diff --git "a/wandb/run-20220310_205608-mf17w61i/files/wandb-summary.json" "b/wandb/run-20220310_205608-mf17w61i/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220310_205608-mf17w61i/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 6.6781, "train/learning_rate": 2.9118171021377674e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 9779, "_timestamp": 1646955547, "_step": 1500, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 9.0, 11.0, 7.0, 3.0, 106.0, 28.0, 11.0, 7.0, 30219.0, 73.0, 16.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.77960205078125, -6.4068603515625, -6.03411865234375, -5.661376953125, -5.28863525390625, -4.9158935546875, -4.54315185546875, -4.17041015625, -3.79766845703125, -3.4249267578125, -3.05218505859375, -2.679443359375, -2.30670166015625, -1.9339599609375, -1.56121826171875, -1.1884765625, -0.81573486328125, -0.4429931640625, -0.07025146484375, 0.302490234375, 0.67523193359375, 1.0479736328125, 1.42071533203125, 1.79345703125, 2.16619873046875, 2.5389404296875, 2.91168212890625, 3.284423828125, 3.65716552734375, 4.0299072265625, 4.40264892578125, 4.775390625, 5.14813232421875, 5.5208740234375, 5.89361572265625, 6.266357421875, 6.63909912109375, 7.0118408203125, 7.38458251953125, 7.75732421875, 8.13006591796875, 8.5028076171875, 8.87554931640625, 9.248291015625, 9.62103271484375, 9.9937744140625, 10.36651611328125, 10.7392578125, 11.11199951171875, 11.4847412109375, 11.85748291015625, 12.230224609375, 12.60296630859375, 12.9757080078125, 13.34844970703125, 13.72119140625, 14.09393310546875, 14.4666748046875, 14.83941650390625, 15.212158203125, 15.58489990234375, 15.9576416015625, 16.33038330078125, 16.703125]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 36.0, 226.0, 671.0, 70.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.65150833129883, -32.98121643066406, -32.3109245300293, -31.6406307220459, -30.9703369140625, -30.300045013427734, -29.62975311279297, -28.95945930480957, -28.289165496826172, -27.618873596191406, -26.948579788208008, -26.278287887573242, -25.607994079589844, -24.937702178955078, -24.267410278320312, -23.597116470336914, -22.92682456970215, -22.256532669067383, -21.586238861083984, -20.91594696044922, -20.24565315246582, -19.575361251831055, -18.905067443847656, -18.23477554321289, -17.564483642578125, -16.89419174194336, -16.22389793395996, -15.553606033325195, -14.883312225341797, -14.213020324707031, -13.54272747039795, -12.872434616088867, -12.202141761779785, -11.531848907470703, -10.861556053161621, -10.191263198852539, -9.520971298217773, -8.850677490234375, -8.18038558959961, -7.510092735290527, -6.839799880981445, -6.169507026672363, -5.499214172363281, -4.828921794891357, -4.158628940582275, -3.4883360862731934, -2.8180437088012695, -2.1477508544921875, -1.4774580001831055, -0.807165265083313, -0.1368725299835205, 0.5334200859069824, 1.2037129402160645, 1.8740057945251465, 2.5442981719970703, 3.2145910263061523, 3.8848838806152344, 4.555176734924316, 5.225469589233398, 5.895761966705322, 6.566054821014404, 7.236347675323486, 7.90664005279541, 8.576932907104492, 9.247225761413574]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 8.0, 4.0, 3.0, 8.0, 7.0, 8.0, 14.0, 17.0, 24.0, 21.0, 38.0, 32.0, 42.0, 43.0, 66.0, 50.0, 48.0, 62.0, 56.0, 49.0, 49.0, 49.0, 54.0, 36.0, 37.0, 35.0, 22.0, 25.0, 19.0, 15.0, 16.0, 14.0, 11.0, 6.0, 7.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.171442747116089, -3.0303826332092285, -2.889322519302368, -2.748262405395508, -2.6072020530700684, -2.466141939163208, -2.3250818252563477, -2.1840217113494873, -2.042961597442627, -1.9019014835357666, -1.7608412504196167, -1.6197811365127563, -1.4787209033966064, -1.337660789489746, -1.1966006755828857, -1.0555405616760254, -0.9144802093505859, -0.7734200358390808, -0.6323598623275757, -0.49129974842071533, -0.3502395749092102, -0.20917940139770508, -0.06811928749084473, 0.0729408860206604, 0.21400105953216553, 0.35506123304367065, 0.4961213767528534, 0.6371815204620361, 0.7782416939735413, 0.9193018674850464, 1.0603619813919067, 1.2014222145080566, 1.342482566833496, 1.4835426807403564, 1.6246029138565063, 1.7656630277633667, 1.9067232608795166, 2.047783374786377, 2.1888434886932373, 2.3299036026000977, 2.470963954925537, 2.6120240688323975, 2.753084182739258, 2.8941445350646973, 3.0352046489715576, 3.176264762878418, 3.3173248767852783, 3.4583849906921387, 3.599445104598999, 3.7405052185058594, 3.8815653324127197, 4.02262544631958, 4.1636857986450195, 4.304745674133301, 4.44580602645874, 4.58686637878418, 4.727926254272461, 4.8689866065979, 5.010046482086182, 5.151106834411621, 5.292166709899902, 5.433227062225342, 5.574287414550781, 5.7153472900390625, 5.856407642364502]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 5.0, 10.0, 8.0, 6.0, 10.0, 21.0, 27.0, 30.0, 49.0, 87.0, 151.0, 288.0, 628.0, 1503.0, 3735.0, 10276.0, 35594.0, 162227.0, 576604.0, 195920.0, 42323.0, 11908.0, 3995.0, 1653.0, 693.0, 344.0, 188.0, 120.0, 52.0, 28.0, 18.0, 20.0, 15.0, 5.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.05322265625, -8.6689453125, -8.28466796875, -7.900390625, -7.51611328125, -7.1318359375, -6.74755859375, -6.36328125, -5.97900390625, -5.5947265625, -5.21044921875, -4.826171875, -4.44189453125, -4.0576171875, -3.67333984375, -3.2890625, -2.90478515625, -2.5205078125, -2.13623046875, -1.751953125, -1.36767578125, -0.9833984375, -0.59912109375, -0.21484375, 0.16943359375, 0.5537109375, 0.93798828125, 1.322265625, 1.70654296875, 2.0908203125, 2.47509765625, 2.859375, 3.24365234375, 3.6279296875, 4.01220703125, 4.396484375, 4.78076171875, 5.1650390625, 5.54931640625, 5.93359375, 6.31787109375, 6.7021484375, 7.08642578125, 7.470703125, 7.85498046875, 8.2392578125, 8.62353515625, 9.0078125, 9.39208984375, 9.7763671875, 10.16064453125, 10.544921875, 10.92919921875, 11.3134765625, 11.69775390625, 12.08203125, 12.46630859375, 12.8505859375, 13.23486328125, 13.619140625, 14.00341796875, 14.3876953125, 14.77197265625, 15.15625]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 2.0, 4.0, 10.0, 11.0, 12.0, 12.0, 29.0, 17.0, 31.0, 39.0, 37.0, 46.0, 65.0, 56.0, 54.0, 108.0, 75.0, 45.0, 43.0, 55.0, 45.0, 37.0, 32.0, 28.0, 28.0, 17.0, 13.0, 9.0, 9.0, 10.0, 9.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.296875, -2.200286865234375, -2.10369873046875, -2.007110595703125, -1.9105224609375, -1.813934326171875, -1.71734619140625, -1.620758056640625, -1.524169921875, -1.427581787109375, -1.33099365234375, -1.234405517578125, -1.1378173828125, -1.041229248046875, -0.94464111328125, -0.848052978515625, -0.75146484375, -0.654876708984375, -0.55828857421875, -0.461700439453125, -0.3651123046875, -0.268524169921875, -0.17193603515625, -0.075347900390625, 0.021240234375, 0.117828369140625, 0.21441650390625, 0.311004638671875, 0.4075927734375, 0.504180908203125, 0.60076904296875, 0.697357177734375, 0.7939453125, 0.890533447265625, 0.98712158203125, 1.083709716796875, 1.1802978515625, 1.276885986328125, 1.37347412109375, 1.470062255859375, 1.566650390625, 1.663238525390625, 1.75982666015625, 1.856414794921875, 1.9530029296875, 2.049591064453125, 2.14617919921875, 2.242767333984375, 2.33935546875, 2.435943603515625, 2.53253173828125, 2.629119873046875, 2.7257080078125, 2.822296142578125, 2.91888427734375, 3.015472412109375, 3.112060546875, 3.208648681640625, 3.30523681640625, 3.401824951171875, 3.4984130859375, 3.595001220703125, 3.69158935546875, 3.788177490234375, 3.884765625]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 9.0, 5.0, 11.0, 16.0, 23.0, 21.0, 44.0, 45.0, 56.0, 74.0, 109.0, 99.0, 89.0, 96.0, 87.0, 48.0, 32.0, 23.0, 21.0, 16.0, 18.0, 10.0, 8.0, 4.0, 9.0, 6.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.656081676483154, -4.529134750366211, -4.402188301086426, -4.275241374969482, -4.148294448852539, -4.021347522735596, -3.8944008350372314, -3.767454147338867, -3.640507221221924, -3.5135602951049805, -3.386613607406616, -3.259666919708252, -3.1327199935913086, -3.0057730674743652, -2.878826379776001, -2.7518796920776367, -2.6249327659606934, -2.49798583984375, -2.3710391521453857, -2.2440924644470215, -2.117145538330078, -1.9901987314224243, -1.8632519245147705, -1.7363051176071167, -1.609358310699463, -1.482411503791809, -1.3554646968841553, -1.2285178899765015, -1.1015710830688477, -0.9746242761611938, -0.84767746925354, -0.7207306623458862, -0.5937840938568115, -0.4668372869491577, -0.3398904800415039, -0.2129436731338501, -0.08599686622619629, 0.04094994068145752, 0.16789674758911133, 0.29484355449676514, 0.42179036140441895, 0.5487371683120728, 0.6756839752197266, 0.8026307821273804, 0.9295775890350342, 1.056524395942688, 1.1834712028503418, 1.3104180097579956, 1.4373648166656494, 1.5643116235733032, 1.691258430480957, 1.8182052373886108, 1.9451520442962646, 2.072098731994629, 2.1990456581115723, 2.3259925842285156, 2.45293927192688, 2.579885959625244, 2.7068328857421875, 2.833779811859131, 2.960726499557495, 3.0876731872558594, 3.2146201133728027, 3.341567039489746, 3.4685137271881104]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 2.0, 5.0, 3.0, 8.0, 15.0, 9.0, 13.0, 17.0, 21.0, 23.0, 16.0, 24.0, 32.0, 41.0, 36.0, 44.0, 57.0, 44.0, 41.0, 47.0, 56.0, 35.0, 43.0, 44.0, 35.0, 35.0, 39.0, 33.0, 32.0, 26.0, 25.0, 21.0, 15.0, 18.0, 14.0, 9.0, 8.0, 4.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.090424060821533, -3.977288246154785, -3.864152193069458, -3.75101637840271, -3.637880563735962, -3.5247445106506348, -3.4116086959838867, -3.2984728813171387, -3.1853370666503906, -3.0722012519836426, -2.9590651988983154, -2.8459293842315674, -2.7327935695648193, -2.619657516479492, -2.506521701812744, -2.393385887145996, -2.280249834060669, -2.167114019393921, -2.0539779663085938, -1.9408421516418457, -1.8277063369750977, -1.71457040309906, -1.6014344692230225, -1.4882986545562744, -1.3751627206802368, -1.2620267868041992, -1.1488909721374512, -1.0357550382614136, -0.9226191639900208, -0.8094832897186279, -0.6963473558425903, -0.5832114815711975, -0.4700758457183838, -0.35693997144699097, -0.24380406737327576, -0.13066816329956055, -0.017532289028167725, 0.0956035852432251, 0.2087395191192627, 0.3218753933906555, 0.43501126766204834, 0.5481471419334412, 0.661283016204834, 0.7744189500808716, 0.8875548243522644, 1.0006906986236572, 1.1138266324996948, 1.2269625663757324, 1.3400983810424805, 1.453234314918518, 1.5663701295852661, 1.6795060634613037, 1.7926418781280518, 1.9057778120040894, 2.018913745880127, 2.132049560546875, 2.245185375213623, 2.358321189880371, 2.4714572429656982, 2.5845930576324463, 2.6977288722991943, 2.8108649253845215, 2.9240007400512695, 3.0371365547180176, 3.1502726078033447]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 10.0, 4.0, 11.0, 14.0, 14.0, 38.0, 43.0, 52.0, 66.0, 91.0, 102.0, 152.0, 207.0, 310.0, 432.0, 680.0, 1097.0, 2130.0, 4461.0, 15477.0, 475070.0, 3532342.0, 143765.0, 9429.0, 3460.0, 1738.0, 951.0, 615.0, 427.0, 289.0, 202.0, 163.0, 134.0, 62.0, 63.0, 49.0, 36.0, 30.0, 14.0, 17.0, 12.0, 7.0, 6.0, 1.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0], "bins": [-5.53515625, -5.37860107421875, -5.2220458984375, -5.06549072265625, -4.908935546875, -4.75238037109375, -4.5958251953125, -4.43927001953125, -4.28271484375, -4.12615966796875, -3.9696044921875, -3.81304931640625, -3.656494140625, -3.49993896484375, -3.3433837890625, -3.18682861328125, -3.0302734375, -2.87371826171875, -2.7171630859375, -2.56060791015625, -2.404052734375, -2.24749755859375, -2.0909423828125, -1.93438720703125, -1.77783203125, -1.62127685546875, -1.4647216796875, -1.30816650390625, -1.151611328125, -0.99505615234375, -0.8385009765625, -0.68194580078125, -0.525390625, -0.36883544921875, -0.2122802734375, -0.05572509765625, 0.100830078125, 0.25738525390625, 0.4139404296875, 0.57049560546875, 0.72705078125, 0.88360595703125, 1.0401611328125, 1.19671630859375, 1.353271484375, 1.50982666015625, 1.6663818359375, 1.82293701171875, 1.9794921875, 2.13604736328125, 2.2926025390625, 2.44915771484375, 2.605712890625, 2.76226806640625, 2.9188232421875, 3.07537841796875, 3.23193359375, 3.38848876953125, 3.5450439453125, 3.70159912109375, 3.858154296875, 4.01470947265625, 4.1712646484375, 4.32781982421875, 4.484375]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 5.0, 6.0, 5.0, 6.0, 9.0, 17.0, 17.0, 11.0, 20.0, 19.0, 22.0, 22.0, 36.0, 43.0, 31.0, 47.0, 43.0, 40.0, 42.0, 45.0, 32.0, 45.0, 45.0, 52.0, 38.0, 33.0, 42.0, 27.0, 30.0, 38.0, 31.0, 23.0, 14.0, 13.0, 11.0, 10.0, 5.0, 10.0, 9.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.01171875, -1.951324462890625, -1.89093017578125, -1.830535888671875, -1.7701416015625, -1.709747314453125, -1.64935302734375, -1.588958740234375, -1.528564453125, -1.468170166015625, -1.40777587890625, -1.347381591796875, -1.2869873046875, -1.226593017578125, -1.16619873046875, -1.105804443359375, -1.04541015625, -0.985015869140625, -0.92462158203125, -0.864227294921875, -0.8038330078125, -0.743438720703125, -0.68304443359375, -0.622650146484375, -0.562255859375, -0.501861572265625, -0.44146728515625, -0.381072998046875, -0.3206787109375, -0.260284423828125, -0.19989013671875, -0.139495849609375, -0.0791015625, -0.018707275390625, 0.04168701171875, 0.102081298828125, 0.1624755859375, 0.222869873046875, 0.28326416015625, 0.343658447265625, 0.404052734375, 0.464447021484375, 0.52484130859375, 0.585235595703125, 0.6456298828125, 0.706024169921875, 0.76641845703125, 0.826812744140625, 0.88720703125, 0.947601318359375, 1.00799560546875, 1.068389892578125, 1.1287841796875, 1.189178466796875, 1.24957275390625, 1.309967041015625, 1.370361328125, 1.430755615234375, 1.49114990234375, 1.551544189453125, 1.6119384765625, 1.672332763671875, 1.73272705078125, 1.793121337890625, 1.853515625]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 6.0, 4.0, 11.0, 13.0, 21.0, 54.0, 126.0, 839.0, 106378.0, 4085141.0, 1354.0, 218.0, 37.0, 32.0, 19.0, 12.0, 4.0, 4.0, 1.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.53125, -41.44384765625, -40.3564453125, -39.26904296875, -38.181640625, -37.09423828125, -36.0068359375, -34.91943359375, -33.83203125, -32.74462890625, -31.6572265625, -30.56982421875, -29.482421875, -28.39501953125, -27.3076171875, -26.22021484375, -25.1328125, -24.04541015625, -22.9580078125, -21.87060546875, -20.783203125, -19.69580078125, -18.6083984375, -17.52099609375, -16.43359375, -15.34619140625, -14.2587890625, -13.17138671875, -12.083984375, -10.99658203125, -9.9091796875, -8.82177734375, -7.734375, -6.64697265625, -5.5595703125, -4.47216796875, -3.384765625, -2.29736328125, -1.2099609375, -0.12255859375, 0.96484375, 2.05224609375, 3.1396484375, 4.22705078125, 5.314453125, 6.40185546875, 7.4892578125, 8.57666015625, 9.6640625, 10.75146484375, 11.8388671875, 12.92626953125, 14.013671875, 15.10107421875, 16.1884765625, 17.27587890625, 18.36328125, 19.45068359375, 20.5380859375, 21.62548828125, 22.712890625, 23.80029296875, 24.8876953125, 25.97509765625, 27.0625]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 11.0, 13.0, 26.0, 45.0, 86.0, 349.0, 916.0, 1520.0, 710.0, 220.0, 73.0, 27.0, 20.0, 17.0, 10.0, 8.0, 1.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.802734375, -1.7544708251953125, -1.706207275390625, -1.6579437255859375, -1.60968017578125, -1.5614166259765625, -1.513153076171875, -1.4648895263671875, -1.4166259765625, -1.3683624267578125, -1.320098876953125, -1.2718353271484375, -1.22357177734375, -1.1753082275390625, -1.127044677734375, -1.0787811279296875, -1.030517578125, -0.9822540283203125, -0.933990478515625, -0.8857269287109375, -0.83746337890625, -0.7891998291015625, -0.740936279296875, -0.6926727294921875, -0.6444091796875, -0.5961456298828125, -0.547882080078125, -0.4996185302734375, -0.45135498046875, -0.4030914306640625, -0.354827880859375, -0.3065643310546875, -0.25830078125, -0.2100372314453125, -0.161773681640625, -0.1135101318359375, -0.06524658203125, -0.0169830322265625, 0.031280517578125, 0.0795440673828125, 0.1278076171875, 0.1760711669921875, 0.224334716796875, 0.2725982666015625, 0.32086181640625, 0.3691253662109375, 0.417388916015625, 0.4656524658203125, 0.513916015625, 0.5621795654296875, 0.610443115234375, 0.6587066650390625, 0.70697021484375, 0.7552337646484375, 0.803497314453125, 0.8517608642578125, 0.9000244140625, 0.9482879638671875, 0.996551513671875, 1.0448150634765625, 1.09307861328125, 1.1413421630859375, 1.189605712890625, 1.2378692626953125, 1.2861328125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 10.0, 11.0, 12.0, 19.0, 17.0, 26.0, 34.0, 44.0, 55.0, 57.0, 77.0, 81.0, 81.0, 82.0, 61.0, 68.0, 52.0, 32.0, 29.0, 22.0, 20.0, 21.0, 12.0, 13.0, 5.0, 6.0, 7.0, 6.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.9721152782440186, -1.9180643558502197, -1.8640133142471313, -1.8099623918533325, -1.7559114694595337, -1.7018604278564453, -1.6478095054626465, -1.5937585830688477, -1.5397076606750488, -1.48565673828125, -1.4316056966781616, -1.3775547742843628, -1.323503851890564, -1.2694528102874756, -1.2154018878936768, -1.161350965499878, -1.107300043106079, -1.0532491207122803, -0.9991981387138367, -0.9451471567153931, -0.8910962343215942, -0.8370452523231506, -0.782994270324707, -0.7289433479309082, -0.6748923063278198, -0.6208413243293762, -0.5667904019355774, -0.5127394199371338, -0.45868849754333496, -0.40463751554489136, -0.35058656334877014, -0.2965356111526489, -0.2424846887588501, -0.18843373656272888, -0.13438278436660767, -0.08033181726932526, -0.02628086507320404, 0.02777010202407837, 0.08182105422019958, 0.1358720064163208, 0.18992295861244202, 0.24397391080856323, 0.29802486300468445, 0.35207581520080566, 0.40612679719924927, 0.4601777493953705, 0.5142287015914917, 0.5682796239852905, 0.6223306059837341, 0.6763815879821777, 0.7304325103759766, 0.7844834923744202, 0.838534414768219, 0.8925853967666626, 0.9466363191604614, 1.0006873607635498, 1.0547382831573486, 1.1087892055511475, 1.1628402471542358, 1.2168911695480347, 1.2709420919418335, 1.3249931335449219, 1.3790440559387207, 1.4330949783325195, 1.4871459007263184]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 7.0, 5.0, 4.0, 6.0, 9.0, 11.0, 15.0, 12.0, 23.0, 21.0, 16.0, 24.0, 25.0, 25.0, 39.0, 35.0, 38.0, 43.0, 41.0, 43.0, 33.0, 55.0, 39.0, 47.0, 33.0, 48.0, 40.0, 33.0, 34.0, 32.0, 29.0, 28.0, 22.0, 16.0, 24.0, 9.0, 9.0, 7.0, 6.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.804324984550476, -1.7467538118362427, -1.6891826391220093, -1.6316114664077759, -1.574040412902832, -1.5164692401885986, -1.4588980674743652, -1.4013268947601318, -1.3437557220458984, -1.286184549331665, -1.2286133766174316, -1.1710422039031982, -1.1134710311889648, -1.0558998584747314, -0.9983288049697876, -0.9407576322555542, -0.8831864595413208, -0.8256152868270874, -0.768044114112854, -0.7104730010032654, -0.652901828289032, -0.5953306555747986, -0.53775954246521, -0.48018836975097656, -0.42261719703674316, -0.36504602432250977, -0.30747488141059875, -0.24990372359752655, -0.19233256578445435, -0.13476139307022095, -0.07719025015830994, -0.019619107246398926, 0.03795218467712402, 0.09552334249019623, 0.15309450030326843, 0.21066565811634064, 0.26823681592941284, 0.32580798864364624, 0.38337913155555725, 0.44095027446746826, 0.49852144718170166, 0.5560926198959351, 0.6136637926101685, 0.6712349057197571, 0.7288060784339905, 0.7863772511482239, 0.8439483642578125, 0.9015195369720459, 0.9590907096862793, 1.0166618824005127, 1.074233055114746, 1.1318042278289795, 1.189375400543213, 1.2469465732574463, 1.3045176267623901, 1.3620887994766235, 1.419659972190857, 1.4772311449050903, 1.5348023176193237, 1.5923734903335571, 1.649944543838501, 1.7075157165527344, 1.7650868892669678, 1.8226580619812012, 1.8802292346954346]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 9.0, 27.0, 31.0, 44.0, 58.0, 78.0, 146.0, 178.0, 313.0, 462.0, 823.0, 1382.0, 2326.0, 4105.0, 7590.0, 14617.0, 29722.0, 62161.0, 137039.0, 307638.0, 261480.0, 112910.0, 52493.0, 25126.0, 12529.0, 6447.0, 3599.0, 2043.0, 1204.0, 697.0, 430.0, 284.0, 173.0, 131.0, 75.0, 56.0, 43.0, 24.0, 15.0, 13.0, 10.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.625, -1.5770416259765625, -1.529083251953125, -1.4811248779296875, -1.43316650390625, -1.3852081298828125, -1.337249755859375, -1.2892913818359375, -1.2413330078125, -1.1933746337890625, -1.145416259765625, -1.0974578857421875, -1.04949951171875, -1.0015411376953125, -0.953582763671875, -0.9056243896484375, -0.857666015625, -0.8097076416015625, -0.761749267578125, -0.7137908935546875, -0.66583251953125, -0.6178741455078125, -0.569915771484375, -0.5219573974609375, -0.4739990234375, -0.4260406494140625, -0.378082275390625, -0.3301239013671875, -0.28216552734375, -0.2342071533203125, -0.186248779296875, -0.1382904052734375, -0.09033203125, -0.0423736572265625, 0.005584716796875, 0.0535430908203125, 0.10150146484375, 0.1494598388671875, 0.197418212890625, 0.2453765869140625, 0.2933349609375, 0.3412933349609375, 0.389251708984375, 0.4372100830078125, 0.48516845703125, 0.5331268310546875, 0.581085205078125, 0.6290435791015625, 0.677001953125, 0.7249603271484375, 0.772918701171875, 0.8208770751953125, 0.86883544921875, 0.9167938232421875, 0.964752197265625, 1.0127105712890625, 1.0606689453125, 1.1086273193359375, 1.156585693359375, 1.2045440673828125, 1.25250244140625, 1.3004608154296875, 1.348419189453125, 1.3963775634765625, 1.4443359375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 9.0, 7.0, 14.0, 9.0, 17.0, 15.0, 17.0, 14.0, 26.0, 29.0, 29.0, 29.0, 38.0, 40.0, 44.0, 44.0, 40.0, 38.0, 42.0, 43.0, 45.0, 46.0, 39.0, 34.0, 38.0, 36.0, 36.0, 28.0, 22.0, 20.0, 26.0, 17.0, 13.0, 18.0, 6.0, 7.0, 7.0, 4.0, 2.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3671875, -1.31951904296875, -1.2718505859375, -1.22418212890625, -1.176513671875, -1.12884521484375, -1.0811767578125, -1.03350830078125, -0.98583984375, -0.93817138671875, -0.8905029296875, -0.84283447265625, -0.795166015625, -0.74749755859375, -0.6998291015625, -0.65216064453125, -0.6044921875, -0.55682373046875, -0.5091552734375, -0.46148681640625, -0.413818359375, -0.36614990234375, -0.3184814453125, -0.27081298828125, -0.22314453125, -0.17547607421875, -0.1278076171875, -0.08013916015625, -0.032470703125, 0.01519775390625, 0.0628662109375, 0.11053466796875, 0.158203125, 0.20587158203125, 0.2535400390625, 0.30120849609375, 0.348876953125, 0.39654541015625, 0.4442138671875, 0.49188232421875, 0.53955078125, 0.58721923828125, 0.6348876953125, 0.68255615234375, 0.730224609375, 0.77789306640625, 0.8255615234375, 0.87322998046875, 0.9208984375, 0.96856689453125, 1.0162353515625, 1.06390380859375, 1.111572265625, 1.15924072265625, 1.2069091796875, 1.25457763671875, 1.30224609375, 1.34991455078125, 1.3975830078125, 1.44525146484375, 1.492919921875, 1.54058837890625, 1.5882568359375, 1.63592529296875, 1.68359375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 13.0, 17.0, 18.0, 30.0, 53.0, 63.0, 111.0, 161.0, 249.0, 434.0, 674.0, 1118.0, 2042.0, 3696.0, 7101.0, 13550.0, 28814.0, 63358.0, 160921.0, 414687.0, 205221.0, 78034.0, 33914.0, 16091.0, 8084.0, 4305.0, 2377.0, 1290.0, 773.0, 468.0, 306.0, 183.0, 130.0, 85.0, 62.0, 34.0, 21.0, 24.0, 11.0, 11.0, 8.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9462890625, -0.9181365966796875, -0.889984130859375, -0.8618316650390625, -0.83367919921875, -0.8055267333984375, -0.777374267578125, -0.7492218017578125, -0.7210693359375, -0.6929168701171875, -0.664764404296875, -0.6366119384765625, -0.60845947265625, -0.5803070068359375, -0.552154541015625, -0.5240020751953125, -0.495849609375, -0.4676971435546875, -0.439544677734375, -0.4113922119140625, -0.38323974609375, -0.3550872802734375, -0.326934814453125, -0.2987823486328125, -0.2706298828125, -0.2424774169921875, -0.214324951171875, -0.1861724853515625, -0.15802001953125, -0.1298675537109375, -0.101715087890625, -0.0735626220703125, -0.04541015625, -0.0172576904296875, 0.010894775390625, 0.0390472412109375, 0.06719970703125, 0.0953521728515625, 0.123504638671875, 0.1516571044921875, 0.1798095703125, 0.2079620361328125, 0.236114501953125, 0.2642669677734375, 0.29241943359375, 0.3205718994140625, 0.348724365234375, 0.3768768310546875, 0.405029296875, 0.4331817626953125, 0.461334228515625, 0.4894866943359375, 0.51763916015625, 0.5457916259765625, 0.573944091796875, 0.6020965576171875, 0.6302490234375, 0.6584014892578125, 0.686553955078125, 0.7147064208984375, 0.74285888671875, 0.7710113525390625, 0.799163818359375, 0.8273162841796875, 0.85546875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 5.0, 11.0, 9.0, 10.0, 18.0, 16.0, 16.0, 32.0, 26.0, 26.0, 42.0, 30.0, 32.0, 31.0, 40.0, 47.0, 37.0, 35.0, 38.0, 41.0, 40.0, 40.0, 31.0, 29.0, 36.0, 35.0, 31.0, 24.0, 22.0, 27.0, 21.0, 25.0, 12.0, 18.0, 11.0, 4.0, 8.0, 7.0, 4.0, 7.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8115234375, -0.7833099365234375, -0.755096435546875, -0.7268829345703125, -0.69866943359375, -0.6704559326171875, -0.642242431640625, -0.6140289306640625, -0.5858154296875, -0.5576019287109375, -0.529388427734375, -0.5011749267578125, -0.47296142578125, -0.4447479248046875, -0.416534423828125, -0.3883209228515625, -0.360107421875, -0.3318939208984375, -0.303680419921875, -0.2754669189453125, -0.24725341796875, -0.2190399169921875, -0.190826416015625, -0.1626129150390625, -0.1343994140625, -0.1061859130859375, -0.077972412109375, -0.0497589111328125, -0.02154541015625, 0.0066680908203125, 0.034881591796875, 0.0630950927734375, 0.09130859375, 0.1195220947265625, 0.147735595703125, 0.1759490966796875, 0.20416259765625, 0.2323760986328125, 0.260589599609375, 0.2888031005859375, 0.3170166015625, 0.3452301025390625, 0.373443603515625, 0.4016571044921875, 0.42987060546875, 0.4580841064453125, 0.486297607421875, 0.5145111083984375, 0.542724609375, 0.5709381103515625, 0.599151611328125, 0.6273651123046875, 0.65557861328125, 0.6837921142578125, 0.712005615234375, 0.7402191162109375, 0.7684326171875, 0.7966461181640625, 0.824859619140625, 0.8530731201171875, 0.88128662109375, 0.9095001220703125, 0.937713623046875, 0.9659271240234375, 0.994140625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 5.0, 7.0, 7.0, 11.0, 13.0, 23.0, 20.0, 35.0, 62.0, 68.0, 89.0, 125.0, 152.0, 244.0, 366.0, 540.0, 895.0, 1438.0, 2502.0, 5131.0, 11833.0, 36073.0, 208774.0, 682378.0, 64040.0, 18013.0, 7124.0, 3414.0, 1834.0, 1106.0, 677.0, 461.0, 298.0, 218.0, 159.0, 118.0, 60.0, 55.0, 44.0, 39.0, 30.0, 22.0, 15.0, 13.0, 11.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.30078125, -0.2911415100097656, -0.28150177001953125, -0.2718620300292969, -0.2622222900390625, -0.2525825500488281, -0.24294281005859375, -0.23330307006835938, -0.223663330078125, -0.21402359008789062, -0.20438385009765625, -0.19474411010742188, -0.1851043701171875, -0.17546463012695312, -0.16582489013671875, -0.15618515014648438, -0.14654541015625, -0.13690567016601562, -0.12726593017578125, -0.11762619018554688, -0.1079864501953125, -0.09834671020507812, -0.08870697021484375, -0.07906723022460938, -0.069427490234375, -0.059787750244140625, -0.05014801025390625, -0.040508270263671875, -0.0308685302734375, -0.021228790283203125, -0.01158905029296875, -0.001949310302734375, 0.0076904296875, 0.017330169677734375, 0.02696990966796875, 0.036609649658203125, 0.0462493896484375, 0.055889129638671875, 0.06552886962890625, 0.07516860961914062, 0.084808349609375, 0.09444808959960938, 0.10408782958984375, 0.11372756958007812, 0.1233673095703125, 0.13300704956054688, 0.14264678955078125, 0.15228652954101562, 0.16192626953125, 0.17156600952148438, 0.18120574951171875, 0.19084548950195312, 0.2004852294921875, 0.21012496948242188, 0.21976470947265625, 0.22940444946289062, 0.239044189453125, 0.24868392944335938, 0.25832366943359375, 0.2679634094238281, 0.2776031494140625, 0.2872428894042969, 0.29688262939453125, 0.3065223693847656, 0.316162109375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 6.0, 8.0, 3.0, 5.0, 8.0, 9.0, 14.0, 12.0, 23.0, 31.0, 65.0, 96.0, 163.0, 173.0, 143.0, 89.0, 37.0, 28.0, 26.0, 15.0, 11.0, 6.0, 5.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2782554626464844e-05, -3.170128911733627e-05, -3.06200236082077e-05, -2.9538758099079132e-05, -2.845749258995056e-05, -2.737622708082199e-05, -2.629496157169342e-05, -2.521369606256485e-05, -2.413243055343628e-05, -2.305116504430771e-05, -2.1969899535179138e-05, -2.0888634026050568e-05, -1.9807368516921997e-05, -1.8726103007793427e-05, -1.7644837498664856e-05, -1.6563571989536285e-05, -1.5482306480407715e-05, -1.4401040971279144e-05, -1.3319775462150574e-05, -1.2238509953022003e-05, -1.1157244443893433e-05, -1.0075978934764862e-05, -8.994713425636292e-06, -7.913447916507721e-06, -6.83218240737915e-06, -5.75091689825058e-06, -4.669651389122009e-06, -3.5883858799934387e-06, -2.507120370864868e-06, -1.4258548617362976e-06, -3.4458935260772705e-07, 7.366761565208435e-07, 1.817941665649414e-06, 2.8992071747779846e-06, 3.980472683906555e-06, 5.061738193035126e-06, 6.143003702163696e-06, 7.224269211292267e-06, 8.305534720420837e-06, 9.386800229549408e-06, 1.0468065738677979e-05, 1.1549331247806549e-05, 1.263059675693512e-05, 1.371186226606369e-05, 1.479312777519226e-05, 1.587439328432083e-05, 1.6955658793449402e-05, 1.8036924302577972e-05, 1.9118189811706543e-05, 2.0199455320835114e-05, 2.1280720829963684e-05, 2.2361986339092255e-05, 2.3443251848220825e-05, 2.4524517357349396e-05, 2.5605782866477966e-05, 2.6687048375606537e-05, 2.7768313884735107e-05, 2.8849579393863678e-05, 2.993084490299225e-05, 3.101211041212082e-05, 3.209337592124939e-05, 3.317464143037796e-05, 3.425590693950653e-05, 3.53371724486351e-05, 3.641843795776367e-05]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 10.0, 5.0, 11.0, 19.0, 21.0, 40.0, 59.0, 368.0, 4276.0, 495285.0, 543707.0, 4183.0, 350.0, 63.0, 30.0, 18.0, 17.0, 10.0, 7.0, 14.0, 10.0, 6.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.185546875, -2.12310791015625, -2.0606689453125, -1.99822998046875, -1.935791015625, -1.87335205078125, -1.8109130859375, -1.74847412109375, -1.68603515625, -1.62359619140625, -1.5611572265625, -1.49871826171875, -1.436279296875, -1.37384033203125, -1.3114013671875, -1.24896240234375, -1.1865234375, -1.12408447265625, -1.0616455078125, -0.99920654296875, -0.936767578125, -0.87432861328125, -0.8118896484375, -0.74945068359375, -0.68701171875, -0.62457275390625, -0.5621337890625, -0.49969482421875, -0.437255859375, -0.37481689453125, -0.3123779296875, -0.24993896484375, -0.1875, -0.12506103515625, -0.0626220703125, -0.00018310546875, 0.062255859375, 0.12469482421875, 0.1871337890625, 0.24957275390625, 0.31201171875, 0.37445068359375, 0.4368896484375, 0.49932861328125, 0.561767578125, 0.62420654296875, 0.6866455078125, 0.74908447265625, 0.8115234375, 0.87396240234375, 0.9364013671875, 0.99884033203125, 1.061279296875, 1.12371826171875, 1.1861572265625, 1.24859619140625, 1.31103515625, 1.37347412109375, 1.4359130859375, 1.49835205078125, 1.560791015625, 1.62322998046875, 1.6856689453125, 1.74810791015625, 1.810546875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 7.0, 6.0, 7.0, 8.0, 7.0, 17.0, 24.0, 31.0, 44.0, 83.0, 109.0, 143.0, 158.0, 94.0, 80.0, 45.0, 29.0, 16.0, 16.0, 10.0, 11.0, 9.0, 8.0, 4.0, 12.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1065673828125, -0.10352897644042969, -0.10049057006835938, -0.09745216369628906, -0.09441375732421875, -0.09137535095214844, -0.08833694458007812, -0.08529853820800781, -0.0822601318359375, -0.07922172546386719, -0.07618331909179688, -0.07314491271972656, -0.07010650634765625, -0.06706809997558594, -0.06402969360351562, -0.06099128723144531, -0.057952880859375, -0.05491447448730469, -0.051876068115234375, -0.04883766174316406, -0.04579925537109375, -0.04276084899902344, -0.039722442626953125, -0.03668403625488281, -0.0336456298828125, -0.030607223510742188, -0.027568817138671875, -0.024530410766601562, -0.02149200439453125, -0.018453598022460938, -0.015415191650390625, -0.012376785278320312, -0.00933837890625, -0.0062999725341796875, -0.003261566162109375, -0.0002231597900390625, 0.00281524658203125, 0.0058536529541015625, 0.008892059326171875, 0.011930465698242188, 0.0149688720703125, 0.018007278442382812, 0.021045684814453125, 0.024084091186523438, 0.02712249755859375, 0.030160903930664062, 0.033199310302734375, 0.03623771667480469, 0.039276123046875, 0.04231452941894531, 0.045352935791015625, 0.04839134216308594, 0.05142974853515625, 0.05446815490722656, 0.057506561279296875, 0.06054496765136719, 0.0635833740234375, 0.06662178039550781, 0.06966018676757812, 0.07269859313964844, 0.07573699951171875, 0.07877540588378906, 0.08181381225585938, 0.08485221862792969, 0.087890625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 12.0, 10.0, 15.0, 11.0, 16.0, 21.0, 34.0, 34.0, 47.0, 47.0, 67.0, 72.0, 79.0, 82.0, 86.0, 66.0, 55.0, 54.0, 33.0, 22.0, 22.0, 26.0, 12.0, 18.0, 4.0, 10.0, 7.0, 4.0, 5.0, 2.0, 4.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7483004331588745, -1.6972051858901978, -1.646109938621521, -1.5950146913528442, -1.543919324874878, -1.4928240776062012, -1.4417288303375244, -1.3906335830688477, -1.339538335800171, -1.2884430885314941, -1.2373478412628174, -1.1862525939941406, -1.1351573467254639, -1.084062099456787, -1.0329667329788208, -0.981871485710144, -0.9307762384414673, -0.8796809911727905, -0.8285857439041138, -0.7774904370307922, -0.7263951897621155, -0.6752999424934387, -0.6242046356201172, -0.5731093883514404, -0.5220141410827637, -0.4709188938140869, -0.41982361674308777, -0.3687283396720886, -0.31763309240341187, -0.2665378451347351, -0.21544256806373596, -0.16434729099273682, -0.11325204372406006, -0.06215678155422211, -0.011061519384384155, 0.040033742785453796, 0.09112900495529175, 0.1422242522239685, 0.19331952929496765, 0.2444148063659668, 0.29551005363464355, 0.3466053009033203, 0.39770057797431946, 0.4487958550453186, 0.49989110231399536, 0.5509863495826721, 0.6020816564559937, 0.6531769037246704, 0.7042721509933472, 0.7553673982620239, 0.8064626455307007, 0.8575579524040222, 0.908653199672699, 0.9597484469413757, 1.0108437538146973, 1.061939001083374, 1.1130342483520508, 1.1641294956207275, 1.2152247428894043, 1.266319990158081, 1.3174152374267578, 1.3685104846954346, 1.4196058511734009, 1.4707010984420776, 1.5217963457107544]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 8.0, 4.0, 6.0, 10.0, 13.0, 18.0, 15.0, 26.0, 18.0, 21.0, 28.0, 23.0, 31.0, 38.0, 38.0, 47.0, 42.0, 35.0, 48.0, 41.0, 49.0, 37.0, 43.0, 42.0, 37.0, 43.0, 30.0, 30.0, 31.0, 20.0, 29.0, 19.0, 16.0, 15.0, 10.0, 5.0, 9.0, 9.0, 5.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4440767765045166, -1.3982326984405518, -1.352388620376587, -1.306544542312622, -1.2607004642486572, -1.2148562669754028, -1.169012188911438, -1.1231681108474731, -1.0773240327835083, -1.0314799547195435, -0.9856358766555786, -0.939791738986969, -0.8939476609230042, -0.8481035828590393, -0.8022594451904297, -0.7564153671264648, -0.7105712890625, -0.6647272109985352, -0.6188831329345703, -0.5730389952659607, -0.5271949172019958, -0.481350839138031, -0.4355067312717438, -0.38966262340545654, -0.3438185453414917, -0.29797446727752686, -0.2521303594112396, -0.2062862664461136, -0.16044217348098755, -0.11459808051586151, -0.06875398755073547, -0.022909879684448242, 0.0229341983795166, 0.06877829134464264, 0.11462238430976868, 0.16046647727489471, 0.20631057024002075, 0.2521546483039856, 0.2979987561702728, 0.34384286403656006, 0.3896869421005249, 0.43553102016448975, 0.481375128030777, 0.5272192358970642, 0.573063313961029, 0.6189073920249939, 0.6647515296936035, 0.7105956077575684, 0.7564396858215332, 0.802283763885498, 0.8481278419494629, 0.8939719796180725, 0.9398160576820374, 0.9856601357460022, 1.0315042734146118, 1.0773483514785767, 1.1231924295425415, 1.1690365076065063, 1.2148805856704712, 1.260724663734436, 1.3065688610076904, 1.3524129390716553, 1.3982570171356201, 1.444101095199585, 1.4899451732635498]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 5.0, 7.0, 12.0, 12.0, 26.0, 38.0, 48.0, 79.0, 112.0, 184.0, 314.0, 528.0, 1023.0, 1967.0, 3910.0, 8624.0, 20681.0, 52442.0, 134686.0, 291609.0, 296941.0, 141189.0, 54622.0, 21836.0, 9183.0, 4036.0, 1980.0, 1044.0, 549.0, 329.0, 194.0, 114.0, 78.0, 61.0, 26.0, 27.0, 10.0, 11.0, 7.0, 5.0, 5.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.732421875, -2.64434814453125, -2.5562744140625, -2.46820068359375, -2.380126953125, -2.29205322265625, -2.2039794921875, -2.11590576171875, -2.02783203125, -1.93975830078125, -1.8516845703125, -1.76361083984375, -1.675537109375, -1.58746337890625, -1.4993896484375, -1.41131591796875, -1.3232421875, -1.23516845703125, -1.1470947265625, -1.05902099609375, -0.970947265625, -0.88287353515625, -0.7947998046875, -0.70672607421875, -0.61865234375, -0.53057861328125, -0.4425048828125, -0.35443115234375, -0.266357421875, -0.17828369140625, -0.0902099609375, -0.00213623046875, 0.0859375, 0.17401123046875, 0.2620849609375, 0.35015869140625, 0.438232421875, 0.52630615234375, 0.6143798828125, 0.70245361328125, 0.79052734375, 0.87860107421875, 0.9666748046875, 1.05474853515625, 1.142822265625, 1.23089599609375, 1.3189697265625, 1.40704345703125, 1.4951171875, 1.58319091796875, 1.6712646484375, 1.75933837890625, 1.847412109375, 1.93548583984375, 2.0235595703125, 2.11163330078125, 2.19970703125, 2.28778076171875, 2.3758544921875, 2.46392822265625, 2.552001953125, 2.64007568359375, 2.7281494140625, 2.81622314453125, 2.904296875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 13.0, 14.0, 13.0, 13.0, 16.0, 24.0, 17.0, 26.0, 29.0, 42.0, 34.0, 40.0, 41.0, 38.0, 43.0, 63.0, 55.0, 50.0, 47.0, 53.0, 40.0, 42.0, 28.0, 35.0, 25.0, 26.0, 25.0, 23.0, 23.0, 14.0, 10.0, 7.0, 8.0, 3.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84716796875, -0.8184814453125, -0.789794921875, -0.7611083984375, -0.732421875, -0.7037353515625, -0.675048828125, -0.6463623046875, -0.61767578125, -0.5889892578125, -0.560302734375, -0.5316162109375, -0.5029296875, -0.4742431640625, -0.445556640625, -0.4168701171875, -0.38818359375, -0.3594970703125, -0.330810546875, -0.3021240234375, -0.2734375, -0.2447509765625, -0.216064453125, -0.1873779296875, -0.15869140625, -0.1300048828125, -0.101318359375, -0.0726318359375, -0.0439453125, -0.0152587890625, 0.013427734375, 0.0421142578125, 0.07080078125, 0.0994873046875, 0.128173828125, 0.1568603515625, 0.185546875, 0.2142333984375, 0.242919921875, 0.2716064453125, 0.30029296875, 0.3289794921875, 0.357666015625, 0.3863525390625, 0.4150390625, 0.4437255859375, 0.472412109375, 0.5010986328125, 0.52978515625, 0.5584716796875, 0.587158203125, 0.6158447265625, 0.64453125, 0.6732177734375, 0.701904296875, 0.7305908203125, 0.75927734375, 0.7879638671875, 0.816650390625, 0.8453369140625, 0.8740234375, 0.9027099609375, 0.931396484375, 0.9600830078125, 0.98876953125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 6.0, 12.0, 6.0, 11.0, 11.0, 14.0, 16.0, 22.0, 33.0, 27.0, 31.0, 38.0, 35.0, 59.0, 69.0, 921.0, 86126.0, 939304.0, 21065.0, 349.0, 57.0, 62.0, 49.0, 32.0, 36.0, 28.0, 20.0, 34.0, 23.0, 12.0, 11.0, 11.0, 5.0, 3.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.575439453125, -10.17431640625, -9.773193359375, -9.3720703125, -8.970947265625, -8.56982421875, -8.168701171875, -7.767578125, -7.366455078125, -6.96533203125, -6.564208984375, -6.1630859375, -5.761962890625, -5.36083984375, -4.959716796875, -4.55859375, -4.157470703125, -3.75634765625, -3.355224609375, -2.9541015625, -2.552978515625, -2.15185546875, -1.750732421875, -1.349609375, -0.948486328125, -0.54736328125, -0.146240234375, 0.2548828125, 0.656005859375, 1.05712890625, 1.458251953125, 1.859375, 2.260498046875, 2.66162109375, 3.062744140625, 3.4638671875, 3.864990234375, 4.26611328125, 4.667236328125, 5.068359375, 5.469482421875, 5.87060546875, 6.271728515625, 6.6728515625, 7.073974609375, 7.47509765625, 7.876220703125, 8.27734375, 8.678466796875, 9.07958984375, 9.480712890625, 9.8818359375, 10.282958984375, 10.68408203125, 11.085205078125, 11.486328125, 11.887451171875, 12.28857421875, 12.689697265625, 13.0908203125, 13.491943359375, 13.89306640625, 14.294189453125, 14.6953125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 5.0, 6.0, 7.0, 14.0, 16.0, 21.0, 14.0, 16.0, 24.0, 22.0, 29.0, 36.0, 45.0, 55.0, 46.0, 61.0, 40.0, 45.0, 49.0, 39.0, 60.0, 41.0, 38.0, 47.0, 34.0, 30.0, 31.0, 26.0, 28.0, 15.0, 17.0, 14.0, 5.0, 5.0, 6.0, 4.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72607421875, -0.6953506469726562, -0.6646270751953125, -0.6339035034179688, -0.603179931640625, -0.5724563598632812, -0.5417327880859375, -0.5110092163085938, -0.48028564453125, -0.44956207275390625, -0.4188385009765625, -0.38811492919921875, -0.357391357421875, -0.32666778564453125, -0.2959442138671875, -0.26522064208984375, -0.2344970703125, -0.20377349853515625, -0.1730499267578125, -0.14232635498046875, -0.111602783203125, -0.08087921142578125, -0.0501556396484375, -0.01943206787109375, 0.01129150390625, 0.04201507568359375, 0.0727386474609375, 0.10346221923828125, 0.134185791015625, 0.16490936279296875, 0.1956329345703125, 0.22635650634765625, 0.257080078125, 0.28780364990234375, 0.3185272216796875, 0.34925079345703125, 0.379974365234375, 0.41069793701171875, 0.4414215087890625, 0.47214508056640625, 0.50286865234375, 0.5335922241210938, 0.5643157958984375, 0.5950393676757812, 0.625762939453125, 0.6564865112304688, 0.6872100830078125, 0.7179336547851562, 0.7486572265625, 0.7793807983398438, 0.8101043701171875, 0.8408279418945312, 0.871551513671875, 0.9022750854492188, 0.9329986572265625, 0.9637222290039062, 0.99444580078125, 1.0251693725585938, 1.0558929443359375, 1.0866165161132812, 1.117340087890625, 1.1480636596679688, 1.1787872314453125, 1.2095108032226562, 1.240234375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 4.0, 6.0, 14.0, 17.0, 10.0, 30.0, 46.0, 119.0, 562.0, 4221.0, 71066.0, 947728.0, 22202.0, 1994.0, 313.0, 81.0, 43.0, 18.0, 20.0, 8.0, 11.0, 4.0, 2.0, 6.0, 4.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4853515625, -1.4243011474609375, -1.363250732421875, -1.3022003173828125, -1.24114990234375, -1.1800994873046875, -1.119049072265625, -1.0579986572265625, -0.9969482421875, -0.9358978271484375, -0.874847412109375, -0.8137969970703125, -0.75274658203125, -0.6916961669921875, -0.630645751953125, -0.5695953369140625, -0.508544921875, -0.4474945068359375, -0.386444091796875, -0.3253936767578125, -0.26434326171875, -0.2032928466796875, -0.142242431640625, -0.0811920166015625, -0.0201416015625, 0.0409088134765625, 0.101959228515625, 0.1630096435546875, 0.22406005859375, 0.2851104736328125, 0.346160888671875, 0.4072113037109375, 0.46826171875, 0.5293121337890625, 0.590362548828125, 0.6514129638671875, 0.71246337890625, 0.7735137939453125, 0.834564208984375, 0.8956146240234375, 0.9566650390625, 1.0177154541015625, 1.078765869140625, 1.1398162841796875, 1.20086669921875, 1.2619171142578125, 1.322967529296875, 1.3840179443359375, 1.445068359375, 1.5061187744140625, 1.567169189453125, 1.6282196044921875, 1.68927001953125, 1.7503204345703125, 1.811370849609375, 1.8724212646484375, 1.9334716796875, 1.9945220947265625, 2.055572509765625, 2.1166229248046875, 2.17767333984375, 2.2387237548828125, 2.299774169921875, 2.3608245849609375, 2.421875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 3.0, 7.0, 12.0, 11.0, 15.0, 38.0, 67.0, 64.0, 100.0, 126.0, 169.0, 122.0, 88.0, 61.0, 36.0, 23.0, 13.0, 12.0, 9.0, 6.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5789947509765625e-05, -5.415920168161392e-05, -5.252845585346222e-05, -5.0897710025310516e-05, -4.9266964197158813e-05, -4.763621836900711e-05, -4.600547254085541e-05, -4.4374726712703705e-05, -4.2743980884552e-05, -4.11132350564003e-05, -3.9482489228248596e-05, -3.785174340009689e-05, -3.622099757194519e-05, -3.459025174379349e-05, -3.2959505915641785e-05, -3.132876008749008e-05, -2.969801425933838e-05, -2.8067268431186676e-05, -2.6436522603034973e-05, -2.480577677488327e-05, -2.3175030946731567e-05, -2.1544285118579865e-05, -1.991353929042816e-05, -1.828279346227646e-05, -1.6652047634124756e-05, -1.5021301805973053e-05, -1.339055597782135e-05, -1.1759810149669647e-05, -1.0129064321517944e-05, -8.498318493366241e-06, -6.8675726652145386e-06, -5.236826837062836e-06, -3.606081008911133e-06, -1.97533518075943e-06, -3.4458935260772705e-07, 1.2861564755439758e-06, 2.9169023036956787e-06, 4.547648131847382e-06, 6.1783939599990845e-06, 7.809139788150787e-06, 9.43988561630249e-06, 1.1070631444454193e-05, 1.2701377272605896e-05, 1.4332123100757599e-05, 1.5962868928909302e-05, 1.7593614757061005e-05, 1.9224360585212708e-05, 2.085510641336441e-05, 2.2485852241516113e-05, 2.4116598069667816e-05, 2.574734389781952e-05, 2.7378089725971222e-05, 2.9008835554122925e-05, 3.063958138227463e-05, 3.227032721042633e-05, 3.3901073038578033e-05, 3.5531818866729736e-05, 3.716256469488144e-05, 3.879331052303314e-05, 4.0424056351184845e-05, 4.205480217933655e-05, 4.368554800748825e-05, 4.5316293835639954e-05, 4.6947039663791656e-05, 4.857778549194336e-05]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 5.0, 8.0, 8.0, 18.0, 25.0, 19.0, 26.0, 32.0, 61.0, 260.0, 4302.0, 960748.0, 81300.0, 1377.0, 150.0, 47.0, 44.0, 25.0, 15.0, 19.0, 15.0, 3.0, 9.0, 6.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.882843017578125, -2.79498291015625, -2.707122802734375, -2.6192626953125, -2.531402587890625, -2.44354248046875, -2.355682373046875, -2.267822265625, -2.179962158203125, -2.09210205078125, -2.004241943359375, -1.9163818359375, -1.828521728515625, -1.74066162109375, -1.652801513671875, -1.56494140625, -1.477081298828125, -1.38922119140625, -1.301361083984375, -1.2135009765625, -1.125640869140625, -1.03778076171875, -0.949920654296875, -0.862060546875, -0.774200439453125, -0.68634033203125, -0.598480224609375, -0.5106201171875, -0.422760009765625, -0.33489990234375, -0.247039794921875, -0.1591796875, -0.071319580078125, 0.01654052734375, 0.104400634765625, 0.1922607421875, 0.280120849609375, 0.36798095703125, 0.455841064453125, 0.543701171875, 0.631561279296875, 0.71942138671875, 0.807281494140625, 0.8951416015625, 0.983001708984375, 1.07086181640625, 1.158721923828125, 1.24658203125, 1.334442138671875, 1.42230224609375, 1.510162353515625, 1.5980224609375, 1.685882568359375, 1.77374267578125, 1.861602783203125, 1.949462890625, 2.037322998046875, 2.12518310546875, 2.213043212890625, 2.3009033203125, 2.388763427734375, 2.47662353515625, 2.564483642578125, 2.65234375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 6.0, 6.0, 5.0, 11.0, 14.0, 15.0, 27.0, 24.0, 28.0, 32.0, 56.0, 73.0, 97.0, 150.0, 123.0, 70.0, 55.0, 53.0, 37.0, 23.0, 18.0, 21.0, 13.0, 7.0, 6.0, 3.0, 8.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1885986328125, -0.1831531524658203, -0.17770767211914062, -0.17226219177246094, -0.16681671142578125, -0.16137123107910156, -0.15592575073242188, -0.1504802703857422, -0.1450347900390625, -0.1395893096923828, -0.13414382934570312, -0.12869834899902344, -0.12325286865234375, -0.11780738830566406, -0.11236190795898438, -0.10691642761230469, -0.101470947265625, -0.09602546691894531, -0.09057998657226562, -0.08513450622558594, -0.07968902587890625, -0.07424354553222656, -0.06879806518554688, -0.06335258483886719, -0.0579071044921875, -0.05246162414550781, -0.047016143798828125, -0.04157066345214844, -0.03612518310546875, -0.030679702758789062, -0.025234222412109375, -0.019788742065429688, -0.01434326171875, -0.008897781372070312, -0.003452301025390625, 0.0019931793212890625, 0.00743865966796875, 0.012884140014648438, 0.018329620361328125, 0.023775100708007812, 0.0292205810546875, 0.03466606140136719, 0.040111541748046875, 0.04555702209472656, 0.05100250244140625, 0.05644798278808594, 0.061893463134765625, 0.06733894348144531, 0.072784423828125, 0.07822990417480469, 0.08367538452148438, 0.08912086486816406, 0.09456634521484375, 0.10001182556152344, 0.10545730590820312, 0.11090278625488281, 0.1163482666015625, 0.12179374694824219, 0.12723922729492188, 0.13268470764160156, 0.13813018798828125, 0.14357566833496094, 0.14902114868164062, 0.1544666290283203, 0.159912109375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 15.0, 48.0, 176.0, 420.0, 255.0, 76.0, 15.0, 7.0, 1.0, 1.0], "bins": [-10.27995491027832, -10.101747512817383, -9.923540115356445, -9.745332717895508, -9.56712532043457, -9.388916969299316, -9.210709571838379, -9.032502174377441, -8.854294776916504, -8.676087379455566, -8.497879981994629, -8.319672584533691, -8.141464233398438, -7.963257312774658, -7.7850494384765625, -7.606842041015625, -7.4286346435546875, -7.25042724609375, -7.0722198486328125, -6.894011974334717, -6.715804576873779, -6.537597179412842, -6.359389305114746, -6.181181907653809, -6.002974510192871, -5.824767112731934, -5.646559715270996, -5.4683518409729, -5.290144443511963, -5.111937046051025, -4.93372917175293, -4.755521774291992, -4.577314853668213, -4.399107456207275, -4.22089958190918, -4.042692184448242, -3.8644847869873047, -3.686277389526367, -3.5080697536468506, -3.329862117767334, -3.1516547203063965, -2.973447322845459, -2.7952396869659424, -2.617032051086426, -2.4388246536254883, -2.260617256164551, -2.082409620285034, -1.9042021036148071, -1.7259944677352905, -1.5477869510650635, -1.3695794343948364, -1.1913719177246094, -1.0131644010543823, -0.8349568843841553, -0.6567493677139282, -0.47854185104370117, -0.3003343343734741, -0.12212681770324707, 0.05608069896697998, 0.23428821563720703, 0.4124957323074341, 0.5907032489776611, 0.7689107656478882, 0.9471182823181152, 1.1253257989883423]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 4.0, 10.0, 11.0, 13.0, 10.0, 22.0, 21.0, 21.0, 18.0, 30.0, 28.0, 23.0, 32.0, 41.0, 36.0, 43.0, 40.0, 34.0, 54.0, 39.0, 42.0, 44.0, 43.0, 26.0, 33.0, 29.0, 26.0, 39.0, 30.0, 29.0, 29.0, 13.0, 14.0, 10.0, 19.0, 6.0, 8.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1654218435287476, -1.1266916990280151, -1.0879616737365723, -1.0492315292358398, -1.010501503944397, -0.9717713594436646, -0.9330412745475769, -0.8943111896514893, -0.8555810451507568, -0.8168509602546692, -0.7781208753585815, -0.7393907308578491, -0.7006606459617615, -0.6619305610656738, -0.6232004761695862, -0.5844703912734985, -0.5457403063774109, -0.5070102214813232, -0.4682801067829132, -0.42955002188682556, -0.3908199071884155, -0.3520898222923279, -0.31335973739624023, -0.2746296226978302, -0.23589953780174255, -0.1971694380044937, -0.15843933820724487, -0.11970925331115723, -0.08097915351390839, -0.042249053716659546, -0.0035189688205718994, 0.035211145877838135, 0.07394123077392578, 0.11267133057117462, 0.15140143036842346, 0.1901315152645111, 0.22886161506175995, 0.2675917148590088, 0.30632179975509644, 0.34505191445350647, 0.3837819993495941, 0.42251208424568176, 0.4612421989440918, 0.49997228384017944, 0.5387023687362671, 0.5774325132369995, 0.6161625385284424, 0.6548926830291748, 0.6936227679252625, 0.7323528528213501, 0.7710829377174377, 0.8098130226135254, 0.8485431671142578, 0.8872732520103455, 0.9260033369064331, 0.9647334814071655, 1.0034635066986084, 1.0421936511993408, 1.0809236764907837, 1.1196538209915161, 1.158383846282959, 1.1971139907836914, 1.2358441352844238, 1.2745741605758667, 1.3133043050765991]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 9.0, 14.0, 14.0, 42.0, 40.0, 69.0, 93.0, 138.0, 220.0, 362.0, 567.0, 914.0, 1453.0, 2465.0, 4116.0, 7155.0, 12518.0, 24870.0, 81104.0, 505531.0, 2206380.0, 1105277.0, 164855.0, 37054.0, 16030.0, 8908.0, 5274.0, 3196.0, 1971.0, 1233.0, 753.0, 558.0, 374.0, 225.0, 152.0, 108.0, 74.0, 50.0, 31.0, 27.0, 12.0, 17.0, 9.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.1396484375, -1.1068191528320312, -1.0739898681640625, -1.0411605834960938, -1.008331298828125, -0.9755020141601562, -0.9426727294921875, -0.9098434448242188, -0.87701416015625, -0.8441848754882812, -0.8113555908203125, -0.7785263061523438, -0.745697021484375, -0.7128677368164062, -0.6800384521484375, -0.6472091674804688, -0.6143798828125, -0.5815505981445312, -0.5487213134765625, -0.5158920288085938, -0.483062744140625, -0.45023345947265625, -0.4174041748046875, -0.38457489013671875, -0.35174560546875, -0.31891632080078125, -0.2860870361328125, -0.25325775146484375, -0.220428466796875, -0.18759918212890625, -0.1547698974609375, -0.12194061279296875, -0.089111328125, -0.05628204345703125, -0.0234527587890625, 0.00937652587890625, 0.042205810546875, 0.07503509521484375, 0.1078643798828125, 0.14069366455078125, 0.17352294921875, 0.20635223388671875, 0.2391815185546875, 0.27201080322265625, 0.304840087890625, 0.33766937255859375, 0.3704986572265625, 0.40332794189453125, 0.4361572265625, 0.46898651123046875, 0.5018157958984375, 0.5346450805664062, 0.567474365234375, 0.6003036499023438, 0.6331329345703125, 0.6659622192382812, 0.69879150390625, 0.7316207885742188, 0.7644500732421875, 0.7972793579101562, 0.830108642578125, 0.8629379272460938, 0.8957672119140625, 0.9285964965820312, 0.96142578125]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 9.0, 7.0, 6.0, 11.0, 14.0, 14.0, 21.0, 18.0, 25.0, 22.0, 31.0, 20.0, 31.0, 24.0, 38.0, 37.0, 36.0, 40.0, 40.0, 49.0, 38.0, 35.0, 33.0, 38.0, 38.0, 37.0, 36.0, 28.0, 32.0, 28.0, 27.0, 17.0, 24.0, 14.0, 19.0, 10.0, 10.0, 9.0, 7.0, 6.0, 5.0, 9.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6650390625, -0.6444168090820312, -0.6237945556640625, -0.6031723022460938, -0.582550048828125, -0.5619277954101562, -0.5413055419921875, -0.5206832885742188, -0.50006103515625, -0.47943878173828125, -0.4588165283203125, -0.43819427490234375, -0.417572021484375, -0.39694976806640625, -0.3763275146484375, -0.35570526123046875, -0.3350830078125, -0.31446075439453125, -0.2938385009765625, -0.27321624755859375, -0.252593994140625, -0.23197174072265625, -0.2113494873046875, -0.19072723388671875, -0.17010498046875, -0.14948272705078125, -0.1288604736328125, -0.10823822021484375, -0.087615966796875, -0.06699371337890625, -0.0463714599609375, -0.02574920654296875, -0.005126953125, 0.01549530029296875, 0.0361175537109375, 0.05673980712890625, 0.077362060546875, 0.09798431396484375, 0.1186065673828125, 0.13922882080078125, 0.15985107421875, 0.18047332763671875, 0.2010955810546875, 0.22171783447265625, 0.242340087890625, 0.26296234130859375, 0.2835845947265625, 0.30420684814453125, 0.3248291015625, 0.34545135498046875, 0.3660736083984375, 0.38669586181640625, 0.407318115234375, 0.42794036865234375, 0.4485626220703125, 0.46918487548828125, 0.48980712890625, 0.5104293823242188, 0.5310516357421875, 0.5516738891601562, 0.572296142578125, 0.5929183959960938, 0.6135406494140625, 0.6341629028320312, 0.65478515625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 5.0, 10.0, 12.0, 30.0, 34.0, 51.0, 74.0, 189.0, 480.0, 6068.0, 4147878.0, 38242.0, 687.0, 229.0, 122.0, 54.0, 27.0, 23.0, 22.0, 11.0, 11.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8046875, -6.50439453125, -6.2041015625, -5.90380859375, -5.603515625, -5.30322265625, -5.0029296875, -4.70263671875, -4.40234375, -4.10205078125, -3.8017578125, -3.50146484375, -3.201171875, -2.90087890625, -2.6005859375, -2.30029296875, -2.0, -1.69970703125, -1.3994140625, -1.09912109375, -0.798828125, -0.49853515625, -0.1982421875, 0.10205078125, 0.40234375, 0.70263671875, 1.0029296875, 1.30322265625, 1.603515625, 1.90380859375, 2.2041015625, 2.50439453125, 2.8046875, 3.10498046875, 3.4052734375, 3.70556640625, 4.005859375, 4.30615234375, 4.6064453125, 4.90673828125, 5.20703125, 5.50732421875, 5.8076171875, 6.10791015625, 6.408203125, 6.70849609375, 7.0087890625, 7.30908203125, 7.609375, 7.90966796875, 8.2099609375, 8.51025390625, 8.810546875, 9.11083984375, 9.4111328125, 9.71142578125, 10.01171875, 10.31201171875, 10.6123046875, 10.91259765625, 11.212890625, 11.51318359375, 11.8134765625, 12.11376953125, 12.4140625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 2.0, 4.0, 11.0, 11.0, 20.0, 30.0, 54.0, 61.0, 87.0, 198.0, 384.0, 667.0, 915.0, 657.0, 438.0, 215.0, 111.0, 59.0, 32.0, 31.0, 20.0, 22.0, 9.0, 12.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296142578125, -0.2830085754394531, -0.26987457275390625, -0.2567405700683594, -0.2436065673828125, -0.23047256469726562, -0.21733856201171875, -0.20420455932617188, -0.191070556640625, -0.17793655395507812, -0.16480255126953125, -0.15166854858398438, -0.1385345458984375, -0.12540054321289062, -0.11226654052734375, -0.09913253784179688, -0.08599853515625, -0.07286453247070312, -0.05973052978515625, -0.046596527099609375, -0.0334625244140625, -0.020328521728515625, -0.00719451904296875, 0.005939483642578125, 0.019073486328125, 0.032207489013671875, 0.04534149169921875, 0.058475494384765625, 0.0716094970703125, 0.08474349975585938, 0.09787750244140625, 0.11101150512695312, 0.1241455078125, 0.13727951049804688, 0.15041351318359375, 0.16354751586914062, 0.1766815185546875, 0.18981552124023438, 0.20294952392578125, 0.21608352661132812, 0.229217529296875, 0.24235153198242188, 0.25548553466796875, 0.2686195373535156, 0.2817535400390625, 0.2948875427246094, 0.30802154541015625, 0.3211555480957031, 0.33428955078125, 0.3474235534667969, 0.36055755615234375, 0.3736915588378906, 0.3868255615234375, 0.3999595642089844, 0.41309356689453125, 0.4262275695800781, 0.439361572265625, 0.4524955749511719, 0.46562957763671875, 0.4787635803222656, 0.4918975830078125, 0.5050315856933594, 0.5181655883789062, 0.5312995910644531, 0.54443359375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 10.0, 14.0, 17.0, 29.0, 45.0, 79.0, 109.0, 169.0, 162.0, 114.0, 89.0, 63.0, 31.0, 28.0, 16.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.094085216522217, -2.051387071609497, -2.0086886882781982, -1.9659905433654785, -1.9232923984527588, -1.8805941343307495, -1.8378958702087402, -1.7951977252960205, -1.7524995803833008, -1.7098013162612915, -1.6671031713485718, -1.6244049072265625, -1.5817067623138428, -1.5390084981918335, -1.4963102340698242, -1.4536120891571045, -1.4109138250350952, -1.368215560913086, -1.3255174160003662, -1.282819151878357, -1.2401210069656372, -1.197422742843628, -1.1547245979309082, -1.112026333808899, -1.0693280696868896, -1.0266298055648804, -0.9839316606521606, -0.9412333965301514, -0.8985352516174316, -0.8558369874954224, -0.8131387829780579, -0.7704405784606934, -0.7277424931526184, -0.6850442886352539, -0.6423460841178894, -0.5996478796005249, -0.5569496154785156, -0.5142514705657959, -0.4715532064437866, -0.4288550019264221, -0.3861567974090576, -0.3434585928916931, -0.3007603883743286, -0.2580621540546417, -0.21536394953727722, -0.17266574501991272, -0.12996751070022583, -0.08726930618286133, -0.044571101665496826, -0.0018728896975517273, 0.04082532227039337, 0.08352354168891907, 0.12622174620628357, 0.16891995072364807, 0.21161818504333496, 0.25431638956069946, 0.29701459407806396, 0.33971279859542847, 0.38241100311279297, 0.42510923743247986, 0.46780744194984436, 0.5105056762695312, 0.5532038807868958, 0.5959020853042603, 0.6386002898216248]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 7.0, 7.0, 6.0, 12.0, 15.0, 9.0, 22.0, 20.0, 33.0, 35.0, 29.0, 29.0, 41.0, 36.0, 45.0, 47.0, 42.0, 45.0, 37.0, 46.0, 33.0, 48.0, 39.0, 49.0, 36.0, 37.0, 27.0, 22.0, 24.0, 21.0, 20.0, 17.0, 13.0, 15.0, 6.0, 5.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7655501961708069, -0.7402287125587463, -0.7149072289466858, -0.6895856857299805, -0.6642642021179199, -0.6389427185058594, -0.6136212348937988, -0.5882997512817383, -0.5629782676696777, -0.5376567840576172, -0.5123353004455566, -0.4870137870311737, -0.46169230341911316, -0.4363707900047302, -0.4110493063926697, -0.38572782278060913, -0.3604063093662262, -0.33508482575416565, -0.3097633123397827, -0.28444182872772217, -0.2591203451156616, -0.23379884660243988, -0.20847734808921814, -0.1831558644771576, -0.15783436596393585, -0.1325128674507141, -0.10719138383865356, -0.08186988532543182, -0.05654839426279068, -0.031226903200149536, -0.005905404686927795, 0.01941607892513275, 0.04473757743835449, 0.07005906850099564, 0.09538055956363678, 0.12070205807685852, 0.14602354168891907, 0.1713450402021408, 0.19666653871536255, 0.2219880223274231, 0.24730952084064484, 0.2726310193538666, 0.2979525029659271, 0.32327401638031006, 0.3485954999923706, 0.37391698360443115, 0.3992384672164917, 0.42455995082855225, 0.4498814642429352, 0.4752029478549957, 0.5005244612693787, 0.5258459448814392, 0.5511674284934998, 0.5764889121055603, 0.6018104553222656, 0.6271319389343262, 0.6524534225463867, 0.6777749061584473, 0.7030963897705078, 0.7284178733825684, 0.7537394165992737, 0.7790609002113342, 0.8043823838233948, 0.8297038674354553, 0.8550253510475159]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 10.0, 6.0, 5.0, 16.0, 19.0, 30.0, 32.0, 47.0, 72.0, 98.0, 145.0, 188.0, 289.0, 419.0, 593.0, 886.0, 1272.0, 2050.0, 2945.0, 4723.0, 7452.0, 12261.0, 20387.0, 35573.0, 65036.0, 125351.0, 247022.0, 244968.0, 123919.0, 64254.0, 35174.0, 20077.0, 12052.0, 7408.0, 4583.0, 3002.0, 1966.0, 1323.0, 920.0, 590.0, 393.0, 287.0, 215.0, 136.0, 97.0, 76.0, 62.0, 33.0, 30.0, 20.0, 12.0, 6.0, 10.0, 6.0, 7.0, 6.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.52099609375, -0.5036239624023438, -0.4862518310546875, -0.46887969970703125, -0.451507568359375, -0.43413543701171875, -0.4167633056640625, -0.39939117431640625, -0.38201904296875, -0.36464691162109375, -0.3472747802734375, -0.32990264892578125, -0.312530517578125, -0.29515838623046875, -0.2777862548828125, -0.26041412353515625, -0.2430419921875, -0.22566986083984375, -0.2082977294921875, -0.19092559814453125, -0.173553466796875, -0.15618133544921875, -0.1388092041015625, -0.12143707275390625, -0.10406494140625, -0.08669281005859375, -0.0693206787109375, -0.05194854736328125, -0.034576416015625, -0.01720428466796875, 0.0001678466796875, 0.01753997802734375, 0.034912109375, 0.05228424072265625, 0.0696563720703125, 0.08702850341796875, 0.104400634765625, 0.12177276611328125, 0.1391448974609375, 0.15651702880859375, 0.17388916015625, 0.19126129150390625, 0.2086334228515625, 0.22600555419921875, 0.243377685546875, 0.26074981689453125, 0.2781219482421875, 0.29549407958984375, 0.3128662109375, 0.33023834228515625, 0.3476104736328125, 0.36498260498046875, 0.382354736328125, 0.39972686767578125, 0.4170989990234375, 0.43447113037109375, 0.45184326171875, 0.46921539306640625, 0.4865875244140625, 0.5039596557617188, 0.521331787109375, 0.5387039184570312, 0.5560760498046875, 0.5734481811523438, 0.5908203125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 8.0, 8.0, 12.0, 12.0, 12.0, 15.0, 15.0, 16.0, 27.0, 28.0, 33.0, 35.0, 40.0, 38.0, 42.0, 44.0, 41.0, 40.0, 45.0, 47.0, 34.0, 46.0, 38.0, 39.0, 37.0, 47.0, 30.0, 37.0, 21.0, 18.0, 20.0, 19.0, 7.0, 7.0, 13.0, 10.0, 5.0, 2.0, 1.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.697265625, -0.6751480102539062, -0.6530303955078125, -0.6309127807617188, -0.608795166015625, -0.5866775512695312, -0.5645599365234375, -0.5424423217773438, -0.52032470703125, -0.49820709228515625, -0.4760894775390625, -0.45397186279296875, -0.431854248046875, -0.40973663330078125, -0.3876190185546875, -0.36550140380859375, -0.3433837890625, -0.32126617431640625, -0.2991485595703125, -0.27703094482421875, -0.254913330078125, -0.23279571533203125, -0.2106781005859375, -0.18856048583984375, -0.16644287109375, -0.14432525634765625, -0.1222076416015625, -0.10009002685546875, -0.077972412109375, -0.05585479736328125, -0.0337371826171875, -0.01161956787109375, 0.010498046875, 0.03261566162109375, 0.0547332763671875, 0.07685089111328125, 0.098968505859375, 0.12108612060546875, 0.1432037353515625, 0.16532135009765625, 0.18743896484375, 0.20955657958984375, 0.2316741943359375, 0.25379180908203125, 0.275909423828125, 0.29802703857421875, 0.3201446533203125, 0.34226226806640625, 0.3643798828125, 0.38649749755859375, 0.4086151123046875, 0.43073272705078125, 0.452850341796875, 0.47496795654296875, 0.4970855712890625, 0.5192031860351562, 0.54132080078125, 0.5634384155273438, 0.5855560302734375, 0.6076736450195312, 0.629791259765625, 0.6519088745117188, 0.6740264892578125, 0.6961441040039062, 0.71826171875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 6.0, 7.0, 11.0, 8.0, 11.0, 24.0, 25.0, 32.0, 59.0, 74.0, 105.0, 171.0, 216.0, 338.0, 502.0, 740.0, 1083.0, 1725.0, 2758.0, 4485.0, 7544.0, 12762.0, 22102.0, 39885.0, 75465.0, 161614.0, 335815.0, 189966.0, 86126.0, 44457.0, 24527.0, 14107.0, 8350.0, 4923.0, 3045.0, 1881.0, 1100.0, 802.0, 511.0, 349.0, 263.0, 162.0, 125.0, 96.0, 57.0, 51.0, 25.0, 22.0, 17.0, 9.0, 8.0, 12.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.382080078125, -0.3703575134277344, -0.35863494873046875, -0.3469123840332031, -0.3351898193359375, -0.3234672546386719, -0.31174468994140625, -0.3000221252441406, -0.288299560546875, -0.2765769958496094, -0.26485443115234375, -0.2531318664550781, -0.2414093017578125, -0.22968673706054688, -0.21796417236328125, -0.20624160766601562, -0.19451904296875, -0.18279647827148438, -0.17107391357421875, -0.15935134887695312, -0.1476287841796875, -0.13590621948242188, -0.12418365478515625, -0.11246109008789062, -0.100738525390625, -0.08901596069335938, -0.07729339599609375, -0.06557083129882812, -0.0538482666015625, -0.042125701904296875, -0.03040313720703125, -0.018680572509765625, -0.0069580078125, 0.004764556884765625, 0.01648712158203125, 0.028209686279296875, 0.0399322509765625, 0.051654815673828125, 0.06337738037109375, 0.07509994506835938, 0.086822509765625, 0.09854507446289062, 0.11026763916015625, 0.12199020385742188, 0.1337127685546875, 0.14543533325195312, 0.15715789794921875, 0.16888046264648438, 0.18060302734375, 0.19232559204101562, 0.20404815673828125, 0.21577072143554688, 0.2274932861328125, 0.23921585083007812, 0.25093841552734375, 0.2626609802246094, 0.274383544921875, 0.2861061096191406, 0.29782867431640625, 0.3095512390136719, 0.3212738037109375, 0.3329963684082031, 0.34471893310546875, 0.3564414978027344, 0.3681640625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 8.0, 11.0, 15.0, 14.0, 12.0, 25.0, 23.0, 21.0, 30.0, 25.0, 35.0, 33.0, 31.0, 33.0, 34.0, 43.0, 45.0, 41.0, 36.0, 32.0, 45.0, 43.0, 29.0, 28.0, 28.0, 34.0, 43.0, 27.0, 18.0, 19.0, 15.0, 20.0, 11.0, 6.0, 18.0, 11.0, 11.0, 9.0, 4.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.436279296875, -0.4231681823730469, -0.41005706787109375, -0.3969459533691406, -0.3838348388671875, -0.3707237243652344, -0.35761260986328125, -0.3445014953613281, -0.331390380859375, -0.3182792663574219, -0.30516815185546875, -0.2920570373535156, -0.2789459228515625, -0.2658348083496094, -0.25272369384765625, -0.23961257934570312, -0.22650146484375, -0.21339035034179688, -0.20027923583984375, -0.18716812133789062, -0.1740570068359375, -0.16094589233398438, -0.14783477783203125, -0.13472366333007812, -0.121612548828125, -0.10850143432617188, -0.09539031982421875, -0.08227920532226562, -0.0691680908203125, -0.056056976318359375, -0.04294586181640625, -0.029834747314453125, -0.0167236328125, -0.003612518310546875, 0.00949859619140625, 0.022609710693359375, 0.0357208251953125, 0.048831939697265625, 0.06194305419921875, 0.07505416870117188, 0.088165283203125, 0.10127639770507812, 0.11438751220703125, 0.12749862670898438, 0.1406097412109375, 0.15372085571289062, 0.16683197021484375, 0.17994308471679688, 0.19305419921875, 0.20616531372070312, 0.21927642822265625, 0.23238754272460938, 0.2454986572265625, 0.2586097717285156, 0.27172088623046875, 0.2848320007324219, 0.297943115234375, 0.3110542297363281, 0.32416534423828125, 0.3372764587402344, 0.3503875732421875, 0.3634986877441406, 0.37660980224609375, 0.3897209167480469, 0.40283203125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 12.0, 10.0, 21.0, 27.0, 37.0, 43.0, 69.0, 76.0, 104.0, 167.0, 221.0, 342.0, 484.0, 760.0, 1200.0, 1890.0, 3019.0, 5327.0, 9862.0, 19965.0, 44241.0, 121766.0, 546357.0, 182528.0, 57215.0, 24677.0, 12028.0, 6351.0, 3637.0, 2085.0, 1300.0, 796.0, 563.0, 371.0, 287.0, 173.0, 141.0, 93.0, 75.0, 53.0, 32.0, 29.0, 19.0, 21.0, 18.0, 14.0, 11.0, 5.0, 8.0, 8.0, 3.0, 1.0, 5.0, 2.0], "bins": [-0.0633544921875, -0.06141376495361328, -0.05947303771972656, -0.057532310485839844, -0.055591583251953125, -0.053650856018066406, -0.05171012878417969, -0.04976940155029297, -0.04782867431640625, -0.04588794708251953, -0.04394721984863281, -0.042006492614746094, -0.040065765380859375, -0.038125038146972656, -0.03618431091308594, -0.03424358367919922, -0.0323028564453125, -0.03036212921142578, -0.028421401977539062, -0.026480674743652344, -0.024539947509765625, -0.022599220275878906, -0.020658493041992188, -0.01871776580810547, -0.01677703857421875, -0.014836311340332031, -0.012895584106445312, -0.010954856872558594, -0.009014129638671875, -0.007073402404785156, -0.0051326751708984375, -0.0031919479370117188, -0.001251220703125, 0.0006895065307617188, 0.0026302337646484375, 0.004570960998535156, 0.006511688232421875, 0.008452415466308594, 0.010393142700195312, 0.012333869934082031, 0.01427459716796875, 0.01621532440185547, 0.018156051635742188, 0.020096778869628906, 0.022037506103515625, 0.023978233337402344, 0.025918960571289062, 0.02785968780517578, 0.0298004150390625, 0.03174114227294922, 0.03368186950683594, 0.035622596740722656, 0.037563323974609375, 0.039504051208496094, 0.04144477844238281, 0.04338550567626953, 0.04532623291015625, 0.04726696014404297, 0.04920768737792969, 0.051148414611816406, 0.053089141845703125, 0.055029869079589844, 0.05697059631347656, 0.05891132354736328, 0.06085205078125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 5.0, 9.0, 6.0, 7.0, 10.0, 9.0, 19.0, 20.0, 62.0, 61.0, 118.0, 118.0, 129.0, 120.0, 78.0, 65.0, 42.0, 31.0, 14.0, 19.0, 11.0, 7.0, 7.0, 5.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8431415557861328e-05, -2.7649104595184326e-05, -2.6866793632507324e-05, -2.6084482669830322e-05, -2.530217170715332e-05, -2.451986074447632e-05, -2.3737549781799316e-05, -2.2955238819122314e-05, -2.2172927856445312e-05, -2.139061689376831e-05, -2.060830593109131e-05, -1.9825994968414307e-05, -1.9043684005737305e-05, -1.8261373043060303e-05, -1.74790620803833e-05, -1.66967511177063e-05, -1.5914440155029297e-05, -1.5132129192352295e-05, -1.4349818229675293e-05, -1.3567507266998291e-05, -1.2785196304321289e-05, -1.2002885341644287e-05, -1.1220574378967285e-05, -1.0438263416290283e-05, -9.655952453613281e-06, -8.87364149093628e-06, -8.091330528259277e-06, -7.309019565582275e-06, -6.5267086029052734e-06, -5.7443976402282715e-06, -4.9620866775512695e-06, -4.179775714874268e-06, -3.3974647521972656e-06, -2.6151537895202637e-06, -1.8328428268432617e-06, -1.0505318641662598e-06, -2.682209014892578e-07, 5.140900611877441e-07, 1.296401023864746e-06, 2.078711986541748e-06, 2.86102294921875e-06, 3.643333911895752e-06, 4.425644874572754e-06, 5.207955837249756e-06, 5.990266799926758e-06, 6.77257776260376e-06, 7.554888725280762e-06, 8.337199687957764e-06, 9.119510650634766e-06, 9.901821613311768e-06, 1.068413257598877e-05, 1.1466443538665771e-05, 1.2248754501342773e-05, 1.3031065464019775e-05, 1.3813376426696777e-05, 1.459568738937378e-05, 1.537799835205078e-05, 1.6160309314727783e-05, 1.6942620277404785e-05, 1.7724931240081787e-05, 1.850724220275879e-05, 1.928955316543579e-05, 2.0071864128112793e-05, 2.0854175090789795e-05, 2.1636486053466797e-05]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 9.0, 8.0, 12.0, 19.0, 24.0, 19.0, 42.0, 95.0, 951.0, 399919.0, 646147.0, 1052.0, 97.0, 42.0, 24.0, 21.0, 15.0, 14.0, 10.0, 7.0, 3.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.798828125, -0.7766494750976562, -0.7544708251953125, -0.7322921752929688, -0.710113525390625, -0.6879348754882812, -0.6657562255859375, -0.6435775756835938, -0.62139892578125, -0.5992202758789062, -0.5770416259765625, -0.5548629760742188, -0.532684326171875, -0.5105056762695312, -0.4883270263671875, -0.46614837646484375, -0.4439697265625, -0.42179107666015625, -0.3996124267578125, -0.37743377685546875, -0.355255126953125, -0.33307647705078125, -0.3108978271484375, -0.28871917724609375, -0.26654052734375, -0.24436187744140625, -0.2221832275390625, -0.20000457763671875, -0.177825927734375, -0.15564727783203125, -0.1334686279296875, -0.11128997802734375, -0.089111328125, -0.06693267822265625, -0.0447540283203125, -0.02257537841796875, -0.000396728515625, 0.02178192138671875, 0.0439605712890625, 0.06613922119140625, 0.08831787109375, 0.11049652099609375, 0.1326751708984375, 0.15485382080078125, 0.177032470703125, 0.19921112060546875, 0.2213897705078125, 0.24356842041015625, 0.2657470703125, 0.28792572021484375, 0.3101043701171875, 0.33228302001953125, 0.354461669921875, 0.37664031982421875, 0.3988189697265625, 0.42099761962890625, 0.44317626953125, 0.46535491943359375, 0.4875335693359375, 0.5097122192382812, 0.531890869140625, 0.5540695190429688, 0.5762481689453125, 0.5984268188476562, 0.62060546875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 5.0, 12.0, 8.0, 16.0, 17.0, 41.0, 36.0, 56.0, 80.0, 139.0, 160.0, 134.0, 85.0, 52.0, 42.0, 24.0, 20.0, 16.0, 16.0, 7.0, 6.0, 6.0, 6.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0318603515625, -0.030963659286499023, -0.030066967010498047, -0.02917027473449707, -0.028273582458496094, -0.027376890182495117, -0.02648019790649414, -0.025583505630493164, -0.024686813354492188, -0.02379012107849121, -0.022893428802490234, -0.021996736526489258, -0.02110004425048828, -0.020203351974487305, -0.019306659698486328, -0.01840996742248535, -0.017513275146484375, -0.0166165828704834, -0.015719890594482422, -0.014823198318481445, -0.013926506042480469, -0.013029813766479492, -0.012133121490478516, -0.011236429214477539, -0.010339736938476562, -0.009443044662475586, -0.00854635238647461, -0.007649660110473633, -0.006752967834472656, -0.00585627555847168, -0.004959583282470703, -0.0040628910064697266, -0.00316619873046875, -0.0022695064544677734, -0.0013728141784667969, -0.0004761219024658203, 0.00042057037353515625, 0.0013172626495361328, 0.0022139549255371094, 0.003110647201538086, 0.0040073394775390625, 0.004904031753540039, 0.005800724029541016, 0.006697416305541992, 0.007594108581542969, 0.008490800857543945, 0.009387493133544922, 0.010284185409545898, 0.011180877685546875, 0.012077569961547852, 0.012974262237548828, 0.013870954513549805, 0.014767646789550781, 0.015664339065551758, 0.016561031341552734, 0.01745772361755371, 0.018354415893554688, 0.019251108169555664, 0.02014780044555664, 0.021044492721557617, 0.021941184997558594, 0.02283787727355957, 0.023734569549560547, 0.024631261825561523, 0.0255279541015625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 10.0, 6.0, 5.0, 8.0, 15.0, 12.0, 26.0, 29.0, 39.0, 55.0, 86.0, 89.0, 116.0, 122.0, 84.0, 63.0, 65.0, 52.0, 30.0, 29.0, 13.0, 11.0, 13.0, 4.0, 2.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2407941818237305, -1.2118333578109741, -1.1828725337982178, -1.1539115905761719, -1.1249507665634155, -1.0959899425506592, -1.0670291185379028, -1.038068175315857, -1.0091073513031006, -0.9801465272903442, -0.9511856436729431, -0.9222248196601868, -0.8932639360427856, -0.8643031120300293, -0.8353422284126282, -0.8063814043998718, -0.7774205207824707, -0.7484596967697144, -0.7194988131523132, -0.6905379891395569, -0.6615771055221558, -0.6326162815093994, -0.6036553978919983, -0.5746945738792419, -0.5457337498664856, -0.5167729258537292, -0.4878120422363281, -0.4588511884212494, -0.42989033460617065, -0.4009295105934143, -0.3719686269760132, -0.34300780296325684, -0.3140469193458557, -0.285086065530777, -0.25612521171569824, -0.2271643579006195, -0.19820350408554077, -0.16924266517162323, -0.1402818113565445, -0.11132095754146576, -0.08236010372638702, -0.05339924991130829, -0.02443839982151985, 0.004522450268268585, 0.03348330408334732, 0.06244415044784546, 0.0914050042629242, 0.12036585807800293, 0.14932671189308167, 0.1782875657081604, 0.20724841952323914, 0.23620927333831787, 0.2651701271533966, 0.29413098096847534, 0.3230918049812317, 0.3520526885986328, 0.38101351261138916, 0.4099743664264679, 0.43893522024154663, 0.46789607405662537, 0.4968569278717041, 0.5258177518844604, 0.5547786355018616, 0.5837394595146179, 0.612700343132019]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 6.0, 6.0, 5.0, 12.0, 4.0, 9.0, 11.0, 15.0, 19.0, 19.0, 26.0, 36.0, 34.0, 30.0, 31.0, 41.0, 40.0, 43.0, 47.0, 42.0, 40.0, 42.0, 47.0, 31.0, 40.0, 53.0, 36.0, 35.0, 34.0, 22.0, 28.0, 25.0, 16.0, 15.0, 17.0, 12.0, 10.0, 6.0, 9.0, 2.0, 4.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.661052942276001, -0.6395013332366943, -0.6179497241973877, -0.596398115158081, -0.5748464465141296, -0.553294837474823, -0.5317432284355164, -0.5101916193962097, -0.4886399805545807, -0.46708837151527405, -0.445536732673645, -0.4239851236343384, -0.40243351459503174, -0.3808818757534027, -0.35933026671409607, -0.33777862787246704, -0.3162270188331604, -0.29467540979385376, -0.27312377095222473, -0.2515721619129181, -0.23002053797245026, -0.20846891403198242, -0.18691730499267578, -0.16536568105220795, -0.1438140571117401, -0.12226243317127228, -0.10071081668138504, -0.0791592001914978, -0.05760757625102997, -0.036055952310562134, -0.014504343271255493, 0.007047280669212341, 0.028598904609680176, 0.05015052482485771, 0.07170214504003525, 0.09325376152992249, 0.11480538547039032, 0.13635700941085815, 0.1579086184501648, 0.17946024239063263, 0.20101186633110046, 0.2225634902715683, 0.24411511421203613, 0.2656667232513428, 0.2872183322906494, 0.30876997113227844, 0.3303215801715851, 0.3518732190132141, 0.37342482805252075, 0.3949764370918274, 0.4165280759334564, 0.43807968497276306, 0.4596313238143921, 0.48118293285369873, 0.5027345418930054, 0.524286150932312, 0.5458377599716187, 0.5673893690109253, 0.5889409780502319, 0.6104925870895386, 0.63204425573349, 0.6535958647727966, 0.6751474738121033, 0.6966990828514099, 0.7182507514953613]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 13.0, 15.0, 28.0, 23.0, 35.0, 57.0, 65.0, 106.0, 198.0, 250.0, 405.0, 691.0, 1111.0, 1795.0, 3055.0, 5157.0, 9121.0, 16322.0, 29770.0, 54769.0, 100447.0, 166936.0, 215588.0, 184652.0, 115602.0, 63724.0, 34434.0, 18944.0, 10536.0, 5820.0, 3497.0, 2082.0, 1190.0, 705.0, 447.0, 315.0, 203.0, 131.0, 99.0, 67.0, 44.0, 31.0, 18.0, 20.0, 3.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0], "bins": [-0.94482421875, -0.915863037109375, -0.88690185546875, -0.857940673828125, -0.8289794921875, -0.800018310546875, -0.77105712890625, -0.742095947265625, -0.713134765625, -0.684173583984375, -0.65521240234375, -0.626251220703125, -0.5972900390625, -0.568328857421875, -0.53936767578125, -0.510406494140625, -0.4814453125, -0.452484130859375, -0.42352294921875, -0.394561767578125, -0.3656005859375, -0.336639404296875, -0.30767822265625, -0.278717041015625, -0.249755859375, -0.220794677734375, -0.19183349609375, -0.162872314453125, -0.1339111328125, -0.104949951171875, -0.07598876953125, -0.047027587890625, -0.01806640625, 0.010894775390625, 0.03985595703125, 0.068817138671875, 0.0977783203125, 0.126739501953125, 0.15570068359375, 0.184661865234375, 0.213623046875, 0.242584228515625, 0.27154541015625, 0.300506591796875, 0.3294677734375, 0.358428955078125, 0.38739013671875, 0.416351318359375, 0.4453125, 0.474273681640625, 0.50323486328125, 0.532196044921875, 0.5611572265625, 0.590118408203125, 0.61907958984375, 0.648040771484375, 0.677001953125, 0.705963134765625, 0.73492431640625, 0.763885498046875, 0.7928466796875, 0.821807861328125, 0.85076904296875, 0.879730224609375, 0.90869140625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 3.0, 6.0, 5.0, 7.0, 8.0, 10.0, 20.0, 14.0, 24.0, 20.0, 21.0, 33.0, 34.0, 37.0, 28.0, 48.0, 48.0, 46.0, 40.0, 38.0, 35.0, 43.0, 46.0, 46.0, 46.0, 41.0, 34.0, 33.0, 25.0, 28.0, 23.0, 23.0, 13.0, 18.0, 12.0, 13.0, 12.0, 8.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.42138671875, -0.40692138671875, -0.3924560546875, -0.37799072265625, -0.363525390625, -0.34906005859375, -0.3345947265625, -0.32012939453125, -0.3056640625, -0.29119873046875, -0.2767333984375, -0.26226806640625, -0.247802734375, -0.23333740234375, -0.2188720703125, -0.20440673828125, -0.18994140625, -0.17547607421875, -0.1610107421875, -0.14654541015625, -0.132080078125, -0.11761474609375, -0.1031494140625, -0.08868408203125, -0.07421875, -0.05975341796875, -0.0452880859375, -0.03082275390625, -0.016357421875, -0.00189208984375, 0.0125732421875, 0.02703857421875, 0.04150390625, 0.05596923828125, 0.0704345703125, 0.08489990234375, 0.099365234375, 0.11383056640625, 0.1282958984375, 0.14276123046875, 0.1572265625, 0.17169189453125, 0.1861572265625, 0.20062255859375, 0.215087890625, 0.22955322265625, 0.2440185546875, 0.25848388671875, 0.27294921875, 0.28741455078125, 0.3018798828125, 0.31634521484375, 0.330810546875, 0.34527587890625, 0.3597412109375, 0.37420654296875, 0.388671875, 0.40313720703125, 0.4176025390625, 0.43206787109375, 0.446533203125, 0.46099853515625, 0.4754638671875, 0.48992919921875, 0.50439453125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 8.0, 9.0, 13.0, 12.0, 14.0, 17.0, 21.0, 23.0, 20.0, 26.0, 24.0, 26.0, 31.0, 35.0, 31.0, 67.0, 448.0, 13222.0, 668273.0, 359307.0, 6312.0, 234.0, 63.0, 36.0, 35.0, 33.0, 38.0, 27.0, 24.0, 14.0, 9.0, 19.0, 19.0, 15.0, 4.0, 9.0, 7.0, 4.0, 5.0, 1.0, 9.0, 0.0, 2.0, 4.0, 2.0, 2.0], "bins": [-7.12109375, -6.9281005859375, -6.735107421875, -6.5421142578125, -6.34912109375, -6.1561279296875, -5.963134765625, -5.7701416015625, -5.5771484375, -5.3841552734375, -5.191162109375, -4.9981689453125, -4.80517578125, -4.6121826171875, -4.419189453125, -4.2261962890625, -4.033203125, -3.8402099609375, -3.647216796875, -3.4542236328125, -3.26123046875, -3.0682373046875, -2.875244140625, -2.6822509765625, -2.4892578125, -2.2962646484375, -2.103271484375, -1.9102783203125, -1.71728515625, -1.5242919921875, -1.331298828125, -1.1383056640625, -0.9453125, -0.7523193359375, -0.559326171875, -0.3663330078125, -0.17333984375, 0.0196533203125, 0.212646484375, 0.4056396484375, 0.5986328125, 0.7916259765625, 0.984619140625, 1.1776123046875, 1.37060546875, 1.5635986328125, 1.756591796875, 1.9495849609375, 2.142578125, 2.3355712890625, 2.528564453125, 2.7215576171875, 2.91455078125, 3.1075439453125, 3.300537109375, 3.4935302734375, 3.6865234375, 3.8795166015625, 4.072509765625, 4.2655029296875, 4.45849609375, 4.6514892578125, 4.844482421875, 5.0374755859375, 5.23046875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 12.0, 6.0, 4.0, 12.0, 12.0, 14.0, 20.0, 25.0, 18.0, 33.0, 21.0, 27.0, 39.0, 32.0, 37.0, 49.0, 52.0, 40.0, 40.0, 43.0, 45.0, 53.0, 44.0, 41.0, 41.0, 29.0, 32.0, 29.0, 23.0, 16.0, 13.0, 24.0, 17.0, 16.0, 11.0, 2.0, 7.0, 6.0, 8.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0], "bins": [-0.587890625, -0.5721168518066406, -0.5563430786132812, -0.5405693054199219, -0.5247955322265625, -0.5090217590332031, -0.49324798583984375, -0.4774742126464844, -0.461700439453125, -0.4459266662597656, -0.43015289306640625, -0.4143791198730469, -0.3986053466796875, -0.3828315734863281, -0.36705780029296875, -0.3512840270996094, -0.33551025390625, -0.3197364807128906, -0.30396270751953125, -0.2881889343261719, -0.2724151611328125, -0.2566413879394531, -0.24086761474609375, -0.22509384155273438, -0.209320068359375, -0.19354629516601562, -0.17777252197265625, -0.16199874877929688, -0.1462249755859375, -0.13045120239257812, -0.11467742919921875, -0.09890365600585938, -0.0831298828125, -0.06735610961914062, -0.05158233642578125, -0.035808563232421875, -0.0200347900390625, -0.004261016845703125, 0.01151275634765625, 0.027286529541015625, 0.043060302734375, 0.058834075927734375, 0.07460784912109375, 0.09038162231445312, 0.1061553955078125, 0.12192916870117188, 0.13770294189453125, 0.15347671508789062, 0.16925048828125, 0.18502426147460938, 0.20079803466796875, 0.21657180786132812, 0.2323455810546875, 0.24811935424804688, 0.26389312744140625, 0.2796669006347656, 0.295440673828125, 0.3112144470214844, 0.32698822021484375, 0.3427619934082031, 0.3585357666015625, 0.3743095397949219, 0.39008331298828125, 0.4058570861816406, 0.421630859375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 12.0, 11.0, 14.0, 24.0, 32.0, 43.0, 74.0, 131.0, 213.0, 399.0, 674.0, 1288.0, 2458.0, 5359.0, 13538.0, 43288.0, 330409.0, 571749.0, 51574.0, 15623.0, 5917.0, 2643.0, 1361.0, 718.0, 406.0, 242.0, 110.0, 80.0, 60.0, 24.0, 21.0, 20.0, 7.0, 9.0, 6.0, 9.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36328125, -0.3507804870605469, -0.33827972412109375, -0.3257789611816406, -0.3132781982421875, -0.3007774353027344, -0.28827667236328125, -0.2757759094238281, -0.263275146484375, -0.2507743835449219, -0.23827362060546875, -0.22577285766601562, -0.2132720947265625, -0.20077133178710938, -0.18827056884765625, -0.17576980590820312, -0.16326904296875, -0.15076828002929688, -0.13826751708984375, -0.12576675415039062, -0.1132659912109375, -0.10076522827148438, -0.08826446533203125, -0.07576370239257812, -0.063262939453125, -0.050762176513671875, -0.03826141357421875, -0.025760650634765625, -0.0132598876953125, -0.000759124755859375, 0.01174163818359375, 0.024242401123046875, 0.0367431640625, 0.049243927001953125, 0.06174468994140625, 0.07424545288085938, 0.0867462158203125, 0.09924697875976562, 0.11174774169921875, 0.12424850463867188, 0.136749267578125, 0.14925003051757812, 0.16175079345703125, 0.17425155639648438, 0.1867523193359375, 0.19925308227539062, 0.21175384521484375, 0.22425460815429688, 0.23675537109375, 0.24925613403320312, 0.26175689697265625, 0.2742576599121094, 0.2867584228515625, 0.2992591857910156, 0.31175994873046875, 0.3242607116699219, 0.336761474609375, 0.3492622375488281, 0.36176300048828125, 0.3742637634277344, 0.3867645263671875, 0.3992652893066406, 0.41176605224609375, 0.4242668151855469, 0.436767578125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 4.0, 1.0, 5.0, 10.0, 24.0, 36.0, 88.0, 147.0, 222.0, 191.0, 135.0, 57.0, 35.0, 19.0, 10.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.181529998779297e-05, -2.043507993221283e-05, -1.905485987663269e-05, -1.767463982105255e-05, -1.6294419765472412e-05, -1.4914199709892273e-05, -1.3533979654312134e-05, -1.2153759598731995e-05, -1.0773539543151855e-05, -9.393319487571716e-06, -8.013099431991577e-06, -6.632879376411438e-06, -5.252659320831299e-06, -3.87243926525116e-06, -2.4922192096710205e-06, -1.1119991540908813e-06, 2.682209014892578e-07, 1.648440957069397e-06, 3.028661012649536e-06, 4.408881068229675e-06, 5.7891011238098145e-06, 7.169321179389954e-06, 8.549541234970093e-06, 9.929761290550232e-06, 1.1309981346130371e-05, 1.269020140171051e-05, 1.407042145729065e-05, 1.545064151287079e-05, 1.6830861568450928e-05, 1.8211081624031067e-05, 1.9591301679611206e-05, 2.0971521735191345e-05, 2.2351741790771484e-05, 2.3731961846351624e-05, 2.5112181901931763e-05, 2.6492401957511902e-05, 2.787262201309204e-05, 2.925284206867218e-05, 3.063306212425232e-05, 3.201328217983246e-05, 3.33935022354126e-05, 3.477372229099274e-05, 3.6153942346572876e-05, 3.7534162402153015e-05, 3.8914382457733154e-05, 4.0294602513313293e-05, 4.167482256889343e-05, 4.305504262447357e-05, 4.443526268005371e-05, 4.581548273563385e-05, 4.719570279121399e-05, 4.857592284679413e-05, 4.995614290237427e-05, 5.133636295795441e-05, 5.2716583013534546e-05, 5.4096803069114685e-05, 5.5477023124694824e-05, 5.685724318027496e-05, 5.82374632358551e-05, 5.961768329143524e-05, 6.099790334701538e-05, 6.237812340259552e-05, 6.375834345817566e-05, 6.51385635137558e-05, 6.651878356933594e-05]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 6.0, 4.0, 4.0, 16.0, 15.0, 11.0, 19.0, 17.0, 23.0, 32.0, 124.0, 1090.0, 25339.0, 1010144.0, 10821.0, 650.0, 95.0, 36.0, 22.0, 12.0, 12.0, 16.0, 7.0, 4.0, 8.0, 5.0, 8.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.189453125, -2.121856689453125, -2.05426025390625, -1.986663818359375, -1.9190673828125, -1.851470947265625, -1.78387451171875, -1.716278076171875, -1.648681640625, -1.581085205078125, -1.51348876953125, -1.445892333984375, -1.3782958984375, -1.310699462890625, -1.24310302734375, -1.175506591796875, -1.10791015625, -1.040313720703125, -0.97271728515625, -0.905120849609375, -0.8375244140625, -0.769927978515625, -0.70233154296875, -0.634735107421875, -0.567138671875, -0.499542236328125, -0.43194580078125, -0.364349365234375, -0.2967529296875, -0.229156494140625, -0.16156005859375, -0.093963623046875, -0.0263671875, 0.041229248046875, 0.10882568359375, 0.176422119140625, 0.2440185546875, 0.311614990234375, 0.37921142578125, 0.446807861328125, 0.514404296875, 0.582000732421875, 0.64959716796875, 0.717193603515625, 0.7847900390625, 0.852386474609375, 0.91998291015625, 0.987579345703125, 1.05517578125, 1.122772216796875, 1.19036865234375, 1.257965087890625, 1.3255615234375, 1.393157958984375, 1.46075439453125, 1.528350830078125, 1.595947265625, 1.663543701171875, 1.73114013671875, 1.798736572265625, 1.8663330078125, 1.933929443359375, 2.00152587890625, 2.069122314453125, 2.13671875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 5.0, 12.0, 14.0, 8.0, 24.0, 14.0, 22.0, 20.0, 34.0, 38.0, 76.0, 161.0, 261.0, 74.0, 52.0, 43.0, 33.0, 15.0, 15.0, 14.0, 11.0, 10.0, 3.0, 8.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1680908203125, -0.16317176818847656, -0.15825271606445312, -0.1533336639404297, -0.14841461181640625, -0.1434955596923828, -0.13857650756835938, -0.13365745544433594, -0.1287384033203125, -0.12381935119628906, -0.11890029907226562, -0.11398124694824219, -0.10906219482421875, -0.10414314270019531, -0.09922409057617188, -0.09430503845214844, -0.089385986328125, -0.08446693420410156, -0.07954788208007812, -0.07462882995605469, -0.06970977783203125, -0.06479072570800781, -0.059871673583984375, -0.05495262145996094, -0.0500335693359375, -0.04511451721191406, -0.040195465087890625, -0.03527641296386719, -0.03035736083984375, -0.025438308715820312, -0.020519256591796875, -0.015600204467773438, -0.01068115234375, -0.0057621002197265625, -0.000843048095703125, 0.0040760040283203125, 0.00899505615234375, 0.013914108276367188, 0.018833160400390625, 0.023752212524414062, 0.0286712646484375, 0.03359031677246094, 0.038509368896484375, 0.04342842102050781, 0.04834747314453125, 0.05326652526855469, 0.058185577392578125, 0.06310462951660156, 0.068023681640625, 0.07294273376464844, 0.07786178588867188, 0.08278083801269531, 0.08769989013671875, 0.09261894226074219, 0.09753799438476562, 0.10245704650878906, 0.1073760986328125, 0.11229515075683594, 0.11721420288085938, 0.12213325500488281, 0.12705230712890625, 0.1319713592529297, 0.13689041137695312, 0.14180946350097656, 0.146728515625]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 10.0, 31.0, 150.0, 474.0, 265.0, 57.0, 22.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1559226512908936, -2.056489944458008, -1.9570574760437012, -1.8576247692108154, -1.7581921815872192, -1.658759593963623, -1.5593268871307373, -1.4598942995071411, -1.360461711883545, -1.2610291242599487, -1.1615965366363525, -1.0621638298034668, -0.9627312421798706, -0.8632986545562744, -0.7638660073280334, -0.6644333600997925, -0.5650007724761963, -0.4655681550502777, -0.36613553762435913, -0.26670292019844055, -0.16727030277252197, -0.0678376853466034, 0.031594932079315186, 0.13102757930755615, 0.23046016693115234, 0.3298927843570709, 0.4293254017829895, 0.5287580490112305, 0.6281906366348267, 0.7276232242584229, 0.8270558714866638, 0.9264885187149048, 1.02592134475708, 1.1253539323806763, 1.2247865200042725, 1.3242192268371582, 1.4236518144607544, 1.5230844020843506, 1.6225171089172363, 1.7219496965408325, 1.8213822841644287, 1.920814871788025, 2.020247459411621, 2.119680166244507, 2.2191128730773926, 2.318545341491699, 2.417978048324585, 2.5174107551574707, 2.6168432235717773, 2.716275930404663, 2.8157083988189697, 2.9151411056518555, 3.014573574066162, 3.114006280899048, 3.2134389877319336, 3.3128714561462402, 3.412304162979126, 3.5117368698120117, 3.6111693382263184, 3.710602045059204, 3.81003475189209, 3.9094672203063965, 4.008899688720703, 4.108332633972168, 4.207765102386475]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 10.0, 5.0, 12.0, 9.0, 20.0, 12.0, 16.0, 25.0, 28.0, 27.0, 34.0, 37.0, 35.0, 39.0, 40.0, 54.0, 43.0, 45.0, 49.0, 34.0, 49.0, 37.0, 40.0, 36.0, 36.0, 27.0, 26.0, 38.0, 22.0, 17.0, 17.0, 14.0, 17.0, 12.0, 9.0, 2.0, 4.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5870530605316162, -0.5667250156402588, -0.5463969111442566, -0.5260688662528992, -0.5057408213615417, -0.48541274666786194, -0.46508467197418213, -0.4447566270828247, -0.4244285821914673, -0.4041005074977875, -0.38377246260643005, -0.36344438791275024, -0.3431163430213928, -0.322788268327713, -0.3024601936340332, -0.2821321487426758, -0.26180407404899597, -0.24147601425647736, -0.22114795446395874, -0.20081987977027893, -0.1804918348789215, -0.1601637601852417, -0.13983570039272308, -0.11950764060020447, -0.09917958080768585, -0.07885152101516724, -0.05852345749735832, -0.03819539397954941, -0.017867334187030792, 0.0024607256054878235, 0.022788792848587036, 0.04311685264110565, 0.06344491243362427, 0.08377297222614288, 0.1041010320186615, 0.12442909926176071, 0.14475715160369873, 0.16508522629737854, 0.18541328608989716, 0.20574134588241577, 0.2260694056749344, 0.246397465467453, 0.2667255401611328, 0.28705358505249023, 0.30738165974617004, 0.32770970463752747, 0.3480377793312073, 0.3683658242225647, 0.3886938989162445, 0.4090219736099243, 0.42935001850128174, 0.44967809319496155, 0.47000613808631897, 0.4903342127799988, 0.5106622576713562, 0.5309903621673584, 0.5513184070587158, 0.5716464519500732, 0.5919745564460754, 0.6123026013374329, 0.6326306462287903, 0.6529586911201477, 0.6732867956161499, 0.6936148405075073, 0.7139428853988647]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 8.0, 17.0, 12.0, 23.0, 26.0, 39.0, 56.0, 103.0, 163.0, 262.0, 418.0, 778.0, 1265.0, 2424.0, 4427.0, 9431.0, 27460.0, 173803.0, 1244159.0, 2198149.0, 445094.0, 58763.0, 13923.0, 6144.0, 3151.0, 1731.0, 972.0, 567.0, 290.0, 237.0, 122.0, 84.0, 64.0, 36.0, 17.0, 13.0, 11.0, 12.0, 6.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5947265625, -0.5743789672851562, -0.5540313720703125, -0.5336837768554688, -0.513336181640625, -0.49298858642578125, -0.4726409912109375, -0.45229339599609375, -0.43194580078125, -0.41159820556640625, -0.3912506103515625, -0.37090301513671875, -0.350555419921875, -0.33020782470703125, -0.3098602294921875, -0.28951263427734375, -0.2691650390625, -0.24881744384765625, -0.2284698486328125, -0.20812225341796875, -0.187774658203125, -0.16742706298828125, -0.1470794677734375, -0.12673187255859375, -0.10638427734375, -0.08603668212890625, -0.0656890869140625, -0.04534149169921875, -0.024993896484375, -0.00464630126953125, 0.0157012939453125, 0.03604888916015625, 0.056396484375, 0.07674407958984375, 0.0970916748046875, 0.11743927001953125, 0.137786865234375, 0.15813446044921875, 0.1784820556640625, 0.19882965087890625, 0.21917724609375, 0.23952484130859375, 0.2598724365234375, 0.28022003173828125, 0.300567626953125, 0.32091522216796875, 0.3412628173828125, 0.36161041259765625, 0.3819580078125, 0.40230560302734375, 0.4226531982421875, 0.44300079345703125, 0.463348388671875, 0.48369598388671875, 0.5040435791015625, 0.5243911743164062, 0.54473876953125, 0.5650863647460938, 0.5854339599609375, 0.6057815551757812, 0.626129150390625, 0.6464767456054688, 0.6668243408203125, 0.6871719360351562, 0.70751953125]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 8.0, 8.0, 6.0, 17.0, 11.0, 20.0, 15.0, 19.0, 21.0, 29.0, 30.0, 37.0, 46.0, 31.0, 47.0, 45.0, 33.0, 52.0, 37.0, 50.0, 39.0, 43.0, 43.0, 33.0, 30.0, 33.0, 27.0, 30.0, 31.0, 24.0, 14.0, 15.0, 16.0, 12.0, 8.0, 8.0, 8.0, 5.0, 2.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.39208984375, -0.3792533874511719, -0.36641693115234375, -0.3535804748535156, -0.3407440185546875, -0.3279075622558594, -0.31507110595703125, -0.3022346496582031, -0.289398193359375, -0.2765617370605469, -0.26372528076171875, -0.2508888244628906, -0.2380523681640625, -0.22521591186523438, -0.21237945556640625, -0.19954299926757812, -0.18670654296875, -0.17387008666992188, -0.16103363037109375, -0.14819717407226562, -0.1353607177734375, -0.12252426147460938, -0.10968780517578125, -0.09685134887695312, -0.084014892578125, -0.07117843627929688, -0.05834197998046875, -0.045505523681640625, -0.0326690673828125, -0.019832611083984375, -0.00699615478515625, 0.005840301513671875, 0.0186767578125, 0.031513214111328125, 0.04434967041015625, 0.057186126708984375, 0.0700225830078125, 0.08285903930664062, 0.09569549560546875, 0.10853195190429688, 0.121368408203125, 0.13420486450195312, 0.14704132080078125, 0.15987777709960938, 0.1727142333984375, 0.18555068969726562, 0.19838714599609375, 0.21122360229492188, 0.22406005859375, 0.23689651489257812, 0.24973297119140625, 0.2625694274902344, 0.2754058837890625, 0.2882423400878906, 0.30107879638671875, 0.3139152526855469, 0.326751708984375, 0.3395881652832031, 0.35242462158203125, 0.3652610778808594, 0.3780975341796875, 0.3909339904785156, 0.40377044677734375, 0.4166069030761719, 0.429443359375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 3.0, 11.0, 5.0, 13.0, 11.0, 17.0, 21.0, 39.0, 82.0, 126.0, 233.0, 416.0, 1312.0, 105184.0, 4080620.0, 4883.0, 596.0, 269.0, 170.0, 94.0, 50.0, 37.0, 19.0, 16.0, 13.0, 7.0, 5.0, 7.0, 2.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.1031494140625, -3.975830078125, -3.8485107421875, -3.72119140625, -3.5938720703125, -3.466552734375, -3.3392333984375, -3.2119140625, -3.0845947265625, -2.957275390625, -2.8299560546875, -2.70263671875, -2.5753173828125, -2.447998046875, -2.3206787109375, -2.193359375, -2.0660400390625, -1.938720703125, -1.8114013671875, -1.68408203125, -1.5567626953125, -1.429443359375, -1.3021240234375, -1.1748046875, -1.0474853515625, -0.920166015625, -0.7928466796875, -0.66552734375, -0.5382080078125, -0.410888671875, -0.2835693359375, -0.15625, -0.0289306640625, 0.098388671875, 0.2257080078125, 0.35302734375, 0.4803466796875, 0.607666015625, 0.7349853515625, 0.8623046875, 0.9896240234375, 1.116943359375, 1.2442626953125, 1.37158203125, 1.4989013671875, 1.626220703125, 1.7535400390625, 1.880859375, 2.0081787109375, 2.135498046875, 2.2628173828125, 2.39013671875, 2.5174560546875, 2.644775390625, 2.7720947265625, 2.8994140625, 3.0267333984375, 3.154052734375, 3.2813720703125, 3.40869140625, 3.5360107421875, 3.663330078125, 3.7906494140625, 3.91796875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 11.0, 9.0, 6.0, 7.0, 5.0, 15.0, 18.0, 23.0, 25.0, 52.0, 85.0, 121.0, 208.0, 302.0, 483.0, 588.0, 589.0, 510.0, 350.0, 235.0, 125.0, 92.0, 68.0, 35.0, 35.0, 21.0, 14.0, 12.0, 11.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.170654296875, -0.16535377502441406, -0.16005325317382812, -0.1547527313232422, -0.14945220947265625, -0.1441516876220703, -0.13885116577148438, -0.13355064392089844, -0.1282501220703125, -0.12294960021972656, -0.11764907836914062, -0.11234855651855469, -0.10704803466796875, -0.10174751281738281, -0.09644699096679688, -0.09114646911621094, -0.085845947265625, -0.08054542541503906, -0.07524490356445312, -0.06994438171386719, -0.06464385986328125, -0.05934333801269531, -0.054042816162109375, -0.04874229431152344, -0.0434417724609375, -0.03814125061035156, -0.032840728759765625, -0.027540206909179688, -0.02223968505859375, -0.016939163208007812, -0.011638641357421875, -0.0063381195068359375, -0.00103759765625, 0.0042629241943359375, 0.009563446044921875, 0.014863967895507812, 0.02016448974609375, 0.025465011596679688, 0.030765533447265625, 0.03606605529785156, 0.0413665771484375, 0.04666709899902344, 0.051967620849609375, 0.05726814270019531, 0.06256866455078125, 0.06786918640136719, 0.07316970825195312, 0.07847023010253906, 0.083770751953125, 0.08907127380371094, 0.09437179565429688, 0.09967231750488281, 0.10497283935546875, 0.11027336120605469, 0.11557388305664062, 0.12087440490722656, 0.1261749267578125, 0.13147544860839844, 0.13677597045898438, 0.1420764923095703, 0.14737701416015625, 0.1526775360107422, 0.15797805786132812, 0.16327857971191406, 0.1685791015625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 11.0, 16.0, 10.0, 17.0, 26.0, 42.0, 73.0, 84.0, 90.0, 101.0, 120.0, 94.0, 69.0, 77.0, 49.0, 27.0, 27.0, 20.0, 9.0, 11.0, 3.0, 7.0, 3.0, 7.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.6752675175666809, -0.6595718264579773, -0.6438761353492737, -0.6281804442405701, -0.6124847531318665, -0.5967890620231628, -0.5810933709144592, -0.5653976798057556, -0.549701988697052, -0.5340062975883484, -0.5183106064796448, -0.5026149153709412, -0.48691922426223755, -0.47122353315353394, -0.4555278420448303, -0.4398321509361267, -0.4241364598274231, -0.4084407687187195, -0.39274507761001587, -0.37704938650131226, -0.36135369539260864, -0.34565800428390503, -0.3299623131752014, -0.3142666220664978, -0.2985709309577942, -0.2828752398490906, -0.26717954874038696, -0.25148385763168335, -0.23578816652297974, -0.22009247541427612, -0.2043967843055725, -0.1887010931968689, -0.1730053722858429, -0.15730968117713928, -0.14161399006843567, -0.12591829895973206, -0.11022260785102844, -0.09452691674232483, -0.07883122563362122, -0.0631355345249176, -0.04743984341621399, -0.031744152307510376, -0.016048461198806763, -0.0003527700901031494, 0.015342921018600464, 0.031038612127304077, 0.04673430323600769, 0.062429994344711304, 0.07812568545341492, 0.09382137656211853, 0.10951706767082214, 0.12521275877952576, 0.14090844988822937, 0.15660414099693298, 0.1722998321056366, 0.1879955232143402, 0.20369121432304382, 0.21938690543174744, 0.23508259654045105, 0.25077828764915466, 0.2664739787578583, 0.2821696698665619, 0.2978653609752655, 0.3135610520839691, 0.32925674319267273]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 8.0, 9.0, 13.0, 13.0, 14.0, 15.0, 28.0, 17.0, 33.0, 35.0, 30.0, 35.0, 45.0, 49.0, 39.0, 66.0, 58.0, 46.0, 46.0, 51.0, 40.0, 35.0, 28.0, 43.0, 37.0, 32.0, 20.0, 24.0, 15.0, 15.0, 13.0, 15.0, 9.0, 11.0, 4.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4223138689994812, -0.40715429186820984, -0.39199474453926086, -0.3768351674079895, -0.36167559027671814, -0.3465160131454468, -0.3313564658164978, -0.31619688868522644, -0.3010373115539551, -0.2858777344226837, -0.27071818709373474, -0.2555586099624634, -0.24039903283119202, -0.22523947060108185, -0.21007990837097168, -0.19492033123970032, -0.17976078391075134, -0.16460122168064117, -0.1494416445493698, -0.13428208231925964, -0.11912251263856888, -0.10396294295787811, -0.08880338072776794, -0.07364381104707718, -0.058484241366386414, -0.04332467168569565, -0.02816510573029518, -0.013005539774894714, 0.002154029905796051, 0.017313599586486816, 0.032473161816596985, 0.04763273149728775, 0.06279230117797852, 0.07795187085866928, 0.09311144053936005, 0.10827100276947021, 0.12343057245016098, 0.13859014213085175, 0.15374970436096191, 0.16890928149223328, 0.18406884372234344, 0.1992284059524536, 0.21438798308372498, 0.22954754531383514, 0.2447071075439453, 0.2598666846752167, 0.27502626180648804, 0.290185809135437, 0.3053453862667084, 0.32050496339797974, 0.3356645107269287, 0.3508240878582001, 0.36598366498947144, 0.3811432123184204, 0.3963027894496918, 0.41146236658096313, 0.4266219139099121, 0.44178149104118347, 0.45694103837013245, 0.4721006155014038, 0.48726019263267517, 0.5024197697639465, 0.5175793170928955, 0.5327388644218445, 0.5478984713554382]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 8.0, 14.0, 18.0, 15.0, 35.0, 44.0, 54.0, 76.0, 95.0, 135.0, 186.0, 251.0, 435.0, 652.0, 1039.0, 1609.0, 2461.0, 3988.0, 6447.0, 10938.0, 19167.0, 33754.0, 62745.0, 124113.0, 247110.0, 254524.0, 129308.0, 65475.0, 34990.0, 19442.0, 11192.0, 6723.0, 4078.0, 2580.0, 1722.0, 1054.0, 673.0, 424.0, 297.0, 186.0, 136.0, 87.0, 76.0, 61.0, 39.0, 32.0, 22.0, 15.0, 15.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.27294921875, -0.26415252685546875, -0.2553558349609375, -0.24655914306640625, -0.237762451171875, -0.22896575927734375, -0.2201690673828125, -0.21137237548828125, -0.20257568359375, -0.19377899169921875, -0.1849822998046875, -0.17618560791015625, -0.167388916015625, -0.15859222412109375, -0.1497955322265625, -0.14099884033203125, -0.1322021484375, -0.12340545654296875, -0.1146087646484375, -0.10581207275390625, -0.097015380859375, -0.08821868896484375, -0.0794219970703125, -0.07062530517578125, -0.06182861328125, -0.05303192138671875, -0.0442352294921875, -0.03543853759765625, -0.026641845703125, -0.01784515380859375, -0.0090484619140625, -0.00025177001953125, 0.008544921875, 0.01734161376953125, 0.0261383056640625, 0.03493499755859375, 0.043731689453125, 0.05252838134765625, 0.0613250732421875, 0.07012176513671875, 0.07891845703125, 0.08771514892578125, 0.0965118408203125, 0.10530853271484375, 0.114105224609375, 0.12290191650390625, 0.1316986083984375, 0.14049530029296875, 0.1492919921875, 0.15808868408203125, 0.1668853759765625, 0.17568206787109375, 0.184478759765625, 0.19327545166015625, 0.2020721435546875, 0.21086883544921875, 0.21966552734375, 0.22846221923828125, 0.2372589111328125, 0.24605560302734375, 0.254852294921875, 0.26364898681640625, 0.2724456787109375, 0.28124237060546875, 0.2900390625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 4.0, 8.0, 11.0, 16.0, 19.0, 9.0, 22.0, 16.0, 34.0, 33.0, 30.0, 37.0, 35.0, 51.0, 51.0, 46.0, 44.0, 52.0, 52.0, 52.0, 43.0, 31.0, 45.0, 34.0, 32.0, 36.0, 33.0, 26.0, 16.0, 21.0, 6.0, 7.0, 15.0, 10.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.333984375, -0.32171630859375, -0.3094482421875, -0.29718017578125, -0.284912109375, -0.27264404296875, -0.2603759765625, -0.24810791015625, -0.23583984375, -0.22357177734375, -0.2113037109375, -0.19903564453125, -0.186767578125, -0.17449951171875, -0.1622314453125, -0.14996337890625, -0.1376953125, -0.12542724609375, -0.1131591796875, -0.10089111328125, -0.088623046875, -0.07635498046875, -0.0640869140625, -0.05181884765625, -0.03955078125, -0.02728271484375, -0.0150146484375, -0.00274658203125, 0.009521484375, 0.02178955078125, 0.0340576171875, 0.04632568359375, 0.05859375, 0.07086181640625, 0.0831298828125, 0.09539794921875, 0.107666015625, 0.11993408203125, 0.1322021484375, 0.14447021484375, 0.15673828125, 0.16900634765625, 0.1812744140625, 0.19354248046875, 0.205810546875, 0.21807861328125, 0.2303466796875, 0.24261474609375, 0.2548828125, 0.26715087890625, 0.2794189453125, 0.29168701171875, 0.303955078125, 0.31622314453125, 0.3284912109375, 0.34075927734375, 0.35302734375, 0.36529541015625, 0.3775634765625, 0.38983154296875, 0.402099609375, 0.41436767578125, 0.4266357421875, 0.43890380859375, 0.451171875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 9.0, 12.0, 12.0, 20.0, 29.0, 46.0, 60.0, 96.0, 137.0, 217.0, 318.0, 476.0, 746.0, 1224.0, 2201.0, 3605.0, 6752.0, 12482.0, 24235.0, 50903.0, 113504.0, 311176.0, 306282.0, 111775.0, 49872.0, 24236.0, 12480.0, 6598.0, 3586.0, 2003.0, 1331.0, 760.0, 489.0, 303.0, 191.0, 130.0, 89.0, 47.0, 43.0, 32.0, 21.0, 14.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2359619140625, -0.22858619689941406, -0.22121047973632812, -0.2138347625732422, -0.20645904541015625, -0.1990833282470703, -0.19170761108398438, -0.18433189392089844, -0.1769561767578125, -0.16958045959472656, -0.16220474243164062, -0.1548290252685547, -0.14745330810546875, -0.1400775909423828, -0.13270187377929688, -0.12532615661621094, -0.117950439453125, -0.11057472229003906, -0.10319900512695312, -0.09582328796386719, -0.08844757080078125, -0.08107185363769531, -0.07369613647460938, -0.06632041931152344, -0.0589447021484375, -0.05156898498535156, -0.044193267822265625, -0.03681755065917969, -0.02944183349609375, -0.022066116333007812, -0.014690399169921875, -0.0073146820068359375, 6.103515625e-05, 0.0074367523193359375, 0.014812469482421875, 0.022188186645507812, 0.02956390380859375, 0.03693962097167969, 0.044315338134765625, 0.05169105529785156, 0.0590667724609375, 0.06644248962402344, 0.07381820678710938, 0.08119392395019531, 0.08856964111328125, 0.09594535827636719, 0.10332107543945312, 0.11069679260253906, 0.118072509765625, 0.12544822692871094, 0.13282394409179688, 0.1401996612548828, 0.14757537841796875, 0.1549510955810547, 0.16232681274414062, 0.16970252990722656, 0.1770782470703125, 0.18445396423339844, 0.19182968139648438, 0.1992053985595703, 0.20658111572265625, 0.2139568328857422, 0.22133255004882812, 0.22870826721191406, 0.236083984375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 5.0, 6.0, 12.0, 9.0, 17.0, 16.0, 26.0, 28.0, 22.0, 29.0, 36.0, 43.0, 41.0, 45.0, 44.0, 45.0, 60.0, 47.0, 63.0, 50.0, 34.0, 26.0, 42.0, 33.0, 39.0, 27.0, 29.0, 20.0, 21.0, 12.0, 16.0, 16.0, 8.0, 8.0, 6.0, 4.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1949462890625, -0.1869640350341797, -0.17898178100585938, -0.17099952697753906, -0.16301727294921875, -0.15503501892089844, -0.14705276489257812, -0.1390705108642578, -0.1310882568359375, -0.12310600280761719, -0.11512374877929688, -0.10714149475097656, -0.09915924072265625, -0.09117698669433594, -0.08319473266601562, -0.07521247863769531, -0.067230224609375, -0.05924797058105469, -0.051265716552734375, -0.04328346252441406, -0.03530120849609375, -0.027318954467773438, -0.019336700439453125, -0.011354446411132812, -0.0033721923828125, 0.0046100616455078125, 0.012592315673828125, 0.020574569702148438, 0.02855682373046875, 0.03653907775878906, 0.044521331787109375, 0.05250358581542969, 0.06048583984375, 0.06846809387207031, 0.07645034790039062, 0.08443260192871094, 0.09241485595703125, 0.10039710998535156, 0.10837936401367188, 0.11636161804199219, 0.1243438720703125, 0.1323261260986328, 0.14030838012695312, 0.14829063415527344, 0.15627288818359375, 0.16425514221191406, 0.17223739624023438, 0.1802196502685547, 0.188201904296875, 0.1961841583251953, 0.20416641235351562, 0.21214866638183594, 0.22013092041015625, 0.22811317443847656, 0.23609542846679688, 0.2440776824951172, 0.2520599365234375, 0.2600421905517578, 0.2680244445800781, 0.27600669860839844, 0.28398895263671875, 0.29197120666503906, 0.2999534606933594, 0.3079357147216797, 0.31591796875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 8.0, 11.0, 7.0, 11.0, 16.0, 9.0, 27.0, 28.0, 36.0, 56.0, 87.0, 117.0, 148.0, 220.0, 345.0, 531.0, 860.0, 1387.0, 2359.0, 4153.0, 7694.0, 16015.0, 40913.0, 159690.0, 604355.0, 139542.0, 37833.0, 14848.0, 7330.0, 3900.0, 2236.0, 1313.0, 814.0, 516.0, 352.0, 227.0, 167.0, 103.0, 82.0, 44.0, 38.0, 39.0, 26.0, 22.0, 8.0, 5.0, 12.0, 5.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.0252838134765625, -0.024504899978637695, -0.02372598648071289, -0.022947072982788086, -0.02216815948486328, -0.021389245986938477, -0.020610332489013672, -0.019831418991088867, -0.019052505493164062, -0.018273591995239258, -0.017494678497314453, -0.01671576499938965, -0.015936851501464844, -0.015157938003540039, -0.014379024505615234, -0.01360011100769043, -0.012821197509765625, -0.01204228401184082, -0.011263370513916016, -0.010484457015991211, -0.009705543518066406, -0.008926630020141602, -0.008147716522216797, -0.007368803024291992, -0.0065898895263671875, -0.005810976028442383, -0.005032062530517578, -0.0042531490325927734, -0.0034742355346679688, -0.002695322036743164, -0.0019164085388183594, -0.0011374950408935547, -0.00035858154296875, 0.0004203319549560547, 0.0011992454528808594, 0.001978158950805664, 0.0027570724487304688, 0.0035359859466552734, 0.004314899444580078, 0.005093812942504883, 0.0058727264404296875, 0.006651639938354492, 0.007430553436279297, 0.008209466934204102, 0.008988380432128906, 0.009767293930053711, 0.010546207427978516, 0.01132512092590332, 0.012104034423828125, 0.01288294792175293, 0.013661861419677734, 0.014440774917602539, 0.015219688415527344, 0.01599860191345215, 0.016777515411376953, 0.017556428909301758, 0.018335342407226562, 0.019114255905151367, 0.019893169403076172, 0.020672082901000977, 0.02145099639892578, 0.022229909896850586, 0.02300882339477539, 0.023787736892700195, 0.024566650390625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 5.0, 2.0, 3.0, 10.0, 7.0, 15.0, 11.0, 17.0, 10.0, 19.0, 14.0, 39.0, 35.0, 56.0, 91.0, 125.0, 140.0, 97.0, 82.0, 33.0, 38.0, 25.0, 11.0, 14.0, 14.0, 12.0, 14.0, 14.0, 4.0, 5.0, 6.0, 3.0, 2.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.396106719970703e-05, -2.3215077817440033e-05, -2.2469088435173035e-05, -2.1723099052906036e-05, -2.0977109670639038e-05, -2.023112028837204e-05, -1.948513090610504e-05, -1.8739141523838043e-05, -1.7993152141571045e-05, -1.7247162759304047e-05, -1.650117337703705e-05, -1.575518399477005e-05, -1.5009194612503052e-05, -1.4263205230236053e-05, -1.3517215847969055e-05, -1.2771226465702057e-05, -1.2025237083435059e-05, -1.127924770116806e-05, -1.0533258318901062e-05, -9.787268936634064e-06, -9.041279554367065e-06, -8.295290172100067e-06, -7.549300789833069e-06, -6.8033114075660706e-06, -6.057322025299072e-06, -5.311332643032074e-06, -4.565343260765076e-06, -3.819353878498077e-06, -3.073364496231079e-06, -2.327375113964081e-06, -1.5813857316970825e-06, -8.353963494300842e-07, -8.940696716308594e-08, 6.565824151039124e-07, 1.4025717973709106e-06, 2.148561179637909e-06, 2.8945505619049072e-06, 3.6405399441719055e-06, 4.386529326438904e-06, 5.132518708705902e-06, 5.8785080909729e-06, 6.624497473239899e-06, 7.370486855506897e-06, 8.116476237773895e-06, 8.862465620040894e-06, 9.608455002307892e-06, 1.035444438457489e-05, 1.1100433766841888e-05, 1.1846423149108887e-05, 1.2592412531375885e-05, 1.3338401913642883e-05, 1.4084391295909882e-05, 1.483038067817688e-05, 1.5576370060443878e-05, 1.6322359442710876e-05, 1.7068348824977875e-05, 1.7814338207244873e-05, 1.856032758951187e-05, 1.930631697177887e-05, 2.0052306354045868e-05, 2.0798295736312866e-05, 2.1544285118579865e-05, 2.2290274500846863e-05, 2.303626388311386e-05, 2.378225326538086e-05]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 8.0, 9.0, 11.0, 21.0, 29.0, 45.0, 40.0, 93.0, 345.0, 7556.0, 1019025.0, 20524.0, 493.0, 115.0, 63.0, 41.0, 29.0, 22.0, 16.0, 7.0, 7.0, 2.0, 5.0, 8.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.232177734375, -0.22406005859375, -0.2159423828125, -0.20782470703125, -0.19970703125, -0.19158935546875, -0.1834716796875, -0.17535400390625, -0.167236328125, -0.15911865234375, -0.1510009765625, -0.14288330078125, -0.134765625, -0.12664794921875, -0.1185302734375, -0.11041259765625, -0.102294921875, -0.09417724609375, -0.0860595703125, -0.07794189453125, -0.06982421875, -0.06170654296875, -0.0535888671875, -0.04547119140625, -0.037353515625, -0.02923583984375, -0.0211181640625, -0.01300048828125, -0.0048828125, 0.00323486328125, 0.0113525390625, 0.01947021484375, 0.027587890625, 0.03570556640625, 0.0438232421875, 0.05194091796875, 0.06005859375, 0.06817626953125, 0.0762939453125, 0.08441162109375, 0.092529296875, 0.10064697265625, 0.1087646484375, 0.11688232421875, 0.125, 0.13311767578125, 0.1412353515625, 0.14935302734375, 0.157470703125, 0.16558837890625, 0.1737060546875, 0.18182373046875, 0.18994140625, 0.19805908203125, 0.2061767578125, 0.21429443359375, 0.222412109375, 0.23052978515625, 0.2386474609375, 0.24676513671875, 0.2548828125, 0.26300048828125, 0.2711181640625, 0.27923583984375, 0.287353515625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 7.0, 4.0, 16.0, 15.0, 21.0, 15.0, 35.0, 78.0, 132.0, 242.0, 169.0, 68.0, 34.0, 31.0, 25.0, 13.0, 18.0, 6.0, 5.0, 5.0, 4.0, 3.0, 6.0, 7.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00873565673828125, -0.008430004119873047, -0.008124351501464844, -0.00781869888305664, -0.0075130462646484375, -0.007207393646240234, -0.006901741027832031, -0.006596088409423828, -0.006290435791015625, -0.005984783172607422, -0.005679130554199219, -0.005373477935791016, -0.0050678253173828125, -0.004762172698974609, -0.004456520080566406, -0.004150867462158203, -0.00384521484375, -0.003539562225341797, -0.0032339096069335938, -0.0029282569885253906, -0.0026226043701171875, -0.0023169517517089844, -0.0020112991333007812, -0.0017056465148925781, -0.001399993896484375, -0.0010943412780761719, -0.0007886886596679688, -0.0004830360412597656, -0.0001773834228515625, 0.00012826919555664062, 0.00043392181396484375, 0.0007395744323730469, 0.00104522705078125, 0.0013508796691894531, 0.0016565322875976562, 0.0019621849060058594, 0.0022678375244140625, 0.0025734901428222656, 0.0028791427612304688, 0.003184795379638672, 0.003490447998046875, 0.003796100616455078, 0.004101753234863281, 0.004407405853271484, 0.0047130584716796875, 0.005018711090087891, 0.005324363708496094, 0.005630016326904297, 0.0059356689453125, 0.006241321563720703, 0.006546974182128906, 0.006852626800537109, 0.0071582794189453125, 0.007463932037353516, 0.007769584655761719, 0.008075237274169922, 0.008380889892578125, 0.008686542510986328, 0.008992195129394531, 0.009297847747802734, 0.009603500366210938, 0.00990915298461914, 0.010214805603027344, 0.010520458221435547, 0.01082611083984375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 13.0, 15.0, 15.0, 29.0, 42.0, 54.0, 86.0, 111.0, 125.0, 130.0, 117.0, 58.0, 73.0, 38.0, 30.0, 16.0, 11.0, 12.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.8512006402015686, -0.8318063020706177, -0.8124119639396667, -0.7930176258087158, -0.7736232876777649, -0.754228949546814, -0.7348345518112183, -0.7154402136802673, -0.6960458755493164, -0.6766515374183655, -0.6572571992874146, -0.6378628611564636, -0.6184685230255127, -0.599074125289917, -0.5796798467636108, -0.5602854490280151, -0.540891170501709, -0.5214968323707581, -0.5021024942398071, -0.4827081561088562, -0.4633137881755829, -0.44391945004463196, -0.42452511191368103, -0.4051307439804077, -0.3857364058494568, -0.36634206771850586, -0.34694772958755493, -0.327553391456604, -0.3081590235233307, -0.28876468539237976, -0.26937034726142883, -0.2499759942293167, -0.2305816113948822, -0.21118727326393127, -0.19179292023181915, -0.17239858210086823, -0.1530042290687561, -0.13360989093780518, -0.11421555280685425, -0.09482119977474213, -0.0754268616437912, -0.056032516062259674, -0.03663817420601845, -0.01724383234977722, 0.002150513231754303, 0.021544858813285828, 0.040939196944236755, 0.06033354997634888, 0.0797278881072998, 0.09912223368883133, 0.11851657927036285, 0.13791091740131378, 0.1573052704334259, 0.17669960856437683, 0.19609394669532776, 0.21548829972743988, 0.2348826378583908, 0.25427699089050293, 0.27367132902145386, 0.2930656671524048, 0.3124600052833557, 0.33185434341430664, 0.35124868154525757, 0.3706430494785309, 0.3900373876094818]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 13.0, 10.0, 12.0, 14.0, 18.0, 27.0, 21.0, 32.0, 30.0, 31.0, 36.0, 47.0, 54.0, 49.0, 58.0, 53.0, 55.0, 51.0, 50.0, 33.0, 39.0, 38.0, 38.0, 35.0, 27.0, 21.0, 22.0, 18.0, 13.0, 12.0, 10.0, 12.0, 8.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34968361258506775, -0.3370632529258728, -0.32444289326667786, -0.3118225336074829, -0.29920220375061035, -0.2865818440914154, -0.27396148443222046, -0.2613411247730255, -0.24872078001499176, -0.23610042035579681, -0.22348007559776306, -0.21085971593856812, -0.19823935627937317, -0.18561901152133942, -0.17299865186214447, -0.16037830710411072, -0.14775794744491577, -0.13513758778572083, -0.12251724302768707, -0.10989688336849213, -0.09727653115987778, -0.08465617895126343, -0.07203581929206848, -0.05941546708345413, -0.04679511487483978, -0.03417476266622543, -0.021554406732320786, -0.008934050798416138, 0.0036863014101982117, 0.01630665361881256, 0.028927013278007507, 0.04154736548662186, 0.05416768789291382, 0.06678804010152817, 0.07940839231014252, 0.09202875196933746, 0.10464910417795181, 0.11726945638656616, 0.1298898160457611, 0.14251017570495605, 0.1551305204629898, 0.16775088012218475, 0.1803712248802185, 0.19299158453941345, 0.2056119441986084, 0.21823228895664215, 0.2308526486158371, 0.24347299337387085, 0.2560933530330658, 0.26871371269226074, 0.2813340723514557, 0.29395443201065063, 0.3065747618675232, 0.31919512152671814, 0.3318154811859131, 0.34443584084510803, 0.357056200504303, 0.3696765601634979, 0.38229691982269287, 0.39491724967956543, 0.4075376093387604, 0.4201579689979553, 0.43277832865715027, 0.4453986883163452, 0.4580190181732178]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 10.0, 27.0, 30.0, 56.0, 74.0, 108.0, 142.0, 213.0, 366.0, 548.0, 867.0, 1369.0, 2179.0, 3568.0, 5921.0, 9750.0, 16908.0, 29429.0, 52745.0, 95291.0, 165267.0, 225974.0, 184888.0, 109434.0, 61255.0, 33957.0, 19297.0, 11254.0, 6625.0, 4170.0, 2554.0, 1551.0, 954.0, 606.0, 393.0, 298.0, 136.0, 110.0, 82.0, 51.0, 32.0, 19.0, 16.0, 12.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4931640625, -0.4765167236328125, -0.459869384765625, -0.4432220458984375, -0.42657470703125, -0.4099273681640625, -0.393280029296875, -0.3766326904296875, -0.3599853515625, -0.3433380126953125, -0.326690673828125, -0.3100433349609375, -0.29339599609375, -0.2767486572265625, -0.260101318359375, -0.2434539794921875, -0.226806640625, -0.2101593017578125, -0.193511962890625, -0.1768646240234375, -0.16021728515625, -0.1435699462890625, -0.126922607421875, -0.1102752685546875, -0.0936279296875, -0.0769805908203125, -0.060333251953125, -0.0436859130859375, -0.02703857421875, -0.0103912353515625, 0.006256103515625, 0.0229034423828125, 0.03955078125, 0.0561981201171875, 0.072845458984375, 0.0894927978515625, 0.10614013671875, 0.1227874755859375, 0.139434814453125, 0.1560821533203125, 0.1727294921875, 0.1893768310546875, 0.206024169921875, 0.2226715087890625, 0.23931884765625, 0.2559661865234375, 0.272613525390625, 0.2892608642578125, 0.305908203125, 0.3225555419921875, 0.339202880859375, 0.3558502197265625, 0.37249755859375, 0.3891448974609375, 0.405792236328125, 0.4224395751953125, 0.4390869140625, 0.4557342529296875, 0.472381591796875, 0.4890289306640625, 0.50567626953125, 0.5223236083984375, 0.538970947265625, 0.5556182861328125, 0.572265625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 5.0, 6.0, 11.0, 7.0, 10.0, 18.0, 8.0, 20.0, 36.0, 26.0, 31.0, 42.0, 36.0, 46.0, 48.0, 52.0, 52.0, 50.0, 43.0, 53.0, 43.0, 43.0, 45.0, 39.0, 33.0, 28.0, 18.0, 38.0, 25.0, 17.0, 22.0, 12.0, 13.0, 6.0, 7.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48779296875, -0.4709320068359375, -0.454071044921875, -0.4372100830078125, -0.42034912109375, -0.4034881591796875, -0.386627197265625, -0.3697662353515625, -0.3529052734375, -0.3360443115234375, -0.319183349609375, -0.3023223876953125, -0.28546142578125, -0.2686004638671875, -0.251739501953125, -0.2348785400390625, -0.218017578125, -0.2011566162109375, -0.184295654296875, -0.1674346923828125, -0.15057373046875, -0.1337127685546875, -0.116851806640625, -0.0999908447265625, -0.0831298828125, -0.0662689208984375, -0.049407958984375, -0.0325469970703125, -0.01568603515625, 0.0011749267578125, 0.018035888671875, 0.0348968505859375, 0.0517578125, 0.0686187744140625, 0.085479736328125, 0.1023406982421875, 0.11920166015625, 0.1360626220703125, 0.152923583984375, 0.1697845458984375, 0.1866455078125, 0.2035064697265625, 0.220367431640625, 0.2372283935546875, 0.25408935546875, 0.2709503173828125, 0.287811279296875, 0.3046722412109375, 0.321533203125, 0.3383941650390625, 0.355255126953125, 0.3721160888671875, 0.38897705078125, 0.4058380126953125, 0.422698974609375, 0.4395599365234375, 0.4564208984375, 0.4732818603515625, 0.490142822265625, 0.5070037841796875, 0.52386474609375, 0.5407257080078125, 0.557586669921875, 0.5744476318359375, 0.59130859375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 9.0, 6.0, 8.0, 7.0, 8.0, 15.0, 17.0, 18.0, 25.0, 31.0, 34.0, 34.0, 42.0, 63.0, 72.0, 187.0, 1753.0, 85793.0, 932281.0, 26850.0, 808.0, 146.0, 70.0, 49.0, 32.0, 32.0, 27.0, 22.0, 27.0, 18.0, 18.0, 12.0, 11.0, 6.0, 4.0, 6.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.787109375, -3.658172607421875, -3.52923583984375, -3.400299072265625, -3.2713623046875, -3.142425537109375, -3.01348876953125, -2.884552001953125, -2.755615234375, -2.626678466796875, -2.49774169921875, -2.368804931640625, -2.2398681640625, -2.110931396484375, -1.98199462890625, -1.853057861328125, -1.72412109375, -1.595184326171875, -1.46624755859375, -1.337310791015625, -1.2083740234375, -1.079437255859375, -0.95050048828125, -0.821563720703125, -0.692626953125, -0.563690185546875, -0.43475341796875, -0.305816650390625, -0.1768798828125, -0.047943115234375, 0.08099365234375, 0.209930419921875, 0.3388671875, 0.467803955078125, 0.59674072265625, 0.725677490234375, 0.8546142578125, 0.983551025390625, 1.11248779296875, 1.241424560546875, 1.370361328125, 1.499298095703125, 1.62823486328125, 1.757171630859375, 1.8861083984375, 2.015045166015625, 2.14398193359375, 2.272918701171875, 2.40185546875, 2.530792236328125, 2.65972900390625, 2.788665771484375, 2.9176025390625, 3.046539306640625, 3.17547607421875, 3.304412841796875, 3.433349609375, 3.562286376953125, 3.69122314453125, 3.820159912109375, 3.9490966796875, 4.078033447265625, 4.20697021484375, 4.335906982421875, 4.46484375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 7.0, 8.0, 7.0, 9.0, 6.0, 14.0, 23.0, 27.0, 16.0, 32.0, 38.0, 25.0, 47.0, 48.0, 33.0, 44.0, 52.0, 47.0, 67.0, 50.0, 39.0, 46.0, 53.0, 34.0, 45.0, 24.0, 25.0, 27.0, 18.0, 19.0, 18.0, 10.0, 12.0, 4.0, 5.0, 6.0, 2.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.55615234375, -0.5376968383789062, -0.5192413330078125, -0.5007858276367188, -0.482330322265625, -0.46387481689453125, -0.4454193115234375, -0.42696380615234375, -0.40850830078125, -0.39005279541015625, -0.3715972900390625, -0.35314178466796875, -0.334686279296875, -0.31623077392578125, -0.2977752685546875, -0.27931976318359375, -0.2608642578125, -0.24240875244140625, -0.2239532470703125, -0.20549774169921875, -0.187042236328125, -0.16858673095703125, -0.1501312255859375, -0.13167572021484375, -0.11322021484375, -0.09476470947265625, -0.0763092041015625, -0.05785369873046875, -0.039398193359375, -0.02094268798828125, -0.0024871826171875, 0.01596832275390625, 0.034423828125, 0.05287933349609375, 0.0713348388671875, 0.08979034423828125, 0.108245849609375, 0.12670135498046875, 0.1451568603515625, 0.16361236572265625, 0.18206787109375, 0.20052337646484375, 0.2189788818359375, 0.23743438720703125, 0.255889892578125, 0.27434539794921875, 0.2928009033203125, 0.31125640869140625, 0.3297119140625, 0.34816741943359375, 0.3666229248046875, 0.38507843017578125, 0.403533935546875, 0.42198944091796875, 0.4404449462890625, 0.45890045166015625, 0.47735595703125, 0.49581146240234375, 0.5142669677734375, 0.5327224731445312, 0.551177978515625, 0.5696334838867188, 0.5880889892578125, 0.6065444946289062, 0.625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 10.0, 16.0, 23.0, 25.0, 26.0, 35.0, 60.0, 82.0, 105.0, 154.0, 241.0, 356.0, 578.0, 891.0, 1754.0, 3087.0, 6390.0, 14564.0, 43114.0, 296232.0, 596005.0, 52737.0, 16751.0, 7083.0, 3458.0, 1913.0, 1033.0, 600.0, 398.0, 242.0, 148.0, 133.0, 86.0, 46.0, 42.0, 36.0, 29.0, 9.0, 13.0, 9.0, 11.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2587890625, -0.2507209777832031, -0.24265289306640625, -0.23458480834960938, -0.2265167236328125, -0.21844863891601562, -0.21038055419921875, -0.20231246948242188, -0.194244384765625, -0.18617630004882812, -0.17810821533203125, -0.17004013061523438, -0.1619720458984375, -0.15390396118164062, -0.14583587646484375, -0.13776779174804688, -0.12969970703125, -0.12163162231445312, -0.11356353759765625, -0.10549545288085938, -0.0974273681640625, -0.08935928344726562, -0.08129119873046875, -0.07322311401367188, -0.065155029296875, -0.057086944580078125, -0.04901885986328125, -0.040950775146484375, -0.0328826904296875, -0.024814605712890625, -0.01674652099609375, -0.008678436279296875, -0.0006103515625, 0.007457733154296875, 0.01552581787109375, 0.023593902587890625, 0.0316619873046875, 0.039730072021484375, 0.04779815673828125, 0.055866241455078125, 0.063934326171875, 0.07200241088867188, 0.08007049560546875, 0.08813858032226562, 0.0962066650390625, 0.10427474975585938, 0.11234283447265625, 0.12041091918945312, 0.12847900390625, 0.13654708862304688, 0.14461517333984375, 0.15268325805664062, 0.1607513427734375, 0.16881942749023438, 0.17688751220703125, 0.18495559692382812, 0.193023681640625, 0.20109176635742188, 0.20915985107421875, 0.21722793579101562, 0.2252960205078125, 0.23336410522460938, 0.24143218994140625, 0.24950027465820312, 0.257568359375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 12.0, 11.0, 22.0, 48.0, 92.0, 195.0, 282.0, 160.0, 61.0, 35.0, 20.0, 15.0, 7.0, 6.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.218650817871094e-05, -3.1159259378910065e-05, -3.0132010579109192e-05, -2.910476177930832e-05, -2.8077512979507446e-05, -2.7050264179706573e-05, -2.60230153799057e-05, -2.4995766580104828e-05, -2.3968517780303955e-05, -2.2941268980503082e-05, -2.191402018070221e-05, -2.0886771380901337e-05, -1.9859522581100464e-05, -1.883227378129959e-05, -1.7805024981498718e-05, -1.6777776181697845e-05, -1.5750527381896973e-05, -1.47232785820961e-05, -1.3696029782295227e-05, -1.2668780982494354e-05, -1.1641532182693481e-05, -1.0614283382892609e-05, -9.587034583091736e-06, -8.559785783290863e-06, -7.53253698348999e-06, -6.5052881836891174e-06, -5.478039383888245e-06, -4.450790584087372e-06, -3.423541784286499e-06, -2.3962929844856262e-06, -1.3690441846847534e-06, -3.417953848838806e-07, 6.854534149169922e-07, 1.712702214717865e-06, 2.739951014518738e-06, 3.7671998143196106e-06, 4.794448614120483e-06, 5.821697413921356e-06, 6.848946213722229e-06, 7.876195013523102e-06, 8.903443813323975e-06, 9.930692613124847e-06, 1.095794141292572e-05, 1.1985190212726593e-05, 1.3012439012527466e-05, 1.4039687812328339e-05, 1.5066936612129211e-05, 1.6094185411930084e-05, 1.7121434211730957e-05, 1.814868301153183e-05, 1.9175931811332703e-05, 2.0203180611133575e-05, 2.1230429410934448e-05, 2.225767821073532e-05, 2.3284927010536194e-05, 2.4312175810337067e-05, 2.533942461013794e-05, 2.6366673409938812e-05, 2.7393922209739685e-05, 2.8421171009540558e-05, 2.944841980934143e-05, 3.0475668609142303e-05, 3.1502917408943176e-05, 3.253016620874405e-05, 3.355741500854492e-05]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 18.0, 15.0, 35.0, 74.0, 207.0, 2245.0, 1000800.0, 44132.0, 768.0, 118.0, 44.0, 25.0, 17.0, 10.0, 8.0, 6.0, 2.0, 2.0, 3.0, 8.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3681640625, -1.3151702880859375, -1.262176513671875, -1.2091827392578125, -1.15618896484375, -1.1031951904296875, -1.050201416015625, -0.9972076416015625, -0.9442138671875, -0.8912200927734375, -0.838226318359375, -0.7852325439453125, -0.73223876953125, -0.6792449951171875, -0.626251220703125, -0.5732574462890625, -0.520263671875, -0.4672698974609375, -0.414276123046875, -0.3612823486328125, -0.30828857421875, -0.2552947998046875, -0.202301025390625, -0.1493072509765625, -0.0963134765625, -0.0433197021484375, 0.009674072265625, 0.0626678466796875, 0.11566162109375, 0.1686553955078125, 0.221649169921875, 0.2746429443359375, 0.32763671875, 0.3806304931640625, 0.433624267578125, 0.4866180419921875, 0.53961181640625, 0.5926055908203125, 0.645599365234375, 0.6985931396484375, 0.7515869140625, 0.8045806884765625, 0.857574462890625, 0.9105682373046875, 0.96356201171875, 1.0165557861328125, 1.069549560546875, 1.1225433349609375, 1.175537109375, 1.2285308837890625, 1.281524658203125, 1.3345184326171875, 1.38751220703125, 1.4405059814453125, 1.493499755859375, 1.5464935302734375, 1.5994873046875, 1.6524810791015625, 1.705474853515625, 1.7584686279296875, 1.81146240234375, 1.8644561767578125, 1.917449951171875, 1.9704437255859375, 2.0234375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 11.0, 17.0, 16.0, 32.0, 46.0, 68.0, 150.0, 294.0, 130.0, 82.0, 52.0, 27.0, 15.0, 14.0, 9.0, 7.0, 6.0, 1.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.1954975128173828, -0.18750381469726562, -0.17951011657714844, -0.17151641845703125, -0.16352272033691406, -0.15552902221679688, -0.1475353240966797, -0.1395416259765625, -0.1315479278564453, -0.12355422973632812, -0.11556053161621094, -0.10756683349609375, -0.09957313537597656, -0.09157943725585938, -0.08358573913574219, -0.075592041015625, -0.06759834289550781, -0.059604644775390625, -0.05161094665527344, -0.04361724853515625, -0.03562355041503906, -0.027629852294921875, -0.019636154174804688, -0.0116424560546875, -0.0036487579345703125, 0.004344940185546875, 0.012338638305664062, 0.02033233642578125, 0.028326034545898438, 0.036319732666015625, 0.04431343078613281, 0.05230712890625, 0.06030082702636719, 0.06829452514648438, 0.07628822326660156, 0.08428192138671875, 0.09227561950683594, 0.10026931762695312, 0.10826301574707031, 0.1162567138671875, 0.12425041198730469, 0.13224411010742188, 0.14023780822753906, 0.14823150634765625, 0.15622520446777344, 0.16421890258789062, 0.1722126007080078, 0.180206298828125, 0.1881999969482422, 0.19619369506835938, 0.20418739318847656, 0.21218109130859375, 0.22017478942871094, 0.22816848754882812, 0.2361621856689453, 0.2441558837890625, 0.2521495819091797, 0.2601432800292969, 0.26813697814941406, 0.27613067626953125, 0.28412437438964844, 0.2921180725097656, 0.3001117706298828, 0.30810546875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 58.0, 383.0, 456.0, 87.0, 18.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0021957159042358, -0.9312325716018677, -0.8602694869041443, -0.7893063426017761, -0.7183432579040527, -0.6473801136016846, -0.5764169692993164, -0.5054538249969482, -0.43449074029922485, -0.3635276257991791, -0.2925645112991333, -0.22160136699676514, -0.15063825249671936, -0.07967513799667358, -0.00871199369430542, 0.062251120805740356, 0.13321423530578613, 0.2041773498058319, 0.2751404643058777, 0.34610360860824585, 0.4170667231082916, 0.4880298376083374, 0.5589929819107056, 0.6299561262130737, 0.7009192109107971, 0.7718823552131653, 0.8428454399108887, 0.9138085842132568, 0.984771728515625, 1.0557348728179932, 1.1266980171203613, 1.19766104221344, 1.2686240673065186, 1.3395872116088867, 1.4105503559112549, 1.481513500213623, 1.5524765253067017, 1.6234396696090698, 1.694402813911438, 1.7653659582138062, 1.8363289833068848, 1.907292127609253, 1.978255271911621, 2.0492184162139893, 2.1201815605163574, 2.1911444664001465, 2.2621078491210938, 2.333070755004883, 2.40403413772583, 2.4749972820281982, 2.5459604263305664, 2.6169235706329346, 2.6878867149353027, 2.758849620819092, 2.829813003540039, 2.900775909423828, 2.9717390537261963, 3.0427021980285645, 3.1136653423309326, 3.184628486633301, 3.255591630935669, 3.326554775238037, 3.397517681121826, 3.4684808254241943, 3.5394439697265625]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 7.0, 5.0, 7.0, 6.0, 8.0, 10.0, 20.0, 19.0, 21.0, 31.0, 24.0, 33.0, 41.0, 42.0, 42.0, 51.0, 40.0, 55.0, 41.0, 49.0, 42.0, 47.0, 40.0, 52.0, 36.0, 32.0, 27.0, 23.0, 24.0, 30.0, 17.0, 20.0, 16.0, 7.0, 4.0, 12.0, 9.0, 3.0, 6.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6164748668670654, -0.5962536334991455, -0.5760324001312256, -0.5558111667633057, -0.5355899333953857, -0.515368640422821, -0.4951474070549011, -0.4749261736869812, -0.4547049403190613, -0.43448370695114136, -0.41426247358322144, -0.3940412104129791, -0.3738199770450592, -0.3535987436771393, -0.333377480506897, -0.31315624713897705, -0.29293501377105713, -0.2727137804031372, -0.2524925470352173, -0.23227128386497498, -0.21205005049705505, -0.19182881712913513, -0.17160756886005402, -0.1513863205909729, -0.13116508722305298, -0.11094384640455246, -0.09072260558605194, -0.07050136476755142, -0.0502801239490509, -0.030058883130550385, -0.009837642312049866, 0.01038360595703125, 0.030604898929595947, 0.050826139748096466, 0.07104738056659698, 0.0912686213850975, 0.11148986220359802, 0.13171109557151794, 0.15193234384059906, 0.17215359210968018, 0.1923748254776001, 0.21259605884552002, 0.23281730711460114, 0.25303855538368225, 0.2732597887516022, 0.2934810221195221, 0.3137022852897644, 0.3339235186576843, 0.35414475202560425, 0.37436598539352417, 0.3945872187614441, 0.4148084819316864, 0.4350297152996063, 0.45525094866752625, 0.47547221183776855, 0.4956934452056885, 0.5159146785736084, 0.5361359119415283, 0.5563571453094482, 0.5765783786773682, 0.5967996120452881, 0.6170209050178528, 0.6372421383857727, 0.6574633717536926, 0.6776846051216125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 7.0, 10.0, 23.0, 20.0, 31.0, 50.0, 46.0, 83.0, 121.0, 151.0, 227.0, 355.0, 529.0, 789.0, 1336.0, 2227.0, 4174.0, 9192.0, 40099.0, 1287922.0, 2745184.0, 76476.0, 12610.0, 5313.0, 2729.0, 1508.0, 991.0, 617.0, 407.0, 284.0, 221.0, 137.0, 109.0, 75.0, 55.0, 45.0, 35.0, 28.0, 17.0, 14.0, 8.0, 7.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.58837890625, -0.5688629150390625, -0.549346923828125, -0.5298309326171875, -0.51031494140625, -0.4907989501953125, -0.471282958984375, -0.4517669677734375, -0.4322509765625, -0.4127349853515625, -0.393218994140625, -0.3737030029296875, -0.35418701171875, -0.3346710205078125, -0.315155029296875, -0.2956390380859375, -0.276123046875, -0.2566070556640625, -0.237091064453125, -0.2175750732421875, -0.19805908203125, -0.1785430908203125, -0.159027099609375, -0.1395111083984375, -0.1199951171875, -0.1004791259765625, -0.080963134765625, -0.0614471435546875, -0.04193115234375, -0.0224151611328125, -0.002899169921875, 0.0166168212890625, 0.0361328125, 0.0556488037109375, 0.075164794921875, 0.0946807861328125, 0.11419677734375, 0.1337127685546875, 0.153228759765625, 0.1727447509765625, 0.1922607421875, 0.2117767333984375, 0.231292724609375, 0.2508087158203125, 0.27032470703125, 0.2898406982421875, 0.309356689453125, 0.3288726806640625, 0.348388671875, 0.3679046630859375, 0.387420654296875, 0.4069366455078125, 0.42645263671875, 0.4459686279296875, 0.465484619140625, 0.4850006103515625, 0.5045166015625, 0.5240325927734375, 0.543548583984375, 0.5630645751953125, 0.58258056640625, 0.6020965576171875, 0.621612548828125, 0.6411285400390625, 0.66064453125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 12.0, 4.0, 10.0, 13.0, 26.0, 16.0, 21.0, 28.0, 39.0, 32.0, 39.0, 47.0, 41.0, 40.0, 45.0, 46.0, 54.0, 57.0, 42.0, 41.0, 36.0, 49.0, 26.0, 33.0, 24.0, 31.0, 30.0, 19.0, 15.0, 20.0, 17.0, 7.0, 6.0, 8.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2178955078125, -0.21102142333984375, -0.2041473388671875, -0.19727325439453125, -0.190399169921875, -0.18352508544921875, -0.1766510009765625, -0.16977691650390625, -0.16290283203125, -0.15602874755859375, -0.1491546630859375, -0.14228057861328125, -0.135406494140625, -0.12853240966796875, -0.1216583251953125, -0.11478424072265625, -0.10791015625, -0.10103607177734375, -0.0941619873046875, -0.08728790283203125, -0.080413818359375, -0.07353973388671875, -0.0666656494140625, -0.05979156494140625, -0.05291748046875, -0.04604339599609375, -0.0391693115234375, -0.03229522705078125, -0.025421142578125, -0.01854705810546875, -0.0116729736328125, -0.00479888916015625, 0.0020751953125, 0.00894927978515625, 0.0158233642578125, 0.02269744873046875, 0.029571533203125, 0.03644561767578125, 0.0433197021484375, 0.05019378662109375, 0.05706787109375, 0.06394195556640625, 0.0708160400390625, 0.07769012451171875, 0.084564208984375, 0.09143829345703125, 0.0983123779296875, 0.10518646240234375, 0.112060546875, 0.11893463134765625, 0.1258087158203125, 0.13268280029296875, 0.139556884765625, 0.14643096923828125, 0.1533050537109375, 0.16017913818359375, 0.16705322265625, 0.17392730712890625, 0.1808013916015625, 0.18767547607421875, 0.194549560546875, 0.20142364501953125, 0.2082977294921875, 0.21517181396484375, 0.2220458984375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 10.0, 25.0, 40.0, 85.0, 193.0, 671.0, 7206.0, 4175786.0, 9123.0, 731.0, 178.0, 85.0, 48.0, 25.0, 10.0, 16.0, 12.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.181640625, -2.069915771484375, -1.95819091796875, -1.846466064453125, -1.7347412109375, -1.623016357421875, -1.51129150390625, -1.399566650390625, -1.287841796875, -1.176116943359375, -1.06439208984375, -0.952667236328125, -0.8409423828125, -0.729217529296875, -0.61749267578125, -0.505767822265625, -0.39404296875, -0.282318115234375, -0.17059326171875, -0.058868408203125, 0.0528564453125, 0.164581298828125, 0.27630615234375, 0.388031005859375, 0.499755859375, 0.611480712890625, 0.72320556640625, 0.834930419921875, 0.9466552734375, 1.058380126953125, 1.17010498046875, 1.281829833984375, 1.3935546875, 1.505279541015625, 1.61700439453125, 1.728729248046875, 1.8404541015625, 1.952178955078125, 2.06390380859375, 2.175628662109375, 2.287353515625, 2.399078369140625, 2.51080322265625, 2.622528076171875, 2.7342529296875, 2.845977783203125, 2.95770263671875, 3.069427490234375, 3.18115234375, 3.292877197265625, 3.40460205078125, 3.516326904296875, 3.6280517578125, 3.739776611328125, 3.85150146484375, 3.963226318359375, 4.074951171875, 4.186676025390625, 4.29840087890625, 4.410125732421875, 4.5218505859375, 4.633575439453125, 4.74530029296875, 4.857025146484375, 4.96875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 5.0, 7.0, 5.0, 6.0, 12.0, 24.0, 26.0, 67.0, 123.0, 313.0, 722.0, 1128.0, 877.0, 385.0, 164.0, 65.0, 53.0, 29.0, 16.0, 23.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10748291015625, -0.10251331329345703, -0.09754371643066406, -0.0925741195678711, -0.08760452270507812, -0.08263492584228516, -0.07766532897949219, -0.07269573211669922, -0.06772613525390625, -0.06275653839111328, -0.05778694152832031, -0.052817344665527344, -0.047847747802734375, -0.042878150939941406, -0.03790855407714844, -0.03293895721435547, -0.0279693603515625, -0.02299976348876953, -0.018030166625976562, -0.013060569763183594, -0.008090972900390625, -0.0031213760375976562, 0.0018482208251953125, 0.006817817687988281, 0.01178741455078125, 0.01675701141357422, 0.021726608276367188, 0.026696205139160156, 0.031665802001953125, 0.036635398864746094, 0.04160499572753906, 0.04657459259033203, 0.051544189453125, 0.05651378631591797, 0.06148338317871094, 0.0664529800415039, 0.07142257690429688, 0.07639217376708984, 0.08136177062988281, 0.08633136749267578, 0.09130096435546875, 0.09627056121826172, 0.10124015808105469, 0.10620975494384766, 0.11117935180664062, 0.1161489486694336, 0.12111854553222656, 0.12608814239501953, 0.1310577392578125, 0.13602733612060547, 0.14099693298339844, 0.1459665298461914, 0.15093612670898438, 0.15590572357177734, 0.1608753204345703, 0.16584491729736328, 0.17081451416015625, 0.17578411102294922, 0.1807537078857422, 0.18572330474853516, 0.19069290161132812, 0.1956624984741211, 0.20063209533691406, 0.20560169219970703, 0.2105712890625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 4.0, 7.0, 18.0, 26.0, 35.0, 48.0, 89.0, 122.0, 141.0, 132.0, 119.0, 76.0, 62.0, 35.0, 23.0, 12.0, 15.0, 11.0, 5.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3934672474861145, -0.38337281346321106, -0.37327840924263, -0.36318397521972656, -0.3530895411968231, -0.3429951071739197, -0.3329007029533386, -0.3228062689304352, -0.31271183490753174, -0.3026174008846283, -0.29252299666404724, -0.2824285626411438, -0.27233412861824036, -0.2622396945953369, -0.25214529037475586, -0.24205085635185242, -0.23195645213127136, -0.2218620330095291, -0.21176759898662567, -0.20167317986488342, -0.19157874584197998, -0.18148432672023773, -0.17138990759849548, -0.16129547357559204, -0.1512010544538498, -0.14110663533210754, -0.1310122013092041, -0.12091778218746185, -0.11082335561513901, -0.10072892904281616, -0.09063450992107391, -0.08054008334875107, -0.07044562697410583, -0.06035120040178299, -0.05025677755475044, -0.040162354707717896, -0.03006792813539505, -0.019973501563072205, -0.009879078716039658, 0.0002153441309928894, 0.010309770703315735, 0.02040419541299343, 0.030498620122671127, 0.040593042969703674, 0.05068746954202652, 0.060781896114349365, 0.07087631523609161, 0.08097074180841446, 0.0910651683807373, 0.10115959495306015, 0.111254021525383, 0.12134844064712524, 0.1314428746700287, 0.14153729379177094, 0.15163171291351318, 0.16172614693641663, 0.17182056605815887, 0.18191498517990112, 0.19200941920280457, 0.20210383832454681, 0.21219825744628906, 0.2222926914691925, 0.23238711059093475, 0.242481529712677, 0.25257596373558044]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 4.0, 7.0, 14.0, 14.0, 12.0, 21.0, 32.0, 32.0, 26.0, 41.0, 33.0, 45.0, 45.0, 40.0, 40.0, 43.0, 46.0, 73.0, 40.0, 33.0, 29.0, 37.0, 38.0, 41.0, 28.0, 28.0, 19.0, 23.0, 20.0, 17.0, 15.0, 8.0, 7.0, 7.0, 4.0, 8.0, 4.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2139837145805359, -0.20708398520946503, -0.20018425583839417, -0.1932845264673233, -0.18638479709625244, -0.17948505282402039, -0.17258532345294952, -0.16568559408187866, -0.1587858647108078, -0.15188613533973694, -0.14498640596866608, -0.13808667659759521, -0.13118693232536316, -0.1242872104048729, -0.11738747358322144, -0.11048774421215057, -0.10358801484107971, -0.09668828547000885, -0.08978855609893799, -0.08288881927728653, -0.07598908990621567, -0.0690893605351448, -0.062189627438783646, -0.055289894342422485, -0.048390164971351624, -0.04149043560028076, -0.0345907025039196, -0.02769097127020359, -0.02079124003648758, -0.013891510665416718, -0.006991777569055557, -9.204447269439697e-05, 0.006807669997215271, 0.013707401230931282, 0.020607132464647293, 0.027506863698363304, 0.034406594932079315, 0.04130632430315018, 0.04820605739951134, 0.0551057904958725, 0.06200551986694336, 0.06890524923801422, 0.07580497860908508, 0.08270471543073654, 0.0896044448018074, 0.09650417417287827, 0.10340391099452972, 0.11030364036560059, 0.11720336973667145, 0.12410309910774231, 0.13100282847881317, 0.13790255784988403, 0.1448023021221161, 0.15170201659202576, 0.1586017608642578, 0.16550149023532867, 0.17240121960639954, 0.1793009489774704, 0.18620067834854126, 0.19310040771961212, 0.20000013709068298, 0.20689988136291504, 0.2137996107339859, 0.22069934010505676, 0.22759906947612762]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 8.0, 11.0, 14.0, 29.0, 34.0, 46.0, 69.0, 113.0, 154.0, 222.0, 337.0, 527.0, 771.0, 1098.0, 1776.0, 2715.0, 4427.0, 7046.0, 11096.0, 17954.0, 29072.0, 49417.0, 86890.0, 158148.0, 250822.0, 182607.0, 99767.0, 56261.0, 32684.0, 20090.0, 12672.0, 7768.0, 4995.0, 3203.0, 1917.0, 1279.0, 823.0, 553.0, 374.0, 249.0, 168.0, 121.0, 89.0, 47.0, 36.0, 25.0, 17.0, 7.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11981201171875, -0.11589908599853516, -0.11198616027832031, -0.10807323455810547, -0.10416030883789062, -0.10024738311767578, -0.09633445739746094, -0.0924215316772461, -0.08850860595703125, -0.0845956802368164, -0.08068275451660156, -0.07676982879638672, -0.07285690307617188, -0.06894397735595703, -0.06503105163574219, -0.061118125915527344, -0.0572052001953125, -0.053292274475097656, -0.04937934875488281, -0.04546642303466797, -0.041553497314453125, -0.03764057159423828, -0.03372764587402344, -0.029814720153808594, -0.02590179443359375, -0.021988868713378906, -0.018075942993164062, -0.014163017272949219, -0.010250091552734375, -0.006337165832519531, -0.0024242401123046875, 0.0014886856079101562, 0.005401611328125, 0.009314537048339844, 0.013227462768554688, 0.01714038848876953, 0.021053314208984375, 0.02496623992919922, 0.028879165649414062, 0.032792091369628906, 0.03670501708984375, 0.040617942810058594, 0.04453086853027344, 0.04844379425048828, 0.052356719970703125, 0.05626964569091797, 0.06018257141113281, 0.06409549713134766, 0.0680084228515625, 0.07192134857177734, 0.07583427429199219, 0.07974720001220703, 0.08366012573242188, 0.08757305145263672, 0.09148597717285156, 0.0953989028930664, 0.09931182861328125, 0.1032247543334961, 0.10713768005371094, 0.11105060577392578, 0.11496353149414062, 0.11887645721435547, 0.12278938293457031, 0.12670230865478516, 0.130615234375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 9.0, 5.0, 10.0, 15.0, 14.0, 21.0, 21.0, 28.0, 26.0, 30.0, 37.0, 40.0, 32.0, 48.0, 50.0, 41.0, 40.0, 50.0, 47.0, 39.0, 42.0, 28.0, 38.0, 43.0, 26.0, 33.0, 30.0, 17.0, 18.0, 19.0, 12.0, 23.0, 8.0, 9.0, 8.0, 9.0, 2.0, 5.0, 6.0, 7.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.186767578125, -0.181121826171875, -0.17547607421875, -0.169830322265625, -0.1641845703125, -0.158538818359375, -0.15289306640625, -0.147247314453125, -0.1416015625, -0.135955810546875, -0.13031005859375, -0.124664306640625, -0.1190185546875, -0.113372802734375, -0.10772705078125, -0.102081298828125, -0.096435546875, -0.090789794921875, -0.08514404296875, -0.079498291015625, -0.0738525390625, -0.068206787109375, -0.06256103515625, -0.056915283203125, -0.05126953125, -0.045623779296875, -0.03997802734375, -0.034332275390625, -0.0286865234375, -0.023040771484375, -0.01739501953125, -0.011749267578125, -0.006103515625, -0.000457763671875, 0.00518798828125, 0.010833740234375, 0.0164794921875, 0.022125244140625, 0.02777099609375, 0.033416748046875, 0.0390625, 0.044708251953125, 0.05035400390625, 0.055999755859375, 0.0616455078125, 0.067291259765625, 0.07293701171875, 0.078582763671875, 0.084228515625, 0.089874267578125, 0.09552001953125, 0.101165771484375, 0.1068115234375, 0.112457275390625, 0.11810302734375, 0.123748779296875, 0.12939453125, 0.135040283203125, 0.14068603515625, 0.146331787109375, 0.1519775390625, 0.157623291015625, 0.16326904296875, 0.168914794921875, 0.174560546875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 16.0, 13.0, 32.0, 40.0, 60.0, 92.0, 122.0, 157.0, 265.0, 346.0, 572.0, 810.0, 1232.0, 1877.0, 2960.0, 4769.0, 7527.0, 12152.0, 20387.0, 34979.0, 63681.0, 126664.0, 286962.0, 241137.0, 107467.0, 55539.0, 30752.0, 17982.0, 10994.0, 6820.0, 4172.0, 2712.0, 1783.0, 1180.0, 709.0, 492.0, 324.0, 235.0, 173.0, 96.0, 80.0, 59.0, 40.0, 23.0, 27.0, 14.0, 5.0, 14.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1007080078125, -0.0975503921508789, -0.09439277648925781, -0.09123516082763672, -0.08807754516601562, -0.08491992950439453, -0.08176231384277344, -0.07860469818115234, -0.07544708251953125, -0.07228946685791016, -0.06913185119628906, -0.06597423553466797, -0.06281661987304688, -0.05965900421142578, -0.05650138854980469, -0.053343772888183594, -0.0501861572265625, -0.047028541564941406, -0.04387092590332031, -0.04071331024169922, -0.037555694580078125, -0.03439807891845703, -0.031240463256835938, -0.028082847595214844, -0.02492523193359375, -0.021767616271972656, -0.018610000610351562, -0.015452384948730469, -0.012294769287109375, -0.009137153625488281, -0.0059795379638671875, -0.0028219223022460938, 0.000335693359375, 0.0034933090209960938, 0.0066509246826171875, 0.009808540344238281, 0.012966156005859375, 0.01612377166748047, 0.019281387329101562, 0.022439002990722656, 0.02559661865234375, 0.028754234313964844, 0.03191184997558594, 0.03506946563720703, 0.038227081298828125, 0.04138469696044922, 0.04454231262207031, 0.047699928283691406, 0.0508575439453125, 0.054015159606933594, 0.05717277526855469, 0.06033039093017578, 0.06348800659179688, 0.06664562225341797, 0.06980323791503906, 0.07296085357666016, 0.07611846923828125, 0.07927608489990234, 0.08243370056152344, 0.08559131622314453, 0.08874893188476562, 0.09190654754638672, 0.09506416320800781, 0.0982217788696289, 0.10137939453125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 15.0, 13.0, 8.0, 11.0, 15.0, 18.0, 19.0, 31.0, 32.0, 27.0, 39.0, 33.0, 33.0, 35.0, 36.0, 36.0, 48.0, 31.0, 43.0, 46.0, 38.0, 34.0, 44.0, 41.0, 32.0, 27.0, 30.0, 25.0, 18.0, 26.0, 16.0, 13.0, 9.0, 9.0, 3.0, 4.0, 4.0, 8.0, 8.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1070556640625, -0.10344600677490234, -0.09983634948730469, -0.09622669219970703, -0.09261703491210938, -0.08900737762451172, -0.08539772033691406, -0.0817880630493164, -0.07817840576171875, -0.0745687484741211, -0.07095909118652344, -0.06734943389892578, -0.06373977661132812, -0.06013011932373047, -0.05652046203613281, -0.052910804748535156, -0.0493011474609375, -0.045691490173339844, -0.04208183288574219, -0.03847217559814453, -0.034862518310546875, -0.03125286102294922, -0.027643203735351562, -0.024033546447753906, -0.02042388916015625, -0.016814231872558594, -0.013204574584960938, -0.009594917297363281, -0.005985260009765625, -0.0023756027221679688, 0.0012340545654296875, 0.004843711853027344, 0.008453369140625, 0.012063026428222656, 0.015672683715820312, 0.01928234100341797, 0.022891998291015625, 0.02650165557861328, 0.030111312866210938, 0.033720970153808594, 0.03733062744140625, 0.040940284729003906, 0.04454994201660156, 0.04815959930419922, 0.051769256591796875, 0.05537891387939453, 0.05898857116699219, 0.06259822845458984, 0.0662078857421875, 0.06981754302978516, 0.07342720031738281, 0.07703685760498047, 0.08064651489257812, 0.08425617218017578, 0.08786582946777344, 0.0914754867553711, 0.09508514404296875, 0.0986948013305664, 0.10230445861816406, 0.10591411590576172, 0.10952377319335938, 0.11313343048095703, 0.11674308776855469, 0.12035274505615234, 0.12396240234375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 9.0, 9.0, 11.0, 9.0, 18.0, 17.0, 36.0, 42.0, 67.0, 111.0, 147.0, 235.0, 328.0, 493.0, 782.0, 1152.0, 1945.0, 3263.0, 5863.0, 11231.0, 26234.0, 74274.0, 370239.0, 418188.0, 79342.0, 27630.0, 11749.0, 5979.0, 3527.0, 2019.0, 1228.0, 789.0, 505.0, 338.0, 226.0, 165.0, 91.0, 69.0, 54.0, 37.0, 36.0, 9.0, 11.0, 10.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.01020050048828125, -0.009871721267700195, -0.00954294204711914, -0.009214162826538086, -0.008885383605957031, -0.008556604385375977, -0.008227825164794922, -0.007899045944213867, -0.0075702667236328125, -0.007241487503051758, -0.006912708282470703, -0.0065839290618896484, -0.006255149841308594, -0.005926370620727539, -0.005597591400146484, -0.00526881217956543, -0.004940032958984375, -0.00461125373840332, -0.004282474517822266, -0.003953695297241211, -0.0036249160766601562, -0.0032961368560791016, -0.002967357635498047, -0.002638578414916992, -0.0023097991943359375, -0.001981019973754883, -0.0016522407531738281, -0.0013234615325927734, -0.0009946823120117188, -0.0006659030914306641, -0.0003371238708496094, -8.344650268554688e-06, 0.0003204345703125, 0.0006492137908935547, 0.0009779930114746094, 0.001306772232055664, 0.0016355514526367188, 0.0019643306732177734, 0.002293109893798828, 0.002621889114379883, 0.0029506683349609375, 0.003279447555541992, 0.003608226776123047, 0.0039370059967041016, 0.004265785217285156, 0.004594564437866211, 0.004923343658447266, 0.00525212287902832, 0.005580902099609375, 0.00590968132019043, 0.006238460540771484, 0.006567239761352539, 0.006896018981933594, 0.0072247982025146484, 0.007553577423095703, 0.007882356643676758, 0.008211135864257812, 0.008539915084838867, 0.008868694305419922, 0.009197473526000977, 0.009526252746582031, 0.009855031967163086, 0.01018381118774414, 0.010512590408325195, 0.01084136962890625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 4.0, 8.0, 10.0, 8.0, 9.0, 12.0, 11.0, 9.0, 7.0, 13.0, 17.0, 13.0, 44.0, 56.0, 104.0, 148.0, 172.0, 120.0, 60.0, 32.0, 17.0, 11.0, 4.0, 12.0, 10.0, 7.0, 15.0, 11.0, 6.0, 10.0, 8.0, 8.0, 3.0, 4.0, 7.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.68952751159668e-05, -3.553275018930435e-05, -3.417022526264191e-05, -3.280770033597946e-05, -3.1445175409317017e-05, -3.008265048265457e-05, -2.8720125555992126e-05, -2.735760062932968e-05, -2.5995075702667236e-05, -2.463255077600479e-05, -2.3270025849342346e-05, -2.19075009226799e-05, -2.0544975996017456e-05, -1.918245106935501e-05, -1.7819926142692566e-05, -1.645740121603012e-05, -1.5094876289367676e-05, -1.373235136270523e-05, -1.2369826436042786e-05, -1.100730150938034e-05, -9.644776582717896e-06, -8.28225165605545e-06, -6.919726729393005e-06, -5.55720180273056e-06, -4.194676876068115e-06, -2.83215194940567e-06, -1.469627022743225e-06, -1.0710209608078003e-07, 1.255422830581665e-06, 2.61794775724411e-06, 3.980472683906555e-06, 5.342997610569e-06, 6.705522537231445e-06, 8.06804746389389e-06, 9.430572390556335e-06, 1.079309731721878e-05, 1.2155622243881226e-05, 1.351814717054367e-05, 1.4880672097206116e-05, 1.624319702386856e-05, 1.7605721950531006e-05, 1.896824687719345e-05, 2.0330771803855896e-05, 2.169329673051834e-05, 2.3055821657180786e-05, 2.441834658384323e-05, 2.5780871510505676e-05, 2.714339643716812e-05, 2.8505921363830566e-05, 2.986844629049301e-05, 3.1230971217155457e-05, 3.25934961438179e-05, 3.395602107048035e-05, 3.531854599714279e-05, 3.668107092380524e-05, 3.804359585046768e-05, 3.940612077713013e-05, 4.076864570379257e-05, 4.213117063045502e-05, 4.349369555711746e-05, 4.485622048377991e-05, 4.621874541044235e-05, 4.75812703371048e-05, 4.894379526376724e-05, 5.030632019042969e-05]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 6.0, 10.0, 7.0, 8.0, 6.0, 15.0, 17.0, 25.0, 30.0, 35.0, 48.0, 53.0, 67.0, 92.0, 140.0, 346.0, 4735.0, 150521.0, 871725.0, 19032.0, 1036.0, 171.0, 98.0, 72.0, 56.0, 52.0, 37.0, 27.0, 13.0, 17.0, 13.0, 9.0, 10.0, 9.0, 5.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.052459716796875, -0.05083179473876953, -0.04920387268066406, -0.047575950622558594, -0.045948028564453125, -0.044320106506347656, -0.04269218444824219, -0.04106426239013672, -0.03943634033203125, -0.03780841827392578, -0.03618049621582031, -0.034552574157714844, -0.032924652099609375, -0.031296730041503906, -0.029668807983398438, -0.02804088592529297, -0.0264129638671875, -0.02478504180908203, -0.023157119750976562, -0.021529197692871094, -0.019901275634765625, -0.018273353576660156, -0.016645431518554688, -0.015017509460449219, -0.01338958740234375, -0.011761665344238281, -0.010133743286132812, -0.008505821228027344, -0.006877899169921875, -0.005249977111816406, -0.0036220550537109375, -0.0019941329956054688, -0.0003662109375, 0.0012617111206054688, 0.0028896331787109375, 0.004517555236816406, 0.006145477294921875, 0.007773399353027344, 0.009401321411132812, 0.011029243469238281, 0.01265716552734375, 0.014285087585449219, 0.015913009643554688, 0.017540931701660156, 0.019168853759765625, 0.020796775817871094, 0.022424697875976562, 0.02405261993408203, 0.0256805419921875, 0.02730846405029297, 0.028936386108398438, 0.030564308166503906, 0.032192230224609375, 0.033820152282714844, 0.03544807434082031, 0.03707599639892578, 0.03870391845703125, 0.04033184051513672, 0.04195976257324219, 0.043587684631347656, 0.045215606689453125, 0.046843528747558594, 0.04847145080566406, 0.05009937286376953, 0.051727294921875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 7.0, 7.0, 10.0, 7.0, 8.0, 12.0, 9.0, 27.0, 31.0, 32.0, 45.0, 62.0, 71.0, 100.0, 128.0, 109.0, 76.0, 68.0, 36.0, 27.0, 32.0, 17.0, 17.0, 11.0, 8.0, 7.0, 8.0, 3.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0027980804443359375, -0.002712070941925049, -0.00262606143951416, -0.0025400519371032715, -0.002454042434692383, -0.002368032932281494, -0.0022820234298706055, -0.002196013927459717, -0.002110004425048828, -0.0020239949226379395, -0.0019379854202270508, -0.0018519759178161621, -0.0017659664154052734, -0.0016799569129943848, -0.001593947410583496, -0.0015079379081726074, -0.0014219284057617188, -0.00133591890335083, -0.0012499094009399414, -0.0011638998985290527, -0.001077890396118164, -0.0009918808937072754, -0.0009058713912963867, -0.000819861888885498, -0.0007338523864746094, -0.0006478428840637207, -0.000561833381652832, -0.00047582387924194336, -0.0003898143768310547, -0.000303804874420166, -0.00021779537200927734, -0.00013178586959838867, -4.57763671875e-05, 4.023313522338867e-05, 0.00012624263763427734, 0.00021225214004516602, 0.0002982616424560547, 0.00038427114486694336, 0.00047028064727783203, 0.0005562901496887207, 0.0006422996520996094, 0.000728309154510498, 0.0008143186569213867, 0.0009003281593322754, 0.000986337661743164, 0.0010723471641540527, 0.0011583566665649414, 0.00124436616897583, 0.0013303756713867188, 0.0014163851737976074, 0.001502394676208496, 0.0015884041786193848, 0.0016744136810302734, 0.0017604231834411621, 0.0018464326858520508, 0.0019324421882629395, 0.002018451690673828, 0.002104461193084717, 0.0021904706954956055, 0.002276480197906494, 0.002362489700317383, 0.0024484992027282715, 0.00253450870513916, 0.002620518207550049, 0.0027065277099609375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 7.0, 8.0, 12.0, 23.0, 30.0, 59.0, 103.0, 138.0, 182.0, 165.0, 95.0, 60.0, 48.0, 24.0, 18.0, 7.0, 6.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.6070498824119568, -0.5937586426734924, -0.5804674029350281, -0.5671761631965637, -0.5538849234580994, -0.540593683719635, -0.5273024439811707, -0.5140112042427063, -0.5007199645042419, -0.4874287247657776, -0.47413748502731323, -0.4608462452888489, -0.4475550055503845, -0.43426376581192017, -0.4209725260734558, -0.40768128633499146, -0.3943900465965271, -0.38109880685806274, -0.3678075671195984, -0.35451632738113403, -0.3412250876426697, -0.3279338479042053, -0.31464260816574097, -0.3013513684272766, -0.28806012868881226, -0.2747688889503479, -0.26147764921188354, -0.2481864094734192, -0.23489516973495483, -0.22160392999649048, -0.20831269025802612, -0.19502145051956177, -0.1817302405834198, -0.16843900084495544, -0.1551477611064911, -0.14185652136802673, -0.12856528162956238, -0.11527404189109802, -0.10198280215263367, -0.08869156241416931, -0.07540032267570496, -0.0621090829372406, -0.048817843198776245, -0.03552660346031189, -0.022235363721847534, -0.008944123983383179, 0.004347115755081177, 0.017638355493545532, 0.030929595232009888, 0.04422083497047424, 0.0575120747089386, 0.07080331444740295, 0.08409455418586731, 0.09738579392433167, 0.11067703366279602, 0.12396827340126038, 0.13725951313972473, 0.1505507528781891, 0.16384199261665344, 0.1771332323551178, 0.19042447209358215, 0.2037157118320465, 0.21700695157051086, 0.23029819130897522, 0.24358943104743958]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 4.0, 5.0, 6.0, 13.0, 11.0, 16.0, 25.0, 25.0, 29.0, 32.0, 38.0, 35.0, 42.0, 39.0, 49.0, 39.0, 39.0, 48.0, 48.0, 62.0, 37.0, 33.0, 33.0, 37.0, 38.0, 31.0, 29.0, 23.0, 18.0, 22.0, 15.0, 13.0, 16.0, 9.0, 3.0, 6.0, 7.0, 5.0, 5.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17927950620651245, -0.17354115843772888, -0.1678028106689453, -0.16206446290016174, -0.15632611513137817, -0.1505877673625946, -0.14484941959381104, -0.13911107182502747, -0.1333727240562439, -0.12763437628746033, -0.12189602851867676, -0.11615768074989319, -0.11041933298110962, -0.10468098521232605, -0.09894262999296188, -0.09320428222417831, -0.08746592700481415, -0.08172757923603058, -0.07598923146724701, -0.07025088369846344, -0.06451253592967987, -0.058774184435606, -0.053035832941532135, -0.047297485172748566, -0.041559137403964996, -0.03582078963518143, -0.03008244000375271, -0.02434409037232399, -0.01860574260354042, -0.012867394834756851, -0.007129043340682983, -0.001390695571899414, 0.004347652196884155, 0.0100860008969903, 0.015824349597096443, 0.021562699228525162, 0.02730104699730873, 0.0330393947660923, 0.03877774626016617, 0.04451609402894974, 0.05025444179773331, 0.055992789566516876, 0.061731137335300446, 0.06746949255466461, 0.07320784032344818, 0.07894618809223175, 0.08468453586101532, 0.09042288362979889, 0.09616123139858246, 0.10189957916736603, 0.1076379269361496, 0.11337627470493317, 0.11911462247371674, 0.1248529702425003, 0.13059133291244507, 0.13632968068122864, 0.1420680284500122, 0.14780637621879578, 0.15354472398757935, 0.15928307175636292, 0.16502141952514648, 0.17075976729393005, 0.17649811506271362, 0.1822364628314972, 0.18797481060028076]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 9.0, 11.0, 20.0, 38.0, 51.0, 86.0, 146.0, 248.0, 413.0, 670.0, 1180.0, 2395.0, 4523.0, 9184.0, 18972.0, 40773.0, 91554.0, 209338.0, 319460.0, 192883.0, 84023.0, 37409.0, 17681.0, 8478.0, 4201.0, 2168.0, 1115.0, 619.0, 341.0, 201.0, 132.0, 78.0, 61.0, 39.0, 23.0, 14.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.283447265625, -0.272308349609375, -0.26116943359375, -0.250030517578125, -0.2388916015625, -0.227752685546875, -0.21661376953125, -0.205474853515625, -0.1943359375, -0.183197021484375, -0.17205810546875, -0.160919189453125, -0.1497802734375, -0.138641357421875, -0.12750244140625, -0.116363525390625, -0.105224609375, -0.094085693359375, -0.08294677734375, -0.071807861328125, -0.0606689453125, -0.049530029296875, -0.03839111328125, -0.027252197265625, -0.01611328125, -0.004974365234375, 0.00616455078125, 0.017303466796875, 0.0284423828125, 0.039581298828125, 0.05072021484375, 0.061859130859375, 0.072998046875, 0.084136962890625, 0.09527587890625, 0.106414794921875, 0.1175537109375, 0.128692626953125, 0.13983154296875, 0.150970458984375, 0.162109375, 0.173248291015625, 0.18438720703125, 0.195526123046875, 0.2066650390625, 0.217803955078125, 0.22894287109375, 0.240081787109375, 0.251220703125, 0.262359619140625, 0.27349853515625, 0.284637451171875, 0.2957763671875, 0.306915283203125, 0.31805419921875, 0.329193115234375, 0.34033203125, 0.351470947265625, 0.36260986328125, 0.373748779296875, 0.3848876953125, 0.396026611328125, 0.40716552734375, 0.418304443359375, 0.429443359375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 10.0, 13.0, 6.0, 26.0, 19.0, 12.0, 34.0, 36.0, 27.0, 41.0, 40.0, 43.0, 41.0, 62.0, 60.0, 49.0, 49.0, 38.0, 41.0, 36.0, 38.0, 42.0, 36.0, 34.0, 14.0, 21.0, 16.0, 25.0, 22.0, 11.0, 8.0, 6.0, 6.0, 3.0, 10.0, 2.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12225341796875, -0.11863040924072266, -0.11500740051269531, -0.11138439178466797, -0.10776138305664062, -0.10413837432861328, -0.10051536560058594, -0.0968923568725586, -0.09326934814453125, -0.0896463394165039, -0.08602333068847656, -0.08240032196044922, -0.07877731323242188, -0.07515430450439453, -0.07153129577636719, -0.06790828704833984, -0.0642852783203125, -0.060662269592285156, -0.05703926086425781, -0.05341625213623047, -0.049793243408203125, -0.04617023468017578, -0.04254722595214844, -0.038924217224121094, -0.03530120849609375, -0.031678199768066406, -0.028055191040039062, -0.02443218231201172, -0.020809173583984375, -0.01718616485595703, -0.013563156127929688, -0.009940147399902344, -0.006317138671875, -0.0026941299438476562, 0.0009288787841796875, 0.004551887512207031, 0.008174896240234375, 0.011797904968261719, 0.015420913696289062, 0.019043922424316406, 0.02266693115234375, 0.026289939880371094, 0.029912948608398438, 0.03353595733642578, 0.037158966064453125, 0.04078197479248047, 0.04440498352050781, 0.048027992248535156, 0.0516510009765625, 0.055274009704589844, 0.05889701843261719, 0.06252002716064453, 0.06614303588867188, 0.06976604461669922, 0.07338905334472656, 0.0770120620727539, 0.08063507080078125, 0.0842580795288086, 0.08788108825683594, 0.09150409698486328, 0.09512710571289062, 0.09875011444091797, 0.10237312316894531, 0.10599613189697266, 0.109619140625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 5.0, 13.0, 9.0, 16.0, 18.0, 30.0, 34.0, 29.0, 29.0, 45.0, 55.0, 65.0, 290.0, 3846.0, 198133.0, 825132.0, 19691.0, 693.0, 97.0, 46.0, 44.0, 35.0, 27.0, 21.0, 17.0, 35.0, 18.0, 15.0, 18.0, 11.0, 8.0, 11.0, 2.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6767578125, -1.624725341796875, -1.57269287109375, -1.520660400390625, -1.4686279296875, -1.416595458984375, -1.36456298828125, -1.312530517578125, -1.260498046875, -1.208465576171875, -1.15643310546875, -1.104400634765625, -1.0523681640625, -1.000335693359375, -0.94830322265625, -0.896270751953125, -0.84423828125, -0.792205810546875, -0.74017333984375, -0.688140869140625, -0.6361083984375, -0.584075927734375, -0.53204345703125, -0.480010986328125, -0.427978515625, -0.375946044921875, -0.32391357421875, -0.271881103515625, -0.2198486328125, -0.167816162109375, -0.11578369140625, -0.063751220703125, -0.01171875, 0.040313720703125, 0.09234619140625, 0.144378662109375, 0.1964111328125, 0.248443603515625, 0.30047607421875, 0.352508544921875, 0.404541015625, 0.456573486328125, 0.50860595703125, 0.560638427734375, 0.6126708984375, 0.664703369140625, 0.71673583984375, 0.768768310546875, 0.82080078125, 0.872833251953125, 0.92486572265625, 0.976898193359375, 1.0289306640625, 1.080963134765625, 1.13299560546875, 1.185028076171875, 1.237060546875, 1.289093017578125, 1.34112548828125, 1.393157958984375, 1.4451904296875, 1.497222900390625, 1.54925537109375, 1.601287841796875, 1.6533203125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 7.0, 8.0, 16.0, 14.0, 25.0, 38.0, 33.0, 39.0, 23.0, 38.0, 51.0, 54.0, 46.0, 44.0, 51.0, 48.0, 49.0, 44.0, 61.0, 40.0, 43.0, 27.0, 31.0, 16.0, 25.0, 28.0, 12.0, 22.0, 15.0, 10.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11334228515625, -0.10951900482177734, -0.10569572448730469, -0.10187244415283203, -0.09804916381835938, -0.09422588348388672, -0.09040260314941406, -0.0865793228149414, -0.08275604248046875, -0.0789327621459961, -0.07510948181152344, -0.07128620147705078, -0.06746292114257812, -0.06363964080810547, -0.05981636047363281, -0.055993080139160156, -0.0521697998046875, -0.048346519470214844, -0.04452323913574219, -0.04069995880126953, -0.036876678466796875, -0.03305339813232422, -0.029230117797851562, -0.025406837463378906, -0.02158355712890625, -0.017760276794433594, -0.013936996459960938, -0.010113716125488281, -0.006290435791015625, -0.0024671554565429688, 0.0013561248779296875, 0.005179405212402344, 0.009002685546875, 0.012825965881347656, 0.016649246215820312, 0.02047252655029297, 0.024295806884765625, 0.02811908721923828, 0.03194236755371094, 0.035765647888183594, 0.03958892822265625, 0.043412208557128906, 0.04723548889160156, 0.05105876922607422, 0.054882049560546875, 0.05870532989501953, 0.06252861022949219, 0.06635189056396484, 0.0701751708984375, 0.07399845123291016, 0.07782173156738281, 0.08164501190185547, 0.08546829223632812, 0.08929157257080078, 0.09311485290527344, 0.0969381332397461, 0.10076141357421875, 0.1045846939086914, 0.10840797424316406, 0.11223125457763672, 0.11605453491210938, 0.11987781524658203, 0.12370109558105469, 0.12752437591552734, 0.13134765625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 8.0, 9.0, 17.0, 18.0, 27.0, 30.0, 48.0, 47.0, 94.0, 97.0, 133.0, 231.0, 252.0, 390.0, 558.0, 770.0, 1137.0, 1764.0, 2624.0, 3995.0, 6361.0, 10702.0, 36360.0, 938832.0, 18945.0, 8854.0, 5388.0, 3500.0, 2288.0, 1561.0, 1035.0, 749.0, 491.0, 346.0, 242.0, 184.0, 123.0, 78.0, 56.0, 32.0, 46.0, 33.0, 25.0, 16.0, 8.0, 14.0, 8.0, 7.0, 5.0, 0.0, 2.0, 2.0, 2.0, 5.0], "bins": [-0.0523681640625, -0.050797462463378906, -0.04922676086425781, -0.04765605926513672, -0.046085357666015625, -0.04451465606689453, -0.04294395446777344, -0.041373252868652344, -0.03980255126953125, -0.038231849670410156, -0.03666114807128906, -0.03509044647216797, -0.033519744873046875, -0.03194904327392578, -0.030378341674804688, -0.028807640075683594, -0.0272369384765625, -0.025666236877441406, -0.024095535278320312, -0.02252483367919922, -0.020954132080078125, -0.01938343048095703, -0.017812728881835938, -0.016242027282714844, -0.01467132568359375, -0.013100624084472656, -0.011529922485351562, -0.009959220886230469, -0.008388519287109375, -0.006817817687988281, -0.0052471160888671875, -0.0036764144897460938, -0.002105712890625, -0.0005350112915039062, 0.0010356903076171875, 0.0026063919067382812, 0.004177093505859375, 0.005747795104980469, 0.0073184967041015625, 0.008889198303222656, 0.01045989990234375, 0.012030601501464844, 0.013601303100585938, 0.015172004699707031, 0.016742706298828125, 0.01831340789794922, 0.019884109497070312, 0.021454811096191406, 0.0230255126953125, 0.024596214294433594, 0.026166915893554688, 0.02773761749267578, 0.029308319091796875, 0.03087902069091797, 0.03244972229003906, 0.034020423889160156, 0.03559112548828125, 0.037161827087402344, 0.03873252868652344, 0.04030323028564453, 0.041873931884765625, 0.04344463348388672, 0.04501533508300781, 0.046586036682128906, 0.04815673828125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 6.0, 6.0, 6.0, 11.0, 12.0, 19.0, 23.0, 45.0, 65.0, 98.0, 116.0, 139.0, 134.0, 108.0, 70.0, 56.0, 29.0, 21.0, 14.0, 9.0, 10.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3053417205810547e-05, -1.2686476111412048e-05, -1.231953501701355e-05, -1.1952593922615051e-05, -1.1585652828216553e-05, -1.1218711733818054e-05, -1.0851770639419556e-05, -1.0484829545021057e-05, -1.0117888450622559e-05, -9.75094735622406e-06, -9.384006261825562e-06, -9.017065167427063e-06, -8.650124073028564e-06, -8.283182978630066e-06, -7.916241884231567e-06, -7.549300789833069e-06, -7.18235969543457e-06, -6.815418601036072e-06, -6.448477506637573e-06, -6.081536412239075e-06, -5.714595317840576e-06, -5.347654223442078e-06, -4.980713129043579e-06, -4.6137720346450806e-06, -4.246830940246582e-06, -3.8798898458480835e-06, -3.512948751449585e-06, -3.1460076570510864e-06, -2.779066562652588e-06, -2.4121254682540894e-06, -2.045184373855591e-06, -1.6782432794570923e-06, -1.3113021850585938e-06, -9.443610906600952e-07, -5.774199962615967e-07, -2.1047890186309814e-07, 1.564621925354004e-07, 5.234032869338989e-07, 8.903443813323975e-07, 1.257285475730896e-06, 1.6242265701293945e-06, 1.991167664527893e-06, 2.3581087589263916e-06, 2.72504985332489e-06, 3.0919909477233887e-06, 3.458932042121887e-06, 3.825873136520386e-06, 4.192814230918884e-06, 4.559755325317383e-06, 4.926696419715881e-06, 5.29363751411438e-06, 5.660578608512878e-06, 6.027519702911377e-06, 6.3944607973098755e-06, 6.761401891708374e-06, 7.1283429861068726e-06, 7.495284080505371e-06, 7.86222517490387e-06, 8.229166269302368e-06, 8.596107363700867e-06, 8.963048458099365e-06, 9.329989552497864e-06, 9.696930646896362e-06, 1.006387174129486e-05, 1.043081283569336e-05]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 24.0, 126.0, 1221.0, 30106.0, 1014107.0, 2651.0, 221.0, 34.0, 10.0, 5.0, 6.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.308837890625, -0.29824066162109375, -0.2876434326171875, -0.27704620361328125, -0.266448974609375, -0.25585174560546875, -0.2452545166015625, -0.23465728759765625, -0.22406005859375, -0.21346282958984375, -0.2028656005859375, -0.19226837158203125, -0.181671142578125, -0.17107391357421875, -0.1604766845703125, -0.14987945556640625, -0.1392822265625, -0.12868499755859375, -0.1180877685546875, -0.10749053955078125, -0.096893310546875, -0.08629608154296875, -0.0756988525390625, -0.06510162353515625, -0.05450439453125, -0.04390716552734375, -0.0333099365234375, -0.02271270751953125, -0.012115478515625, -0.00151824951171875, 0.0090789794921875, 0.01967620849609375, 0.0302734375, 0.04087066650390625, 0.0514678955078125, 0.06206512451171875, 0.072662353515625, 0.08325958251953125, 0.0938568115234375, 0.10445404052734375, 0.11505126953125, 0.12564849853515625, 0.1362457275390625, 0.14684295654296875, 0.157440185546875, 0.16803741455078125, 0.1786346435546875, 0.18923187255859375, 0.1998291015625, 0.21042633056640625, 0.2210235595703125, 0.23162078857421875, 0.242218017578125, 0.25281524658203125, 0.2634124755859375, 0.27400970458984375, 0.28460693359375, 0.29520416259765625, 0.3058013916015625, 0.31639862060546875, 0.326995849609375, 0.33759307861328125, 0.3481903076171875, 0.35878753662109375, 0.369384765625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 6.0, 5.0, 8.0, 63.0, 734.0, 115.0, 5.0, 7.0, 4.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0209197998046875, -0.02021193504333496, -0.019504070281982422, -0.018796205520629883, -0.018088340759277344, -0.017380475997924805, -0.016672611236572266, -0.015964746475219727, -0.015256881713867188, -0.014549016952514648, -0.01384115219116211, -0.01313328742980957, -0.012425422668457031, -0.011717557907104492, -0.011009693145751953, -0.010301828384399414, -0.009593963623046875, -0.008886098861694336, -0.008178234100341797, -0.007470369338989258, -0.006762504577636719, -0.00605463981628418, -0.005346775054931641, -0.0046389102935791016, -0.0039310455322265625, -0.0032231807708740234, -0.0025153160095214844, -0.0018074512481689453, -0.0010995864868164062, -0.0003917217254638672, 0.0003161430358886719, 0.001024007797241211, 0.00173187255859375, 0.002439737319946289, 0.003147602081298828, 0.003855466842651367, 0.004563331604003906, 0.005271196365356445, 0.005979061126708984, 0.0066869258880615234, 0.0073947906494140625, 0.008102655410766602, 0.00881052017211914, 0.00951838493347168, 0.010226249694824219, 0.010934114456176758, 0.011641979217529297, 0.012349843978881836, 0.013057708740234375, 0.013765573501586914, 0.014473438262939453, 0.015181303024291992, 0.01588916778564453, 0.01659703254699707, 0.01730489730834961, 0.01801276206970215, 0.018720626831054688, 0.019428491592407227, 0.020136356353759766, 0.020844221115112305, 0.021552085876464844, 0.022259950637817383, 0.022967815399169922, 0.02367568016052246, 0.024383544921875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 20.0, 50.0, 187.0, 430.0, 223.0, 63.0, 28.0, 8.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2737616300582886, -1.2486053705215454, -1.2234491109848022, -1.198292851448059, -1.173136591911316, -1.1479803323745728, -1.1228240728378296, -1.0976678133010864, -1.0725115537643433, -1.0473552942276, -1.022199034690857, -0.9970427751541138, -0.9718865156173706, -0.9467302560806274, -0.9215739965438843, -0.8964176774024963, -0.8712613582611084, -0.8461050987243652, -0.8209488391876221, -0.7957925796508789, -0.7706363201141357, -0.7454800605773926, -0.7203238010406494, -0.6951674818992615, -0.6700112819671631, -0.6448550224304199, -0.6196987628936768, -0.5945425033569336, -0.5693862438201904, -0.5442299842834473, -0.5190737247467041, -0.49391740560531616, -0.4687611758708954, -0.4436049163341522, -0.41844865679740906, -0.3932923674583435, -0.36813610792160034, -0.3429798483848572, -0.317823588848114, -0.29266732931137085, -0.2675110697746277, -0.24235481023788452, -0.21719853579998016, -0.192042276263237, -0.16688600182533264, -0.14172974228858948, -0.11657348275184631, -0.09141720831394196, -0.0662609338760376, -0.04110466688871384, -0.015948403626680374, 0.009207859635353088, 0.03436412662267685, 0.05952039361000061, 0.08467665314674377, 0.10983292758464813, 0.1349891871213913, 0.16014544665813446, 0.18530172109603882, 0.21045798063278198, 0.23561424016952515, 0.2607704997062683, 0.2859267592430115, 0.311083048582077, 0.3362393081188202]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 7.0, 11.0, 7.0, 11.0, 16.0, 8.0, 17.0, 17.0, 18.0, 29.0, 36.0, 26.0, 28.0, 38.0, 37.0, 36.0, 39.0, 38.0, 38.0, 38.0, 42.0, 39.0, 33.0, 41.0, 42.0, 30.0, 35.0, 29.0, 25.0, 23.0, 27.0, 24.0, 13.0, 14.0, 19.0, 11.0, 6.0, 6.0, 10.0, 6.0, 6.0, 6.0, 6.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.13295792043209076, -0.128255233168602, -0.12355255335569382, -0.11884987354278564, -0.11414718627929688, -0.1094445064663887, -0.10474182665348053, -0.10003913938999176, -0.09533645957708359, -0.09063377976417542, -0.08593109250068665, -0.08122841268777847, -0.0765257328748703, -0.07182304561138153, -0.06712036579847336, -0.06241768226027489, -0.057714998722076416, -0.053012315183877945, -0.048309631645679474, -0.0436069518327713, -0.03890426829457283, -0.03420158475637436, -0.029498903080821037, -0.024796221405267715, -0.020093537867069244, -0.015390855260193348, -0.010688172653317451, -0.005985490046441555, -0.0012828074395656586, 0.0034198760986328125, 0.008122557774186134, 0.012825239449739456, 0.017527908086776733, 0.022230591624975204, 0.026933273300528526, 0.03163595497608185, 0.03633863851428032, 0.04104132205247879, 0.04574400186538696, 0.050446685403585434, 0.055149368941783905, 0.059852052479982376, 0.06455473601818085, 0.06925741583108902, 0.07396009564399719, 0.07866278290748596, 0.08336546272039413, 0.08806814253330231, 0.09277082979679108, 0.09747350960969925, 0.10217619687318802, 0.10687887668609619, 0.11158156394958496, 0.11628424376249313, 0.1209869235754013, 0.12568961083889008, 0.13039228320121765, 0.13509497046470642, 0.139797642827034, 0.14450033009052277, 0.14920301735401154, 0.1539056897163391, 0.15860837697982788, 0.16331106424331665, 0.16801375150680542]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 13.0, 7.0, 13.0, 22.0, 16.0, 27.0, 28.0, 23.0, 48.0, 68.0, 77.0, 83.0, 129.0, 191.0, 315.0, 536.0, 1016.0, 2123.0, 4944.0, 16102.0, 411481.0, 3611439.0, 127595.0, 10190.0, 3761.0, 1680.0, 870.0, 464.0, 282.0, 198.0, 113.0, 79.0, 78.0, 55.0, 52.0, 31.0, 26.0, 26.0, 16.0, 12.0, 9.0, 17.0, 7.0, 3.0, 6.0, 6.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.263092041015625, -0.25347900390625, -0.243865966796875, -0.2342529296875, -0.224639892578125, -0.21502685546875, -0.205413818359375, -0.19580078125, -0.186187744140625, -0.17657470703125, -0.166961669921875, -0.1573486328125, -0.147735595703125, -0.13812255859375, -0.128509521484375, -0.118896484375, -0.109283447265625, -0.09967041015625, -0.090057373046875, -0.0804443359375, -0.070831298828125, -0.06121826171875, -0.051605224609375, -0.0419921875, -0.032379150390625, -0.02276611328125, -0.013153076171875, -0.0035400390625, 0.006072998046875, 0.01568603515625, 0.025299072265625, 0.034912109375, 0.044525146484375, 0.05413818359375, 0.063751220703125, 0.0733642578125, 0.082977294921875, 0.09259033203125, 0.102203369140625, 0.11181640625, 0.121429443359375, 0.13104248046875, 0.140655517578125, 0.1502685546875, 0.159881591796875, 0.16949462890625, 0.179107666015625, 0.188720703125, 0.198333740234375, 0.20794677734375, 0.217559814453125, 0.2271728515625, 0.236785888671875, 0.24639892578125, 0.256011962890625, 0.265625, 0.275238037109375, 0.28485107421875, 0.294464111328125, 0.3040771484375, 0.313690185546875, 0.32330322265625, 0.332916259765625, 0.342529296875]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 6.0, 12.0, 14.0, 11.0, 14.0, 15.0, 17.0, 23.0, 29.0, 33.0, 42.0, 34.0, 41.0, 29.0, 38.0, 34.0, 39.0, 49.0, 44.0, 47.0, 43.0, 39.0, 26.0, 32.0, 34.0, 34.0, 16.0, 20.0, 23.0, 29.0, 24.0, 16.0, 10.0, 11.0, 12.0, 10.0, 4.0, 5.0, 9.0, 4.0, 8.0, 4.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.08868408203125, -0.08568572998046875, -0.0826873779296875, -0.07968902587890625, -0.076690673828125, -0.07369232177734375, -0.0706939697265625, -0.06769561767578125, -0.064697265625, -0.06169891357421875, -0.0587005615234375, -0.05570220947265625, -0.052703857421875, -0.04970550537109375, -0.0467071533203125, -0.04370880126953125, -0.04071044921875, -0.03771209716796875, -0.0347137451171875, -0.03171539306640625, -0.028717041015625, -0.02571868896484375, -0.0227203369140625, -0.01972198486328125, -0.0167236328125, -0.01372528076171875, -0.0107269287109375, -0.00772857666015625, -0.004730224609375, -0.00173187255859375, 0.0012664794921875, 0.00426483154296875, 0.00726318359375, 0.01026153564453125, 0.0132598876953125, 0.01625823974609375, 0.019256591796875, 0.02225494384765625, 0.0252532958984375, 0.02825164794921875, 0.03125, 0.03424835205078125, 0.0372467041015625, 0.04024505615234375, 0.043243408203125, 0.04624176025390625, 0.0492401123046875, 0.05223846435546875, 0.05523681640625, 0.05823516845703125, 0.0612335205078125, 0.06423187255859375, 0.067230224609375, 0.07022857666015625, 0.0732269287109375, 0.07622528076171875, 0.0792236328125, 0.08222198486328125, 0.0852203369140625, 0.08821868896484375, 0.091217041015625, 0.09421539306640625, 0.0972137451171875, 0.10021209716796875, 0.10321044921875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 27.0, 57.0, 235.0, 1167.0, 45486.0, 4143749.0, 2952.0, 393.0, 111.0, 42.0, 22.0, 8.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.0912933349609375, -2.028289794921875, -1.9652862548828125, -1.90228271484375, -1.8392791748046875, -1.776275634765625, -1.7132720947265625, -1.6502685546875, -1.5872650146484375, -1.524261474609375, -1.4612579345703125, -1.39825439453125, -1.3352508544921875, -1.272247314453125, -1.2092437744140625, -1.146240234375, -1.0832366943359375, -1.020233154296875, -0.9572296142578125, -0.89422607421875, -0.8312225341796875, -0.768218994140625, -0.7052154541015625, -0.6422119140625, -0.5792083740234375, -0.516204833984375, -0.4532012939453125, -0.39019775390625, -0.3271942138671875, -0.264190673828125, -0.2011871337890625, -0.13818359375, -0.0751800537109375, -0.012176513671875, 0.0508270263671875, 0.11383056640625, 0.1768341064453125, 0.239837646484375, 0.3028411865234375, 0.3658447265625, 0.4288482666015625, 0.491851806640625, 0.5548553466796875, 0.61785888671875, 0.6808624267578125, 0.743865966796875, 0.8068695068359375, 0.869873046875, 0.9328765869140625, 0.995880126953125, 1.0588836669921875, 1.12188720703125, 1.1848907470703125, 1.247894287109375, 1.3108978271484375, 1.3739013671875, 1.4369049072265625, 1.499908447265625, 1.5629119873046875, 1.62591552734375, 1.6889190673828125, 1.751922607421875, 1.8149261474609375, 1.8779296875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 14.0, 23.0, 64.0, 233.0, 824.0, 1766.0, 791.0, 204.0, 62.0, 34.0, 22.0, 8.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1392822265625, -0.13584041595458984, -0.1323986053466797, -0.12895679473876953, -0.12551498413085938, -0.12207317352294922, -0.11863136291503906, -0.1151895523071289, -0.11174774169921875, -0.1083059310913086, -0.10486412048339844, -0.10142230987548828, -0.09798049926757812, -0.09453868865966797, -0.09109687805175781, -0.08765506744384766, -0.0842132568359375, -0.08077144622802734, -0.07732963562011719, -0.07388782501220703, -0.07044601440429688, -0.06700420379638672, -0.06356239318847656, -0.060120582580566406, -0.05667877197265625, -0.053236961364746094, -0.04979515075683594, -0.04635334014892578, -0.042911529541015625, -0.03946971893310547, -0.03602790832519531, -0.032586097717285156, -0.029144287109375, -0.025702476501464844, -0.022260665893554688, -0.01881885528564453, -0.015377044677734375, -0.011935234069824219, -0.008493423461914062, -0.005051612854003906, -0.00160980224609375, 0.0018320083618164062, 0.0052738189697265625, 0.008715629577636719, 0.012157440185546875, 0.015599250793457031, 0.019041061401367188, 0.022482872009277344, 0.0259246826171875, 0.029366493225097656, 0.03280830383300781, 0.03625011444091797, 0.039691925048828125, 0.04313373565673828, 0.04657554626464844, 0.050017356872558594, 0.05345916748046875, 0.056900978088378906, 0.06034278869628906, 0.06378459930419922, 0.06722640991210938, 0.07066822052001953, 0.07411003112792969, 0.07755184173583984, 0.08099365234375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 32.0, 85.0, 272.0, 407.0, 126.0, 41.0, 29.0, 9.0, 5.0, 0.0, 2.0], "bins": [-1.042585015296936, -1.0240403413772583, -1.0054956674575806, -0.9869509339332581, -0.9684062004089355, -0.9498615264892578, -0.9313167929649353, -0.9127721190452576, -0.8942273855209351, -0.8756827116012573, -0.8571379780769348, -0.8385933041572571, -0.8200485706329346, -0.8015038967132568, -0.7829591631889343, -0.7644144892692566, -0.7458697557449341, -0.7273250818252563, -0.7087803483009338, -0.6902356743812561, -0.6716909408569336, -0.6531462669372559, -0.6346015334129333, -0.6160568594932556, -0.5975121855735779, -0.5789675116539001, -0.5604227781295776, -0.5418781042098999, -0.5233333706855774, -0.5047886967658997, -0.48624396324157715, -0.4676992893218994, -0.4491545557975769, -0.4306098520755768, -0.41206514835357666, -0.39352044463157654, -0.3749757409095764, -0.3564310371875763, -0.33788633346557617, -0.31934165954589844, -0.3007969260215759, -0.2822522222995758, -0.2637075185775757, -0.24516281485557556, -0.22661811113357544, -0.20807340741157532, -0.1895287185907364, -0.17098401486873627, -0.15243932604789734, -0.13389462232589722, -0.1153499186038971, -0.09680522233247757, -0.07826051861047745, -0.059715814888477325, -0.0411711186170578, -0.022626414895057678, -0.004081711173057556, 0.014462990686297417, 0.03300769254565239, 0.05155239254236221, 0.07009709626436234, 0.08864179998636246, 0.10718649625778198, 0.1257311999797821, 0.14427590370178223]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 4.0, 2.0, 7.0, 6.0, 5.0, 9.0, 14.0, 14.0, 15.0, 16.0, 10.0, 22.0, 28.0, 28.0, 32.0, 33.0, 22.0, 29.0, 37.0, 39.0, 45.0, 39.0, 39.0, 33.0, 41.0, 40.0, 36.0, 26.0, 33.0, 35.0, 30.0, 24.0, 24.0, 23.0, 22.0, 25.0, 21.0, 15.0, 12.0, 12.0, 5.0, 6.0, 10.0, 4.0, 8.0, 5.0, 7.0, 1.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09046391397714615, -0.08749459683895111, -0.08452527970075607, -0.08155596256256104, -0.078586645424366, -0.07561732828617096, -0.07264801859855652, -0.06967869400978088, -0.06670938432216644, -0.0637400671839714, -0.06077075004577637, -0.05780143290758133, -0.05483211576938629, -0.051862798631191254, -0.048893485218286514, -0.045924168080091476, -0.04295484721660614, -0.0399855300784111, -0.037016212940216064, -0.03404689580202103, -0.031077580526471138, -0.0281082633882761, -0.02513894811272621, -0.022169630974531174, -0.019200313836336136, -0.016230996698141098, -0.013261680491268635, -0.010292364284396172, -0.007323047146201134, -0.004353730008006096, -0.0013844147324562073, 0.0015849024057388306, 0.0045542120933532715, 0.007523528765887022, 0.010492845438420773, 0.013462161645293236, 0.016431478783488274, 0.01940079592168331, 0.0223701111972332, 0.025339428335428238, 0.028308745473623276, 0.031278062611818314, 0.03424737975001335, 0.03721669316291809, 0.04018601030111313, 0.043155327439308167, 0.046124644577503204, 0.04909396171569824, 0.05206327885389328, 0.05503259599208832, 0.058001913130283356, 0.060971230268478394, 0.06394054740667343, 0.06690986454486847, 0.06987917423248291, 0.07284849882125854, 0.07581780850887299, 0.07878712564706802, 0.08175644278526306, 0.0847257599234581, 0.08769507706165314, 0.09066439419984818, 0.09363371133804321, 0.09660302102565765, 0.09957234561443329]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 9.0, 20.0, 26.0, 48.0, 61.0, 94.0, 143.0, 229.0, 374.0, 594.0, 862.0, 1500.0, 2229.0, 3852.0, 6284.0, 10402.0, 17736.0, 31530.0, 57904.0, 113148.0, 222642.0, 266163.0, 146176.0, 72975.0, 39392.0, 21755.0, 12724.0, 7605.0, 4477.0, 2870.0, 1746.0, 1075.0, 712.0, 411.0, 274.0, 188.0, 105.0, 83.0, 49.0, 32.0, 24.0, 13.0, 6.0, 1.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08526611328125, -0.08261680603027344, -0.07996749877929688, -0.07731819152832031, -0.07466888427734375, -0.07201957702636719, -0.06937026977539062, -0.06672096252441406, -0.0640716552734375, -0.06142234802246094, -0.058773040771484375, -0.05612373352050781, -0.05347442626953125, -0.05082511901855469, -0.048175811767578125, -0.04552650451660156, -0.042877197265625, -0.04022789001464844, -0.037578582763671875, -0.03492927551269531, -0.03227996826171875, -0.029630661010742188, -0.026981353759765625, -0.024332046508789062, -0.0216827392578125, -0.019033432006835938, -0.016384124755859375, -0.013734817504882812, -0.01108551025390625, -0.008436203002929688, -0.005786895751953125, -0.0031375885009765625, -0.00048828125, 0.0021610260009765625, 0.004810333251953125, 0.0074596405029296875, 0.01010894775390625, 0.012758255004882812, 0.015407562255859375, 0.018056869506835938, 0.0207061767578125, 0.023355484008789062, 0.026004791259765625, 0.028654098510742188, 0.03130340576171875, 0.03395271301269531, 0.036602020263671875, 0.03925132751464844, 0.041900634765625, 0.04454994201660156, 0.047199249267578125, 0.04984855651855469, 0.05249786376953125, 0.05514717102050781, 0.057796478271484375, 0.06044578552246094, 0.0630950927734375, 0.06574440002441406, 0.06839370727539062, 0.07104301452636719, 0.07369232177734375, 0.07634162902832031, 0.07899093627929688, 0.08164024353027344, 0.08428955078125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 6.0, 4.0, 11.0, 12.0, 9.0, 12.0, 13.0, 16.0, 21.0, 16.0, 26.0, 25.0, 24.0, 28.0, 35.0, 38.0, 42.0, 40.0, 47.0, 37.0, 36.0, 48.0, 52.0, 37.0, 32.0, 39.0, 32.0, 34.0, 29.0, 31.0, 25.0, 23.0, 27.0, 21.0, 16.0, 12.0, 5.0, 7.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0943603515625, -0.0913076400756836, -0.08825492858886719, -0.08520221710205078, -0.08214950561523438, -0.07909679412841797, -0.07604408264160156, -0.07299137115478516, -0.06993865966796875, -0.06688594818115234, -0.06383323669433594, -0.06078052520751953, -0.057727813720703125, -0.05467510223388672, -0.05162239074707031, -0.048569679260253906, -0.0455169677734375, -0.042464256286621094, -0.03941154479980469, -0.03635883331298828, -0.033306121826171875, -0.03025341033935547, -0.027200698852539062, -0.024147987365722656, -0.02109527587890625, -0.018042564392089844, -0.014989852905273438, -0.011937141418457031, -0.008884429931640625, -0.005831718444824219, -0.0027790069580078125, 0.00027370452880859375, 0.003326416015625, 0.006379127502441406, 0.009431838989257812, 0.012484550476074219, 0.015537261962890625, 0.01858997344970703, 0.021642684936523438, 0.024695396423339844, 0.02774810791015625, 0.030800819396972656, 0.03385353088378906, 0.03690624237060547, 0.039958953857421875, 0.04301166534423828, 0.04606437683105469, 0.049117088317871094, 0.0521697998046875, 0.055222511291503906, 0.05827522277832031, 0.06132793426513672, 0.06438064575195312, 0.06743335723876953, 0.07048606872558594, 0.07353878021240234, 0.07659149169921875, 0.07964420318603516, 0.08269691467285156, 0.08574962615966797, 0.08880233764648438, 0.09185504913330078, 0.09490776062011719, 0.0979604721069336, 0.10101318359375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 2.0, 8.0, 7.0, 9.0, 17.0, 35.0, 29.0, 52.0, 81.0, 134.0, 171.0, 238.0, 298.0, 479.0, 733.0, 1204.0, 1838.0, 2875.0, 4497.0, 7404.0, 11959.0, 19784.0, 33736.0, 61230.0, 120433.0, 264667.0, 255896.0, 116672.0, 59916.0, 33392.0, 19435.0, 11556.0, 7257.0, 4483.0, 2742.0, 1827.0, 1137.0, 740.0, 495.0, 350.0, 233.0, 161.0, 119.0, 62.0, 46.0, 38.0, 29.0, 20.0, 7.0, 9.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.06439208984375, -0.0624394416809082, -0.060486793518066406, -0.05853414535522461, -0.05658149719238281, -0.054628849029541016, -0.05267620086669922, -0.05072355270385742, -0.048770904541015625, -0.04681825637817383, -0.04486560821533203, -0.042912960052490234, -0.04096031188964844, -0.03900766372680664, -0.037055015563964844, -0.03510236740112305, -0.03314971923828125, -0.031197071075439453, -0.029244422912597656, -0.02729177474975586, -0.025339126586914062, -0.023386478424072266, -0.02143383026123047, -0.019481182098388672, -0.017528533935546875, -0.015575885772705078, -0.013623237609863281, -0.011670589447021484, -0.009717941284179688, -0.007765293121337891, -0.005812644958496094, -0.003859996795654297, -0.0019073486328125, 4.5299530029296875e-05, 0.0019979476928710938, 0.003950595855712891, 0.0059032440185546875, 0.007855892181396484, 0.009808540344238281, 0.011761188507080078, 0.013713836669921875, 0.015666484832763672, 0.01761913299560547, 0.019571781158447266, 0.021524429321289062, 0.02347707748413086, 0.025429725646972656, 0.027382373809814453, 0.02933502197265625, 0.03128767013549805, 0.033240318298339844, 0.03519296646118164, 0.03714561462402344, 0.039098262786865234, 0.04105091094970703, 0.04300355911254883, 0.044956207275390625, 0.04690885543823242, 0.04886150360107422, 0.050814151763916016, 0.05276679992675781, 0.05471944808959961, 0.056672096252441406, 0.0586247444152832, 0.060577392578125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 3.0, 6.0, 14.0, 9.0, 14.0, 14.0, 13.0, 17.0, 29.0, 25.0, 33.0, 27.0, 37.0, 39.0, 30.0, 40.0, 46.0, 31.0, 43.0, 41.0, 42.0, 27.0, 44.0, 21.0, 36.0, 28.0, 36.0, 30.0, 23.0, 26.0, 22.0, 17.0, 20.0, 22.0, 18.0, 11.0, 8.0, 15.0, 7.0, 4.0, 8.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0745849609375, -0.07233619689941406, -0.07008743286132812, -0.06783866882324219, -0.06558990478515625, -0.06334114074707031, -0.061092376708984375, -0.05884361267089844, -0.0565948486328125, -0.05434608459472656, -0.052097320556640625, -0.04984855651855469, -0.04759979248046875, -0.04535102844238281, -0.043102264404296875, -0.04085350036621094, -0.038604736328125, -0.03635597229003906, -0.034107208251953125, -0.03185844421386719, -0.02960968017578125, -0.027360916137695312, -0.025112152099609375, -0.022863388061523438, -0.0206146240234375, -0.018365859985351562, -0.016117095947265625, -0.013868331909179688, -0.01161956787109375, -0.009370803833007812, -0.007122039794921875, -0.0048732757568359375, -0.00262451171875, -0.0003757476806640625, 0.001873016357421875, 0.0041217803955078125, 0.00637054443359375, 0.008619308471679688, 0.010868072509765625, 0.013116836547851562, 0.0153656005859375, 0.017614364624023438, 0.019863128662109375, 0.022111892700195312, 0.02436065673828125, 0.026609420776367188, 0.028858184814453125, 0.031106948852539062, 0.033355712890625, 0.03560447692871094, 0.037853240966796875, 0.04010200500488281, 0.04235076904296875, 0.04459953308105469, 0.046848297119140625, 0.04909706115722656, 0.0513458251953125, 0.05359458923339844, 0.055843353271484375, 0.05809211730957031, 0.06034088134765625, 0.06258964538574219, 0.06483840942382812, 0.06708717346191406, 0.0693359375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 8.0, 12.0, 7.0, 17.0, 23.0, 22.0, 41.0, 73.0, 89.0, 134.0, 187.0, 344.0, 554.0, 1009.0, 1947.0, 4428.0, 11341.0, 41400.0, 509404.0, 419194.0, 38775.0, 10966.0, 4181.0, 1920.0, 995.0, 521.0, 365.0, 180.0, 122.0, 84.0, 57.0, 45.0, 35.0, 21.0, 15.0, 14.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01336669921875, -0.012948751449584961, -0.012530803680419922, -0.012112855911254883, -0.011694908142089844, -0.011276960372924805, -0.010859012603759766, -0.010441064834594727, -0.010023117065429688, -0.009605169296264648, -0.00918722152709961, -0.00876927375793457, -0.008351325988769531, -0.007933378219604492, -0.007515430450439453, -0.007097482681274414, -0.006679534912109375, -0.006261587142944336, -0.005843639373779297, -0.005425691604614258, -0.005007743835449219, -0.00458979606628418, -0.004171848297119141, -0.0037539005279541016, -0.0033359527587890625, -0.0029180049896240234, -0.0025000572204589844, -0.0020821094512939453, -0.0016641616821289062, -0.0012462139129638672, -0.0008282661437988281, -0.00041031837463378906, 7.62939453125e-06, 0.00042557716369628906, 0.0008435249328613281, 0.0012614727020263672, 0.0016794204711914062, 0.0020973682403564453, 0.0025153160095214844, 0.0029332637786865234, 0.0033512115478515625, 0.0037691593170166016, 0.004187107086181641, 0.00460505485534668, 0.005023002624511719, 0.005440950393676758, 0.005858898162841797, 0.006276845932006836, 0.006694793701171875, 0.007112741470336914, 0.007530689239501953, 0.007948637008666992, 0.008366584777832031, 0.00878453254699707, 0.00920248031616211, 0.009620428085327148, 0.010038375854492188, 0.010456323623657227, 0.010874271392822266, 0.011292219161987305, 0.011710166931152344, 0.012128114700317383, 0.012546062469482422, 0.012964010238647461, 0.0133819580078125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 10.0, 11.0, 6.0, 6.0, 8.0, 10.0, 15.0, 10.0, 17.0, 12.0, 15.0, 15.0, 15.0, 16.0, 13.0, 21.0, 40.0, 56.0, 59.0, 59.0, 120.0, 79.0, 68.0, 45.0, 47.0, 18.0, 27.0, 20.0, 18.0, 12.0, 24.0, 17.0, 18.0, 9.0, 8.0, 6.0, 8.0, 12.0, 9.0, 4.0, 3.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.647804260253906e-05, -3.5196542739868164e-05, -3.3915042877197266e-05, -3.263354301452637e-05, -3.135204315185547e-05, -3.007054328918457e-05, -2.8789043426513672e-05, -2.7507543563842773e-05, -2.6226043701171875e-05, -2.4944543838500977e-05, -2.3663043975830078e-05, -2.238154411315918e-05, -2.110004425048828e-05, -1.9818544387817383e-05, -1.8537044525146484e-05, -1.7255544662475586e-05, -1.5974044799804688e-05, -1.4692544937133789e-05, -1.341104507446289e-05, -1.2129545211791992e-05, -1.0848045349121094e-05, -9.566545486450195e-06, -8.285045623779297e-06, -7.0035457611083984e-06, -5.7220458984375e-06, -4.4405460357666016e-06, -3.159046173095703e-06, -1.8775463104248047e-06, -5.960464477539062e-07, 6.854534149169922e-07, 1.9669532775878906e-06, 3.248453140258789e-06, 4.5299530029296875e-06, 5.811452865600586e-06, 7.092952728271484e-06, 8.374452590942383e-06, 9.655952453613281e-06, 1.093745231628418e-05, 1.2218952178955078e-05, 1.3500452041625977e-05, 1.4781951904296875e-05, 1.6063451766967773e-05, 1.7344951629638672e-05, 1.862645149230957e-05, 1.990795135498047e-05, 2.1189451217651367e-05, 2.2470951080322266e-05, 2.3752450942993164e-05, 2.5033950805664062e-05, 2.631545066833496e-05, 2.759695053100586e-05, 2.8878450393676758e-05, 3.0159950256347656e-05, 3.1441450119018555e-05, 3.272294998168945e-05, 3.400444984436035e-05, 3.528594970703125e-05, 3.656744956970215e-05, 3.784894943237305e-05, 3.9130449295043945e-05, 4.0411949157714844e-05, 4.169344902038574e-05, 4.297494888305664e-05, 4.425644874572754e-05, 4.553794860839844e-05]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 6.0, 4.0, 7.0, 10.0, 8.0, 6.0, 16.0, 15.0, 16.0, 36.0, 139.0, 526.0, 2140.0, 10474.0, 992642.0, 37352.0, 3753.0, 996.0, 205.0, 81.0, 22.0, 18.0, 11.0, 10.0, 4.0, 8.0, 7.0, 4.0, 4.0, 5.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07415771484375, -0.07188987731933594, -0.06962203979492188, -0.06735420227050781, -0.06508636474609375, -0.06281852722167969, -0.060550689697265625, -0.05828285217285156, -0.0560150146484375, -0.05374717712402344, -0.051479339599609375, -0.04921150207519531, -0.04694366455078125, -0.04467582702636719, -0.042407989501953125, -0.04014015197753906, -0.037872314453125, -0.03560447692871094, -0.033336639404296875, -0.031068801879882812, -0.02880096435546875, -0.026533126831054688, -0.024265289306640625, -0.021997451782226562, -0.0197296142578125, -0.017461776733398438, -0.015193939208984375, -0.012926101684570312, -0.01065826416015625, -0.008390426635742188, -0.006122589111328125, -0.0038547515869140625, -0.0015869140625, 0.0006809234619140625, 0.002948760986328125, 0.0052165985107421875, 0.00748443603515625, 0.009752273559570312, 0.012020111083984375, 0.014287948608398438, 0.0165557861328125, 0.018823623657226562, 0.021091461181640625, 0.023359298706054688, 0.02562713623046875, 0.027894973754882812, 0.030162811279296875, 0.03243064880371094, 0.034698486328125, 0.03696632385253906, 0.039234161376953125, 0.04150199890136719, 0.04376983642578125, 0.04603767395019531, 0.048305511474609375, 0.05057334899902344, 0.0528411865234375, 0.05510902404785156, 0.057376861572265625, 0.05964469909667969, 0.06191253662109375, 0.06418037414550781, 0.06644821166992188, 0.06871604919433594, 0.07098388671875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 13.0, 50.0, 99.0, 218.0, 249.0, 183.0, 112.0, 34.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00542449951171875, -0.00525742769241333, -0.00509035587310791, -0.00492328405380249, -0.00475621223449707, -0.00458914041519165, -0.0044220685958862305, -0.0042549967765808105, -0.004087924957275391, -0.003920853137969971, -0.0037537813186645508, -0.003586709499359131, -0.003419637680053711, -0.003252565860748291, -0.003085494041442871, -0.002918422222137451, -0.0027513504028320312, -0.0025842785835266113, -0.0024172067642211914, -0.0022501349449157715, -0.0020830631256103516, -0.0019159913063049316, -0.0017489194869995117, -0.0015818476676940918, -0.0014147758483886719, -0.001247704029083252, -0.001080632209777832, -0.0009135603904724121, -0.0007464885711669922, -0.0005794167518615723, -0.00041234493255615234, -0.0002452731132507324, -7.82012939453125e-05, 8.887052536010742e-05, 0.00025594234466552734, 0.00042301416397094727, 0.0005900859832763672, 0.0007571578025817871, 0.000924229621887207, 0.001091301441192627, 0.0012583732604980469, 0.0014254450798034668, 0.0015925168991088867, 0.0017595887184143066, 0.0019266605377197266, 0.0020937323570251465, 0.0022608041763305664, 0.0024278759956359863, 0.0025949478149414062, 0.002762019634246826, 0.002929091453552246, 0.003096163272857666, 0.003263235092163086, 0.003430306911468506, 0.0035973787307739258, 0.0037644505500793457, 0.003931522369384766, 0.0040985941886901855, 0.0042656660079956055, 0.004432737827301025, 0.004599809646606445, 0.004766881465911865, 0.004933953285217285, 0.005101025104522705, 0.005268096923828125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 9.0, 18.0, 27.0, 52.0, 87.0, 184.0, 240.0, 206.0, 80.0, 39.0, 23.0, 20.0, 15.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5717854499816895, -0.5599862337112427, -0.5481870174407959, -0.5363878011703491, -0.5245885848999023, -0.5127893686294556, -0.5009901523590088, -0.4891909658908844, -0.47739177942276, -0.46559256315231323, -0.45379334688186646, -0.4419941306114197, -0.4301949441432953, -0.4183957278728485, -0.40659651160240173, -0.39479729533195496, -0.3829980790615082, -0.3711988627910614, -0.3593996465206146, -0.34760046005249023, -0.33580124378204346, -0.3240020275115967, -0.3122028112411499, -0.3004035949707031, -0.28860437870025635, -0.27680516242980957, -0.2650059461593628, -0.253206729888916, -0.24140754342079163, -0.22960832715034485, -0.21780911087989807, -0.2060098946094513, -0.1942106932401657, -0.18241147696971893, -0.17061227560043335, -0.15881305932998657, -0.1470138430595398, -0.1352146416902542, -0.12341542541980743, -0.11161621659994125, -0.09981700778007507, -0.08801779896020889, -0.07621859014034271, -0.06441937386989594, -0.052620165050029755, -0.040820956230163574, -0.029021739959716797, -0.017222531139850616, -0.005423322319984436, 0.006375888362526894, 0.018175099045038223, 0.029974311590194702, 0.04177352041006088, 0.05357272922992706, 0.06537194550037384, 0.07717115432024002, 0.0889703631401062, 0.10076957195997238, 0.11256878077983856, 0.12436799705028534, 0.13616719841957092, 0.1479664146900177, 0.15976563096046448, 0.17156484723091125, 0.18336404860019684]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 13.0, 8.0, 12.0, 21.0, 14.0, 12.0, 15.0, 43.0, 36.0, 25.0, 26.0, 20.0, 44.0, 38.0, 37.0, 47.0, 38.0, 38.0, 38.0, 38.0, 39.0, 33.0, 25.0, 36.0, 39.0, 27.0, 23.0, 21.0, 25.0, 25.0, 22.0, 18.0, 8.0, 14.0, 4.0, 7.0, 9.0, 8.0, 6.0, 7.0, 2.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0836683064699173, -0.08085262030363083, -0.07803692668676376, -0.0752212405204773, -0.07240554690361023, -0.06958986073732376, -0.0667741671204567, -0.06395848095417023, -0.06114278733730316, -0.058327097445726395, -0.05551140755414963, -0.05269571766257286, -0.049880027770996094, -0.04706433787941933, -0.04424864798784256, -0.04143296182155609, -0.038617271929979324, -0.03580158203840256, -0.03298589214682579, -0.030170202255249023, -0.027354512363672256, -0.02453882247209549, -0.021723134443163872, -0.018907444551587105, -0.016091754660010338, -0.01327606476843357, -0.010460374876856804, -0.0076446859166026115, -0.004828996025025845, -0.0020133061334490776, 0.0008023828268051147, 0.0036180727183818817, 0.006433762609958649, 0.009249452501535416, 0.012065142393112183, 0.014880831353366375, 0.017696522176265717, 0.020512212067842484, 0.0233279000967741, 0.026143589988350868, 0.028959279879927635, 0.03177496790885925, 0.03459065780043602, 0.03740634769201279, 0.040222037583589554, 0.04303772747516632, 0.04585341736674309, 0.048669107258319855, 0.05148479714989662, 0.05430048704147339, 0.057116176933050156, 0.05993186682462692, 0.06274755299091339, 0.06556324660778046, 0.06837893277406693, 0.07119462639093399, 0.07401031255722046, 0.07682599872350693, 0.07964169234037399, 0.08245737850666046, 0.08527307212352753, 0.088088758289814, 0.09090445190668106, 0.09372013807296753, 0.0965358316898346]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 8.0, 13.0, 14.0, 29.0, 44.0, 59.0, 95.0, 137.0, 229.0, 324.0, 512.0, 912.0, 1478.0, 2472.0, 4202.0, 7730.0, 14128.0, 26302.0, 51092.0, 102758.0, 210090.0, 281368.0, 171054.0, 83035.0, 41492.0, 21723.0, 11754.0, 6577.0, 3609.0, 2085.0, 1261.0, 724.0, 422.0, 286.0, 199.0, 116.0, 80.0, 43.0, 38.0, 20.0, 13.0, 13.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.17903709411621094, -0.17313766479492188, -0.1672382354736328, -0.16133880615234375, -0.1554393768310547, -0.14953994750976562, -0.14364051818847656, -0.1377410888671875, -0.13184165954589844, -0.12594223022460938, -0.12004280090332031, -0.11414337158203125, -0.10824394226074219, -0.10234451293945312, -0.09644508361816406, -0.090545654296875, -0.08464622497558594, -0.07874679565429688, -0.07284736633300781, -0.06694793701171875, -0.06104850769042969, -0.055149078369140625, -0.04924964904785156, -0.0433502197265625, -0.03745079040527344, -0.031551361083984375, -0.025651931762695312, -0.01975250244140625, -0.013853073120117188, -0.007953643798828125, -0.0020542144775390625, 0.00384521484375, 0.009744644165039062, 0.015644073486328125, 0.021543502807617188, 0.02744293212890625, 0.03334236145019531, 0.039241790771484375, 0.04514122009277344, 0.0510406494140625, 0.05694007873535156, 0.06283950805664062, 0.06873893737792969, 0.07463836669921875, 0.08053779602050781, 0.08643722534179688, 0.09233665466308594, 0.098236083984375, 0.10413551330566406, 0.11003494262695312, 0.11593437194824219, 0.12183380126953125, 0.1277332305908203, 0.13363265991210938, 0.13953208923339844, 0.1454315185546875, 0.15133094787597656, 0.15723037719726562, 0.1631298065185547, 0.16902923583984375, 0.1749286651611328, 0.18082809448242188, 0.18672752380371094, 0.192626953125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 8.0, 4.0, 6.0, 5.0, 16.0, 13.0, 14.0, 20.0, 31.0, 24.0, 34.0, 34.0, 43.0, 34.0, 43.0, 59.0, 48.0, 43.0, 60.0, 49.0, 60.0, 39.0, 45.0, 33.0, 26.0, 38.0, 29.0, 32.0, 20.0, 16.0, 14.0, 18.0, 13.0, 4.0, 11.0, 7.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07818603515625, -0.07603216171264648, -0.07387828826904297, -0.07172441482543945, -0.06957054138183594, -0.06741666793823242, -0.0652627944946289, -0.06310892105102539, -0.060955047607421875, -0.05880117416381836, -0.056647300720214844, -0.05449342727661133, -0.05233955383300781, -0.0501856803894043, -0.04803180694580078, -0.045877933502197266, -0.04372406005859375, -0.041570186614990234, -0.03941631317138672, -0.0372624397277832, -0.03510856628417969, -0.03295469284057617, -0.030800819396972656, -0.02864694595336914, -0.026493072509765625, -0.02433919906616211, -0.022185325622558594, -0.020031452178955078, -0.017877578735351562, -0.015723705291748047, -0.013569831848144531, -0.011415958404541016, -0.0092620849609375, -0.007108211517333984, -0.004954338073730469, -0.002800464630126953, -0.0006465911865234375, 0.0015072822570800781, 0.0036611557006835938, 0.005815029144287109, 0.007968902587890625, 0.01012277603149414, 0.012276649475097656, 0.014430522918701172, 0.016584396362304688, 0.018738269805908203, 0.02089214324951172, 0.023046016693115234, 0.02519989013671875, 0.027353763580322266, 0.02950763702392578, 0.0316615104675293, 0.03381538391113281, 0.03596925735473633, 0.038123130798339844, 0.04027700424194336, 0.042430877685546875, 0.04458475112915039, 0.046738624572753906, 0.04889249801635742, 0.05104637145996094, 0.05320024490356445, 0.05535411834716797, 0.057507991790771484, 0.059661865234375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 12.0, 12.0, 15.0, 24.0, 26.0, 23.0, 33.0, 32.0, 44.0, 49.0, 73.0, 81.0, 166.0, 509.0, 1999.0, 9493.0, 51981.0, 334229.0, 534198.0, 94677.0, 16200.0, 3252.0, 736.0, 216.0, 83.0, 70.0, 41.0, 61.0, 44.0, 25.0, 26.0, 22.0, 24.0, 15.0, 13.0, 13.0, 6.0, 4.0, 6.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.50146484375, -0.4875984191894531, -0.47373199462890625, -0.4598655700683594, -0.4459991455078125, -0.4321327209472656, -0.41826629638671875, -0.4043998718261719, -0.390533447265625, -0.3766670227050781, -0.36280059814453125, -0.3489341735839844, -0.3350677490234375, -0.3212013244628906, -0.30733489990234375, -0.2934684753417969, -0.27960205078125, -0.2657356262207031, -0.25186920166015625, -0.23800277709960938, -0.2241363525390625, -0.21026992797851562, -0.19640350341796875, -0.18253707885742188, -0.168670654296875, -0.15480422973632812, -0.14093780517578125, -0.12707138061523438, -0.1132049560546875, -0.09933853149414062, -0.08547210693359375, -0.07160568237304688, -0.0577392578125, -0.043872833251953125, -0.03000640869140625, -0.016139984130859375, -0.0022735595703125, 0.011592864990234375, 0.02545928955078125, 0.039325714111328125, 0.053192138671875, 0.06705856323242188, 0.08092498779296875, 0.09479141235351562, 0.1086578369140625, 0.12252426147460938, 0.13639068603515625, 0.15025711059570312, 0.16412353515625, 0.17798995971679688, 0.19185638427734375, 0.20572280883789062, 0.2195892333984375, 0.23345565795898438, 0.24732208251953125, 0.2611885070800781, 0.275054931640625, 0.2889213562011719, 0.30278778076171875, 0.3166542053222656, 0.3305206298828125, 0.3443870544433594, 0.35825347900390625, 0.3721199035644531, 0.385986328125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 12.0, 4.0, 4.0, 18.0, 13.0, 14.0, 21.0, 13.0, 19.0, 32.0, 35.0, 34.0, 33.0, 49.0, 59.0, 47.0, 47.0, 47.0, 62.0, 56.0, 38.0, 52.0, 35.0, 37.0, 29.0, 25.0, 26.0, 24.0, 18.0, 15.0, 15.0, 15.0, 10.0, 8.0, 9.0, 10.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.066650390625, -0.06474781036376953, -0.06284523010253906, -0.060942649841308594, -0.059040069580078125, -0.057137489318847656, -0.05523490905761719, -0.05333232879638672, -0.05142974853515625, -0.04952716827392578, -0.04762458801269531, -0.045722007751464844, -0.043819427490234375, -0.041916847229003906, -0.04001426696777344, -0.03811168670654297, -0.0362091064453125, -0.03430652618408203, -0.03240394592285156, -0.030501365661621094, -0.028598785400390625, -0.026696205139160156, -0.024793624877929688, -0.02289104461669922, -0.02098846435546875, -0.01908588409423828, -0.017183303833007812, -0.015280723571777344, -0.013378143310546875, -0.011475563049316406, -0.009572982788085938, -0.007670402526855469, -0.005767822265625, -0.0038652420043945312, -0.0019626617431640625, -6.008148193359375e-05, 0.001842498779296875, 0.0037450790405273438, 0.0056476593017578125, 0.007550239562988281, 0.00945281982421875, 0.011355400085449219, 0.013257980346679688, 0.015160560607910156, 0.017063140869140625, 0.018965721130371094, 0.020868301391601562, 0.02277088165283203, 0.0246734619140625, 0.02657604217529297, 0.028478622436523438, 0.030381202697753906, 0.032283782958984375, 0.034186363220214844, 0.03608894348144531, 0.03799152374267578, 0.03989410400390625, 0.04179668426513672, 0.04369926452636719, 0.045601844787597656, 0.047504425048828125, 0.049407005310058594, 0.05130958557128906, 0.05321216583251953, 0.05511474609375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 5.0, 4.0, 7.0, 8.0, 11.0, 11.0, 27.0, 34.0, 50.0, 61.0, 90.0, 137.0, 210.0, 366.0, 616.0, 1112.0, 2268.0, 4763.0, 11263.0, 37873.0, 279407.0, 617008.0, 64788.0, 16045.0, 6140.0, 2762.0, 1487.0, 795.0, 445.0, 267.0, 152.0, 93.0, 84.0, 57.0, 32.0, 31.0, 19.0, 13.0, 5.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005962371826171875, -0.00576472282409668, -0.005567073822021484, -0.005369424819946289, -0.005171775817871094, -0.0049741268157958984, -0.004776477813720703, -0.004578828811645508, -0.0043811798095703125, -0.004183530807495117, -0.003985881805419922, -0.0037882328033447266, -0.0035905838012695312, -0.003392934799194336, -0.0031952857971191406, -0.0029976367950439453, -0.00279998779296875, -0.0026023387908935547, -0.0024046897888183594, -0.002207040786743164, -0.0020093917846679688, -0.0018117427825927734, -0.0016140937805175781, -0.0014164447784423828, -0.0012187957763671875, -0.0010211467742919922, -0.0008234977722167969, -0.0006258487701416016, -0.00042819976806640625, -0.00023055076599121094, -3.2901763916015625e-05, 0.0001647472381591797, 0.000362396240234375, 0.0005600452423095703, 0.0007576942443847656, 0.0009553432464599609, 0.0011529922485351562, 0.0013506412506103516, 0.0015482902526855469, 0.0017459392547607422, 0.0019435882568359375, 0.002141237258911133, 0.002338886260986328, 0.0025365352630615234, 0.0027341842651367188, 0.002931833267211914, 0.0031294822692871094, 0.0033271312713623047, 0.0035247802734375, 0.0037224292755126953, 0.003920078277587891, 0.004117727279663086, 0.004315376281738281, 0.0045130252838134766, 0.004710674285888672, 0.004908323287963867, 0.0051059722900390625, 0.005303621292114258, 0.005501270294189453, 0.0056989192962646484, 0.005896568298339844, 0.006094217300415039, 0.006291866302490234, 0.00648951530456543, 0.006687164306640625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 14.0, 11.0, 14.0, 20.0, 20.0, 27.0, 34.0, 53.0, 67.0, 87.0, 93.0, 74.0, 95.0, 85.0, 68.0, 52.0, 32.0, 30.0, 31.0, 21.0, 12.0, 14.0, 3.0, 7.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.569789886474609e-06, -7.282942533493042e-06, -6.996095180511475e-06, -6.709247827529907e-06, -6.42240047454834e-06, -6.1355531215667725e-06, -5.848705768585205e-06, -5.561858415603638e-06, -5.27501106262207e-06, -4.988163709640503e-06, -4.7013163566589355e-06, -4.414469003677368e-06, -4.127621650695801e-06, -3.840774297714233e-06, -3.553926944732666e-06, -3.2670795917510986e-06, -2.9802322387695312e-06, -2.693384885787964e-06, -2.4065375328063965e-06, -2.119690179824829e-06, -1.8328428268432617e-06, -1.5459954738616943e-06, -1.259148120880127e-06, -9.723007678985596e-07, -6.854534149169922e-07, -3.986060619354248e-07, -1.1175870895385742e-07, 1.7508864402770996e-07, 4.6193599700927734e-07, 7.487833499908447e-07, 1.0356307029724121e-06, 1.3224780559539795e-06, 1.6093254089355469e-06, 1.8961727619171143e-06, 2.1830201148986816e-06, 2.469867467880249e-06, 2.7567148208618164e-06, 3.043562173843384e-06, 3.330409526824951e-06, 3.6172568798065186e-06, 3.904104232788086e-06, 4.190951585769653e-06, 4.477798938751221e-06, 4.764646291732788e-06, 5.0514936447143555e-06, 5.338340997695923e-06, 5.62518835067749e-06, 5.912035703659058e-06, 6.198883056640625e-06, 6.485730409622192e-06, 6.77257776260376e-06, 7.059425115585327e-06, 7.3462724685668945e-06, 7.633119821548462e-06, 7.91996717453003e-06, 8.206814527511597e-06, 8.493661880493164e-06, 8.780509233474731e-06, 9.067356586456299e-06, 9.354203939437866e-06, 9.641051292419434e-06, 9.927898645401001e-06, 1.0214745998382568e-05, 1.0501593351364136e-05, 1.0788440704345703e-05]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 11.0, 7.0, 25.0, 59.0, 122.0, 396.0, 1644.0, 9267.0, 952155.0, 79797.0, 3816.0, 799.0, 271.0, 107.0, 39.0, 9.0, 4.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0182952880859375, -0.017611980438232422, -0.016928672790527344, -0.016245365142822266, -0.015562057495117188, -0.01487874984741211, -0.014195442199707031, -0.013512134552001953, -0.012828826904296875, -0.012145519256591797, -0.011462211608886719, -0.01077890396118164, -0.010095596313476562, -0.009412288665771484, -0.008728981018066406, -0.008045673370361328, -0.00736236572265625, -0.006679058074951172, -0.005995750427246094, -0.005312442779541016, -0.0046291351318359375, -0.003945827484130859, -0.0032625198364257812, -0.002579212188720703, -0.001895904541015625, -0.0012125968933105469, -0.0005292892456054688, 0.00015401840209960938, 0.0008373260498046875, 0.0015206336975097656, 0.0022039413452148438, 0.002887248992919922, 0.003570556640625, 0.004253864288330078, 0.004937171936035156, 0.005620479583740234, 0.0063037872314453125, 0.006987094879150391, 0.007670402526855469, 0.008353710174560547, 0.009037017822265625, 0.009720325469970703, 0.010403633117675781, 0.01108694076538086, 0.011770248413085938, 0.012453556060791016, 0.013136863708496094, 0.013820171356201172, 0.01450347900390625, 0.015186786651611328, 0.015870094299316406, 0.016553401947021484, 0.017236709594726562, 0.01792001724243164, 0.01860332489013672, 0.019286632537841797, 0.019969940185546875, 0.020653247833251953, 0.02133655548095703, 0.02201986312866211, 0.022703170776367188, 0.023386478424072266, 0.024069786071777344, 0.024753093719482422, 0.0254364013671875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 5.0, 6.0, 9.0, 17.0, 29.0, 34.0, 58.0, 83.0, 90.0, 98.0, 127.0, 127.0, 83.0, 70.0, 38.0, 35.0, 29.0, 11.0, 10.0, 9.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001300811767578125, -0.001253560185432434, -0.0012063086032867432, -0.0011590570211410522, -0.0011118054389953613, -0.0010645538568496704, -0.0010173022747039795, -0.0009700506925582886, -0.0009227991104125977, -0.0008755475282669067, -0.0008282959461212158, -0.0007810443639755249, -0.000733792781829834, -0.0006865411996841431, -0.0006392896175384521, -0.0005920380353927612, -0.0005447864532470703, -0.0004975348711013794, -0.0004502832889556885, -0.00040303170680999756, -0.00035578012466430664, -0.0003085285425186157, -0.0002612769603729248, -0.0002140253782272339, -0.00016677379608154297, -0.00011952221393585205, -7.227063179016113e-05, -2.5019049644470215e-05, 2.2232532501220703e-05, 6.948411464691162e-05, 0.00011673569679260254, 0.00016398727893829346, 0.00021123886108398438, 0.0002584904432296753, 0.0003057420253753662, 0.00035299360752105713, 0.00040024518966674805, 0.00044749677181243896, 0.0004947483539581299, 0.0005419999361038208, 0.0005892515182495117, 0.0006365031003952026, 0.0006837546825408936, 0.0007310062646865845, 0.0007782578468322754, 0.0008255094289779663, 0.0008727610111236572, 0.0009200125932693481, 0.0009672641754150391, 0.00101451575756073, 0.001061767339706421, 0.0011090189218521118, 0.0011562705039978027, 0.0012035220861434937, 0.0012507736682891846, 0.0012980252504348755, 0.0013452768325805664, 0.0013925284147262573, 0.0014397799968719482, 0.0014870315790176392, 0.00153428316116333, 0.001581534743309021, 0.001628786325454712, 0.0016760379076004028, 0.0017232894897460938]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 10.0, 21.0, 58.0, 97.0, 256.0, 305.0, 131.0, 70.0, 29.0, 21.0, 9.0, 4.0, 1.0], "bins": [-0.6100084185600281, -0.599139392375946, -0.588270366191864, -0.577401340007782, -0.5665322542190552, -0.5556632280349731, -0.5447942018508911, -0.5339251756668091, -0.523056149482727, -0.512187123298645, -0.501318097114563, -0.49044904112815857, -0.47958001494407654, -0.4687109887599945, -0.4578419327735901, -0.44697290658950806, -0.436103880405426, -0.425234854221344, -0.4143657982349396, -0.40349677205085754, -0.3926277458667755, -0.3817587196826935, -0.37088966369628906, -0.36002063751220703, -0.3491515815258026, -0.3382825553417206, -0.32741349935531616, -0.31654447317123413, -0.3056754469871521, -0.29480642080307007, -0.28393736481666565, -0.2730683386325836, -0.2621993124485016, -0.25133028626441956, -0.24046124517917633, -0.2295922040939331, -0.21872317790985107, -0.20785413682460785, -0.19698509573936462, -0.1861160695552826, -0.17524704337120056, -0.16437800228595734, -0.1535089761018753, -0.14263993501663208, -0.13177090883255005, -0.12090186774730682, -0.1100328341126442, -0.09916380047798157, -0.08829475939273834, -0.07742572575807571, -0.06655669212341309, -0.05568765476346016, -0.04481862112879753, -0.0339495874941349, -0.023080550134181976, -0.012211516499519348, -0.00134248286485672, 0.009526551701128483, 0.020395586267113686, 0.03126462176442146, 0.04213365539908409, 0.05300268903374672, 0.06387172639369965, 0.07474076002836227, 0.0856097936630249]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 6.0, 15.0, 15.0, 12.0, 16.0, 17.0, 21.0, 21.0, 14.0, 35.0, 41.0, 41.0, 32.0, 40.0, 33.0, 41.0, 37.0, 44.0, 48.0, 51.0, 50.0, 33.0, 35.0, 29.0, 41.0, 27.0, 31.0, 25.0, 19.0, 24.0, 18.0, 13.0, 10.0, 8.0, 9.0, 9.0, 8.0, 6.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08386777341365814, -0.08129160106182098, -0.07871542870998383, -0.07613926380872726, -0.0735630914568901, -0.07098691910505295, -0.06841075420379639, -0.06583458185195923, -0.06325840950012207, -0.06068223714828491, -0.05810606852173805, -0.05552989989519119, -0.052953727543354034, -0.050377555191516876, -0.047801386564970016, -0.04522521793842316, -0.042649045586586, -0.04007287323474884, -0.03749670460820198, -0.03492053598165512, -0.03234436362981796, -0.029768193140625954, -0.027192022651433945, -0.024615852162241936, -0.022039681673049927, -0.019463511183857918, -0.01688734069466591, -0.0143111702054739, -0.011734999716281891, -0.009158829227089882, -0.006582658737897873, -0.004006488248705864, -0.001430317759513855, 0.001145852729678154, 0.003722023218870163, 0.006298193708062172, 0.008874364197254181, 0.01145053468644619, 0.014026705175638199, 0.016602875664830208, 0.019179046154022217, 0.021755216643214226, 0.024331387132406235, 0.026907557621598244, 0.029483728110790253, 0.03205990046262741, 0.03463606908917427, 0.03721223771572113, 0.03978841006755829, 0.04236458241939545, 0.044940751045942307, 0.047516919672489166, 0.050093092024326324, 0.05266926437616348, 0.05524543300271034, 0.0578216016292572, 0.06039777398109436, 0.06297394633293152, 0.06555011868476868, 0.06812628358602524, 0.0707024559378624, 0.07327862828969955, 0.07585479319095612, 0.07843096554279327, 0.08100713789463043]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 5.0, 8.0, 7.0, 14.0, 15.0, 21.0, 21.0, 29.0, 41.0, 40.0, 71.0, 100.0, 169.0, 290.0, 528.0, 1153.0, 3334.0, 23865.0, 3814288.0, 340691.0, 6094.0, 1693.0, 759.0, 356.0, 218.0, 128.0, 84.0, 59.0, 43.0, 36.0, 28.0, 20.0, 14.0, 8.0, 10.0, 5.0, 8.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.25244140625, -0.24365234375, -0.23486328125, -0.22607421875, -0.21728515625, -0.20849609375, -0.19970703125, -0.19091796875, -0.18212890625, -0.17333984375, -0.16455078125, -0.15576171875, -0.14697265625, -0.13818359375, -0.12939453125, -0.12060546875, -0.11181640625, -0.10302734375, -0.09423828125, -0.08544921875, -0.07666015625, -0.06787109375, -0.05908203125, -0.05029296875, -0.04150390625, -0.03271484375, -0.02392578125, -0.01513671875, -0.00634765625, 0.00244140625, 0.01123046875, 0.02001953125, 0.02880859375, 0.03759765625, 0.04638671875, 0.05517578125, 0.06396484375, 0.07275390625, 0.08154296875, 0.09033203125, 0.09912109375, 0.10791015625, 0.11669921875, 0.12548828125, 0.13427734375, 0.14306640625, 0.15185546875, 0.16064453125, 0.16943359375, 0.17822265625, 0.18701171875, 0.19580078125, 0.20458984375, 0.21337890625, 0.22216796875, 0.23095703125, 0.23974609375, 0.24853515625, 0.25732421875, 0.26611328125, 0.27490234375, 0.28369140625, 0.29248046875, 0.30126953125]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 6.0, 8.0, 10.0, 17.0, 9.0, 16.0, 17.0, 10.0, 29.0, 28.0, 35.0, 31.0, 39.0, 29.0, 44.0, 38.0, 47.0, 37.0, 44.0, 40.0, 30.0, 45.0, 56.0, 43.0, 34.0, 21.0, 40.0, 30.0, 23.0, 14.0, 24.0, 18.0, 16.0, 16.0, 12.0, 7.0, 9.0, 7.0, 1.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0628662109375, -0.06094932556152344, -0.059032440185546875, -0.05711555480957031, -0.05519866943359375, -0.05328178405761719, -0.051364898681640625, -0.04944801330566406, -0.0475311279296875, -0.04561424255371094, -0.043697357177734375, -0.04178047180175781, -0.03986358642578125, -0.03794670104980469, -0.036029815673828125, -0.03411293029785156, -0.032196044921875, -0.030279159545898438, -0.028362274169921875, -0.026445388793945312, -0.02452850341796875, -0.022611618041992188, -0.020694732666015625, -0.018777847290039062, -0.0168609619140625, -0.014944076538085938, -0.013027191162109375, -0.011110305786132812, -0.00919342041015625, -0.0072765350341796875, -0.005359649658203125, -0.0034427642822265625, -0.00152587890625, 0.0003910064697265625, 0.002307891845703125, 0.0042247772216796875, 0.00614166259765625, 0.008058547973632812, 0.009975433349609375, 0.011892318725585938, 0.0138092041015625, 0.015726089477539062, 0.017642974853515625, 0.019559860229492188, 0.02147674560546875, 0.023393630981445312, 0.025310516357421875, 0.027227401733398438, 0.029144287109375, 0.031061172485351562, 0.032978057861328125, 0.03489494323730469, 0.03681182861328125, 0.03872871398925781, 0.040645599365234375, 0.04256248474121094, 0.0444793701171875, 0.04639625549316406, 0.048313140869140625, 0.05023002624511719, 0.05214691162109375, 0.05406379699707031, 0.055980682373046875, 0.05789756774902344, 0.059814453125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 4.0, 9.0, 10.0, 25.0, 71.0, 210.0, 1239.0, 45995.0, 4143385.0, 2806.0, 340.0, 90.0, 33.0, 16.0, 11.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.68359375, -1.6445999145507812, -1.6056060791015625, -1.5666122436523438, -1.527618408203125, -1.4886245727539062, -1.4496307373046875, -1.4106369018554688, -1.37164306640625, -1.3326492309570312, -1.2936553955078125, -1.2546615600585938, -1.215667724609375, -1.1766738891601562, -1.1376800537109375, -1.0986862182617188, -1.0596923828125, -1.0206985473632812, -0.9817047119140625, -0.9427108764648438, -0.903717041015625, -0.8647232055664062, -0.8257293701171875, -0.7867355346679688, -0.74774169921875, -0.7087478637695312, -0.6697540283203125, -0.6307601928710938, -0.591766357421875, -0.5527725219726562, -0.5137786865234375, -0.47478485107421875, -0.435791015625, -0.39679718017578125, -0.3578033447265625, -0.31880950927734375, -0.279815673828125, -0.24082183837890625, -0.2018280029296875, -0.16283416748046875, -0.12384033203125, -0.08484649658203125, -0.0458526611328125, -0.00685882568359375, 0.032135009765625, 0.07112884521484375, 0.1101226806640625, 0.14911651611328125, 0.1881103515625, 0.22710418701171875, 0.2660980224609375, 0.30509185791015625, 0.344085693359375, 0.38307952880859375, 0.4220733642578125, 0.46106719970703125, 0.50006103515625, 0.5390548706054688, 0.5780487060546875, 0.6170425415039062, 0.656036376953125, 0.6950302124023438, 0.7340240478515625, 0.7730178833007812, 0.81201171875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 8.0, 6.0, 5.0, 19.0, 21.0, 60.0, 110.0, 484.0, 1490.0, 1302.0, 377.0, 87.0, 50.0, 15.0, 8.0, 9.0, 5.0, 3.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041656494140625, -0.03975343704223633, -0.037850379943847656, -0.035947322845458984, -0.03404426574707031, -0.03214120864868164, -0.03023815155029297, -0.028335094451904297, -0.026432037353515625, -0.024528980255126953, -0.02262592315673828, -0.02072286605834961, -0.018819808959960938, -0.016916751861572266, -0.015013694763183594, -0.013110637664794922, -0.01120758056640625, -0.009304523468017578, -0.007401466369628906, -0.005498409271240234, -0.0035953521728515625, -0.0016922950744628906, 0.00021076202392578125, 0.002113819122314453, 0.004016876220703125, 0.005919933319091797, 0.007822990417480469, 0.00972604751586914, 0.011629104614257812, 0.013532161712646484, 0.015435218811035156, 0.017338275909423828, 0.0192413330078125, 0.021144390106201172, 0.023047447204589844, 0.024950504302978516, 0.026853561401367188, 0.02875661849975586, 0.03065967559814453, 0.0325627326965332, 0.034465789794921875, 0.03636884689331055, 0.03827190399169922, 0.04017496109008789, 0.04207801818847656, 0.043981075286865234, 0.045884132385253906, 0.04778718948364258, 0.04969024658203125, 0.05159330368041992, 0.053496360778808594, 0.055399417877197266, 0.05730247497558594, 0.05920553207397461, 0.06110858917236328, 0.06301164627075195, 0.06491470336914062, 0.0668177604675293, 0.06872081756591797, 0.07062387466430664, 0.07252693176269531, 0.07442998886108398, 0.07633304595947266, 0.07823610305786133, 0.08013916015625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 11.0, 24.0, 52.0, 148.0, 330.0, 294.0, 92.0, 41.0, 16.0, 6.0, 1.0], "bins": [-0.5692185759544373, -0.5593691468238831, -0.5495196580886841, -0.5396702289581299, -0.5298207998275757, -0.5199713706970215, -0.5101218819618225, -0.5002724528312683, -0.4904230237007141, -0.4805735647678375, -0.4707241356372833, -0.46087467670440674, -0.45102524757385254, -0.44117578864097595, -0.43132635951042175, -0.42147690057754517, -0.4116274416446686, -0.401777982711792, -0.3919285535812378, -0.3820790946483612, -0.372229665517807, -0.3623802065849304, -0.3525307774543762, -0.34268131852149963, -0.33283185958862305, -0.32298240065574646, -0.31313297152519226, -0.3032835125923157, -0.2934340834617615, -0.2835846245288849, -0.2737351953983307, -0.2638857364654541, -0.2540363073348999, -0.2441868633031845, -0.23433741927146912, -0.22448797523975372, -0.21463853120803833, -0.20478907227516174, -0.19493962824344635, -0.18509018421173096, -0.17524072527885437, -0.16539128124713898, -0.15554183721542358, -0.1456923931837082, -0.1358429491519928, -0.1259934902191162, -0.11614404618740082, -0.10629460215568542, -0.09644516557455063, -0.08659572154283524, -0.07674627006053925, -0.06689682602882385, -0.05704738199710846, -0.047197937965393066, -0.037348490208387375, -0.027499042451381683, -0.01764959841966629, -0.007800152525305748, 0.0020492933690547943, 0.011898739263415337, 0.02174818515777588, 0.03159762918949127, 0.041447076946496964, 0.051296524703502655, 0.06114596873521805]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 3.0, 10.0, 4.0, 10.0, 10.0, 7.0, 19.0, 17.0, 17.0, 30.0, 18.0, 35.0, 34.0, 28.0, 31.0, 28.0, 39.0, 47.0, 34.0, 50.0, 38.0, 41.0, 56.0, 40.0, 36.0, 35.0, 37.0, 22.0, 16.0, 34.0, 28.0, 24.0, 18.0, 18.0, 23.0, 9.0, 8.0, 11.0, 8.0, 4.0, 6.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0], "bins": [-0.07609716802835464, -0.0740557536482811, -0.07201433926820755, -0.0699729174375534, -0.06793150305747986, -0.06589008867740631, -0.06384867429733276, -0.061807259917259216, -0.05976584181189537, -0.05772442743182182, -0.05568300932645798, -0.05364159494638443, -0.05160018056631088, -0.04955876246094704, -0.04751734808087349, -0.045475929975509644, -0.043434515595436096, -0.04139310121536255, -0.0393516831099987, -0.037310268729925156, -0.03526885062456131, -0.03322743624448776, -0.031186021864414215, -0.02914460562169552, -0.027103189378976822, -0.025061773136258125, -0.02302035689353943, -0.02097894251346588, -0.018937526270747185, -0.016896110028028488, -0.014854694716632366, -0.012813279405236244, -0.010771870613098145, -0.008730454370379448, -0.006689039058983326, -0.004647623281925917, -0.0026062075048685074, -0.0005647912621498108, 0.0014766240492463112, 0.003518039360642433, 0.00555945560336113, 0.007600871380418539, 0.009642287157475948, 0.01168370246887207, 0.013725118711590767, 0.015766534954309464, 0.01780794933438301, 0.019849365577101707, 0.021890781819820404, 0.0239321980625391, 0.025973614305257797, 0.028015028685331345, 0.03005644492805004, 0.03209786117076874, 0.034139275550842285, 0.03618068993091583, 0.03822210803627968, 0.040263522416353226, 0.04230494052171707, 0.04434635490179062, 0.046387769281864166, 0.04842918738722801, 0.05047060176730156, 0.052512019872665405, 0.05455343425273895]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 11.0, 19.0, 30.0, 28.0, 56.0, 63.0, 110.0, 149.0, 256.0, 389.0, 569.0, 879.0, 1287.0, 1939.0, 2955.0, 4516.0, 7118.0, 11607.0, 18896.0, 32090.0, 56214.0, 104012.0, 196865.0, 259107.0, 154412.0, 81942.0, 44836.0, 25747.0, 15513.0, 9632.0, 6075.0, 3881.0, 2443.0, 1668.0, 1062.0, 732.0, 467.0, 313.0, 215.0, 139.0, 105.0, 60.0, 49.0, 26.0, 23.0, 15.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.037841796875, -0.03655052185058594, -0.035259246826171875, -0.03396797180175781, -0.03267669677734375, -0.03138542175292969, -0.030094146728515625, -0.028802871704101562, -0.0275115966796875, -0.026220321655273438, -0.024929046630859375, -0.023637771606445312, -0.02234649658203125, -0.021055221557617188, -0.019763946533203125, -0.018472671508789062, -0.017181396484375, -0.015890121459960938, -0.014598846435546875, -0.013307571411132812, -0.01201629638671875, -0.010725021362304688, -0.009433746337890625, -0.008142471313476562, -0.0068511962890625, -0.0055599212646484375, -0.004268646240234375, -0.0029773712158203125, -0.00168609619140625, -0.0003948211669921875, 0.000896453857421875, 0.0021877288818359375, 0.00347900390625, 0.0047702789306640625, 0.006061553955078125, 0.0073528289794921875, 0.00864410400390625, 0.009935379028320312, 0.011226654052734375, 0.012517929077148438, 0.0138092041015625, 0.015100479125976562, 0.016391754150390625, 0.017683029174804688, 0.01897430419921875, 0.020265579223632812, 0.021556854248046875, 0.022848129272460938, 0.024139404296875, 0.025430679321289062, 0.026721954345703125, 0.028013229370117188, 0.02930450439453125, 0.030595779418945312, 0.031887054443359375, 0.03317832946777344, 0.0344696044921875, 0.03576087951660156, 0.037052154541015625, 0.03834342956542969, 0.03963470458984375, 0.04092597961425781, 0.042217254638671875, 0.04350852966308594, 0.0447998046875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 7.0, 5.0, 11.0, 12.0, 9.0, 11.0, 15.0, 23.0, 25.0, 27.0, 32.0, 40.0, 37.0, 37.0, 32.0, 42.0, 43.0, 51.0, 51.0, 42.0, 33.0, 48.0, 34.0, 45.0, 38.0, 42.0, 23.0, 32.0, 27.0, 19.0, 14.0, 17.0, 23.0, 12.0, 6.0, 7.0, 6.0, 7.0, 0.0, 3.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068359375, -0.06632328033447266, -0.06428718566894531, -0.06225109100341797, -0.060214996337890625, -0.05817890167236328, -0.05614280700683594, -0.054106712341308594, -0.05207061767578125, -0.050034523010253906, -0.04799842834472656, -0.04596233367919922, -0.043926239013671875, -0.04189014434814453, -0.03985404968261719, -0.037817955017089844, -0.0357818603515625, -0.033745765686035156, -0.03170967102050781, -0.02967357635498047, -0.027637481689453125, -0.02560138702392578, -0.023565292358398438, -0.021529197692871094, -0.01949310302734375, -0.017457008361816406, -0.015420913696289062, -0.013384819030761719, -0.011348724365234375, -0.009312629699707031, -0.0072765350341796875, -0.005240440368652344, -0.003204345703125, -0.0011682510375976562, 0.0008678436279296875, 0.0029039382934570312, 0.004940032958984375, 0.006976127624511719, 0.009012222290039062, 0.011048316955566406, 0.01308441162109375, 0.015120506286621094, 0.017156600952148438, 0.01919269561767578, 0.021228790283203125, 0.02326488494873047, 0.025300979614257812, 0.027337074279785156, 0.0293731689453125, 0.031409263610839844, 0.03344535827636719, 0.03548145294189453, 0.037517547607421875, 0.03955364227294922, 0.04158973693847656, 0.043625831604003906, 0.04566192626953125, 0.047698020935058594, 0.04973411560058594, 0.05177021026611328, 0.053806304931640625, 0.05584239959716797, 0.05787849426269531, 0.059914588928222656, 0.06195068359375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 17.0, 10.0, 33.0, 36.0, 57.0, 62.0, 138.0, 163.0, 256.0, 378.0, 504.0, 727.0, 1098.0, 1727.0, 2544.0, 3813.0, 5904.0, 9550.0, 15225.0, 24652.0, 42954.0, 80069.0, 169858.0, 332944.0, 167651.0, 79015.0, 42542.0, 24760.0, 14974.0, 9332.0, 5945.0, 3877.0, 2482.0, 1694.0, 1144.0, 754.0, 509.0, 339.0, 245.0, 185.0, 126.0, 66.0, 59.0, 40.0, 27.0, 16.0, 18.0, 8.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0379638671875, -0.0367584228515625, -0.035552978515625, -0.0343475341796875, -0.03314208984375, -0.0319366455078125, -0.030731201171875, -0.0295257568359375, -0.0283203125, -0.0271148681640625, -0.025909423828125, -0.0247039794921875, -0.02349853515625, -0.0222930908203125, -0.021087646484375, -0.0198822021484375, -0.0186767578125, -0.0174713134765625, -0.016265869140625, -0.0150604248046875, -0.01385498046875, -0.0126495361328125, -0.011444091796875, -0.0102386474609375, -0.009033203125, -0.0078277587890625, -0.006622314453125, -0.0054168701171875, -0.00421142578125, -0.0030059814453125, -0.001800537109375, -0.0005950927734375, 0.0006103515625, 0.0018157958984375, 0.003021240234375, 0.0042266845703125, 0.00543212890625, 0.0066375732421875, 0.007843017578125, 0.0090484619140625, 0.01025390625, 0.0114593505859375, 0.012664794921875, 0.0138702392578125, 0.01507568359375, 0.0162811279296875, 0.017486572265625, 0.0186920166015625, 0.0198974609375, 0.0211029052734375, 0.022308349609375, 0.0235137939453125, 0.02471923828125, 0.0259246826171875, 0.027130126953125, 0.0283355712890625, 0.029541015625, 0.0307464599609375, 0.031951904296875, 0.0331573486328125, 0.03436279296875, 0.0355682373046875, 0.036773681640625, 0.0379791259765625, 0.0391845703125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 8.0, 6.0, 3.0, 11.0, 13.0, 22.0, 17.0, 19.0, 19.0, 18.0, 21.0, 24.0, 28.0, 27.0, 23.0, 33.0, 39.0, 28.0, 63.0, 46.0, 37.0, 27.0, 52.0, 39.0, 39.0, 35.0, 21.0, 32.0, 37.0, 32.0, 27.0, 20.0, 27.0, 12.0, 8.0, 15.0, 11.0, 17.0, 6.0, 5.0, 7.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04376220703125, -0.0423130989074707, -0.040863990783691406, -0.03941488265991211, -0.03796577453613281, -0.036516666412353516, -0.03506755828857422, -0.03361845016479492, -0.032169342041015625, -0.030720233917236328, -0.02927112579345703, -0.027822017669677734, -0.026372909545898438, -0.02492380142211914, -0.023474693298339844, -0.022025585174560547, -0.02057647705078125, -0.019127368927001953, -0.017678260803222656, -0.01622915267944336, -0.014780044555664062, -0.013330936431884766, -0.011881828308105469, -0.010432720184326172, -0.008983612060546875, -0.007534503936767578, -0.006085395812988281, -0.004636287689208984, -0.0031871795654296875, -0.0017380714416503906, -0.00028896331787109375, 0.0011601448059082031, 0.0026092529296875, 0.004058361053466797, 0.005507469177246094, 0.006956577301025391, 0.008405685424804688, 0.009854793548583984, 0.011303901672363281, 0.012753009796142578, 0.014202117919921875, 0.015651226043701172, 0.01710033416748047, 0.018549442291259766, 0.019998550415039062, 0.02144765853881836, 0.022896766662597656, 0.024345874786376953, 0.02579498291015625, 0.027244091033935547, 0.028693199157714844, 0.03014230728149414, 0.03159141540527344, 0.033040523529052734, 0.03448963165283203, 0.03593873977661133, 0.037387847900390625, 0.03883695602416992, 0.04028606414794922, 0.041735172271728516, 0.04318428039550781, 0.04463338851928711, 0.046082496643066406, 0.0475316047668457, 0.048980712890625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 16.0, 17.0, 27.0, 31.0, 41.0, 62.0, 88.0, 135.0, 214.0, 233.0, 388.0, 524.0, 786.0, 1120.0, 1604.0, 2385.0, 3592.0, 5496.0, 8908.0, 15445.0, 30100.0, 73359.0, 270743.0, 452390.0, 96600.0, 37491.0, 17914.0, 10015.0, 6367.0, 4055.0, 2680.0, 1737.0, 1201.0, 827.0, 600.0, 399.0, 264.0, 216.0, 148.0, 99.0, 72.0, 52.0, 24.0, 24.0, 19.0, 15.0, 7.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0034847259521484375, -0.003372788429260254, -0.0032608509063720703, -0.0031489133834838867, -0.003036975860595703, -0.0029250383377075195, -0.002813100814819336, -0.0027011632919311523, -0.0025892257690429688, -0.002477288246154785, -0.0023653507232666016, -0.002253413200378418, -0.0021414756774902344, -0.0020295381546020508, -0.0019176006317138672, -0.0018056631088256836, -0.0016937255859375, -0.0015817880630493164, -0.0014698505401611328, -0.0013579130172729492, -0.0012459754943847656, -0.001134037971496582, -0.0010221004486083984, -0.0009101629257202148, -0.0007982254028320312, -0.0006862878799438477, -0.0005743503570556641, -0.00046241283416748047, -0.0003504753112792969, -0.00023853778839111328, -0.0001266002655029297, -1.4662742614746094e-05, 9.72747802734375e-05, 0.0002092123031616211, 0.0003211498260498047, 0.0004330873489379883, 0.0005450248718261719, 0.0006569623947143555, 0.0007688999176025391, 0.0008808374404907227, 0.0009927749633789062, 0.0011047124862670898, 0.0012166500091552734, 0.001328587532043457, 0.0014405250549316406, 0.0015524625778198242, 0.0016644001007080078, 0.0017763376235961914, 0.001888275146484375, 0.0020002126693725586, 0.002112150192260742, 0.0022240877151489258, 0.0023360252380371094, 0.002447962760925293, 0.0025599002838134766, 0.00267183780670166, 0.0027837753295898438, 0.0028957128524780273, 0.003007650375366211, 0.0031195878982543945, 0.003231525421142578, 0.0033434629440307617, 0.0034554004669189453, 0.003567337989807129, 0.0036792755126953125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 4.0, 5.0, 3.0, 5.0, 6.0, 5.0, 8.0, 6.0, 7.0, 4.0, 8.0, 7.0, 18.0, 10.0, 18.0, 28.0, 29.0, 57.0, 76.0, 109.0, 118.0, 117.0, 91.0, 54.0, 40.0, 21.0, 20.0, 11.0, 20.0, 16.0, 9.0, 4.0, 6.0, 9.0, 4.0, 5.0, 4.0, 3.0, 5.0, 8.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-5.829334259033203e-05, -5.6507065892219543e-05, -5.4720789194107056e-05, -5.293451249599457e-05, -5.114823579788208e-05, -4.936195909976959e-05, -4.7575682401657104e-05, -4.578940570354462e-05, -4.400312900543213e-05, -4.221685230731964e-05, -4.043057560920715e-05, -3.8644298911094666e-05, -3.685802221298218e-05, -3.507174551486969e-05, -3.32854688167572e-05, -3.1499192118644714e-05, -2.9712915420532227e-05, -2.792663872241974e-05, -2.614036202430725e-05, -2.4354085326194763e-05, -2.2567808628082275e-05, -2.0781531929969788e-05, -1.89952552318573e-05, -1.7208978533744812e-05, -1.5422701835632324e-05, -1.3636425137519836e-05, -1.1850148439407349e-05, -1.006387174129486e-05, -8.277595043182373e-06, -6.491318345069885e-06, -4.7050416469573975e-06, -2.9187649488449097e-06, -1.1324882507324219e-06, 6.537884473800659e-07, 2.4400651454925537e-06, 4.2263418436050415e-06, 6.012618541717529e-06, 7.798895239830017e-06, 9.585171937942505e-06, 1.1371448636054993e-05, 1.315772533416748e-05, 1.4944002032279968e-05, 1.6730278730392456e-05, 1.8516555428504944e-05, 2.030283212661743e-05, 2.208910882472992e-05, 2.3875385522842407e-05, 2.5661662220954895e-05, 2.7447938919067383e-05, 2.923421561717987e-05, 3.102049231529236e-05, 3.2806769013404846e-05, 3.4593045711517334e-05, 3.637932240962982e-05, 3.816559910774231e-05, 3.99518758058548e-05, 4.1738152503967285e-05, 4.352442920207977e-05, 4.531070590019226e-05, 4.709698259830475e-05, 4.8883259296417236e-05, 5.0669535994529724e-05, 5.245581269264221e-05, 5.42420893907547e-05, 5.602836608886719e-05]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 6.0, 11.0, 8.0, 14.0, 14.0, 10.0, 25.0, 28.0, 34.0, 60.0, 82.0, 194.0, 391.0, 1001.0, 3193.0, 12852.0, 70902.0, 682069.0, 237272.0, 30868.0, 6387.0, 1821.0, 644.0, 271.0, 122.0, 76.0, 49.0, 27.0, 34.0, 17.0, 18.0, 8.0, 10.0, 7.0, 8.0, 3.0, 3.0, 1.0, 5.0, 1.0, 5.0, 0.0, 2.0, 3.0, 1.0], "bins": [-0.0125579833984375, -0.012216448783874512, -0.011874914169311523, -0.011533379554748535, -0.011191844940185547, -0.010850310325622559, -0.01050877571105957, -0.010167241096496582, -0.009825706481933594, -0.009484171867370605, -0.009142637252807617, -0.008801102638244629, -0.00845956802368164, -0.008118033409118652, -0.007776498794555664, -0.007434964179992676, -0.0070934295654296875, -0.006751894950866699, -0.006410360336303711, -0.006068825721740723, -0.005727291107177734, -0.005385756492614746, -0.005044221878051758, -0.0047026872634887695, -0.004361152648925781, -0.004019618034362793, -0.0036780834197998047, -0.0033365488052368164, -0.002995014190673828, -0.00265347957611084, -0.0023119449615478516, -0.0019704103469848633, -0.001628875732421875, -0.0012873411178588867, -0.0009458065032958984, -0.0006042718887329102, -0.0002627372741699219, 7.87973403930664e-05, 0.0004203319549560547, 0.000761866569519043, 0.0011034011840820312, 0.0014449357986450195, 0.0017864704132080078, 0.002128005027770996, 0.0024695396423339844, 0.0028110742568969727, 0.003152608871459961, 0.0034941434860229492, 0.0038356781005859375, 0.004177212715148926, 0.004518747329711914, 0.004860281944274902, 0.005201816558837891, 0.005543351173400879, 0.005884885787963867, 0.0062264204025268555, 0.006567955017089844, 0.006909489631652832, 0.00725102424621582, 0.007592558860778809, 0.007934093475341797, 0.008275628089904785, 0.008617162704467773, 0.008958697319030762, 0.00930023193359375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 3.0, 7.0, 7.0, 5.0, 17.0, 21.0, 24.0, 35.0, 25.0, 31.0, 47.0, 64.0, 104.0, 139.0, 99.0, 80.0, 53.0, 46.0, 33.0, 24.0, 20.0, 19.0, 18.0, 6.0, 10.0, 16.0, 8.0, 3.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.000713348388671875, -0.0006926953792572021, -0.0006720423698425293, -0.0006513893604278564, -0.0006307363510131836, -0.0006100833415985107, -0.0005894303321838379, -0.000568777322769165, -0.0005481243133544922, -0.0005274713039398193, -0.0005068182945251465, -0.00048616528511047363, -0.0004655122756958008, -0.00044485926628112793, -0.0004242062568664551, -0.0004035532474517822, -0.0003829002380371094, -0.0003622472286224365, -0.00034159421920776367, -0.0003209412097930908, -0.00030028820037841797, -0.0002796351909637451, -0.00025898218154907227, -0.00023832917213439941, -0.00021767616271972656, -0.0001970231533050537, -0.00017637014389038086, -0.000155717134475708, -0.00013506412506103516, -0.0001144111156463623, -9.375810623168945e-05, -7.31050968170166e-05, -5.245208740234375e-05, -3.17990779876709e-05, -1.1146068572998047e-05, 9.506940841674805e-06, 3.0159950256347656e-05, 5.081295967102051e-05, 7.146596908569336e-05, 9.211897850036621e-05, 0.00011277198791503906, 0.00013342499732971191, 0.00015407800674438477, 0.00017473101615905762, 0.00019538402557373047, 0.00021603703498840332, 0.00023669004440307617, 0.000257343053817749, 0.0002779960632324219, 0.0002986490726470947, 0.0003193020820617676, 0.00033995509147644043, 0.0003606081008911133, 0.00038126111030578613, 0.000401914119720459, 0.00042256712913513184, 0.0004432201385498047, 0.00046387314796447754, 0.0004845261573791504, 0.0005051791667938232, 0.0005258321762084961, 0.0005464851856231689, 0.0005671381950378418, 0.0005877912044525146, 0.0006084442138671875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 17.0, 24.0, 28.0, 56.0, 121.0, 194.0, 191.0, 176.0, 95.0, 42.0, 32.0, 10.0, 9.0, 5.0, 5.0, 2.0], "bins": [-0.34323030710220337, -0.3369091749191284, -0.33058807253837585, -0.3242669403553009, -0.31794580817222595, -0.3116247057914734, -0.30530357360839844, -0.2989824414253235, -0.2926613390445709, -0.28634020686149597, -0.2800191044807434, -0.27369797229766846, -0.2673768401145935, -0.26105573773384094, -0.254734605550766, -0.24841348826885223, -0.24209235608577728, -0.23577123880386353, -0.22945010662078857, -0.22312898933887482, -0.21680787205696106, -0.2104867398738861, -0.20416562259197235, -0.1978445053100586, -0.19152337312698364, -0.18520225584506989, -0.17888112366199493, -0.17256000638008118, -0.16623888909816742, -0.15991777181625366, -0.1535966396331787, -0.14727552235126495, -0.1409544050693512, -0.13463328778743744, -0.1283121556043625, -0.12199103832244873, -0.11566992104053497, -0.10934879630804062, -0.10302767157554626, -0.09670655429363251, -0.09038543701171875, -0.0840643122792244, -0.07774319499731064, -0.07142207026481628, -0.06510095298290253, -0.05877982825040817, -0.05245870351791382, -0.04613758251070976, -0.03981645777821541, -0.03349533677101135, -0.027174213901162148, -0.020853091031312943, -0.014531970024108887, -0.008210849016904831, -0.0018897242844104767, 0.004431396722793579, 0.010752517729997635, 0.01707363873720169, 0.023394761607050896, 0.0297158844769001, 0.036037005484104156, 0.04235812649130821, 0.048679251223802567, 0.05500037223100662, 0.06132149323821068]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 2.0, 9.0, 4.0, 12.0, 4.0, 13.0, 15.0, 19.0, 14.0, 28.0, 22.0, 24.0, 37.0, 30.0, 31.0, 23.0, 34.0, 51.0, 38.0, 36.0, 40.0, 43.0, 52.0, 41.0, 35.0, 32.0, 43.0, 25.0, 22.0, 21.0, 33.0, 29.0, 16.0, 16.0, 18.0, 20.0, 12.0, 9.0, 11.0, 5.0, 6.0, 8.0, 4.0, 1.0, 6.0, 2.0, 2.0, 2.0], "bins": [-0.06515493243932724, -0.06338705122470856, -0.061619170010089874, -0.05985128879547119, -0.05808341130614281, -0.056315530091524124, -0.05454764887690544, -0.05277976766228676, -0.051011890172958374, -0.04924400895833969, -0.04747612774372101, -0.045708246529102325, -0.04394036903977394, -0.04217248782515526, -0.040404606610536575, -0.03863672539591789, -0.03686884418129921, -0.03510096296668053, -0.033333081752061844, -0.03156520426273346, -0.029797323048114777, -0.028029441833496094, -0.02626156061887741, -0.024493679404258728, -0.022725800052285194, -0.02095791883766651, -0.019190039485692978, -0.017422158271074295, -0.015654277056455612, -0.013886397704482079, -0.012118516489863396, -0.010350636206567287, -0.00858275219798088, -0.0068148719146847725, -0.005046991165727377, -0.0032791104167699814, -0.0015112301334738731, 0.0002566501498222351, 0.002024531364440918, 0.003792411647737026, 0.0055602919310331345, 0.007328172214329243, 0.009096052497625351, 0.010863933712244034, 0.012631813995540142, 0.01439969427883625, 0.016167575493454933, 0.017935454845428467, 0.01970333606004715, 0.021471217274665833, 0.023239096626639366, 0.02500697784125805, 0.026774857193231583, 0.028542738407850266, 0.03031061962246895, 0.03207850083708763, 0.033846378326416016, 0.0356142595410347, 0.03738214075565338, 0.039150021970272064, 0.04091789945960045, 0.04268578067421913, 0.044453661888837814, 0.0462215431034565, 0.04798942431807518]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 13.0, 10.0, 20.0, 27.0, 66.0, 103.0, 135.0, 285.0, 595.0, 1133.0, 2297.0, 5045.0, 11294.0, 26377.0, 64978.0, 164536.0, 331791.0, 259030.0, 106287.0, 42181.0, 17611.0, 7616.0, 3567.0, 1681.0, 833.0, 444.0, 259.0, 128.0, 80.0, 51.0, 26.0, 19.0, 7.0, 10.0, 5.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15380859375, -0.14880943298339844, -0.14381027221679688, -0.1388111114501953, -0.13381195068359375, -0.1288127899169922, -0.12381362915039062, -0.11881446838378906, -0.1138153076171875, -0.10881614685058594, -0.10381698608398438, -0.09881782531738281, -0.09381866455078125, -0.08881950378417969, -0.08382034301757812, -0.07882118225097656, -0.073822021484375, -0.06882286071777344, -0.06382369995117188, -0.05882453918457031, -0.05382537841796875, -0.04882621765136719, -0.043827056884765625, -0.03882789611816406, -0.0338287353515625, -0.028829574584960938, -0.023830413818359375, -0.018831253051757812, -0.01383209228515625, -0.008832931518554688, -0.003833770751953125, 0.0011653900146484375, 0.00616455078125, 0.011163711547851562, 0.016162872314453125, 0.021162033081054688, 0.02616119384765625, 0.031160354614257812, 0.036159515380859375, 0.04115867614746094, 0.0461578369140625, 0.05115699768066406, 0.056156158447265625, 0.06115531921386719, 0.06615447998046875, 0.07115364074707031, 0.07615280151367188, 0.08115196228027344, 0.086151123046875, 0.09115028381347656, 0.09614944458007812, 0.10114860534667969, 0.10614776611328125, 0.11114692687988281, 0.11614608764648438, 0.12114524841308594, 0.1261444091796875, 0.13114356994628906, 0.13614273071289062, 0.1411418914794922, 0.14614105224609375, 0.1511402130126953, 0.15613937377929688, 0.16113853454589844, 0.1661376953125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 10.0, 7.0, 20.0, 25.0, 37.0, 33.0, 54.0, 50.0, 66.0, 54.0, 89.0, 62.0, 72.0, 72.0, 60.0, 59.0, 42.0, 36.0, 43.0, 25.0, 22.0, 14.0, 13.0, 9.0, 11.0, 1.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08929443359375, -0.087249755859375, -0.085205078125, -0.083160400390625, -0.08111572265625, -0.079071044921875, -0.0770263671875, -0.074981689453125, -0.07293701171875, -0.070892333984375, -0.06884765625, -0.066802978515625, -0.06475830078125, -0.062713623046875, -0.0606689453125, -0.058624267578125, -0.05657958984375, -0.054534912109375, -0.052490234375, -0.050445556640625, -0.04840087890625, -0.046356201171875, -0.0443115234375, -0.042266845703125, -0.04022216796875, -0.038177490234375, -0.0361328125, -0.034088134765625, -0.03204345703125, -0.029998779296875, -0.0279541015625, -0.025909423828125, -0.02386474609375, -0.021820068359375, -0.019775390625, -0.017730712890625, -0.01568603515625, -0.013641357421875, -0.0115966796875, -0.009552001953125, -0.00750732421875, -0.005462646484375, -0.00341796875, -0.001373291015625, 0.00067138671875, 0.002716064453125, 0.0047607421875, 0.006805419921875, 0.00885009765625, 0.010894775390625, 0.012939453125, 0.014984130859375, 0.01702880859375, 0.019073486328125, 0.0211181640625, 0.023162841796875, 0.02520751953125, 0.027252197265625, 0.029296875, 0.031341552734375, 0.03338623046875, 0.035430908203125, 0.0374755859375, 0.039520263671875, 0.04156494140625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 5.0, 13.0, 17.0, 16.0, 25.0, 22.0, 39.0, 64.0, 78.0, 137.0, 333.0, 1354.0, 8943.0, 87442.0, 695805.0, 229924.0, 20654.0, 2633.0, 526.0, 190.0, 99.0, 54.0, 38.0, 29.0, 28.0, 24.0, 16.0, 5.0, 9.0, 13.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302490234375, -0.2911567687988281, -0.27982330322265625, -0.2684898376464844, -0.2571563720703125, -0.24582290649414062, -0.23448944091796875, -0.22315597534179688, -0.211822509765625, -0.20048904418945312, -0.18915557861328125, -0.17782211303710938, -0.1664886474609375, -0.15515518188476562, -0.14382171630859375, -0.13248825073242188, -0.12115478515625, -0.10982131958007812, -0.09848785400390625, -0.08715438842773438, -0.0758209228515625, -0.06448745727539062, -0.05315399169921875, -0.041820526123046875, -0.030487060546875, -0.019153594970703125, -0.00782012939453125, 0.003513336181640625, 0.0148468017578125, 0.026180267333984375, 0.03751373291015625, 0.048847198486328125, 0.0601806640625, 0.07151412963867188, 0.08284759521484375, 0.09418106079101562, 0.1055145263671875, 0.11684799194335938, 0.12818145751953125, 0.13951492309570312, 0.150848388671875, 0.16218185424804688, 0.17351531982421875, 0.18484878540039062, 0.1961822509765625, 0.20751571655273438, 0.21884918212890625, 0.23018264770507812, 0.24151611328125, 0.2528495788574219, 0.26418304443359375, 0.2755165100097656, 0.2868499755859375, 0.2981834411621094, 0.30951690673828125, 0.3208503723144531, 0.332183837890625, 0.3435173034667969, 0.35485076904296875, 0.3661842346191406, 0.3775177001953125, 0.3888511657714844, 0.40018463134765625, 0.4115180969238281, 0.4228515625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 12.0, 9.0, 7.0, 8.0, 24.0, 27.0, 23.0, 25.0, 36.0, 42.0, 42.0, 50.0, 51.0, 64.0, 57.0, 68.0, 61.0, 38.0, 44.0, 49.0, 43.0, 42.0, 39.0, 36.0, 16.0, 26.0, 17.0, 11.0, 13.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06024169921875, -0.058718204498291016, -0.05719470977783203, -0.05567121505737305, -0.05414772033691406, -0.05262422561645508, -0.051100730895996094, -0.04957723617553711, -0.048053741455078125, -0.04653024673461914, -0.045006752014160156, -0.04348325729370117, -0.04195976257324219, -0.0404362678527832, -0.03891277313232422, -0.037389278411865234, -0.03586578369140625, -0.034342288970947266, -0.03281879425048828, -0.0312952995300293, -0.029771804809570312, -0.028248310089111328, -0.026724815368652344, -0.02520132064819336, -0.023677825927734375, -0.02215433120727539, -0.020630836486816406, -0.019107341766357422, -0.017583847045898438, -0.016060352325439453, -0.014536857604980469, -0.013013362884521484, -0.0114898681640625, -0.009966373443603516, -0.008442878723144531, -0.006919384002685547, -0.0053958892822265625, -0.003872394561767578, -0.0023488998413085938, -0.0008254051208496094, 0.000698089599609375, 0.0022215843200683594, 0.0037450790405273438, 0.005268573760986328, 0.0067920684814453125, 0.008315563201904297, 0.009839057922363281, 0.011362552642822266, 0.01288604736328125, 0.014409542083740234, 0.01593303680419922, 0.017456531524658203, 0.018980026245117188, 0.020503520965576172, 0.022027015686035156, 0.02355051040649414, 0.025074005126953125, 0.02659749984741211, 0.028120994567871094, 0.029644489288330078, 0.031167984008789062, 0.03269147872924805, 0.03421497344970703, 0.035738468170166016, 0.037261962890625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 10.0, 2.0, 10.0, 13.0, 15.0, 22.0, 32.0, 33.0, 39.0, 75.0, 110.0, 136.0, 203.0, 275.0, 403.0, 579.0, 828.0, 1230.0, 1827.0, 2921.0, 4526.0, 8992.0, 21775.0, 390263.0, 568552.0, 23090.0, 9002.0, 4835.0, 2854.0, 1794.0, 1217.0, 870.0, 564.0, 428.0, 306.0, 205.0, 135.0, 84.0, 98.0, 53.0, 43.0, 36.0, 20.0, 15.0, 11.0, 9.0, 4.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.019866943359375, -0.019226551055908203, -0.018586158752441406, -0.01794576644897461, -0.017305374145507812, -0.016664981842041016, -0.01602458953857422, -0.015384197235107422, -0.014743804931640625, -0.014103412628173828, -0.013463020324707031, -0.012822628021240234, -0.012182235717773438, -0.01154184341430664, -0.010901451110839844, -0.010261058807373047, -0.00962066650390625, -0.008980274200439453, -0.008339881896972656, -0.007699489593505859, -0.0070590972900390625, -0.006418704986572266, -0.005778312683105469, -0.005137920379638672, -0.004497528076171875, -0.003857135772705078, -0.0032167434692382812, -0.0025763511657714844, -0.0019359588623046875, -0.0012955665588378906, -0.0006551742553710938, -1.4781951904296875e-05, 0.0006256103515625, 0.0012660026550292969, 0.0019063949584960938, 0.0025467872619628906, 0.0031871795654296875, 0.0038275718688964844, 0.004467964172363281, 0.005108356475830078, 0.005748748779296875, 0.006389141082763672, 0.007029533386230469, 0.007669925689697266, 0.008310317993164062, 0.00895071029663086, 0.009591102600097656, 0.010231494903564453, 0.01087188720703125, 0.011512279510498047, 0.012152671813964844, 0.01279306411743164, 0.013433456420898438, 0.014073848724365234, 0.014714241027832031, 0.015354633331298828, 0.015995025634765625, 0.016635417938232422, 0.01727581024169922, 0.017916202545166016, 0.018556594848632812, 0.01919698715209961, 0.019837379455566406, 0.020477771759033203, 0.0211181640625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 11.0, 13.0, 16.0, 19.0, 13.0, 35.0, 56.0, 57.0, 93.0, 81.0, 98.0, 115.0, 82.0, 80.0, 57.0, 49.0, 40.0, 28.0, 16.0, 8.0, 9.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4373016357421875e-06, -6.1998143792152405e-06, -5.9623271226882935e-06, -5.7248398661613464e-06, -5.487352609634399e-06, -5.249865353107452e-06, -5.012378096580505e-06, -4.774890840053558e-06, -4.537403583526611e-06, -4.299916326999664e-06, -4.062429070472717e-06, -3.82494181394577e-06, -3.5874545574188232e-06, -3.3499673008918762e-06, -3.112480044364929e-06, -2.874992787837982e-06, -2.637505531311035e-06, -2.400018274784088e-06, -2.162531018257141e-06, -1.925043761730194e-06, -1.687556505203247e-06, -1.4500692486763e-06, -1.212581992149353e-06, -9.75094735622406e-07, -7.37607479095459e-07, -5.00120222568512e-07, -2.6263296604156494e-07, -2.514570951461792e-08, 2.123415470123291e-07, 4.498288035392761e-07, 6.873160600662231e-07, 9.248033165931702e-07, 1.1622905731201172e-06, 1.3997778296470642e-06, 1.6372650861740112e-06, 1.8747523427009583e-06, 2.1122395992279053e-06, 2.3497268557548523e-06, 2.5872141122817993e-06, 2.8247013688087463e-06, 3.0621886253356934e-06, 3.2996758818626404e-06, 3.5371631383895874e-06, 3.7746503949165344e-06, 4.0121376514434814e-06, 4.2496249079704285e-06, 4.4871121644973755e-06, 4.7245994210243225e-06, 4.9620866775512695e-06, 5.1995739340782166e-06, 5.4370611906051636e-06, 5.674548447132111e-06, 5.912035703659058e-06, 6.149522960186005e-06, 6.387010216712952e-06, 6.624497473239899e-06, 6.861984729766846e-06, 7.099471986293793e-06, 7.33695924282074e-06, 7.574446499347687e-06, 7.811933755874634e-06, 8.04942101240158e-06, 8.286908268928528e-06, 8.524395525455475e-06, 8.761882781982422e-06]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 9.0, 6.0, 7.0, 23.0, 38.0, 102.0, 332.0, 1080.0, 4487.0, 52697.0, 980188.0, 7462.0, 1474.0, 385.0, 140.0, 47.0, 32.0, 19.0, 9.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09771728515625, -0.0941171646118164, -0.09051704406738281, -0.08691692352294922, -0.08331680297851562, -0.07971668243408203, -0.07611656188964844, -0.07251644134521484, -0.06891632080078125, -0.06531620025634766, -0.06171607971191406, -0.05811595916748047, -0.054515838623046875, -0.05091571807861328, -0.04731559753417969, -0.043715476989746094, -0.0401153564453125, -0.036515235900878906, -0.03291511535644531, -0.02931499481201172, -0.025714874267578125, -0.02211475372314453, -0.018514633178710938, -0.014914512634277344, -0.01131439208984375, -0.007714271545410156, -0.0041141510009765625, -0.0005140304565429688, 0.003086090087890625, 0.006686210632324219, 0.010286331176757812, 0.013886451721191406, 0.017486572265625, 0.021086692810058594, 0.024686813354492188, 0.02828693389892578, 0.031887054443359375, 0.03548717498779297, 0.03908729553222656, 0.042687416076660156, 0.04628753662109375, 0.049887657165527344, 0.05348777770996094, 0.05708789825439453, 0.060688018798828125, 0.06428813934326172, 0.06788825988769531, 0.0714883804321289, 0.0750885009765625, 0.0786886215209961, 0.08228874206542969, 0.08588886260986328, 0.08948898315429688, 0.09308910369873047, 0.09668922424316406, 0.10028934478759766, 0.10388946533203125, 0.10748958587646484, 0.11108970642089844, 0.11468982696533203, 0.11828994750976562, 0.12189006805419922, 0.1254901885986328, 0.1290903091430664, 0.1326904296875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 8.0, 9.0, 8.0, 17.0, 46.0, 585.0, 221.0, 26.0, 14.0, 9.0, 7.0, 6.0, 8.0, 4.0, 3.0, 6.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016937255859375, -0.016476869583129883, -0.016016483306884766, -0.015556097030639648, -0.015095710754394531, -0.014635324478149414, -0.014174938201904297, -0.01371455192565918, -0.013254165649414062, -0.012793779373168945, -0.012333393096923828, -0.011873006820678711, -0.011412620544433594, -0.010952234268188477, -0.01049184799194336, -0.010031461715698242, -0.009571075439453125, -0.009110689163208008, -0.00865030288696289, -0.008189916610717773, -0.007729530334472656, -0.007269144058227539, -0.006808757781982422, -0.006348371505737305, -0.0058879852294921875, -0.00542759895324707, -0.004967212677001953, -0.004506826400756836, -0.004046440124511719, -0.0035860538482666016, -0.0031256675720214844, -0.002665281295776367, -0.00220489501953125, -0.0017445087432861328, -0.0012841224670410156, -0.0008237361907958984, -0.00036334991455078125, 9.703636169433594e-05, 0.0005574226379394531, 0.0010178089141845703, 0.0014781951904296875, 0.0019385814666748047, 0.002398967742919922, 0.002859354019165039, 0.0033197402954101562, 0.0037801265716552734, 0.004240512847900391, 0.004700899124145508, 0.005161285400390625, 0.005621671676635742, 0.006082057952880859, 0.0065424442291259766, 0.007002830505371094, 0.007463216781616211, 0.007923603057861328, 0.008383989334106445, 0.008844375610351562, 0.00930476188659668, 0.009765148162841797, 0.010225534439086914, 0.010685920715332031, 0.011146306991577148, 0.011606693267822266, 0.012067079544067383, 0.0125274658203125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 12.0, 17.0, 24.0, 45.0, 82.0, 135.0, 223.0, 188.0, 110.0, 75.0, 43.0, 23.0, 14.0, 8.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16255216300487518, -0.15813568234443665, -0.1537192016839981, -0.14930272102355957, -0.14488624036312103, -0.1404697597026825, -0.13605327904224396, -0.13163679838180542, -0.12722033262252808, -0.12280385196208954, -0.118387371301651, -0.11397089064121246, -0.10955440998077393, -0.10513792932033539, -0.10072145611047745, -0.09630497545003891, -0.09188848733901978, -0.08747200667858124, -0.0830555260181427, -0.07863904535770416, -0.07422256469726562, -0.06980608403682709, -0.06538961082696915, -0.06097313016653061, -0.05655664950609207, -0.052140168845653534, -0.047723688185214996, -0.04330721125006676, -0.03889073058962822, -0.03447424992918968, -0.030057771131396294, -0.025641292333602905, -0.021224811673164368, -0.01680833101272583, -0.012391852214932442, -0.007975372485816479, -0.0035588927567005157, 0.0008575879037380219, 0.00527406670153141, 0.009690545499324799, 0.014107026159763336, 0.018523506820201874, 0.022939985617995262, 0.02735646441578865, 0.03177294507622719, 0.036189425736665726, 0.040605902671813965, 0.0450223833322525, 0.04943886399269104, 0.05385534465312958, 0.058271825313568115, 0.06268830597400665, 0.06710478663444519, 0.07152126729488373, 0.07593774050474167, 0.0803542211651802, 0.08477070182561874, 0.08918718248605728, 0.09360366314649582, 0.09802014380693436, 0.1024366170167923, 0.10685309767723083, 0.11126957833766937, 0.11568605899810791, 0.12010253965854645]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 9.0, 6.0, 9.0, 9.0, 8.0, 14.0, 22.0, 14.0, 19.0, 21.0, 34.0, 28.0, 29.0, 45.0, 29.0, 32.0, 45.0, 41.0, 42.0, 54.0, 49.0, 46.0, 39.0, 44.0, 32.0, 36.0, 29.0, 35.0, 24.0, 16.0, 18.0, 23.0, 21.0, 11.0, 11.0, 12.0, 8.0, 9.0, 9.0, 8.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.053438663482666016, -0.05171694979071617, -0.049995239824056625, -0.04827352613210678, -0.04655181244015694, -0.04483010247349739, -0.043108388781547546, -0.041386678814888, -0.039664965122938156, -0.03794325143098831, -0.036221541464328766, -0.03449982777237892, -0.03277811408042908, -0.03105640411376953, -0.029334690421819687, -0.027612978592514992, -0.025891264900565147, -0.024169553071260452, -0.022447839379310608, -0.020726127550005913, -0.019004415720701218, -0.017282702028751373, -0.015560990199446678, -0.013839278370141983, -0.012117565609514713, -0.010395852848887444, -0.008674141019582748, -0.006952428258955479, -0.005230715963989496, -0.003509003669023514, -0.001787290908396244, -6.557907909154892e-05, 0.0016561336815357208, 0.0033778459765017033, 0.005099558271467686, 0.0068212710320949554, 0.00854298286139965, 0.01026469562202692, 0.01198640838265419, 0.013708120211958885, 0.015429832972586155, 0.017151545733213425, 0.01887325756251812, 0.020594969391822815, 0.02231668308377266, 0.024038394913077354, 0.02576010674238205, 0.027481820434331894, 0.02920353226363659, 0.030925244092941284, 0.03264695778489113, 0.03436867147684097, 0.03609038144350052, 0.03781209513545036, 0.03953380882740021, 0.04125551879405975, 0.0429772324860096, 0.04469894617795944, 0.04642065614461899, 0.04814236983656883, 0.04986408352851868, 0.05158579349517822, 0.05330750718712807, 0.05502922087907791, 0.05675093084573746]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 8.0, 9.0, 8.0, 17.0, 23.0, 38.0, 56.0, 62.0, 105.0, 154.0, 225.0, 360.0, 573.0, 930.0, 1621.0, 3636.0, 10010.0, 63393.0, 3448092.0, 634781.0, 19240.0, 5513.0, 2261.0, 1139.0, 720.0, 449.0, 288.0, 176.0, 128.0, 68.0, 47.0, 33.0, 35.0, 24.0, 13.0, 11.0, 10.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11810302734375, -0.11426258087158203, -0.11042213439941406, -0.1065816879272461, -0.10274124145507812, -0.09890079498291016, -0.09506034851074219, -0.09121990203857422, -0.08737945556640625, -0.08353900909423828, -0.07969856262207031, -0.07585811614990234, -0.07201766967773438, -0.0681772232055664, -0.06433677673339844, -0.06049633026123047, -0.0566558837890625, -0.05281543731689453, -0.04897499084472656, -0.045134544372558594, -0.041294097900390625, -0.037453651428222656, -0.03361320495605469, -0.02977275848388672, -0.02593231201171875, -0.02209186553955078, -0.018251419067382812, -0.014410972595214844, -0.010570526123046875, -0.006730079650878906, -0.0028896331787109375, 0.0009508132934570312, 0.004791259765625, 0.008631706237792969, 0.012472152709960938, 0.016312599182128906, 0.020153045654296875, 0.023993492126464844, 0.027833938598632812, 0.03167438507080078, 0.03551483154296875, 0.03935527801513672, 0.04319572448730469, 0.047036170959472656, 0.050876617431640625, 0.054717063903808594, 0.05855751037597656, 0.06239795684814453, 0.0662384033203125, 0.07007884979248047, 0.07391929626464844, 0.0777597427368164, 0.08160018920898438, 0.08544063568115234, 0.08928108215332031, 0.09312152862548828, 0.09696197509765625, 0.10080242156982422, 0.10464286804199219, 0.10848331451416016, 0.11232376098632812, 0.1161642074584961, 0.12000465393066406, 0.12384510040283203, 0.127685546875]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 6.0, 11.0, 7.0, 10.0, 15.0, 13.0, 23.0, 20.0, 24.0, 30.0, 19.0, 31.0, 32.0, 33.0, 49.0, 35.0, 35.0, 52.0, 61.0, 48.0, 48.0, 42.0, 44.0, 40.0, 45.0, 28.0, 23.0, 17.0, 22.0, 24.0, 18.0, 19.0, 10.0, 8.0, 9.0, 7.0, 6.0, 10.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036041259765625, -0.03482770919799805, -0.033614158630371094, -0.03240060806274414, -0.031187057495117188, -0.029973506927490234, -0.02875995635986328, -0.027546405792236328, -0.026332855224609375, -0.025119304656982422, -0.02390575408935547, -0.022692203521728516, -0.021478652954101562, -0.02026510238647461, -0.019051551818847656, -0.017838001251220703, -0.01662445068359375, -0.015410900115966797, -0.014197349548339844, -0.01298379898071289, -0.011770248413085938, -0.010556697845458984, -0.009343147277832031, -0.008129596710205078, -0.006916046142578125, -0.005702495574951172, -0.004488945007324219, -0.0032753944396972656, -0.0020618438720703125, -0.0008482933044433594, 0.00036525726318359375, 0.0015788078308105469, 0.0027923583984375, 0.004005908966064453, 0.005219459533691406, 0.006433010101318359, 0.0076465606689453125, 0.008860111236572266, 0.010073661804199219, 0.011287212371826172, 0.012500762939453125, 0.013714313507080078, 0.014927864074707031, 0.016141414642333984, 0.017354965209960938, 0.01856851577758789, 0.019782066345214844, 0.020995616912841797, 0.02220916748046875, 0.023422718048095703, 0.024636268615722656, 0.02584981918334961, 0.027063369750976562, 0.028276920318603516, 0.02949047088623047, 0.030704021453857422, 0.031917572021484375, 0.03313112258911133, 0.03434467315673828, 0.035558223724365234, 0.03677177429199219, 0.03798532485961914, 0.039198875427246094, 0.04041242599487305, 0.0416259765625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 9.0, 13.0, 34.0, 42.0, 93.0, 215.0, 1363.0, 422143.0, 3767971.0, 1801.0, 254.0, 98.0, 66.0, 44.0, 36.0, 23.0, 23.0, 8.0, 8.0, 6.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6962890625, -0.6752243041992188, -0.6541595458984375, -0.6330947875976562, -0.612030029296875, -0.5909652709960938, -0.5699005126953125, -0.5488357543945312, -0.52777099609375, -0.5067062377929688, -0.4856414794921875, -0.46457672119140625, -0.443511962890625, -0.42244720458984375, -0.4013824462890625, -0.38031768798828125, -0.3592529296875, -0.33818817138671875, -0.3171234130859375, -0.29605865478515625, -0.274993896484375, -0.25392913818359375, -0.2328643798828125, -0.21179962158203125, -0.19073486328125, -0.16967010498046875, -0.1486053466796875, -0.12754058837890625, -0.106475830078125, -0.08541107177734375, -0.0643463134765625, -0.04328155517578125, -0.022216796875, -0.00115203857421875, 0.0199127197265625, 0.04097747802734375, 0.062042236328125, 0.08310699462890625, 0.1041717529296875, 0.12523651123046875, 0.14630126953125, 0.16736602783203125, 0.1884307861328125, 0.20949554443359375, 0.230560302734375, 0.25162506103515625, 0.2726898193359375, 0.29375457763671875, 0.3148193359375, 0.33588409423828125, 0.3569488525390625, 0.37801361083984375, 0.399078369140625, 0.42014312744140625, 0.4412078857421875, 0.46227264404296875, 0.48333740234375, 0.5044021606445312, 0.5254669189453125, 0.5465316772460938, 0.567596435546875, 0.5886611938476562, 0.6097259521484375, 0.6307907104492188, 0.65185546875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 14.0, 23.0, 28.0, 26.0, 52.0, 83.0, 88.0, 256.0, 719.0, 1391.0, 821.0, 280.0, 109.0, 66.0, 38.0, 17.0, 12.0, 14.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02752685546875, -0.02656412124633789, -0.02560138702392578, -0.024638652801513672, -0.023675918579101562, -0.022713184356689453, -0.021750450134277344, -0.020787715911865234, -0.019824981689453125, -0.018862247467041016, -0.017899513244628906, -0.016936779022216797, -0.015974044799804688, -0.015011310577392578, -0.014048576354980469, -0.01308584213256836, -0.01212310791015625, -0.01116037368774414, -0.010197639465332031, -0.009234905242919922, -0.008272171020507812, -0.007309436798095703, -0.006346702575683594, -0.005383968353271484, -0.004421234130859375, -0.0034584999084472656, -0.0024957656860351562, -0.0015330314636230469, -0.0005702972412109375, 0.0003924369812011719, 0.0013551712036132812, 0.0023179054260253906, 0.0032806396484375, 0.004243373870849609, 0.005206108093261719, 0.006168842315673828, 0.0071315765380859375, 0.008094310760498047, 0.009057044982910156, 0.010019779205322266, 0.010982513427734375, 0.011945247650146484, 0.012907981872558594, 0.013870716094970703, 0.014833450317382812, 0.015796184539794922, 0.01675891876220703, 0.01772165298461914, 0.01868438720703125, 0.01964712142944336, 0.02060985565185547, 0.021572589874267578, 0.022535324096679688, 0.023498058319091797, 0.024460792541503906, 0.025423526763916016, 0.026386260986328125, 0.027348995208740234, 0.028311729431152344, 0.029274463653564453, 0.030237197875976562, 0.031199932098388672, 0.03216266632080078, 0.03312540054321289, 0.034088134765625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 16.0, 25.0, 34.0, 83.0, 190.0, 287.0, 205.0, 86.0, 49.0, 20.0, 17.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05477528274059296, -0.05002733692526817, -0.04527939110994339, -0.040531449019908905, -0.03578350320458412, -0.03103555738925934, -0.026287613436579704, -0.02153966948390007, -0.016791723668575287, -0.012043778784573078, -0.0072958339005708694, -0.0025478890165686607, 0.002200055867433548, 0.006948001682758331, 0.011695945635437965, 0.0164438895881176, 0.021191835403442383, 0.025939781218767166, 0.0306877251714468, 0.035435669124126434, 0.04018361493945122, 0.044931560754776, 0.049679502844810486, 0.05442744866013527, 0.05917539447546005, 0.06392333656549454, 0.06867128610610962, 0.0734192281961441, 0.07816717028617859, 0.08291511982679367, 0.08766306191682816, 0.09241101145744324, 0.09715896844863892, 0.1019069105386734, 0.10665486007928848, 0.11140280216932297, 0.11615075170993805, 0.12089869379997253, 0.12564663589000702, 0.1303945779800415, 0.13514253497123718, 0.13989047706127167, 0.14463841915130615, 0.14938637614250183, 0.15413431823253632, 0.1588822603225708, 0.16363020241260529, 0.16837814450263977, 0.17312608659267426, 0.17787402868270874, 0.18262197077274323, 0.1873699277639389, 0.1921178698539734, 0.19686581194400787, 0.20161375403404236, 0.20636169612407684, 0.21110963821411133, 0.2158575803041458, 0.2206055223941803, 0.22535347938537598, 0.23010142147541046, 0.23484936356544495, 0.23959730565547943, 0.24434524774551392, 0.2490932047367096]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 9.0, 12.0, 5.0, 9.0, 12.0, 5.0, 14.0, 12.0, 19.0, 21.0, 21.0, 32.0, 43.0, 44.0, 54.0, 30.0, 35.0, 31.0, 42.0, 48.0, 46.0, 39.0, 43.0, 42.0, 24.0, 33.0, 39.0, 34.0, 25.0, 23.0, 28.0, 24.0, 17.0, 22.0, 11.0, 11.0, 9.0, 3.0, 5.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.04379528760910034, -0.042463090270757675, -0.04113089293241501, -0.03979869186878204, -0.03846649453043938, -0.03713429719209671, -0.035802096128463745, -0.03446989879012108, -0.03313770145177841, -0.031805504113435745, -0.03047330491244793, -0.029141105711460114, -0.027808908373117447, -0.02647671103477478, -0.025144511833786964, -0.02381231263279915, -0.022480115294456482, -0.021147917956113815, -0.019815718755126, -0.018483519554138184, -0.017151322215795517, -0.01581912487745285, -0.014486925676465034, -0.013154727406799793, -0.011822529137134552, -0.01049033086746931, -0.00915813259780407, -0.007825934328138828, -0.006493736058473587, -0.005161537788808346, -0.0038293395191431046, -0.0024971412494778633, -0.0011649467051029205, 0.0001672515645623207, 0.001499449834227562, 0.002831648103892803, 0.004163846373558044, 0.005496044643223286, 0.006828242912888527, 0.008160441182553768, 0.00949263945221901, 0.01082483772188425, 0.012157035991549492, 0.013489234261214733, 0.014821432530879974, 0.01615362986922264, 0.017485829070210457, 0.018818028271198273, 0.02015022560954094, 0.021482422947883606, 0.022814622148871422, 0.024146821349859238, 0.025479018688201904, 0.02681121602654457, 0.028143415227532387, 0.029475614428520203, 0.03080781176686287, 0.032140009105205536, 0.0334722101688385, 0.03480440750718117, 0.036136604845523834, 0.0374688021838665, 0.03880099952220917, 0.04013320058584213, 0.0414653979241848]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 6.0, 12.0, 14.0, 29.0, 34.0, 54.0, 89.0, 130.0, 164.0, 241.0, 349.0, 526.0, 764.0, 1030.0, 1528.0, 2298.0, 3275.0, 4790.0, 7499.0, 11382.0, 17766.0, 28640.0, 48632.0, 86923.0, 169138.0, 273803.0, 171410.0, 88010.0, 48829.0, 28989.0, 17889.0, 11360.0, 7424.0, 4970.0, 3277.0, 2187.0, 1609.0, 1097.0, 756.0, 499.0, 323.0, 243.0, 183.0, 138.0, 79.0, 64.0, 32.0, 29.0, 19.0, 9.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0244140625, -0.023639202117919922, -0.022864341735839844, -0.022089481353759766, -0.021314620971679688, -0.02053976058959961, -0.01976490020751953, -0.018990039825439453, -0.018215179443359375, -0.017440319061279297, -0.01666545867919922, -0.01589059829711914, -0.015115737915039062, -0.014340877532958984, -0.013566017150878906, -0.012791156768798828, -0.01201629638671875, -0.011241436004638672, -0.010466575622558594, -0.009691715240478516, -0.008916854858398438, -0.00814199447631836, -0.007367134094238281, -0.006592273712158203, -0.005817413330078125, -0.005042552947998047, -0.004267692565917969, -0.0034928321838378906, -0.0027179718017578125, -0.0019431114196777344, -0.0011682510375976562, -0.0003933906555175781, 0.0003814697265625, 0.0011563301086425781, 0.0019311904907226562, 0.0027060508728027344, 0.0034809112548828125, 0.004255771636962891, 0.005030632019042969, 0.005805492401123047, 0.006580352783203125, 0.007355213165283203, 0.008130073547363281, 0.00890493392944336, 0.009679794311523438, 0.010454654693603516, 0.011229515075683594, 0.012004375457763672, 0.01277923583984375, 0.013554096221923828, 0.014328956604003906, 0.015103816986083984, 0.015878677368164062, 0.01665353775024414, 0.01742839813232422, 0.018203258514404297, 0.018978118896484375, 0.019752979278564453, 0.02052783966064453, 0.02130270004272461, 0.022077560424804688, 0.022852420806884766, 0.023627281188964844, 0.024402141571044922, 0.025177001953125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 5.0, 3.0, 8.0, 5.0, 10.0, 14.0, 14.0, 20.0, 20.0, 22.0, 34.0, 43.0, 42.0, 50.0, 47.0, 34.0, 51.0, 40.0, 55.0, 45.0, 28.0, 40.0, 55.0, 35.0, 35.0, 41.0, 23.0, 31.0, 25.0, 20.0, 18.0, 19.0, 10.0, 8.0, 8.0, 7.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04150390625, -0.040189266204833984, -0.03887462615966797, -0.03755998611450195, -0.03624534606933594, -0.03493070602416992, -0.033616065979003906, -0.03230142593383789, -0.030986785888671875, -0.02967214584350586, -0.028357505798339844, -0.027042865753173828, -0.025728225708007812, -0.024413585662841797, -0.02309894561767578, -0.021784305572509766, -0.02046966552734375, -0.019155025482177734, -0.01784038543701172, -0.016525745391845703, -0.015211105346679688, -0.013896465301513672, -0.012581825256347656, -0.01126718521118164, -0.009952545166015625, -0.00863790512084961, -0.007323265075683594, -0.006008625030517578, -0.0046939849853515625, -0.003379344940185547, -0.0020647048950195312, -0.0007500648498535156, 0.0005645751953125, 0.0018792152404785156, 0.0031938552856445312, 0.004508495330810547, 0.0058231353759765625, 0.007137775421142578, 0.008452415466308594, 0.00976705551147461, 0.011081695556640625, 0.01239633560180664, 0.013710975646972656, 0.015025615692138672, 0.016340255737304688, 0.017654895782470703, 0.01896953582763672, 0.020284175872802734, 0.02159881591796875, 0.022913455963134766, 0.02422809600830078, 0.025542736053466797, 0.026857376098632812, 0.028172016143798828, 0.029486656188964844, 0.03080129623413086, 0.032115936279296875, 0.03343057632446289, 0.034745216369628906, 0.03605985641479492, 0.03737449645996094, 0.03868913650512695, 0.04000377655029297, 0.041318416595458984, 0.042633056640625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 9.0, 16.0, 20.0, 32.0, 35.0, 76.0, 94.0, 143.0, 230.0, 274.0, 470.0, 653.0, 1044.0, 1649.0, 2358.0, 3694.0, 5887.0, 9367.0, 15279.0, 25455.0, 45239.0, 87655.0, 209723.0, 351903.0, 134988.0, 63924.0, 34697.0, 20177.0, 12128.0, 7665.0, 4846.0, 2952.0, 1954.0, 1312.0, 856.0, 583.0, 377.0, 265.0, 154.0, 121.0, 74.0, 59.0, 42.0, 28.0, 20.0, 6.0, 9.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0275421142578125, -0.026661396026611328, -0.025780677795410156, -0.024899959564208984, -0.024019241333007812, -0.02313852310180664, -0.02225780487060547, -0.021377086639404297, -0.020496368408203125, -0.019615650177001953, -0.01873493194580078, -0.01785421371459961, -0.016973495483398438, -0.016092777252197266, -0.015212059020996094, -0.014331340789794922, -0.01345062255859375, -0.012569904327392578, -0.011689186096191406, -0.010808467864990234, -0.009927749633789062, -0.00904703140258789, -0.008166313171386719, -0.007285594940185547, -0.006404876708984375, -0.005524158477783203, -0.004643440246582031, -0.0037627220153808594, -0.0028820037841796875, -0.0020012855529785156, -0.0011205673217773438, -0.00023984909057617188, 0.000640869140625, 0.0015215873718261719, 0.0024023056030273438, 0.0032830238342285156, 0.0041637420654296875, 0.005044460296630859, 0.005925178527832031, 0.006805896759033203, 0.007686614990234375, 0.008567333221435547, 0.009448051452636719, 0.01032876968383789, 0.011209487915039062, 0.012090206146240234, 0.012970924377441406, 0.013851642608642578, 0.01473236083984375, 0.015613079071044922, 0.016493797302246094, 0.017374515533447266, 0.018255233764648438, 0.01913595199584961, 0.02001667022705078, 0.020897388458251953, 0.021778106689453125, 0.022658824920654297, 0.02353954315185547, 0.02442026138305664, 0.025300979614257812, 0.026181697845458984, 0.027062416076660156, 0.027943134307861328, 0.0288238525390625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 14.0, 7.0, 13.0, 14.0, 23.0, 19.0, 21.0, 14.0, 31.0, 45.0, 28.0, 32.0, 37.0, 38.0, 41.0, 47.0, 41.0, 35.0, 63.0, 51.0, 36.0, 42.0, 35.0, 37.0, 34.0, 25.0, 26.0, 30.0, 24.0, 16.0, 14.0, 16.0, 12.0, 10.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032806396484375, -0.03175067901611328, -0.030694961547851562, -0.029639244079589844, -0.028583526611328125, -0.027527809143066406, -0.026472091674804688, -0.02541637420654297, -0.02436065673828125, -0.02330493927001953, -0.022249221801757812, -0.021193504333496094, -0.020137786865234375, -0.019082069396972656, -0.018026351928710938, -0.01697063446044922, -0.0159149169921875, -0.014859199523925781, -0.013803482055664062, -0.012747764587402344, -0.011692047119140625, -0.010636329650878906, -0.009580612182617188, -0.008524894714355469, -0.00746917724609375, -0.006413459777832031, -0.0053577423095703125, -0.004302024841308594, -0.003246307373046875, -0.0021905899047851562, -0.0011348724365234375, -7.915496826171875e-05, 0.0009765625, 0.0020322799682617188, 0.0030879974365234375, 0.004143714904785156, 0.005199432373046875, 0.006255149841308594, 0.0073108673095703125, 0.008366584777832031, 0.00942230224609375, 0.010478019714355469, 0.011533737182617188, 0.012589454650878906, 0.013645172119140625, 0.014700889587402344, 0.015756607055664062, 0.01681232452392578, 0.0178680419921875, 0.01892375946044922, 0.019979476928710938, 0.021035194396972656, 0.022090911865234375, 0.023146629333496094, 0.024202346801757812, 0.02525806427001953, 0.02631378173828125, 0.02736949920654297, 0.028425216674804688, 0.029480934143066406, 0.030536651611328125, 0.031592369079589844, 0.03264808654785156, 0.03370380401611328, 0.034759521484375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 14.0, 15.0, 14.0, 23.0, 43.0, 41.0, 89.0, 117.0, 183.0, 294.0, 529.0, 921.0, 1807.0, 4405.0, 14882.0, 96444.0, 849509.0, 60777.0, 11283.0, 3574.0, 1518.0, 781.0, 485.0, 245.0, 193.0, 117.0, 71.0, 38.0, 47.0, 29.0, 12.0, 17.0, 8.0, 5.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005901336669921875, -0.005713403224945068, -0.005525469779968262, -0.005337536334991455, -0.0051496028900146484, -0.004961669445037842, -0.004773736000061035, -0.0045858025550842285, -0.004397869110107422, -0.004209935665130615, -0.004022002220153809, -0.003834068775177002, -0.0036461353302001953, -0.0034582018852233887, -0.003270268440246582, -0.0030823349952697754, -0.0028944015502929688, -0.002706468105316162, -0.0025185346603393555, -0.002330601215362549, -0.002142667770385742, -0.0019547343254089355, -0.001766800880432129, -0.0015788674354553223, -0.0013909339904785156, -0.001203000545501709, -0.0010150671005249023, -0.0008271336555480957, -0.0006392002105712891, -0.0004512667655944824, -0.0002633333206176758, -7.539987564086914e-05, 0.0001125335693359375, 0.00030046701431274414, 0.0004884004592895508, 0.0006763339042663574, 0.0008642673492431641, 0.0010522007942199707, 0.0012401342391967773, 0.001428067684173584, 0.0016160011291503906, 0.0018039345741271973, 0.001991868019104004, 0.0021798014640808105, 0.002367734909057617, 0.002555668354034424, 0.0027436017990112305, 0.002931535243988037, 0.0031194686889648438, 0.0033074021339416504, 0.003495335578918457, 0.0036832690238952637, 0.0038712024688720703, 0.004059135913848877, 0.004247069358825684, 0.00443500280380249, 0.004622936248779297, 0.0048108696937561035, 0.00499880313873291, 0.005186736583709717, 0.0053746700286865234, 0.00556260347366333, 0.005750536918640137, 0.005938470363616943, 0.00612640380859375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 3.0, 4.0, 7.0, 7.0, 9.0, 9.0, 16.0, 43.0, 70.0, 156.0, 247.0, 178.0, 107.0, 51.0, 24.0, 11.0, 11.0, 11.0, 3.0, 4.0, 3.0, 7.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.285045623779297e-05, -8.015893399715424e-05, -7.74674117565155e-05, -7.477588951587677e-05, -7.208436727523804e-05, -6.93928450345993e-05, -6.670132279396057e-05, -6.400980055332184e-05, -6.13182783126831e-05, -5.862675607204437e-05, -5.593523383140564e-05, -5.324371159076691e-05, -5.0552189350128174e-05, -4.786066710948944e-05, -4.516914486885071e-05, -4.2477622628211975e-05, -3.978610038757324e-05, -3.709457814693451e-05, -3.4403055906295776e-05, -3.1711533665657043e-05, -2.902001142501831e-05, -2.6328489184379578e-05, -2.3636966943740845e-05, -2.0945444703102112e-05, -1.825392246246338e-05, -1.5562400221824646e-05, -1.2870877981185913e-05, -1.017935574054718e-05, -7.487833499908447e-06, -4.796311259269714e-06, -2.1047890186309814e-06, 5.867332220077515e-07, 3.2782554626464844e-06, 5.969777703285217e-06, 8.66129994392395e-06, 1.1352822184562683e-05, 1.4044344425201416e-05, 1.673586666584015e-05, 1.9427388906478882e-05, 2.2118911147117615e-05, 2.4810433387756348e-05, 2.750195562839508e-05, 3.0193477869033813e-05, 3.2885000109672546e-05, 3.557652235031128e-05, 3.826804459095001e-05, 4.0959566831588745e-05, 4.365108907222748e-05, 4.634261131286621e-05, 4.9034133553504944e-05, 5.172565579414368e-05, 5.441717803478241e-05, 5.710870027542114e-05, 5.9800222516059875e-05, 6.249174475669861e-05, 6.518326699733734e-05, 6.787478923797607e-05, 7.056631147861481e-05, 7.325783371925354e-05, 7.594935595989227e-05, 7.8640878200531e-05, 8.133240044116974e-05, 8.402392268180847e-05, 8.67154449224472e-05, 8.940696716308594e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 13.0, 74.0, 360.0, 1613.0, 10264.0, 1028169.0, 6550.0, 1130.0, 273.0, 64.0, 15.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06683349609375, -0.06483221054077148, -0.06283092498779297, -0.06082963943481445, -0.05882835388183594, -0.05682706832885742, -0.054825782775878906, -0.05282449722290039, -0.050823211669921875, -0.04882192611694336, -0.046820640563964844, -0.04481935501098633, -0.04281806945800781, -0.0408167839050293, -0.03881549835205078, -0.036814212799072266, -0.03481292724609375, -0.032811641693115234, -0.03081035614013672, -0.028809070587158203, -0.026807785034179688, -0.024806499481201172, -0.022805213928222656, -0.02080392837524414, -0.018802642822265625, -0.01680135726928711, -0.014800071716308594, -0.012798786163330078, -0.010797500610351562, -0.008796215057373047, -0.006794929504394531, -0.004793643951416016, -0.0027923583984375, -0.0007910728454589844, 0.0012102127075195312, 0.003211498260498047, 0.0052127838134765625, 0.007214069366455078, 0.009215354919433594, 0.01121664047241211, 0.013217926025390625, 0.01521921157836914, 0.017220497131347656, 0.019221782684326172, 0.021223068237304688, 0.023224353790283203, 0.02522563934326172, 0.027226924896240234, 0.02922821044921875, 0.031229496002197266, 0.03323078155517578, 0.0352320671081543, 0.03723335266113281, 0.03923463821411133, 0.041235923767089844, 0.04323720932006836, 0.045238494873046875, 0.04723978042602539, 0.049241065979003906, 0.05124235153198242, 0.05324363708496094, 0.05524492263793945, 0.05724620819091797, 0.059247493743896484, 0.061248779296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 17.0, 73.0, 708.0, 154.0, 16.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003681182861328125, -0.003560960292816162, -0.0034407377243041992, -0.0033205151557922363, -0.0032002925872802734, -0.0030800700187683105, -0.0029598474502563477, -0.0028396248817443848, -0.002719402313232422, -0.002599179744720459, -0.002478957176208496, -0.002358734607696533, -0.0022385120391845703, -0.0021182894706726074, -0.0019980669021606445, -0.0018778443336486816, -0.0017576217651367188, -0.0016373991966247559, -0.001517176628112793, -0.00139695405960083, -0.0012767314910888672, -0.0011565089225769043, -0.0010362863540649414, -0.0009160637855529785, -0.0007958412170410156, -0.0006756186485290527, -0.0005553960800170898, -0.00043517351150512695, -0.00031495094299316406, -0.00019472837448120117, -7.450580596923828e-05, 4.571676254272461e-05, 0.0001659393310546875, 0.0002861618995666504, 0.0004063844680786133, 0.0005266070365905762, 0.0006468296051025391, 0.000767052173614502, 0.0008872747421264648, 0.0010074973106384277, 0.0011277198791503906, 0.0012479424476623535, 0.0013681650161743164, 0.0014883875846862793, 0.0016086101531982422, 0.001728832721710205, 0.001849055290222168, 0.001969277858734131, 0.0020895004272460938, 0.0022097229957580566, 0.0023299455642700195, 0.0024501681327819824, 0.0025703907012939453, 0.002690613269805908, 0.002810835838317871, 0.002931058406829834, 0.003051280975341797, 0.0031715035438537598, 0.0032917261123657227, 0.0034119486808776855, 0.0035321712493896484, 0.0036523938179016113, 0.0037726163864135742, 0.003892838954925537, 0.0040130615234375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 9.0, 7.0, 16.0, 15.0, 23.0, 19.0, 37.0, 56.0, 81.0, 109.0, 164.0, 142.0, 108.0, 86.0, 42.0, 42.0, 19.0, 13.0, 9.0, 4.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05504005402326584, -0.05243833363056183, -0.04983661323785782, -0.04723489657044411, -0.0446331761777401, -0.04203145578503609, -0.039429739117622375, -0.036828018724918365, -0.034226298332214355, -0.031624577939510345, -0.029022859409451485, -0.026421140879392624, -0.023819420486688614, -0.021217700093984604, -0.018615981563925743, -0.016014263033866882, -0.013412542641162872, -0.010810823179781437, -0.008209103718400002, -0.005607384257018566, -0.0030056647956371307, -0.00040394533425569534, 0.00219777412712574, 0.004799492657184601, 0.007401213049888611, 0.010002932511270046, 0.012604651972651482, 0.015206371434032917, 0.017808090895414352, 0.020409811288118362, 0.023011529818177223, 0.025613248348236084, 0.028214968740940094, 0.030816689133644104, 0.033418409526348114, 0.036020126193761826, 0.038621846586465836, 0.041223566979169846, 0.04382528364658356, 0.04642700403928757, 0.04902872443199158, 0.05163044482469559, 0.0542321652173996, 0.05683388188481331, 0.05943560227751732, 0.06203732267022133, 0.06463903933763504, 0.06724075973033905, 0.06984248012304306, 0.07244420051574707, 0.07504592090845108, 0.07764764130115509, 0.0802493542432785, 0.08285107463598251, 0.08545279502868652, 0.08805451542139053, 0.09065623581409454, 0.09325795620679855, 0.09585967659950256, 0.09846139699220657, 0.10106311738491058, 0.103664830327034, 0.106266550719738, 0.10886827111244202, 0.11146999150514603]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 5.0, 5.0, 6.0, 7.0, 12.0, 5.0, 7.0, 11.0, 13.0, 13.0, 13.0, 23.0, 25.0, 22.0, 36.0, 46.0, 50.0, 39.0, 34.0, 37.0, 45.0, 40.0, 43.0, 47.0, 48.0, 41.0, 26.0, 27.0, 40.0, 35.0, 27.0, 24.0, 25.0, 34.0, 14.0, 16.0, 18.0, 4.0, 12.0, 10.0, 3.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03933930769562721, -0.038151662796735764, -0.03696402162313461, -0.035776376724243164, -0.034588731825351715, -0.033401090651750565, -0.032213445752859116, -0.031025802716612816, -0.029838159680366516, -0.028650516644120216, -0.027462871745228767, -0.026275228708982468, -0.025087585672736168, -0.023899942636489868, -0.02271229773759842, -0.02152465470135212, -0.02033700980246067, -0.01914936676621437, -0.017961721867322922, -0.016774078831076622, -0.015586435794830322, -0.014398791827261448, -0.013211147859692574, -0.012023504823446274, -0.0108358608558774, -0.009648216888308525, -0.008460573852062225, -0.007272929884493351, -0.006085286382585764, -0.004897642880678177, -0.0037099989131093025, -0.0025223558768630028, -0.0013347119092941284, -0.00014706829097121954, 0.0010405753273516893, 0.00222821906208992, 0.003415862563997507, 0.004603506065905094, 0.0057911500334739685, 0.006978793069720268, 0.008166437037289143, 0.009354081004858017, 0.010541724041104317, 0.011729368008673191, 0.012917011976242065, 0.014104655012488365, 0.01529229898005724, 0.016479942947626114, 0.017667585983872414, 0.018855229020118713, 0.020042873919010162, 0.021230516955256462, 0.022418159991502762, 0.02360580489039421, 0.02479344792664051, 0.02598109096288681, 0.02716873586177826, 0.02835637889802456, 0.029544023796916008, 0.030731666833162308, 0.03191931173205376, 0.03310695290565491, 0.034294597804546356, 0.035482242703437805, 0.036669883877038956]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 13.0, 12.0, 18.0, 31.0, 51.0, 85.0, 143.0, 193.0, 289.0, 448.0, 767.0, 1284.0, 2132.0, 3834.0, 7316.0, 14385.0, 29746.0, 64983.0, 150561.0, 301824.0, 256351.0, 114747.0, 50296.0, 23595.0, 11643.0, 5883.0, 3223.0, 1796.0, 1093.0, 620.0, 436.0, 252.0, 194.0, 109.0, 64.0, 52.0, 23.0, 20.0, 16.0, 10.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10736083984375, -0.1042795181274414, -0.10119819641113281, -0.09811687469482422, -0.09503555297851562, -0.09195423126220703, -0.08887290954589844, -0.08579158782958984, -0.08271026611328125, -0.07962894439697266, -0.07654762268066406, -0.07346630096435547, -0.07038497924804688, -0.06730365753173828, -0.06422233581542969, -0.061141014099121094, -0.0580596923828125, -0.054978370666503906, -0.05189704895019531, -0.04881572723388672, -0.045734405517578125, -0.04265308380126953, -0.03957176208496094, -0.036490440368652344, -0.03340911865234375, -0.030327796936035156, -0.027246475219726562, -0.02416515350341797, -0.021083831787109375, -0.01800251007080078, -0.014921188354492188, -0.011839866638183594, -0.008758544921875, -0.005677223205566406, -0.0025959014892578125, 0.00048542022705078125, 0.003566741943359375, 0.006648063659667969, 0.009729385375976562, 0.012810707092285156, 0.01589202880859375, 0.018973350524902344, 0.022054672241210938, 0.02513599395751953, 0.028217315673828125, 0.03129863739013672, 0.03437995910644531, 0.037461280822753906, 0.0405426025390625, 0.043623924255371094, 0.04670524597167969, 0.04978656768798828, 0.052867889404296875, 0.05594921112060547, 0.05903053283691406, 0.062111854553222656, 0.06519317626953125, 0.06827449798583984, 0.07135581970214844, 0.07443714141845703, 0.07751846313476562, 0.08059978485107422, 0.08368110656738281, 0.0867624282836914, 0.08984375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 3.0, 7.0, 10.0, 12.0, 14.0, 12.0, 15.0, 14.0, 24.0, 42.0, 40.0, 57.0, 44.0, 50.0, 47.0, 46.0, 52.0, 56.0, 52.0, 56.0, 38.0, 46.0, 47.0, 34.0, 36.0, 17.0, 23.0, 18.0, 24.0, 14.0, 19.0, 12.0, 3.0, 9.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04888916015625, -0.047446250915527344, -0.04600334167480469, -0.04456043243408203, -0.043117523193359375, -0.04167461395263672, -0.04023170471191406, -0.038788795471191406, -0.03734588623046875, -0.035902976989746094, -0.03446006774902344, -0.03301715850830078, -0.031574249267578125, -0.03013134002685547, -0.028688430786132812, -0.027245521545410156, -0.0258026123046875, -0.024359703063964844, -0.022916793823242188, -0.02147388458251953, -0.020030975341796875, -0.01858806610107422, -0.017145156860351562, -0.015702247619628906, -0.01425933837890625, -0.012816429138183594, -0.011373519897460938, -0.009930610656738281, -0.008487701416015625, -0.007044792175292969, -0.0056018829345703125, -0.004158973693847656, -0.002716064453125, -0.0012731552124023438, 0.0001697540283203125, 0.0016126632690429688, 0.003055572509765625, 0.004498481750488281, 0.0059413909912109375, 0.007384300231933594, 0.00882720947265625, 0.010270118713378906, 0.011713027954101562, 0.013155937194824219, 0.014598846435546875, 0.01604175567626953, 0.017484664916992188, 0.018927574157714844, 0.0203704833984375, 0.021813392639160156, 0.023256301879882812, 0.02469921112060547, 0.026142120361328125, 0.02758502960205078, 0.029027938842773438, 0.030470848083496094, 0.03191375732421875, 0.033356666564941406, 0.03479957580566406, 0.03624248504638672, 0.037685394287109375, 0.03912830352783203, 0.04057121276855469, 0.042014122009277344, 0.04345703125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 6.0, 1.0, 11.0, 8.0, 6.0, 7.0, 15.0, 20.0, 18.0, 19.0, 30.0, 24.0, 51.0, 52.0, 99.0, 174.0, 589.0, 4165.0, 53430.0, 655004.0, 312715.0, 19457.0, 1812.0, 348.0, 123.0, 60.0, 56.0, 45.0, 34.0, 31.0, 22.0, 21.0, 16.0, 16.0, 13.0, 6.0, 12.0, 9.0, 2.0, 5.0, 7.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25244140625, -0.2430267333984375, -0.233612060546875, -0.2241973876953125, -0.21478271484375, -0.2053680419921875, -0.195953369140625, -0.1865386962890625, -0.1771240234375, -0.1677093505859375, -0.158294677734375, -0.1488800048828125, -0.13946533203125, -0.1300506591796875, -0.120635986328125, -0.1112213134765625, -0.101806640625, -0.0923919677734375, -0.082977294921875, -0.0735626220703125, -0.06414794921875, -0.0547332763671875, -0.045318603515625, -0.0359039306640625, -0.0264892578125, -0.0170745849609375, -0.007659912109375, 0.0017547607421875, 0.01116943359375, 0.0205841064453125, 0.029998779296875, 0.0394134521484375, 0.048828125, 0.0582427978515625, 0.067657470703125, 0.0770721435546875, 0.08648681640625, 0.0959014892578125, 0.105316162109375, 0.1147308349609375, 0.1241455078125, 0.1335601806640625, 0.142974853515625, 0.1523895263671875, 0.16180419921875, 0.1712188720703125, 0.180633544921875, 0.1900482177734375, 0.199462890625, 0.2088775634765625, 0.218292236328125, 0.2277069091796875, 0.23712158203125, 0.2465362548828125, 0.255950927734375, 0.2653656005859375, 0.2747802734375, 0.2841949462890625, 0.293609619140625, 0.3030242919921875, 0.31243896484375, 0.3218536376953125, 0.331268310546875, 0.3406829833984375, 0.35009765625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 5.0, 11.0, 9.0, 10.0, 18.0, 20.0, 20.0, 23.0, 30.0, 38.0, 27.0, 35.0, 31.0, 30.0, 54.0, 46.0, 41.0, 45.0, 44.0, 48.0, 47.0, 47.0, 45.0, 43.0, 33.0, 24.0, 26.0, 28.0, 22.0, 17.0, 13.0, 10.0, 9.0, 11.0, 9.0, 4.0, 5.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.036224365234375, -0.03518271446228027, -0.03414106369018555, -0.03309941291809082, -0.032057762145996094, -0.031016111373901367, -0.02997446060180664, -0.028932809829711914, -0.027891159057617188, -0.02684950828552246, -0.025807857513427734, -0.024766206741333008, -0.02372455596923828, -0.022682905197143555, -0.021641254425048828, -0.0205996036529541, -0.019557952880859375, -0.01851630210876465, -0.017474651336669922, -0.016433000564575195, -0.015391349792480469, -0.014349699020385742, -0.013308048248291016, -0.012266397476196289, -0.011224746704101562, -0.010183095932006836, -0.00914144515991211, -0.008099794387817383, -0.007058143615722656, -0.00601649284362793, -0.004974842071533203, -0.0039331912994384766, -0.00289154052734375, -0.0018498897552490234, -0.0008082389831542969, 0.0002334117889404297, 0.0012750625610351562, 0.002316713333129883, 0.0033583641052246094, 0.004400014877319336, 0.0054416656494140625, 0.006483316421508789, 0.007524967193603516, 0.008566617965698242, 0.009608268737792969, 0.010649919509887695, 0.011691570281982422, 0.012733221054077148, 0.013774871826171875, 0.014816522598266602, 0.015858173370361328, 0.016899824142456055, 0.01794147491455078, 0.018983125686645508, 0.020024776458740234, 0.02106642723083496, 0.022108078002929688, 0.023149728775024414, 0.02419137954711914, 0.025233030319213867, 0.026274681091308594, 0.02731633186340332, 0.028357982635498047, 0.029399633407592773, 0.0304412841796875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 7.0, 13.0, 16.0, 28.0, 51.0, 61.0, 73.0, 108.0, 144.0, 265.0, 363.0, 534.0, 833.0, 1217.0, 1909.0, 3061.0, 5174.0, 9030.0, 20707.0, 144954.0, 794478.0, 36340.0, 12199.0, 6419.0, 3844.0, 2270.0, 1469.0, 971.0, 659.0, 449.0, 279.0, 185.0, 132.0, 81.0, 80.0, 48.0, 24.0, 19.0, 21.0, 13.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.008209228515625, -0.007969260215759277, -0.007729291915893555, -0.007489323616027832, -0.007249355316162109, -0.007009387016296387, -0.006769418716430664, -0.006529450416564941, -0.006289482116699219, -0.006049513816833496, -0.0058095455169677734, -0.005569577217102051, -0.005329608917236328, -0.0050896406173706055, -0.004849672317504883, -0.00460970401763916, -0.0043697357177734375, -0.004129767417907715, -0.003889799118041992, -0.0036498308181762695, -0.003409862518310547, -0.0031698942184448242, -0.0029299259185791016, -0.002689957618713379, -0.0024499893188476562, -0.0022100210189819336, -0.001970052719116211, -0.0017300844192504883, -0.0014901161193847656, -0.001250147819519043, -0.0010101795196533203, -0.0007702112197875977, -0.000530242919921875, -0.00029027462005615234, -5.030632019042969e-05, 0.00018966197967529297, 0.0004296302795410156, 0.0006695985794067383, 0.0009095668792724609, 0.0011495351791381836, 0.0013895034790039062, 0.001629471778869629, 0.0018694400787353516, 0.0021094083786010742, 0.002349376678466797, 0.0025893449783325195, 0.002829313278198242, 0.003069281578063965, 0.0033092498779296875, 0.00354921817779541, 0.003789186477661133, 0.0040291547775268555, 0.004269123077392578, 0.004509091377258301, 0.0047490596771240234, 0.004989027976989746, 0.005228996276855469, 0.005468964576721191, 0.005708932876586914, 0.005948901176452637, 0.006188869476318359, 0.006428837776184082, 0.006668806076049805, 0.006908774375915527, 0.00714874267578125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 5.0, 4.0, 5.0, 7.0, 7.0, 2.0, 8.0, 22.0, 17.0, 23.0, 34.0, 44.0, 64.0, 75.0, 83.0, 90.0, 87.0, 83.0, 75.0, 52.0, 56.0, 43.0, 25.0, 15.0, 20.0, 9.0, 14.0, 6.0, 9.0, 2.0, 3.0, 9.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.67572021484375e-06, -6.4373016357421875e-06, -6.198883056640625e-06, -5.9604644775390625e-06, -5.7220458984375e-06, -5.4836273193359375e-06, -5.245208740234375e-06, -5.0067901611328125e-06, -4.76837158203125e-06, -4.5299530029296875e-06, -4.291534423828125e-06, -4.0531158447265625e-06, -3.814697265625e-06, -3.5762786865234375e-06, -3.337860107421875e-06, -3.0994415283203125e-06, -2.86102294921875e-06, -2.6226043701171875e-06, -2.384185791015625e-06, -2.1457672119140625e-06, -1.9073486328125e-06, -1.6689300537109375e-06, -1.430511474609375e-06, -1.1920928955078125e-06, -9.5367431640625e-07, -7.152557373046875e-07, -4.76837158203125e-07, -2.384185791015625e-07, 0.0, 2.384185791015625e-07, 4.76837158203125e-07, 7.152557373046875e-07, 9.5367431640625e-07, 1.1920928955078125e-06, 1.430511474609375e-06, 1.6689300537109375e-06, 1.9073486328125e-06, 2.1457672119140625e-06, 2.384185791015625e-06, 2.6226043701171875e-06, 2.86102294921875e-06, 3.0994415283203125e-06, 3.337860107421875e-06, 3.5762786865234375e-06, 3.814697265625e-06, 4.0531158447265625e-06, 4.291534423828125e-06, 4.5299530029296875e-06, 4.76837158203125e-06, 5.0067901611328125e-06, 5.245208740234375e-06, 5.4836273193359375e-06, 5.7220458984375e-06, 5.9604644775390625e-06, 6.198883056640625e-06, 6.4373016357421875e-06, 6.67572021484375e-06, 6.9141387939453125e-06, 7.152557373046875e-06, 7.3909759521484375e-06, 7.62939453125e-06, 7.867813110351562e-06, 8.106231689453125e-06, 8.344650268554688e-06, 8.58306884765625e-06]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 19.0, 5.0, 33.0, 117.0, 958.0, 11331.0, 1026657.0, 8426.0, 797.0, 109.0, 22.0, 10.0, 13.0, 9.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07012939453125, -0.06789970397949219, -0.06567001342773438, -0.06344032287597656, -0.06121063232421875, -0.05898094177246094, -0.056751251220703125, -0.05452156066894531, -0.0522918701171875, -0.05006217956542969, -0.047832489013671875, -0.04560279846191406, -0.04337310791015625, -0.04114341735839844, -0.038913726806640625, -0.03668403625488281, -0.034454345703125, -0.03222465515136719, -0.029994964599609375, -0.027765274047851562, -0.02553558349609375, -0.023305892944335938, -0.021076202392578125, -0.018846511840820312, -0.0166168212890625, -0.014387130737304688, -0.012157440185546875, -0.009927749633789062, -0.00769805908203125, -0.0054683685302734375, -0.003238677978515625, -0.0010089874267578125, 0.001220703125, 0.0034503936767578125, 0.005680084228515625, 0.007909774780273438, 0.01013946533203125, 0.012369155883789062, 0.014598846435546875, 0.016828536987304688, 0.0190582275390625, 0.021287918090820312, 0.023517608642578125, 0.025747299194335938, 0.02797698974609375, 0.030206680297851562, 0.032436370849609375, 0.03466606140136719, 0.036895751953125, 0.03912544250488281, 0.041355133056640625, 0.04358482360839844, 0.04581451416015625, 0.04804420471191406, 0.050273895263671875, 0.05250358581542969, 0.0547332763671875, 0.05696296691894531, 0.059192657470703125, 0.06142234802246094, 0.06365203857421875, 0.06588172912597656, 0.06811141967773438, 0.07034111022949219, 0.07257080078125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 8.0, 8.0, 5.0, 7.0, 12.0, 23.0, 153.0, 621.0, 77.0, 19.0, 6.0, 10.0, 2.0, 11.0, 2.0, 2.0, 6.0, 3.0, 1.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.006458282470703125, -0.006258726119995117, -0.006059169769287109, -0.0058596134185791016, -0.005660057067871094, -0.005460500717163086, -0.005260944366455078, -0.00506138801574707, -0.0048618316650390625, -0.004662275314331055, -0.004462718963623047, -0.004263162612915039, -0.004063606262207031, -0.0038640499114990234, -0.0036644935607910156, -0.003464937210083008, -0.003265380859375, -0.003065824508666992, -0.0028662681579589844, -0.0026667118072509766, -0.0024671554565429688, -0.002267599105834961, -0.002068042755126953, -0.0018684864044189453, -0.0016689300537109375, -0.0014693737030029297, -0.0012698173522949219, -0.001070261001586914, -0.0008707046508789062, -0.0006711483001708984, -0.0004715919494628906, -0.0002720355987548828, -7.2479248046875e-05, 0.0001270771026611328, 0.0003266334533691406, 0.0005261898040771484, 0.0007257461547851562, 0.0009253025054931641, 0.0011248588562011719, 0.0013244152069091797, 0.0015239715576171875, 0.0017235279083251953, 0.0019230842590332031, 0.002122640609741211, 0.0023221969604492188, 0.0025217533111572266, 0.0027213096618652344, 0.002920866012573242, 0.00312042236328125, 0.003319978713989258, 0.0035195350646972656, 0.0037190914154052734, 0.003918647766113281, 0.004118204116821289, 0.004317760467529297, 0.004517316818237305, 0.0047168731689453125, 0.00491642951965332, 0.005115985870361328, 0.005315542221069336, 0.005515098571777344, 0.0057146549224853516, 0.005914211273193359, 0.006113767623901367, 0.006313323974609375]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 52.0, 694.0, 260.0, 11.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04605269059538841, -0.029511824250221252, -0.012970957905054092, 0.0035699084401130676, 0.020110774785280228, 0.036651644855737686, 0.05319250747561455, 0.06973336637020111, 0.08627423644065857, 0.10281510651111603, 0.11935596913099289, 0.13589683175086975, 0.1524377018213272, 0.16897857189178467, 0.18551942706108093, 0.2020602971315384, 0.21860116720199585, 0.2351420372724533, 0.25168290734291077, 0.26822376251220703, 0.2847646474838257, 0.30130550265312195, 0.3178463578224182, 0.33438724279403687, 0.35092809796333313, 0.3674689531326294, 0.38400983810424805, 0.4005506932735443, 0.4170915484428406, 0.43363243341445923, 0.4501732885837555, 0.46671414375305176, 0.4832550287246704, 0.4997958838939667, 0.5163367390632629, 0.5328776240348816, 0.5494185090065002, 0.5659593343734741, 0.5825002193450928, 0.5990411043167114, 0.6155819892883301, 0.6321228742599487, 0.6486636996269226, 0.6652045845985413, 0.6817454695701599, 0.6982862949371338, 0.7148271799087524, 0.7313680648803711, 0.747908890247345, 0.7644497752189636, 0.7809906005859375, 0.7975314855575562, 0.8140723705291748, 0.8306132555007935, 0.8471540808677673, 0.863694965839386, 0.8802357912063599, 0.8967766761779785, 0.9133175015449524, 0.929858386516571, 0.9463992714881897, 0.9629400968551636, 0.9794809818267822, 0.9960218667984009, 1.0125627517700195]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 5.0, 10.0, 9.0, 8.0, 6.0, 16.0, 14.0, 13.0, 18.0, 32.0, 21.0, 24.0, 30.0, 39.0, 33.0, 34.0, 36.0, 39.0, 37.0, 37.0, 52.0, 46.0, 42.0, 42.0, 28.0, 35.0, 36.0, 30.0, 41.0, 33.0, 27.0, 11.0, 27.0, 10.0, 16.0, 15.0, 7.0, 7.0, 8.0, 3.0, 3.0, 4.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.04708774387836456, -0.04564499482512474, -0.04420224204659462, -0.0427594929933548, -0.041316743940114975, -0.03987399488687515, -0.03843124210834503, -0.03698849305510521, -0.03554574400186539, -0.034102994948625565, -0.032660242170095444, -0.03121749311685562, -0.0297747440636158, -0.028331993147730827, -0.026889242231845856, -0.025446493178606033, -0.02400374226272106, -0.02256099134683609, -0.021118242293596268, -0.019675491377711296, -0.018232742324471474, -0.016789991408586502, -0.015347241424024105, -0.013904491439461708, -0.012461741454899311, -0.011018991470336914, -0.009576241485774517, -0.00813349150121212, -0.006690741050988436, -0.005247991066426039, -0.0038052406162023544, -0.0023624906316399574, -0.0009197406470775604, 0.0005230094539001584, 0.0019657595548778772, 0.003408509772270918, 0.004851259756833315, 0.006294009741395712, 0.007736760191619396, 0.009179510176181793, 0.01062226016074419, 0.012065010145306587, 0.013507760129868984, 0.014950510114431381, 0.016393261030316353, 0.017836010083556175, 0.019278760999441147, 0.02072151005268097, 0.02216426096856594, 0.023607011884450912, 0.025049760937690735, 0.026492511853575706, 0.02793526090681553, 0.0293780118227005, 0.030820760875940323, 0.032263509929180145, 0.033706262707710266, 0.03514901176095009, 0.03659176453948021, 0.03803451359272003, 0.039477262645959854, 0.040920011699199677, 0.0423627644777298, 0.04380551353096962, 0.04524826258420944]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 11.0, 9.0, 13.0, 14.0, 12.0, 30.0, 18.0, 44.0, 40.0, 45.0, 53.0, 79.0, 76.0, 129.0, 159.0, 228.0, 290.0, 421.0, 625.0, 988.0, 1594.0, 3446.0, 24038.0, 1552035.0, 2557620.0, 42682.0, 4087.0, 1928.0, 1080.0, 655.0, 451.0, 337.0, 255.0, 176.0, 134.0, 101.0, 74.0, 57.0, 54.0, 43.0, 32.0, 23.0, 23.0, 19.0, 15.0, 10.0, 3.0, 6.0, 3.0, 4.0, 4.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0838623046875, -0.08107566833496094, -0.07828903198242188, -0.07550239562988281, -0.07271575927734375, -0.06992912292480469, -0.06714248657226562, -0.06435585021972656, -0.0615692138671875, -0.05878257751464844, -0.055995941162109375, -0.05320930480957031, -0.05042266845703125, -0.04763603210449219, -0.044849395751953125, -0.04206275939941406, -0.039276123046875, -0.03648948669433594, -0.033702850341796875, -0.030916213989257812, -0.02812957763671875, -0.025342941284179688, -0.022556304931640625, -0.019769668579101562, -0.0169830322265625, -0.014196395874023438, -0.011409759521484375, -0.008623123168945312, -0.00583648681640625, -0.0030498504638671875, -0.000263214111328125, 0.0025234222412109375, 0.00531005859375, 0.008096694946289062, 0.010883331298828125, 0.013669967651367188, 0.01645660400390625, 0.019243240356445312, 0.022029876708984375, 0.024816513061523438, 0.0276031494140625, 0.030389785766601562, 0.033176422119140625, 0.03596305847167969, 0.03874969482421875, 0.04153633117675781, 0.044322967529296875, 0.04710960388183594, 0.049896240234375, 0.05268287658691406, 0.055469512939453125, 0.05825614929199219, 0.06104278564453125, 0.06382942199707031, 0.06661605834960938, 0.06940269470214844, 0.0721893310546875, 0.07497596740722656, 0.07776260375976562, 0.08054924011230469, 0.08333587646484375, 0.08612251281738281, 0.08890914916992188, 0.09169578552246094, 0.094482421875]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 5.0, 6.0, 21.0, 15.0, 18.0, 24.0, 20.0, 21.0, 23.0, 27.0, 29.0, 31.0, 36.0, 44.0, 44.0, 36.0, 52.0, 54.0, 44.0, 37.0, 49.0, 36.0, 37.0, 38.0, 29.0, 37.0, 37.0, 20.0, 27.0, 17.0, 17.0, 12.0, 11.0, 4.0, 5.0, 7.0, 3.0, 5.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032073974609375, -0.031026363372802734, -0.02997875213623047, -0.028931140899658203, -0.027883529663085938, -0.026835918426513672, -0.025788307189941406, -0.02474069595336914, -0.023693084716796875, -0.02264547348022461, -0.021597862243652344, -0.020550251007080078, -0.019502639770507812, -0.018455028533935547, -0.01740741729736328, -0.016359806060791016, -0.01531219482421875, -0.014264583587646484, -0.013216972351074219, -0.012169361114501953, -0.011121749877929688, -0.010074138641357422, -0.009026527404785156, -0.00797891616821289, -0.006931304931640625, -0.005883693695068359, -0.004836082458496094, -0.003788471221923828, -0.0027408599853515625, -0.0016932487487792969, -0.0006456375122070312, 0.0004019737243652344, 0.0014495849609375, 0.0024971961975097656, 0.0035448074340820312, 0.004592418670654297, 0.0056400299072265625, 0.006687641143798828, 0.007735252380371094, 0.00878286361694336, 0.009830474853515625, 0.01087808609008789, 0.011925697326660156, 0.012973308563232422, 0.014020919799804688, 0.015068531036376953, 0.01611614227294922, 0.017163753509521484, 0.01821136474609375, 0.019258975982666016, 0.02030658721923828, 0.021354198455810547, 0.022401809692382812, 0.023449420928955078, 0.024497032165527344, 0.02554464340209961, 0.026592254638671875, 0.02763986587524414, 0.028687477111816406, 0.029735088348388672, 0.030782699584960938, 0.0318303108215332, 0.03287792205810547, 0.033925533294677734, 0.03497314453125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 13.0, 13.0, 25.0, 21.0, 50.0, 62.0, 138.0, 603.0, 87092.0, 4105012.0, 991.0, 141.0, 44.0, 23.0, 14.0, 3.0, 9.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9846267700195312, -0.9565582275390625, -0.9284896850585938, -0.900421142578125, -0.8723526000976562, -0.8442840576171875, -0.8162155151367188, -0.78814697265625, -0.7600784301757812, -0.7320098876953125, -0.7039413452148438, -0.675872802734375, -0.6478042602539062, -0.6197357177734375, -0.5916671752929688, -0.5635986328125, -0.5355300903320312, -0.5074615478515625, -0.47939300537109375, -0.451324462890625, -0.42325592041015625, -0.3951873779296875, -0.36711883544921875, -0.33905029296875, -0.31098175048828125, -0.2829132080078125, -0.25484466552734375, -0.226776123046875, -0.19870758056640625, -0.1706390380859375, -0.14257049560546875, -0.114501953125, -0.08643341064453125, -0.0583648681640625, -0.03029632568359375, -0.002227783203125, 0.02584075927734375, 0.0539093017578125, 0.08197784423828125, 0.11004638671875, 0.13811492919921875, 0.1661834716796875, 0.19425201416015625, 0.222320556640625, 0.25038909912109375, 0.2784576416015625, 0.30652618408203125, 0.3345947265625, 0.36266326904296875, 0.3907318115234375, 0.41880035400390625, 0.446868896484375, 0.47493743896484375, 0.5030059814453125, 0.5310745239257812, 0.55914306640625, 0.5872116088867188, 0.6152801513671875, 0.6433486938476562, 0.671417236328125, 0.6994857788085938, 0.7275543212890625, 0.7556228637695312, 0.78369140625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 11.0, 5.0, 18.0, 35.0, 71.0, 329.0, 1210.0, 1457.0, 541.0, 157.0, 80.0, 50.0, 18.0, 23.0, 19.0, 14.0, 6.0, 4.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0273895263671875, -0.02630162239074707, -0.02521371841430664, -0.02412581443786621, -0.02303791046142578, -0.02195000648498535, -0.020862102508544922, -0.019774198532104492, -0.018686294555664062, -0.017598390579223633, -0.016510486602783203, -0.015422582626342773, -0.014334678649902344, -0.013246774673461914, -0.012158870697021484, -0.011070966720581055, -0.009983062744140625, -0.008895158767700195, -0.007807254791259766, -0.006719350814819336, -0.005631446838378906, -0.0045435428619384766, -0.003455638885498047, -0.002367734909057617, -0.0012798309326171875, -0.0001919269561767578, 0.0008959770202636719, 0.0019838809967041016, 0.0030717849731445312, 0.004159688949584961, 0.005247592926025391, 0.00633549690246582, 0.00742340087890625, 0.00851130485534668, 0.00959920883178711, 0.010687112808227539, 0.011775016784667969, 0.012862920761108398, 0.013950824737548828, 0.015038728713989258, 0.016126632690429688, 0.017214536666870117, 0.018302440643310547, 0.019390344619750977, 0.020478248596191406, 0.021566152572631836, 0.022654056549072266, 0.023741960525512695, 0.024829864501953125, 0.025917768478393555, 0.027005672454833984, 0.028093576431274414, 0.029181480407714844, 0.030269384384155273, 0.0313572883605957, 0.03244519233703613, 0.03353309631347656, 0.03462100028991699, 0.03570890426635742, 0.03679680824279785, 0.03788471221923828, 0.03897261619567871, 0.04006052017211914, 0.04114842414855957, 0.042236328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 8.0, 15.0, 13.0, 32.0, 53.0, 68.0, 85.0, 127.0, 126.0, 116.0, 101.0, 88.0, 63.0, 33.0, 26.0, 16.0, 10.0, 8.0, 8.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02572374790906906, -0.024058040231466293, -0.022392334416508675, -0.020726626738905907, -0.019060920923948288, -0.01739521324634552, -0.015729505568742752, -0.014063798822462559, -0.012398092076182365, -0.010732385329902172, -0.009066678583621979, -0.007400970906019211, -0.0057352641597390175, -0.004069557413458824, -0.002403849735856056, -0.0007381429895758629, 0.0009275637567043304, 0.0025932707358151674, 0.004258977714926004, 0.005924684926867485, 0.007590391673147678, 0.009256098419427872, 0.01092180609703064, 0.012587512843310833, 0.014253219589591026, 0.015918927267193794, 0.017584633082151413, 0.01925034075975418, 0.02091604843735695, 0.022581754252314568, 0.024247461929917336, 0.025913167744874954, 0.027578875422477722, 0.02924458310008049, 0.03091028891503811, 0.03257599472999573, 0.034241702407598495, 0.03590741008520126, 0.03757311776280403, 0.0392388254404068, 0.04090452939271927, 0.04257023707032204, 0.044235944747924805, 0.045901648700237274, 0.04756735637784004, 0.04923306405544281, 0.05089877173304558, 0.052564479410648346, 0.054230187088251114, 0.05589589476585388, 0.05756160244345665, 0.05922731012105942, 0.06089301407337189, 0.06255872547626495, 0.06422442942857742, 0.06589013338088989, 0.06755584478378296, 0.06922154873609543, 0.0708872601389885, 0.07255296409130096, 0.07421867549419403, 0.0758843794465065, 0.07755008339881897, 0.07921579480171204, 0.0808814987540245]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 2.0, 5.0, 3.0, 2.0, 6.0, 8.0, 10.0, 12.0, 8.0, 13.0, 25.0, 24.0, 15.0, 15.0, 29.0, 25.0, 24.0, 30.0, 30.0, 37.0, 32.0, 44.0, 37.0, 44.0, 38.0, 40.0, 37.0, 41.0, 31.0, 35.0, 38.0, 31.0, 37.0, 22.0, 30.0, 23.0, 14.0, 14.0, 18.0, 13.0, 11.0, 7.0, 8.0, 7.0, 7.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03306492790579796, -0.03201434761285782, -0.030963771045207977, -0.029913192614912987, -0.028862614184617996, -0.027812035754323006, -0.026761457324028015, -0.025710877031087875, -0.024660300463438034, -0.023609722033143044, -0.022559143602848053, -0.021508565172553062, -0.020457986742258072, -0.01940740831196308, -0.01835682988166809, -0.01730624958872795, -0.01625567115843296, -0.01520509272813797, -0.01415451429784298, -0.013103935867547989, -0.012053357437252998, -0.011002779006958008, -0.009952199645340443, -0.008901621215045452, -0.007851042784750462, -0.006800464354455471, -0.0057498859241604805, -0.004699307028204203, -0.003648728597909212, -0.0025981501676142216, -0.0015475712716579437, -0.0004969928413629532, 0.0005535855889320374, 0.0016041641356423497, 0.002654742682352662, 0.0037053213454782963, 0.004755899775773287, 0.005806478206068277, 0.006857057102024555, 0.007907635532319546, 0.008958213962614536, 0.010008792392909527, 0.011059370823204517, 0.012109950184822083, 0.013160528615117073, 0.014211107045412064, 0.015261685475707054, 0.016312263906002045, 0.017362842336297035, 0.018413420766592026, 0.019463999196887016, 0.020514577627182007, 0.021565156057476997, 0.022615734487771988, 0.023666314780712128, 0.02471689134836197, 0.02576747164130211, 0.0268180500715971, 0.02786862850189209, 0.02891920693218708, 0.02996978536248207, 0.03102036379277706, 0.03207094222307205, 0.03312152251601219, 0.03417209908366203]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 15.0, 19.0, 23.0, 35.0, 54.0, 93.0, 150.0, 200.0, 309.0, 446.0, 693.0, 1063.0, 1705.0, 2751.0, 4493.0, 6865.0, 11271.0, 18864.0, 32391.0, 58652.0, 113452.0, 234364.0, 268383.0, 133537.0, 67076.0, 37026.0, 20966.0, 12832.0, 7671.0, 4772.0, 3012.0, 1906.0, 1225.0, 752.0, 498.0, 346.0, 219.0, 142.0, 104.0, 60.0, 42.0, 28.0, 9.0, 18.0, 10.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0186614990234375, -0.018097877502441406, -0.017534255981445312, -0.01697063446044922, -0.016407012939453125, -0.01584339141845703, -0.015279769897460938, -0.014716148376464844, -0.01415252685546875, -0.013588905334472656, -0.013025283813476562, -0.012461662292480469, -0.011898040771484375, -0.011334419250488281, -0.010770797729492188, -0.010207176208496094, -0.0096435546875, -0.009079933166503906, -0.008516311645507812, -0.007952690124511719, -0.007389068603515625, -0.006825447082519531, -0.0062618255615234375, -0.005698204040527344, -0.00513458251953125, -0.004570960998535156, -0.0040073394775390625, -0.0034437179565429688, -0.002880096435546875, -0.0023164749145507812, -0.0017528533935546875, -0.0011892318725585938, -0.0006256103515625, -6.198883056640625e-05, 0.0005016326904296875, 0.0010652542114257812, 0.001628875732421875, 0.0021924972534179688, 0.0027561187744140625, 0.0033197402954101562, 0.00388336181640625, 0.004446983337402344, 0.0050106048583984375, 0.005574226379394531, 0.006137847900390625, 0.006701469421386719, 0.0072650909423828125, 0.007828712463378906, 0.008392333984375, 0.008955955505371094, 0.009519577026367188, 0.010083198547363281, 0.010646820068359375, 0.011210441589355469, 0.011774063110351562, 0.012337684631347656, 0.01290130615234375, 0.013464927673339844, 0.014028549194335938, 0.014592170715332031, 0.015155792236328125, 0.01571941375732422, 0.016283035278320312, 0.016846656799316406, 0.0174102783203125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 9.0, 8.0, 8.0, 9.0, 9.0, 9.0, 26.0, 26.0, 20.0, 21.0, 37.0, 30.0, 35.0, 41.0, 30.0, 44.0, 41.0, 43.0, 31.0, 43.0, 38.0, 52.0, 49.0, 32.0, 40.0, 33.0, 31.0, 31.0, 25.0, 22.0, 24.0, 23.0, 8.0, 13.0, 8.0, 10.0, 7.0, 10.0, 3.0, 2.0, 2.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.027801513671875, -0.02690410614013672, -0.026006698608398438, -0.025109291076660156, -0.024211883544921875, -0.023314476013183594, -0.022417068481445312, -0.02151966094970703, -0.02062225341796875, -0.01972484588623047, -0.018827438354492188, -0.017930030822753906, -0.017032623291015625, -0.016135215759277344, -0.015237808227539062, -0.014340400695800781, -0.0134429931640625, -0.012545585632324219, -0.011648178100585938, -0.010750770568847656, -0.009853363037109375, -0.008955955505371094, -0.008058547973632812, -0.007161140441894531, -0.00626373291015625, -0.005366325378417969, -0.0044689178466796875, -0.0035715103149414062, -0.002674102783203125, -0.0017766952514648438, -0.0008792877197265625, 1.811981201171875e-05, 0.00091552734375, 0.0018129348754882812, 0.0027103424072265625, 0.0036077499389648438, 0.004505157470703125, 0.005402565002441406, 0.0062999725341796875, 0.007197380065917969, 0.00809478759765625, 0.008992195129394531, 0.009889602661132812, 0.010787010192871094, 0.011684417724609375, 0.012581825256347656, 0.013479232788085938, 0.014376640319824219, 0.0152740478515625, 0.01617145538330078, 0.017068862915039062, 0.017966270446777344, 0.018863677978515625, 0.019761085510253906, 0.020658493041992188, 0.02155590057373047, 0.02245330810546875, 0.02335071563720703, 0.024248123168945312, 0.025145530700683594, 0.026042938232421875, 0.026940345764160156, 0.027837753295898438, 0.02873516082763672, 0.029632568359375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 10.0, 9.0, 18.0, 30.0, 25.0, 55.0, 66.0, 89.0, 146.0, 259.0, 359.0, 531.0, 781.0, 1291.0, 2031.0, 3220.0, 5233.0, 8700.0, 14757.0, 25245.0, 46871.0, 97593.0, 266498.0, 334884.0, 116287.0, 53633.0, 28641.0, 16182.0, 9669.0, 5792.0, 3499.0, 2175.0, 1387.0, 866.0, 581.0, 351.0, 266.0, 164.0, 118.0, 80.0, 53.0, 36.0, 29.0, 15.0, 9.0, 6.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.019500732421875, -0.01891160011291504, -0.018322467803955078, -0.017733335494995117, -0.017144203186035156, -0.016555070877075195, -0.015965938568115234, -0.015376806259155273, -0.014787673950195312, -0.014198541641235352, -0.01360940933227539, -0.01302027702331543, -0.012431144714355469, -0.011842012405395508, -0.011252880096435547, -0.010663747787475586, -0.010074615478515625, -0.009485483169555664, -0.008896350860595703, -0.008307218551635742, -0.007718086242675781, -0.00712895393371582, -0.006539821624755859, -0.0059506893157958984, -0.0053615570068359375, -0.0047724246978759766, -0.004183292388916016, -0.0035941600799560547, -0.0030050277709960938, -0.002415895462036133, -0.0018267631530761719, -0.001237630844116211, -0.00064849853515625, -5.936622619628906e-05, 0.0005297660827636719, 0.0011188983917236328, 0.0017080307006835938, 0.0022971630096435547, 0.0028862953186035156, 0.0034754276275634766, 0.0040645599365234375, 0.0046536922454833984, 0.005242824554443359, 0.00583195686340332, 0.006421089172363281, 0.007010221481323242, 0.007599353790283203, 0.008188486099243164, 0.008777618408203125, 0.009366750717163086, 0.009955883026123047, 0.010545015335083008, 0.011134147644042969, 0.01172327995300293, 0.01231241226196289, 0.012901544570922852, 0.013490676879882812, 0.014079809188842773, 0.014668941497802734, 0.015258073806762695, 0.015847206115722656, 0.016436338424682617, 0.017025470733642578, 0.01761460304260254, 0.0182037353515625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 9.0, 5.0, 4.0, 11.0, 7.0, 14.0, 18.0, 20.0, 12.0, 24.0, 30.0, 25.0, 31.0, 28.0, 42.0, 35.0, 52.0, 41.0, 49.0, 41.0, 38.0, 38.0, 54.0, 40.0, 37.0, 38.0, 41.0, 37.0, 42.0, 21.0, 23.0, 19.0, 19.0, 10.0, 12.0, 13.0, 7.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0213165283203125, -0.020636796951293945, -0.01995706558227539, -0.019277334213256836, -0.01859760284423828, -0.017917871475219727, -0.017238140106201172, -0.016558408737182617, -0.015878677368164062, -0.015198945999145508, -0.014519214630126953, -0.013839483261108398, -0.013159751892089844, -0.012480020523071289, -0.011800289154052734, -0.01112055778503418, -0.010440826416015625, -0.00976109504699707, -0.009081363677978516, -0.008401632308959961, -0.007721900939941406, -0.0070421695709228516, -0.006362438201904297, -0.005682706832885742, -0.0050029754638671875, -0.004323244094848633, -0.003643512725830078, -0.0029637813568115234, -0.0022840499877929688, -0.001604318618774414, -0.0009245872497558594, -0.0002448558807373047, 0.00043487548828125, 0.0011146068572998047, 0.0017943382263183594, 0.002474069595336914, 0.0031538009643554688, 0.0038335323333740234, 0.004513263702392578, 0.005192995071411133, 0.0058727264404296875, 0.006552457809448242, 0.007232189178466797, 0.007911920547485352, 0.008591651916503906, 0.009271383285522461, 0.009951114654541016, 0.01063084602355957, 0.011310577392578125, 0.01199030876159668, 0.012670040130615234, 0.013349771499633789, 0.014029502868652344, 0.014709234237670898, 0.015388965606689453, 0.016068696975708008, 0.016748428344726562, 0.017428159713745117, 0.018107891082763672, 0.018787622451782227, 0.01946735382080078, 0.020147085189819336, 0.02082681655883789, 0.021506547927856445, 0.022186279296875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 5.0, 1.0, 2.0, 3.0, 8.0, 9.0, 17.0, 16.0, 26.0, 40.0, 42.0, 65.0, 110.0, 153.0, 235.0, 355.0, 513.0, 787.0, 1109.0, 1827.0, 2839.0, 4633.0, 7606.0, 13739.0, 27111.0, 60904.0, 255980.0, 519455.0, 78732.0, 32647.0, 16380.0, 8895.0, 5296.0, 3230.0, 1955.0, 1258.0, 802.0, 566.0, 352.0, 246.0, 178.0, 140.0, 92.0, 62.0, 41.0, 30.0, 22.0, 16.0, 13.0, 7.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0027618408203125, -0.0026701688766479492, -0.0025784969329833984, -0.0024868249893188477, -0.002395153045654297, -0.002303481101989746, -0.0022118091583251953, -0.0021201372146606445, -0.0020284652709960938, -0.001936793327331543, -0.0018451213836669922, -0.0017534494400024414, -0.0016617774963378906, -0.0015701055526733398, -0.001478433609008789, -0.0013867616653442383, -0.0012950897216796875, -0.0012034177780151367, -0.001111745834350586, -0.0010200738906860352, -0.0009284019470214844, -0.0008367300033569336, -0.0007450580596923828, -0.000653386116027832, -0.0005617141723632812, -0.00047004222869873047, -0.0003783702850341797, -0.0002866983413696289, -0.00019502639770507812, -0.00010335445404052734, -1.1682510375976562e-05, 7.998943328857422e-05, 0.000171661376953125, 0.0002633333206176758, 0.00035500526428222656, 0.00044667720794677734, 0.0005383491516113281, 0.0006300210952758789, 0.0007216930389404297, 0.0008133649826049805, 0.0009050369262695312, 0.000996708869934082, 0.0010883808135986328, 0.0011800527572631836, 0.0012717247009277344, 0.0013633966445922852, 0.001455068588256836, 0.0015467405319213867, 0.0016384124755859375, 0.0017300844192504883, 0.001821756362915039, 0.0019134283065795898, 0.0020051002502441406, 0.0020967721939086914, 0.002188444137573242, 0.002280116081237793, 0.0023717880249023438, 0.0024634599685668945, 0.0025551319122314453, 0.002646803855895996, 0.002738475799560547, 0.0028301477432250977, 0.0029218196868896484, 0.0030134916305541992, 0.00310516357421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 5.0, 5.0, 8.0, 13.0, 13.0, 12.0, 14.0, 28.0, 22.0, 75.0, 132.0, 204.0, 169.0, 97.0, 65.0, 25.0, 25.0, 17.0, 12.0, 11.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.128715515136719e-05, -6.872136145830154e-05, -6.61555677652359e-05, -6.358977407217026e-05, -6.1023980379104614e-05, -5.845818668603897e-05, -5.589239299297333e-05, -5.3326599299907684e-05, -5.076080560684204e-05, -4.81950119137764e-05, -4.5629218220710754e-05, -4.306342452764511e-05, -4.049763083457947e-05, -3.7931837141513824e-05, -3.536604344844818e-05, -3.280024975538254e-05, -3.0234456062316895e-05, -2.766866236925125e-05, -2.5102868676185608e-05, -2.2537074983119965e-05, -1.997128129005432e-05, -1.7405487596988678e-05, -1.4839693903923035e-05, -1.2273900210857391e-05, -9.708106517791748e-06, -7.142312824726105e-06, -4.5765191316604614e-06, -2.010725438594818e-06, 5.550682544708252e-07, 3.1208619475364685e-06, 5.686655640602112e-06, 8.252449333667755e-06, 1.0818243026733398e-05, 1.3384036719799042e-05, 1.5949830412864685e-05, 1.851562410593033e-05, 2.108141779899597e-05, 2.3647211492061615e-05, 2.6213005185127258e-05, 2.87787988781929e-05, 3.1344592571258545e-05, 3.391038626432419e-05, 3.647617995738983e-05, 3.9041973650455475e-05, 4.160776734352112e-05, 4.417356103658676e-05, 4.6739354729652405e-05, 4.930514842271805e-05, 5.187094211578369e-05, 5.4436735808849335e-05, 5.700252950191498e-05, 5.956832319498062e-05, 6.213411688804626e-05, 6.469991058111191e-05, 6.726570427417755e-05, 6.98314979672432e-05, 7.239729166030884e-05, 7.496308535337448e-05, 7.752887904644012e-05, 8.009467273950577e-05, 8.266046643257141e-05, 8.522626012563705e-05, 8.77920538187027e-05, 9.035784751176834e-05, 9.292364120483398e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 2.0, 4.0, 7.0, 9.0, 15.0, 19.0, 24.0, 24.0, 52.0, 70.0, 312.0, 2638.0, 108624.0, 927910.0, 7868.0, 631.0, 113.0, 61.0, 34.0, 27.0, 24.0, 15.0, 13.0, 7.0, 8.0, 4.0, 7.0, 2.0, 3.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0191802978515625, -0.018619298934936523, -0.018058300018310547, -0.01749730110168457, -0.016936302185058594, -0.016375303268432617, -0.01581430435180664, -0.015253305435180664, -0.014692306518554688, -0.014131307601928711, -0.013570308685302734, -0.013009309768676758, -0.012448310852050781, -0.011887311935424805, -0.011326313018798828, -0.010765314102172852, -0.010204315185546875, -0.009643316268920898, -0.009082317352294922, -0.008521318435668945, -0.007960319519042969, -0.007399320602416992, -0.006838321685791016, -0.006277322769165039, -0.0057163238525390625, -0.005155324935913086, -0.004594326019287109, -0.004033327102661133, -0.0034723281860351562, -0.0029113292694091797, -0.002350330352783203, -0.0017893314361572266, -0.00122833251953125, -0.0006673336029052734, -0.00010633468627929688, 0.0004546642303466797, 0.0010156631469726562, 0.0015766620635986328, 0.0021376609802246094, 0.002698659896850586, 0.0032596588134765625, 0.003820657730102539, 0.004381656646728516, 0.004942655563354492, 0.005503654479980469, 0.006064653396606445, 0.006625652313232422, 0.0071866512298583984, 0.007747650146484375, 0.008308649063110352, 0.008869647979736328, 0.009430646896362305, 0.009991645812988281, 0.010552644729614258, 0.011113643646240234, 0.011674642562866211, 0.012235641479492188, 0.012796640396118164, 0.01335763931274414, 0.013918638229370117, 0.014479637145996094, 0.01504063606262207, 0.015601634979248047, 0.016162633895874023, 0.0167236328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 9.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 2.0, 9.0, 5.0, 14.0, 14.0, 16.0, 25.0, 41.0, 52.0, 92.0, 151.0, 170.0, 123.0, 93.0, 50.0, 39.0, 21.0, 20.0, 19.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008416175842285156, -0.0008129552006721497, -0.0007842928171157837, -0.0007556304335594177, -0.0007269680500030518, -0.0006983056664466858, -0.0006696432828903198, -0.0006409808993339539, -0.0006123185157775879, -0.0005836561322212219, -0.000554993748664856, -0.00052633136510849, -0.000497668981552124, -0.00046900659799575806, -0.0004403442144393921, -0.0004116818308830261, -0.00038301944732666016, -0.0003543570637702942, -0.0003256946802139282, -0.00029703229665756226, -0.0002683699131011963, -0.00023970752954483032, -0.00021104514598846436, -0.0001823827624320984, -0.00015372037887573242, -0.00012505799531936646, -9.639561176300049e-05, -6.773322820663452e-05, -3.9070844650268555e-05, -1.0408461093902588e-05, 1.825392246246338e-05, 4.6916306018829346e-05, 7.557868957519531e-05, 0.00010424107313156128, 0.00013290345668792725, 0.0001615658402442932, 0.00019022822380065918, 0.00021889060735702515, 0.0002475529909133911, 0.0002762153744697571, 0.00030487775802612305, 0.000333540141582489, 0.000362202525138855, 0.00039086490869522095, 0.0004195272922515869, 0.0004481896758079529, 0.00047685205936431885, 0.0005055144429206848, 0.0005341768264770508, 0.0005628392100334167, 0.0005915015935897827, 0.0006201639771461487, 0.0006488263607025146, 0.0006774887442588806, 0.0007061511278152466, 0.0007348135113716125, 0.0007634758949279785, 0.0007921382784843445, 0.0008208006620407104, 0.0008494630455970764, 0.0008781254291534424, 0.0009067878127098083, 0.0009354501962661743, 0.0009641125798225403, 0.0009927749633789062]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 29.0, 89.0, 245.0, 323.0, 214.0, 78.0, 19.0, 10.0, 5.0, 1.0, 1.0], "bins": [-0.2711053192615509, -0.2662927806377411, -0.2614802420139313, -0.25666770339012146, -0.25185516476631165, -0.24704262614250183, -0.24223008751869202, -0.2374175488948822, -0.2326050102710724, -0.22779247164726257, -0.22297993302345276, -0.21816739439964294, -0.21335485577583313, -0.20854231715202332, -0.2037297785282135, -0.1989172399044037, -0.19410470128059387, -0.18929216265678406, -0.18447962403297424, -0.17966708540916443, -0.17485454678535461, -0.1700420081615448, -0.16522946953773499, -0.16041693091392517, -0.15560440719127655, -0.15079186856746674, -0.14597932994365692, -0.1411667913198471, -0.1363542526960373, -0.13154171407222748, -0.12672917544841766, -0.12191663682460785, -0.11710409820079803, -0.11229155957698822, -0.1074790209531784, -0.10266648232936859, -0.09785394370555878, -0.09304140508174896, -0.08822886645793915, -0.08341632783412933, -0.07860378921031952, -0.0737912505865097, -0.06897871196269989, -0.06416617333889008, -0.05935363471508026, -0.05454109609127045, -0.04972856119275093, -0.044916022568941116, -0.0401034876704216, -0.035290949046611786, -0.03047841042280197, -0.025665873661637306, -0.020853335037827492, -0.016040796414017677, -0.011228259652853012, -0.006415721029043198, -0.0016031824052333832, 0.003209355752915144, 0.008021893911063671, 0.012834431603550911, 0.017646970227360725, 0.02245950885117054, 0.027272045612335205, 0.03208458423614502, 0.036897122859954834]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 9.0, 7.0, 13.0, 12.0, 29.0, 26.0, 20.0, 19.0, 20.0, 33.0, 30.0, 33.0, 33.0, 34.0, 30.0, 35.0, 48.0, 27.0, 31.0, 37.0, 45.0, 38.0, 32.0, 36.0, 40.0, 27.0, 25.0, 29.0, 30.0, 23.0, 21.0, 14.0, 17.0, 6.0, 10.0, 15.0, 9.0, 8.0, 7.0, 3.0, 4.0, 4.0, 1.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.02550448663532734, -0.02473812736570835, -0.023971768096089363, -0.023205408826470375, -0.022439049556851387, -0.0216726902872324, -0.02090633288025856, -0.020139973610639572, -0.019373614341020584, -0.018607255071401596, -0.017840895801782608, -0.01707453653216362, -0.016308177262544632, -0.015541817992925644, -0.01477545965462923, -0.014009100385010242, -0.01324274018406868, -0.012476380914449692, -0.011710021644830704, -0.010943662375211716, -0.010177303105592728, -0.00941094383597374, -0.008644585497677326, -0.007878226228058338, -0.00711186695843935, -0.006345507688820362, -0.005579148419201374, -0.004812789615243673, -0.004046430345624685, -0.0032800710760056973, -0.0025137122720479965, -0.0017473530024290085, -0.0009809918701648712, -0.000214632716961205, 0.0005517264362424612, 0.0013180854730308056, 0.0020844447426497936, 0.0028508040122687817, 0.0036171628162264824, 0.00438352208584547, 0.0051498813554644585, 0.0059162406250834465, 0.0066825998947024345, 0.007448958698660135, 0.008215317502617836, 0.008981676772236824, 0.009748036041855812, 0.0105143953114748, 0.011280754581093788, 0.012047113850712776, 0.012813473120331764, 0.013579832389950752, 0.01434619165956974, 0.015112550929188728, 0.015878908336162567, 0.016645267605781555, 0.017411626875400543, 0.01817798614501953, 0.01894434541463852, 0.019710704684257507, 0.020477063953876495, 0.021243423223495483, 0.02200978249311447, 0.02277614176273346, 0.023542501032352448]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 14.0, 15.0, 35.0, 23.0, 45.0, 96.0, 106.0, 171.0, 250.0, 341.0, 557.0, 882.0, 1372.0, 2280.0, 3757.0, 6125.0, 10701.0, 18079.0, 32459.0, 58603.0, 104763.0, 178024.0, 224634.0, 172935.0, 101770.0, 56537.0, 30930.0, 17482.0, 10017.0, 5848.0, 3628.0, 2171.0, 1391.0, 882.0, 561.0, 390.0, 228.0, 143.0, 99.0, 59.0, 40.0, 34.0, 24.0, 8.0, 15.0, 9.0, 10.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.048736572265625, -0.04718780517578125, -0.0456390380859375, -0.04409027099609375, -0.04254150390625, -0.04099273681640625, -0.0394439697265625, -0.03789520263671875, -0.036346435546875, -0.03479766845703125, -0.0332489013671875, -0.03170013427734375, -0.0301513671875, -0.02860260009765625, -0.0270538330078125, -0.02550506591796875, -0.023956298828125, -0.02240753173828125, -0.0208587646484375, -0.01930999755859375, -0.01776123046875, -0.01621246337890625, -0.0146636962890625, -0.01311492919921875, -0.011566162109375, -0.01001739501953125, -0.0084686279296875, -0.00691986083984375, -0.00537109375, -0.00382232666015625, -0.0022735595703125, -0.00072479248046875, 0.000823974609375, 0.00237274169921875, 0.0039215087890625, 0.00547027587890625, 0.00701904296875, 0.00856781005859375, 0.0101165771484375, 0.01166534423828125, 0.013214111328125, 0.01476287841796875, 0.0163116455078125, 0.01786041259765625, 0.0194091796875, 0.02095794677734375, 0.0225067138671875, 0.02405548095703125, 0.025604248046875, 0.02715301513671875, 0.0287017822265625, 0.03025054931640625, 0.03179931640625, 0.03334808349609375, 0.0348968505859375, 0.03644561767578125, 0.037994384765625, 0.03954315185546875, 0.0410919189453125, 0.04264068603515625, 0.044189453125, 0.04573822021484375, 0.0472869873046875, 0.04883575439453125, 0.050384521484375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 11.0, 13.0, 14.0, 19.0, 20.0, 26.0, 28.0, 27.0, 49.0, 40.0, 43.0, 57.0, 67.0, 58.0, 51.0, 67.0, 56.0, 55.0, 52.0, 35.0, 39.0, 47.0, 28.0, 17.0, 20.0, 16.0, 8.0, 10.0, 7.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028564453125, -0.027347087860107422, -0.026129722595214844, -0.024912357330322266, -0.023694992065429688, -0.02247762680053711, -0.02126026153564453, -0.020042896270751953, -0.018825531005859375, -0.017608165740966797, -0.01639080047607422, -0.01517343521118164, -0.013956069946289062, -0.012738704681396484, -0.011521339416503906, -0.010303974151611328, -0.00908660888671875, -0.007869243621826172, -0.006651878356933594, -0.005434513092041016, -0.0042171478271484375, -0.0029997825622558594, -0.0017824172973632812, -0.0005650520324707031, 0.000652313232421875, 0.0018696784973144531, 0.0030870437622070312, 0.004304409027099609, 0.0055217742919921875, 0.006739139556884766, 0.007956504821777344, 0.009173870086669922, 0.0103912353515625, 0.011608600616455078, 0.012825965881347656, 0.014043331146240234, 0.015260696411132812, 0.01647806167602539, 0.01769542694091797, 0.018912792205810547, 0.020130157470703125, 0.021347522735595703, 0.02256488800048828, 0.02378225326538086, 0.024999618530273438, 0.026216983795166016, 0.027434349060058594, 0.028651714324951172, 0.02986907958984375, 0.031086444854736328, 0.032303810119628906, 0.033521175384521484, 0.03473854064941406, 0.03595590591430664, 0.03717327117919922, 0.0383906364440918, 0.039608001708984375, 0.04082536697387695, 0.04204273223876953, 0.04326009750366211, 0.04447746276855469, 0.045694828033447266, 0.046912193298339844, 0.04812955856323242, 0.049346923828125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 12.0, 27.0, 27.0, 46.0, 58.0, 64.0, 109.0, 319.0, 5926.0, 1014770.0, 26352.0, 449.0, 142.0, 71.0, 51.0, 38.0, 22.0, 24.0, 10.0, 12.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8818359375, -0.8620681762695312, -0.8423004150390625, -0.8225326538085938, -0.802764892578125, -0.7829971313476562, -0.7632293701171875, -0.7434616088867188, -0.72369384765625, -0.7039260864257812, -0.6841583251953125, -0.6643905639648438, -0.644622802734375, -0.6248550415039062, -0.6050872802734375, -0.5853195190429688, -0.5655517578125, -0.5457839965820312, -0.5260162353515625, -0.5062484741210938, -0.486480712890625, -0.46671295166015625, -0.4469451904296875, -0.42717742919921875, -0.40740966796875, -0.38764190673828125, -0.3678741455078125, -0.34810638427734375, -0.328338623046875, -0.30857086181640625, -0.2888031005859375, -0.26903533935546875, -0.249267578125, -0.22949981689453125, -0.2097320556640625, -0.18996429443359375, -0.170196533203125, -0.15042877197265625, -0.1306610107421875, -0.11089324951171875, -0.09112548828125, -0.07135772705078125, -0.0515899658203125, -0.03182220458984375, -0.012054443359375, 0.00771331787109375, 0.0274810791015625, 0.04724884033203125, 0.0670166015625, 0.08678436279296875, 0.1065521240234375, 0.12631988525390625, 0.146087646484375, 0.16585540771484375, 0.1856231689453125, 0.20539093017578125, 0.22515869140625, 0.24492645263671875, 0.2646942138671875, 0.28446197509765625, 0.304229736328125, 0.32399749755859375, 0.3437652587890625, 0.36353302001953125, 0.38330078125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 5.0, 10.0, 14.0, 24.0, 28.0, 41.0, 41.0, 51.0, 56.0, 73.0, 72.0, 81.0, 92.0, 74.0, 69.0, 76.0, 48.0, 43.0, 33.0, 20.0, 20.0, 8.0, 11.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03375244140625, -0.03218555450439453, -0.030618667602539062, -0.029051780700683594, -0.027484893798828125, -0.025918006896972656, -0.024351119995117188, -0.02278423309326172, -0.02121734619140625, -0.01965045928955078, -0.018083572387695312, -0.016516685485839844, -0.014949798583984375, -0.013382911682128906, -0.011816024780273438, -0.010249137878417969, -0.0086822509765625, -0.007115364074707031, -0.0055484771728515625, -0.003981590270996094, -0.002414703369140625, -0.0008478164672851562, 0.0007190704345703125, 0.0022859573364257812, 0.00385284423828125, 0.005419731140136719, 0.0069866180419921875, 0.008553504943847656, 0.010120391845703125, 0.011687278747558594, 0.013254165649414062, 0.014821052551269531, 0.016387939453125, 0.01795482635498047, 0.019521713256835938, 0.021088600158691406, 0.022655487060546875, 0.024222373962402344, 0.025789260864257812, 0.02735614776611328, 0.02892303466796875, 0.03048992156982422, 0.03205680847167969, 0.033623695373535156, 0.035190582275390625, 0.036757469177246094, 0.03832435607910156, 0.03989124298095703, 0.0414581298828125, 0.04302501678466797, 0.04459190368652344, 0.046158790588378906, 0.047725677490234375, 0.049292564392089844, 0.05085945129394531, 0.05242633819580078, 0.05399322509765625, 0.05556011199951172, 0.05712699890136719, 0.058693885803222656, 0.060260772705078125, 0.061827659606933594, 0.06339454650878906, 0.06496143341064453, 0.0665283203125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 7.0, 6.0, 11.0, 16.0, 35.0, 52.0, 100.0, 218.0, 375.0, 967.0, 2593.0, 9882.0, 81829.0, 884884.0, 55929.0, 7815.0, 2186.0, 864.0, 378.0, 183.0, 88.0, 54.0, 30.0, 21.0, 8.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021820068359375, -0.0021167397499084473, -0.0020514726638793945, -0.001986205577850342, -0.001920938491821289, -0.0018556714057922363, -0.0017904043197631836, -0.0017251372337341309, -0.0016598701477050781, -0.0015946030616760254, -0.0015293359756469727, -0.00146406888961792, -0.0013988018035888672, -0.0013335347175598145, -0.0012682676315307617, -0.001203000545501709, -0.0011377334594726562, -0.0010724663734436035, -0.0010071992874145508, -0.000941932201385498, -0.0008766651153564453, -0.0008113980293273926, -0.0007461309432983398, -0.0006808638572692871, -0.0006155967712402344, -0.0005503296852111816, -0.0004850625991821289, -0.00041979551315307617, -0.00035452842712402344, -0.0002892613410949707, -0.00022399425506591797, -0.00015872716903686523, -9.34600830078125e-05, -2.8192996978759766e-05, 3.707408905029297e-05, 0.0001023411750793457, 0.00016760826110839844, 0.00023287534713745117, 0.0002981424331665039, 0.00036340951919555664, 0.0004286766052246094, 0.0004939436912536621, 0.0005592107772827148, 0.0006244778633117676, 0.0006897449493408203, 0.000755012035369873, 0.0008202791213989258, 0.0008855462074279785, 0.0009508132934570312, 0.001016080379486084, 0.0010813474655151367, 0.0011466145515441895, 0.0012118816375732422, 0.001277148723602295, 0.0013424158096313477, 0.0014076828956604004, 0.0014729499816894531, 0.0015382170677185059, 0.0016034841537475586, 0.0016687512397766113, 0.001734018325805664, 0.0017992854118347168, 0.0018645524978637695, 0.0019298195838928223, 0.001995086669921875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 11.0, 7.0, 9.0, 22.0, 21.0, 25.0, 46.0, 42.0, 66.0, 77.0, 95.0, 112.0, 76.0, 84.0, 89.0, 42.0, 55.0, 22.0, 21.0, 20.0, 7.0, 7.0, 5.0, 3.0, 6.0, 3.0, 0.0, 6.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.569789886474609e-06, -7.368624210357666e-06, -7.167458534240723e-06, -6.966292858123779e-06, -6.765127182006836e-06, -6.563961505889893e-06, -6.362795829772949e-06, -6.161630153656006e-06, -5.9604644775390625e-06, -5.759298801422119e-06, -5.558133125305176e-06, -5.356967449188232e-06, -5.155801773071289e-06, -4.954636096954346e-06, -4.753470420837402e-06, -4.552304744720459e-06, -4.351139068603516e-06, -4.149973392486572e-06, -3.948807716369629e-06, -3.7476420402526855e-06, -3.546476364135742e-06, -3.345310688018799e-06, -3.1441450119018555e-06, -2.942979335784912e-06, -2.7418136596679688e-06, -2.5406479835510254e-06, -2.339482307434082e-06, -2.1383166313171387e-06, -1.9371509552001953e-06, -1.735985279083252e-06, -1.5348196029663086e-06, -1.3336539268493652e-06, -1.1324882507324219e-06, -9.313225746154785e-07, -7.301568984985352e-07, -5.289912223815918e-07, -3.2782554626464844e-07, -1.2665987014770508e-07, 7.450580596923828e-08, 2.7567148208618164e-07, 4.76837158203125e-07, 6.780028343200684e-07, 8.791685104370117e-07, 1.080334186553955e-06, 1.2814998626708984e-06, 1.4826655387878418e-06, 1.6838312149047852e-06, 1.8849968910217285e-06, 2.086162567138672e-06, 2.2873282432556152e-06, 2.4884939193725586e-06, 2.689659595489502e-06, 2.8908252716064453e-06, 3.0919909477233887e-06, 3.293156623840332e-06, 3.4943222999572754e-06, 3.6954879760742188e-06, 3.896653652191162e-06, 4.0978193283081055e-06, 4.298985004425049e-06, 4.500150680541992e-06, 4.7013163566589355e-06, 4.902482032775879e-06, 5.103647708892822e-06, 5.304813385009766e-06]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 12.0, 18.0, 18.0, 21.0, 31.0, 56.0, 68.0, 99.0, 347.0, 6893.0, 1010356.0, 29419.0, 803.0, 131.0, 60.0, 45.0, 37.0, 33.0, 18.0, 9.0, 10.0, 7.0, 4.0, 6.0, 3.0, 4.0, 6.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.003662109375, -0.003562241792678833, -0.003462374210357666, -0.003362506628036499, -0.003262639045715332, -0.003162771463394165, -0.003062903881072998, -0.002963036298751831, -0.002863168716430664, -0.002763301134109497, -0.00266343355178833, -0.002563565969467163, -0.002463698387145996, -0.002363830804824829, -0.002263963222503662, -0.002164095640182495, -0.002064228057861328, -0.001964360475540161, -0.0018644928932189941, -0.0017646253108978271, -0.0016647577285766602, -0.0015648901462554932, -0.0014650225639343262, -0.0013651549816131592, -0.0012652873992919922, -0.0011654198169708252, -0.0010655522346496582, -0.0009656846523284912, -0.0008658170700073242, -0.0007659494876861572, -0.0006660819053649902, -0.0005662143230438232, -0.00046634674072265625, -0.00036647915840148926, -0.00026661157608032227, -0.00016674399375915527, -6.687641143798828e-05, 3.299117088317871e-05, 0.0001328587532043457, 0.0002327263355255127, 0.0003325939178466797, 0.0004324615001678467, 0.0005323290824890137, 0.0006321966648101807, 0.0007320642471313477, 0.0008319318294525146, 0.0009317994117736816, 0.0010316669940948486, 0.0011315345764160156, 0.0012314021587371826, 0.0013312697410583496, 0.0014311373233795166, 0.0015310049057006836, 0.0016308724880218506, 0.0017307400703430176, 0.0018306076526641846, 0.0019304752349853516, 0.0020303428173065186, 0.0021302103996276855, 0.0022300779819488525, 0.0023299455642700195, 0.0024298131465911865, 0.0025296807289123535, 0.0026295483112335205, 0.0027294158935546875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 1.0, 4.0, 8.0, 2.0, 6.0, 4.0, 5.0, 4.0, 13.0, 10.0, 25.0, 28.0, 31.0, 39.0, 71.0, 73.0, 85.0, 99.0, 102.0, 86.0, 64.0, 62.0, 51.0, 26.0, 20.0, 15.0, 11.0, 12.0, 9.0, 5.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021696090698242188, -0.00020913034677505493, -0.000201299786567688, -0.00019346922636032104, -0.0001856386661529541, -0.00017780810594558716, -0.00016997754573822021, -0.00016214698553085327, -0.00015431642532348633, -0.00014648586511611938, -0.00013865530490875244, -0.0001308247447013855, -0.00012299418449401855, -0.00011516362428665161, -0.00010733306407928467, -9.950250387191772e-05, -9.167194366455078e-05, -8.384138345718384e-05, -7.60108232498169e-05, -6.818026304244995e-05, -6.034970283508301e-05, -5.2519142627716064e-05, -4.468858242034912e-05, -3.685802221298218e-05, -2.9027462005615234e-05, -2.119690179824829e-05, -1.3366341590881348e-05, -5.535781383514404e-06, 2.294778823852539e-06, 1.0125339031219482e-05, 1.7955899238586426e-05, 2.578645944595337e-05, 3.361701965332031e-05, 4.1447579860687256e-05, 4.92781400680542e-05, 5.710870027542114e-05, 6.493926048278809e-05, 7.276982069015503e-05, 8.060038089752197e-05, 8.843094110488892e-05, 9.626150131225586e-05, 0.0001040920615196228, 0.00011192262172698975, 0.00011975318193435669, 0.00012758374214172363, 0.00013541430234909058, 0.00014324486255645752, 0.00015107542276382446, 0.0001589059829711914, 0.00016673654317855835, 0.0001745671033859253, 0.00018239766359329224, 0.00019022822380065918, 0.00019805878400802612, 0.00020588934421539307, 0.00021371990442276, 0.00022155046463012695, 0.0002293810248374939, 0.00023721158504486084, 0.0002450421452522278, 0.0002528727054595947, 0.00026070326566696167, 0.0002685338258743286, 0.00027636438608169556, 0.0002841949462890625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 203.0, 802.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1936591863632202, -1.1720291376113892, -1.150399088859558, -1.128769040107727, -1.107138991355896, -1.085508942604065, -1.0638788938522339, -1.0422488451004028, -1.0206187963485718, -0.9989887475967407, -0.9773586988449097, -0.9557286500930786, -0.9340986013412476, -0.9124685525894165, -0.8908385038375854, -0.8692083954811096, -0.8475782871246338, -0.8259482383728027, -0.8043181896209717, -0.7826881408691406, -0.7610580921173096, -0.7394280433654785, -0.7177979946136475, -0.6961678862571716, -0.6745378971099854, -0.6529078483581543, -0.6312777996063232, -0.6096477508544922, -0.5880177021026611, -0.5663876533508301, -0.544757604598999, -0.5231274962425232, -0.5014974474906921, -0.4798673987388611, -0.45823734998703003, -0.436607301235199, -0.41497722268104553, -0.3933471739292145, -0.3717171251773834, -0.35008704662323, -0.3284569978713989, -0.30682694911956787, -0.2851969003677368, -0.26356685161590576, -0.24193677306175232, -0.22030672430992126, -0.1986766755580902, -0.17704661190509796, -0.1554165631532669, -0.13378651440143585, -0.1121564507484436, -0.09052640199661255, -0.0688963457942009, -0.047266289591789246, -0.02563624083995819, -0.004006177186965942, 0.017623871564865112, 0.039253927767276764, 0.06088398024439812, 0.08251403272151947, 0.10414408892393112, 0.12577414512634277, 0.14740419387817383, 0.16903425753116608, 0.19066430628299713]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 8.0, 7.0, 9.0, 6.0, 10.0, 12.0, 13.0, 11.0, 13.0, 27.0, 20.0, 29.0, 25.0, 30.0, 48.0, 47.0, 46.0, 44.0, 38.0, 39.0, 43.0, 49.0, 50.0, 51.0, 38.0, 31.0, 40.0, 32.0, 34.0, 23.0, 27.0, 15.0, 16.0, 16.0, 12.0, 9.0, 6.0, 10.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0373009592294693, -0.035971395671367645, -0.03464183211326599, -0.03331226855516434, -0.03198270872235298, -0.030653145164251328, -0.029323581606149673, -0.02799401804804802, -0.026664456352591515, -0.02533489279448986, -0.024005331099033356, -0.0226757675409317, -0.021346203982830048, -0.020016642287373543, -0.01868707872927189, -0.017357517033815384, -0.01602795347571373, -0.01469839084893465, -0.013368828222155571, -0.012039264664053917, -0.010709702037274837, -0.009380139410495758, -0.008050575852394104, -0.006721013225615025, -0.005391450598835945, -0.004061887972056866, -0.002732324879616499, -0.0014027617871761322, -7.319916039705276e-05, 0.0012563634663820267, 0.0025859270244836807, 0.00391548965126276, 0.005245048552751541, 0.006574611179530621, 0.0079041738063097, 0.009233737364411354, 0.010563299991190434, 0.011892862617969513, 0.013222426176071167, 0.014551988802850246, 0.015881551429629326, 0.01721111498773098, 0.018540676683187485, 0.01987024024128914, 0.021199803799390793, 0.022529365494847298, 0.02385892905294895, 0.025188490748405457, 0.02651805430650711, 0.027847617864608765, 0.02917717956006527, 0.030506743118166924, 0.03183630481362343, 0.03316586837172508, 0.034495431929826736, 0.03582499548792839, 0.037154555320739746, 0.0384841188788414, 0.039813682436943054, 0.04114324599504471, 0.042472805827856064, 0.04380236938595772, 0.04513193294405937, 0.046461496502161026, 0.04779106006026268]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 3.0, 7.0, 4.0, 6.0, 12.0, 16.0, 17.0, 23.0, 26.0, 31.0, 36.0, 40.0, 54.0, 74.0, 119.0, 148.0, 215.0, 488.0, 1260.0, 4265.0, 172544.0, 3867362.0, 140850.0, 4130.0, 1245.0, 490.0, 224.0, 140.0, 91.0, 77.0, 60.0, 40.0, 26.0, 36.0, 19.0, 24.0, 15.0, 14.0, 12.0, 8.0, 5.0, 2.0, 8.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07989501953125, -0.07709026336669922, -0.07428550720214844, -0.07148075103759766, -0.06867599487304688, -0.0658712387084961, -0.06306648254394531, -0.06026172637939453, -0.05745697021484375, -0.05465221405029297, -0.05184745788574219, -0.049042701721191406, -0.046237945556640625, -0.043433189392089844, -0.04062843322753906, -0.03782367706298828, -0.0350189208984375, -0.03221416473388672, -0.029409408569335938, -0.026604652404785156, -0.023799896240234375, -0.020995140075683594, -0.018190383911132812, -0.015385627746582031, -0.01258087158203125, -0.009776115417480469, -0.0069713592529296875, -0.004166603088378906, -0.001361846923828125, 0.0014429092407226562, 0.0042476654052734375, 0.007052421569824219, 0.009857177734375, 0.012661933898925781, 0.015466690063476562, 0.018271446228027344, 0.021076202392578125, 0.023880958557128906, 0.026685714721679688, 0.02949047088623047, 0.03229522705078125, 0.03509998321533203, 0.03790473937988281, 0.040709495544433594, 0.043514251708984375, 0.046319007873535156, 0.04912376403808594, 0.05192852020263672, 0.0547332763671875, 0.05753803253173828, 0.06034278869628906, 0.06314754486083984, 0.06595230102539062, 0.0687570571899414, 0.07156181335449219, 0.07436656951904297, 0.07717132568359375, 0.07997608184814453, 0.08278083801269531, 0.0855855941772461, 0.08839035034179688, 0.09119510650634766, 0.09399986267089844, 0.09680461883544922, 0.099609375]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 7.0, 11.0, 6.0, 9.0, 15.0, 15.0, 18.0, 21.0, 21.0, 27.0, 28.0, 29.0, 39.0, 35.0, 51.0, 35.0, 43.0, 38.0, 38.0, 36.0, 43.0, 45.0, 43.0, 45.0, 36.0, 35.0, 23.0, 18.0, 29.0, 26.0, 25.0, 16.0, 15.0, 11.0, 10.0, 6.0, 9.0, 5.0, 8.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 6.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.02581787109375, -0.025032997131347656, -0.024248123168945312, -0.02346324920654297, -0.022678375244140625, -0.02189350128173828, -0.021108627319335938, -0.020323753356933594, -0.01953887939453125, -0.018754005432128906, -0.017969131469726562, -0.01718425750732422, -0.016399383544921875, -0.015614509582519531, -0.014829635620117188, -0.014044761657714844, -0.0132598876953125, -0.012475013732910156, -0.011690139770507812, -0.010905265808105469, -0.010120391845703125, -0.009335517883300781, -0.008550643920898438, -0.007765769958496094, -0.00698089599609375, -0.006196022033691406, -0.0054111480712890625, -0.004626274108886719, -0.003841400146484375, -0.0030565261840820312, -0.0022716522216796875, -0.0014867782592773438, -0.000701904296875, 8.296966552734375e-05, 0.0008678436279296875, 0.0016527175903320312, 0.002437591552734375, 0.0032224655151367188, 0.0040073394775390625, 0.004792213439941406, 0.00557708740234375, 0.006361961364746094, 0.0071468353271484375, 0.007931709289550781, 0.008716583251953125, 0.009501457214355469, 0.010286331176757812, 0.011071205139160156, 0.0118560791015625, 0.012640953063964844, 0.013425827026367188, 0.014210700988769531, 0.014995574951171875, 0.01578044891357422, 0.016565322875976562, 0.017350196838378906, 0.01813507080078125, 0.018919944763183594, 0.019704818725585938, 0.02048969268798828, 0.021274566650390625, 0.02205944061279297, 0.022844314575195312, 0.023629188537597656, 0.0244140625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 10.0, 22.0, 69.0, 825.0, 4186040.0, 6996.0, 204.0, 47.0, 23.0, 16.0, 7.0, 10.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90185546875, -0.8725204467773438, -0.8431854248046875, -0.8138504028320312, -0.784515380859375, -0.7551803588867188, -0.7258453369140625, -0.6965103149414062, -0.66717529296875, -0.6378402709960938, -0.6085052490234375, -0.5791702270507812, -0.549835205078125, -0.5205001831054688, -0.4911651611328125, -0.46183013916015625, -0.4324951171875, -0.40316009521484375, -0.3738250732421875, -0.34449005126953125, -0.315155029296875, -0.28582000732421875, -0.2564849853515625, -0.22714996337890625, -0.19781494140625, -0.16847991943359375, -0.1391448974609375, -0.10980987548828125, -0.080474853515625, -0.05113983154296875, -0.0218048095703125, 0.00753021240234375, 0.036865234375, 0.06620025634765625, 0.0955352783203125, 0.12487030029296875, 0.154205322265625, 0.18354034423828125, 0.2128753662109375, 0.24221038818359375, 0.27154541015625, 0.30088043212890625, 0.3302154541015625, 0.35955047607421875, 0.388885498046875, 0.41822052001953125, 0.4475555419921875, 0.47689056396484375, 0.5062255859375, 0.5355606079101562, 0.5648956298828125, 0.5942306518554688, 0.623565673828125, 0.6529006958007812, 0.6822357177734375, 0.7115707397460938, 0.74090576171875, 0.7702407836914062, 0.7995758056640625, 0.8289108276367188, 0.858245849609375, 0.8875808715820312, 0.9169158935546875, 0.9462509155273438, 0.9755859375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 10.0, 10.0, 14.0, 30.0, 42.0, 129.0, 784.0, 2217.0, 715.0, 83.0, 22.0, 7.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038360595703125, -0.03721427917480469, -0.036067962646484375, -0.03492164611816406, -0.03377532958984375, -0.03262901306152344, -0.031482696533203125, -0.030336380004882812, -0.0291900634765625, -0.028043746948242188, -0.026897430419921875, -0.025751113891601562, -0.02460479736328125, -0.023458480834960938, -0.022312164306640625, -0.021165847778320312, -0.02001953125, -0.018873214721679688, -0.017726898193359375, -0.016580581665039062, -0.01543426513671875, -0.014287948608398438, -0.013141632080078125, -0.011995315551757812, -0.0108489990234375, -0.009702682495117188, -0.008556365966796875, -0.0074100494384765625, -0.00626373291015625, -0.0051174163818359375, -0.003971099853515625, -0.0028247833251953125, -0.001678466796875, -0.0005321502685546875, 0.000614166259765625, 0.0017604827880859375, 0.00290679931640625, 0.0040531158447265625, 0.005199432373046875, 0.0063457489013671875, 0.0074920654296875, 0.008638381958007812, 0.009784698486328125, 0.010931015014648438, 0.01207733154296875, 0.013223648071289062, 0.014369964599609375, 0.015516281127929688, 0.01666259765625, 0.017808914184570312, 0.018955230712890625, 0.020101547241210938, 0.02124786376953125, 0.022394180297851562, 0.023540496826171875, 0.024686813354492188, 0.0258331298828125, 0.026979446411132812, 0.028125762939453125, 0.029272079467773438, 0.03041839599609375, 0.03156471252441406, 0.032711029052734375, 0.03385734558105469, 0.035003662109375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 14.0, 27.0, 75.0, 208.0, 353.0, 227.0, 73.0, 27.0, 10.0, 1.0, 4.0], "bins": [-0.2061588317155838, -0.2025785595178604, -0.19899830222129822, -0.19541803002357483, -0.19183775782585144, -0.18825748562812805, -0.18467721343040466, -0.18109695613384247, -0.17751668393611908, -0.1739364117383957, -0.1703561544418335, -0.1667758822441101, -0.16319561004638672, -0.15961533784866333, -0.15603506565093994, -0.15245480835437775, -0.14887453615665436, -0.14529426395893097, -0.14171400666236877, -0.13813373446464539, -0.134553462266922, -0.1309731900691986, -0.12739291787147522, -0.12381266057491302, -0.12023238837718964, -0.11665211617946625, -0.11307185143232346, -0.10949158668518066, -0.10591131448745728, -0.10233104228973389, -0.0987507775425911, -0.0951705127954483, -0.09159024804830551, -0.08800998330116272, -0.08442971110343933, -0.08084943890571594, -0.07726917415857315, -0.07368890941143036, -0.07010863721370697, -0.06652836501598358, -0.06294810026884079, -0.0593678317964077, -0.05578756332397461, -0.05220729485154152, -0.04862702637910843, -0.04504675790667534, -0.04146648943424225, -0.03788622096180916, -0.03430595248937607, -0.030725684016942978, -0.027145415544509888, -0.023565147072076797, -0.019984878599643707, -0.016404610127210617, -0.012824341654777527, -0.009244073182344437, -0.005663802847266197, -0.002083534374833107, 0.0014967340975999832, 0.005077002570033073, 0.008657271042466164, 0.012237539514899254, 0.015817807987332344, 0.019398076459765434, 0.022978344932198524]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 2.0, 3.0, 5.0, 4.0, 8.0, 4.0, 14.0, 20.0, 12.0, 21.0, 30.0, 27.0, 28.0, 22.0, 28.0, 35.0, 40.0, 30.0, 44.0, 55.0, 46.0, 39.0, 39.0, 48.0, 45.0, 44.0, 38.0, 32.0, 26.0, 33.0, 25.0, 23.0, 21.0, 17.0, 19.0, 15.0, 13.0, 7.0, 6.0, 6.0, 8.0, 3.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.026735950261354446, -0.025954922661185265, -0.025173895061016083, -0.0243928674608469, -0.02361183986067772, -0.022830812260508537, -0.022049784660339355, -0.021268757060170174, -0.020487729460000992, -0.01970670185983181, -0.018925674259662628, -0.018144646659493446, -0.017363619059324265, -0.016582591459155083, -0.0158015638589859, -0.015020536258816719, -0.014239508658647537, -0.013458481058478355, -0.012677453458309174, -0.011896425858139992, -0.01111539825797081, -0.010334370657801628, -0.009553343057632446, -0.008772315457463264, -0.007991287857294083, -0.007210260257124901, -0.006429232656955719, -0.005648205056786537, -0.004867177456617355, -0.0040861498564481735, -0.0033051222562789917, -0.00252409465610981, -0.0017430689185857773, -0.0009620413184165955, -0.00018101371824741364, 0.0006000138819217682, 0.00138104148209095, 0.002162069082260132, 0.0029430966824293137, 0.0037241242825984955, 0.004505151882767677, 0.005286179482936859, 0.006067207083106041, 0.006848234683275223, 0.007629262283444405, 0.008410289883613586, 0.009191317483782768, 0.00997234508395195, 0.010753372684121132, 0.011534400284290314, 0.012315427884459496, 0.013096455484628677, 0.01387748308479786, 0.014658510684967041, 0.015439538285136223, 0.016220565885305405, 0.017001593485474586, 0.01778262108564377, 0.01856364868581295, 0.019344676285982132, 0.020125703886151314, 0.020906731486320496, 0.021687759086489677, 0.02246878668665886, 0.02324981428682804]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 6.0, 11.0, 17.0, 27.0, 28.0, 61.0, 57.0, 107.0, 135.0, 217.0, 301.0, 454.0, 656.0, 928.0, 1428.0, 2037.0, 3070.0, 4595.0, 7252.0, 11419.0, 18565.0, 31596.0, 54811.0, 103915.0, 212672.0, 277427.0, 141271.0, 72262.0, 40052.0, 23335.0, 13982.0, 8855.0, 5646.0, 3665.0, 2523.0, 1586.0, 1158.0, 720.0, 507.0, 341.0, 270.0, 195.0, 104.0, 102.0, 45.0, 44.0, 32.0, 27.0, 12.0, 12.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0], "bins": [-0.01161956787109375, -0.011258959770202637, -0.010898351669311523, -0.01053774356842041, -0.010177135467529297, -0.009816527366638184, -0.00945591926574707, -0.009095311164855957, -0.008734703063964844, -0.00837409496307373, -0.008013486862182617, -0.007652878761291504, -0.007292270660400391, -0.006931662559509277, -0.006571054458618164, -0.006210446357727051, -0.0058498382568359375, -0.005489230155944824, -0.005128622055053711, -0.004768013954162598, -0.004407405853271484, -0.004046797752380371, -0.003686189651489258, -0.0033255815505981445, -0.0029649734497070312, -0.002604365348815918, -0.0022437572479248047, -0.0018831491470336914, -0.0015225410461425781, -0.0011619329452514648, -0.0008013248443603516, -0.0004407167434692383, -8.0108642578125e-05, 0.0002804994583129883, 0.0006411075592041016, 0.0010017156600952148, 0.0013623237609863281, 0.0017229318618774414, 0.0020835399627685547, 0.002444148063659668, 0.0028047561645507812, 0.0031653642654418945, 0.003525972366333008, 0.003886580467224121, 0.004247188568115234, 0.004607796669006348, 0.004968404769897461, 0.005329012870788574, 0.0056896209716796875, 0.006050229072570801, 0.006410837173461914, 0.006771445274353027, 0.007132053375244141, 0.007492661476135254, 0.007853269577026367, 0.00821387767791748, 0.008574485778808594, 0.008935093879699707, 0.00929570198059082, 0.009656310081481934, 0.010016918182373047, 0.01037752628326416, 0.010738134384155273, 0.011098742485046387, 0.0114593505859375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 8.0, 5.0, 10.0, 8.0, 13.0, 17.0, 24.0, 14.0, 25.0, 24.0, 29.0, 30.0, 28.0, 30.0, 35.0, 38.0, 42.0, 37.0, 54.0, 48.0, 50.0, 35.0, 42.0, 32.0, 50.0, 29.0, 30.0, 32.0, 23.0, 19.0, 23.0, 18.0, 17.0, 9.0, 9.0, 12.0, 9.0, 9.0, 4.0, 4.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0], "bins": [-0.02276611328125, -0.022116661071777344, -0.021467208862304688, -0.02081775665283203, -0.020168304443359375, -0.01951885223388672, -0.018869400024414062, -0.018219947814941406, -0.01757049560546875, -0.016921043395996094, -0.016271591186523438, -0.015622138977050781, -0.014972686767578125, -0.014323234558105469, -0.013673782348632812, -0.013024330139160156, -0.0123748779296875, -0.011725425720214844, -0.011075973510742188, -0.010426521301269531, -0.009777069091796875, -0.009127616882324219, -0.008478164672851562, -0.007828712463378906, -0.00717926025390625, -0.006529808044433594, -0.0058803558349609375, -0.005230903625488281, -0.004581451416015625, -0.003931999206542969, -0.0032825469970703125, -0.0026330947875976562, -0.001983642578125, -0.0013341903686523438, -0.0006847381591796875, -3.528594970703125e-05, 0.000614166259765625, 0.0012636184692382812, 0.0019130706787109375, 0.0025625228881835938, 0.00321197509765625, 0.0038614273071289062, 0.0045108795166015625, 0.005160331726074219, 0.005809783935546875, 0.006459236145019531, 0.0071086883544921875, 0.007758140563964844, 0.0084075927734375, 0.009057044982910156, 0.009706497192382812, 0.010355949401855469, 0.011005401611328125, 0.011654853820800781, 0.012304306030273438, 0.012953758239746094, 0.01360321044921875, 0.014252662658691406, 0.014902114868164062, 0.015551567077636719, 0.016201019287109375, 0.01685047149658203, 0.017499923706054688, 0.018149375915527344, 0.018798828125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 4.0, 8.0, 12.0, 9.0, 8.0, 17.0, 36.0, 46.0, 49.0, 76.0, 116.0, 140.0, 230.0, 311.0, 448.0, 547.0, 894.0, 1311.0, 1854.0, 2948.0, 4441.0, 6902.0, 10709.0, 17017.0, 28411.0, 48918.0, 93128.0, 207388.0, 318522.0, 137198.0, 67760.0, 37916.0, 22065.0, 13636.0, 8778.0, 5551.0, 3603.0, 2337.0, 1611.0, 1114.0, 720.0, 491.0, 395.0, 267.0, 179.0, 108.0, 99.0, 65.0, 62.0, 28.0, 21.0, 22.0, 10.0, 4.0, 10.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0100555419921875, -0.009733915328979492, -0.009412288665771484, -0.009090662002563477, -0.008769035339355469, -0.008447408676147461, -0.008125782012939453, -0.007804155349731445, -0.0074825286865234375, -0.00716090202331543, -0.006839275360107422, -0.006517648696899414, -0.006196022033691406, -0.0058743953704833984, -0.005552768707275391, -0.005231142044067383, -0.004909515380859375, -0.004587888717651367, -0.004266262054443359, -0.0039446353912353516, -0.0036230087280273438, -0.003301382064819336, -0.002979755401611328, -0.0026581287384033203, -0.0023365020751953125, -0.0020148754119873047, -0.0016932487487792969, -0.001371622085571289, -0.0010499954223632812, -0.0007283687591552734, -0.0004067420959472656, -8.511543273925781e-05, 0.00023651123046875, 0.0005581378936767578, 0.0008797645568847656, 0.0012013912200927734, 0.0015230178833007812, 0.001844644546508789, 0.002166271209716797, 0.0024878978729248047, 0.0028095245361328125, 0.0031311511993408203, 0.003452777862548828, 0.003774404525756836, 0.004096031188964844, 0.0044176578521728516, 0.004739284515380859, 0.005060911178588867, 0.005382537841796875, 0.005704164505004883, 0.006025791168212891, 0.0063474178314208984, 0.006669044494628906, 0.006990671157836914, 0.007312297821044922, 0.00763392448425293, 0.007955551147460938, 0.008277177810668945, 0.008598804473876953, 0.008920431137084961, 0.009242057800292969, 0.009563684463500977, 0.009885311126708984, 0.010206937789916992, 0.010528564453125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 9.0, 2.0, 8.0, 5.0, 12.0, 11.0, 15.0, 14.0, 17.0, 20.0, 24.0, 36.0, 29.0, 34.0, 31.0, 45.0, 36.0, 35.0, 45.0, 46.0, 43.0, 47.0, 54.0, 28.0, 32.0, 34.0, 38.0, 39.0, 29.0, 35.0, 21.0, 21.0, 18.0, 20.0, 12.0, 11.0, 14.0, 5.0, 2.0, 13.0, 7.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0142364501953125, -0.013787627220153809, -0.013338804244995117, -0.012889981269836426, -0.012441158294677734, -0.011992335319519043, -0.011543512344360352, -0.01109468936920166, -0.010645866394042969, -0.010197043418884277, -0.009748220443725586, -0.009299397468566895, -0.008850574493408203, -0.008401751518249512, -0.00795292854309082, -0.007504105567932129, -0.0070552825927734375, -0.006606459617614746, -0.006157636642456055, -0.005708813667297363, -0.005259990692138672, -0.0048111677169799805, -0.004362344741821289, -0.003913521766662598, -0.0034646987915039062, -0.003015875816345215, -0.0025670528411865234, -0.002118229866027832, -0.0016694068908691406, -0.0012205839157104492, -0.0007717609405517578, -0.0003229379653930664, 0.000125885009765625, 0.0005747079849243164, 0.0010235309600830078, 0.0014723539352416992, 0.0019211769104003906, 0.002369999885559082, 0.0028188228607177734, 0.003267645835876465, 0.0037164688110351562, 0.004165291786193848, 0.004614114761352539, 0.0050629377365112305, 0.005511760711669922, 0.005960583686828613, 0.006409406661987305, 0.006858229637145996, 0.0073070526123046875, 0.007755875587463379, 0.00820469856262207, 0.008653521537780762, 0.009102344512939453, 0.009551167488098145, 0.009999990463256836, 0.010448813438415527, 0.010897636413574219, 0.01134645938873291, 0.011795282363891602, 0.012244105339050293, 0.012692928314208984, 0.013141751289367676, 0.013590574264526367, 0.014039397239685059, 0.01448822021484375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 6.0, 17.0, 14.0, 19.0, 40.0, 55.0, 88.0, 103.0, 149.0, 241.0, 341.0, 513.0, 785.0, 1266.0, 2100.0, 3441.0, 5995.0, 10990.0, 21026.0, 43864.0, 121349.0, 584515.0, 150476.0, 49848.0, 22963.0, 11816.0, 6565.0, 3822.0, 2247.0, 1345.0, 851.0, 583.0, 363.0, 242.0, 154.0, 110.0, 61.0, 57.0, 33.0, 23.0, 15.0, 15.0, 12.0, 8.0, 5.0, 4.0, 3.0, 4.0, 0.0, 3.0, 1.0, 3.0], "bins": [-0.0014848709106445312, -0.0014406442642211914, -0.0013964176177978516, -0.0013521909713745117, -0.0013079643249511719, -0.001263737678527832, -0.0012195110321044922, -0.0011752843856811523, -0.0011310577392578125, -0.0010868310928344727, -0.0010426044464111328, -0.000998377799987793, -0.0009541511535644531, -0.0009099245071411133, -0.0008656978607177734, -0.0008214712142944336, -0.0007772445678710938, -0.0007330179214477539, -0.0006887912750244141, -0.0006445646286010742, -0.0006003379821777344, -0.0005561113357543945, -0.0005118846893310547, -0.00046765804290771484, -0.000423431396484375, -0.00037920475006103516, -0.0003349781036376953, -0.00029075145721435547, -0.0002465248107910156, -0.00020229816436767578, -0.00015807151794433594, -0.0001138448715209961, -6.961822509765625e-05, -2.5391578674316406e-05, 1.8835067749023438e-05, 6.306171417236328e-05, 0.00010728836059570312, 0.00015151500701904297, 0.0001957416534423828, 0.00023996829986572266, 0.0002841949462890625, 0.00032842159271240234, 0.0003726482391357422, 0.00041687488555908203, 0.0004611015319824219, 0.0005053281784057617, 0.0005495548248291016, 0.0005937814712524414, 0.0006380081176757812, 0.0006822347640991211, 0.0007264614105224609, 0.0007706880569458008, 0.0008149147033691406, 0.0008591413497924805, 0.0009033679962158203, 0.0009475946426391602, 0.0009918212890625, 0.0010360479354858398, 0.0010802745819091797, 0.0011245012283325195, 0.0011687278747558594, 0.0012129545211791992, 0.001257181167602539, 0.001301407814025879, 0.0013456344604492188]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 4.0, 3.0, 6.0, 5.0, 6.0, 5.0, 7.0, 12.0, 16.0, 15.0, 22.0, 28.0, 33.0, 53.0, 69.0, 103.0, 117.0, 129.0, 104.0, 71.0, 31.0, 40.0, 22.0, 21.0, 16.0, 11.0, 11.0, 9.0, 4.0, 7.0, 8.0, 3.0, 2.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.682209014892578e-05, -2.598203718662262e-05, -2.5141984224319458e-05, -2.4301931262016296e-05, -2.3461878299713135e-05, -2.2621825337409973e-05, -2.178177237510681e-05, -2.094171941280365e-05, -2.0101666450500488e-05, -1.9261613488197327e-05, -1.8421560525894165e-05, -1.7581507563591003e-05, -1.6741454601287842e-05, -1.590140163898468e-05, -1.5061348676681519e-05, -1.4221295714378357e-05, -1.3381242752075195e-05, -1.2541189789772034e-05, -1.1701136827468872e-05, -1.086108386516571e-05, -1.0021030902862549e-05, -9.180977940559387e-06, -8.340924978256226e-06, -7.500872015953064e-06, -6.660819053649902e-06, -5.820766091346741e-06, -4.980713129043579e-06, -4.1406601667404175e-06, -3.300607204437256e-06, -2.4605542421340942e-06, -1.6205012798309326e-06, -7.80448317527771e-07, 5.960464477539063e-08, 8.996576070785522e-07, 1.7397105693817139e-06, 2.5797635316848755e-06, 3.419816493988037e-06, 4.259869456291199e-06, 5.09992241859436e-06, 5.939975380897522e-06, 6.780028343200684e-06, 7.620081305503845e-06, 8.460134267807007e-06, 9.300187230110168e-06, 1.014024019241333e-05, 1.0980293154716492e-05, 1.1820346117019653e-05, 1.2660399079322815e-05, 1.3500452041625977e-05, 1.4340505003929138e-05, 1.51805579662323e-05, 1.602061092853546e-05, 1.6860663890838623e-05, 1.7700716853141785e-05, 1.8540769815444946e-05, 1.9380822777748108e-05, 2.022087574005127e-05, 2.106092870235443e-05, 2.1900981664657593e-05, 2.2741034626960754e-05, 2.3581087589263916e-05, 2.4421140551567078e-05, 2.526119351387024e-05, 2.61012464761734e-05, 2.6941299438476562e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 5.0, 8.0, 12.0, 24.0, 32.0, 57.0, 108.0, 359.0, 1970.0, 34503.0, 973104.0, 35646.0, 2030.0, 394.0, 132.0, 51.0, 41.0, 23.0, 13.0, 12.0, 6.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00638580322265625, -0.006169378757476807, -0.005952954292297363, -0.00573652982711792, -0.0055201053619384766, -0.005303680896759033, -0.00508725643157959, -0.0048708319664001465, -0.004654407501220703, -0.00443798303604126, -0.004221558570861816, -0.004005134105682373, -0.0037887096405029297, -0.0035722851753234863, -0.003355860710144043, -0.0031394362449645996, -0.0029230117797851562, -0.002706587314605713, -0.0024901628494262695, -0.002273738384246826, -0.002057313919067383, -0.0018408894538879395, -0.001624464988708496, -0.0014080405235290527, -0.0011916160583496094, -0.000975191593170166, -0.0007587671279907227, -0.0005423426628112793, -0.00032591819763183594, -0.00010949373245239258, 0.00010693073272705078, 0.00032335519790649414, 0.0005397796630859375, 0.0007562041282653809, 0.0009726285934448242, 0.0011890530586242676, 0.001405477523803711, 0.0016219019889831543, 0.0018383264541625977, 0.002054750919342041, 0.0022711753845214844, 0.0024875998497009277, 0.002704024314880371, 0.0029204487800598145, 0.003136873245239258, 0.003353297710418701, 0.0035697221755981445, 0.003786146640777588, 0.004002571105957031, 0.004218995571136475, 0.004435420036315918, 0.004651844501495361, 0.004868268966674805, 0.005084693431854248, 0.005301117897033691, 0.005517542362213135, 0.005733966827392578, 0.0059503912925720215, 0.006166815757751465, 0.006383240222930908, 0.0065996646881103516, 0.006816089153289795, 0.007032513618469238, 0.007248938083648682, 0.007465362548828125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 9.0, 9.0, 6.0, 18.0, 14.0, 17.0, 35.0, 46.0, 65.0, 92.0, 116.0, 164.0, 127.0, 81.0, 60.0, 24.0, 26.0, 22.0, 16.0, 8.0, 13.0, 7.0, 5.0, 6.0, 2.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00046825408935546875, -0.0004546418786048889, -0.0004410296678543091, -0.00042741745710372925, -0.0004138052463531494, -0.0004001930356025696, -0.00038658082485198975, -0.0003729686141014099, -0.0003593564033508301, -0.00034574419260025024, -0.0003321319818496704, -0.0003185197710990906, -0.00030490756034851074, -0.0002912953495979309, -0.0002776831388473511, -0.00026407092809677124, -0.0002504587173461914, -0.00023684650659561157, -0.00022323429584503174, -0.0002096220850944519, -0.00019600987434387207, -0.00018239766359329224, -0.0001687854528427124, -0.00015517324209213257, -0.00014156103134155273, -0.0001279488205909729, -0.00011433660984039307, -0.00010072439908981323, -8.71121883392334e-05, -7.349997758865356e-05, -5.988776683807373e-05, -4.6275556087493896e-05, -3.266334533691406e-05, -1.905113458633423e-05, -5.4389238357543945e-06, 8.17328691482544e-06, 2.1785497665405273e-05, 3.539770841598511e-05, 4.900991916656494e-05, 6.262212991714478e-05, 7.623434066772461e-05, 8.984655141830444e-05, 0.00010345876216888428, 0.00011707097291946411, 0.00013068318367004395, 0.00014429539442062378, 0.0001579076051712036, 0.00017151981592178345, 0.00018513202667236328, 0.00019874423742294312, 0.00021235644817352295, 0.00022596865892410278, 0.00023958086967468262, 0.00025319308042526245, 0.0002668052911758423, 0.0002804175019264221, 0.00029402971267700195, 0.0003076419234275818, 0.0003212541341781616, 0.00033486634492874146, 0.0003484785556793213, 0.0003620907664299011, 0.00037570297718048096, 0.0003893151879310608, 0.0004029273986816406]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [5.0, 6.0, 3.0, 3.0, 8.0, 7.0, 9.0, 17.0, 19.0, 33.0, 33.0, 46.0, 62.0, 83.0, 108.0, 115.0, 104.0, 97.0, 65.0, 61.0, 40.0, 29.0, 25.0, 9.0, 9.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018370749428868294, -0.017210042104125023, -0.016049334779381752, -0.014888627454638481, -0.01372792012989521, -0.01256721280515194, -0.011406506411731243, -0.010245799086987972, -0.009085091762244701, -0.00792438443750143, -0.00676367711275816, -0.005602970253676176, -0.004442262928932905, -0.0032815556041896343, -0.0021208487451076508, -0.0009601414203643799, 0.000200565904378891, 0.00136127311270684, 0.002521980321034789, 0.0036826874129474163, 0.004843394737690687, 0.006004102062433958, 0.007164808921515942, 0.008325516246259212, 0.009486223571002483, 0.010646930895745754, 0.011807638220489025, 0.012968344613909721, 0.014129051938652992, 0.015289759263396263, 0.016450466588139534, 0.017611173912882805, 0.018771879374980927, 0.019932586699724197, 0.021093294024467468, 0.02225400134921074, 0.02341470867395401, 0.02457541599869728, 0.025736123323440552, 0.026896830648183823, 0.028057537972927094, 0.029218245297670364, 0.030378952622413635, 0.031539659947156906, 0.03270036727190018, 0.03386107459664345, 0.03502178192138672, 0.03618248924612999, 0.03734319657087326, 0.03850390389561653, 0.0396646112203598, 0.04082531854510307, 0.041986025869846344, 0.043146733194589615, 0.044307440519332886, 0.04546814784407616, 0.04662885144352913, 0.0477895587682724, 0.04895026609301567, 0.05011097341775894, 0.05127168074250221, 0.05243238806724548, 0.053593095391988754, 0.054753802716732025, 0.055914510041475296]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 5.0, 13.0, 11.0, 15.0, 15.0, 21.0, 22.0, 21.0, 28.0, 27.0, 37.0, 34.0, 28.0, 39.0, 37.0, 39.0, 51.0, 37.0, 38.0, 35.0, 43.0, 46.0, 41.0, 41.0, 37.0, 30.0, 29.0, 20.0, 18.0, 19.0, 30.0, 10.0, 9.0, 9.0, 10.0, 11.0, 4.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.02115490660071373, -0.02054668590426445, -0.01993846707046032, -0.01933024823665619, -0.01872202754020691, -0.01811380684375763, -0.0175055880099535, -0.01689736917614937, -0.01628914847970009, -0.01568092778325081, -0.015072708949446678, -0.014464489184319973, -0.013856269419193268, -0.013248049654066563, -0.012639829888939857, -0.012031610123813152, -0.011423390358686447, -0.010815170593559742, -0.010206950828433037, -0.009598731063306332, -0.008990511298179626, -0.008382291533052921, -0.007774071767926216, -0.007165852002799511, -0.006557632237672806, -0.005949412472546101, -0.0053411927074193954, -0.00473297294229269, -0.004124753177165985, -0.00351653341203928, -0.0029083136469125748, -0.0023000938817858696, -0.0016918741166591644, -0.0010836543515324593, -0.0004754345864057541, 0.00013278517872095108, 0.0007410049438476562, 0.0013492247089743614, 0.0019574444741010666, 0.0025656642392277718, 0.003173884004354477, 0.003782103769481182, 0.004390323534607887, 0.0049985432997345924, 0.005606763064861298, 0.006214982829988003, 0.006823202595114708, 0.007431422360241413, 0.008039642125368118, 0.008647861890494823, 0.009256081655621529, 0.009864301420748234, 0.010472521185874939, 0.011080740951001644, 0.01168896071612835, 0.012297180481255054, 0.01290540024638176, 0.013513620011508465, 0.01412183977663517, 0.014730059541761875, 0.01533827930688858, 0.01594650000333786, 0.01655471883714199, 0.01716293767094612, 0.0177711583673954]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 6.0, 8.0, 19.0, 21.0, 28.0, 41.0, 63.0, 109.0, 155.0, 227.0, 340.0, 599.0, 904.0, 1457.0, 2448.0, 3947.0, 6891.0, 11950.0, 21622.0, 39486.0, 73278.0, 130028.0, 199727.0, 212909.0, 149818.0, 85999.0, 47200.0, 25382.0, 14142.0, 8056.0, 4523.0, 2745.0, 1614.0, 1023.0, 644.0, 406.0, 264.0, 163.0, 113.0, 73.0, 46.0, 26.0, 21.0, 12.0, 9.0, 8.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038360595703125, -0.03704404830932617, -0.035727500915527344, -0.034410953521728516, -0.03309440612792969, -0.03177785873413086, -0.03046131134033203, -0.029144763946533203, -0.027828216552734375, -0.026511669158935547, -0.02519512176513672, -0.02387857437133789, -0.022562026977539062, -0.021245479583740234, -0.019928932189941406, -0.018612384796142578, -0.01729583740234375, -0.015979290008544922, -0.014662742614746094, -0.013346195220947266, -0.012029647827148438, -0.01071310043334961, -0.009396553039550781, -0.008080005645751953, -0.006763458251953125, -0.005446910858154297, -0.004130363464355469, -0.0028138160705566406, -0.0014972686767578125, -0.00018072128295898438, 0.0011358261108398438, 0.002452373504638672, 0.0037689208984375, 0.005085468292236328, 0.006402015686035156, 0.007718563079833984, 0.009035110473632812, 0.01035165786743164, 0.011668205261230469, 0.012984752655029297, 0.014301300048828125, 0.015617847442626953, 0.01693439483642578, 0.01825094223022461, 0.019567489624023438, 0.020884037017822266, 0.022200584411621094, 0.023517131805419922, 0.02483367919921875, 0.026150226593017578, 0.027466773986816406, 0.028783321380615234, 0.030099868774414062, 0.03141641616821289, 0.03273296356201172, 0.03404951095581055, 0.035366058349609375, 0.0366826057434082, 0.03799915313720703, 0.03931570053100586, 0.04063224792480469, 0.041948795318603516, 0.043265342712402344, 0.04458189010620117, 0.0458984375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 0.0, 2.0, 6.0, 5.0, 9.0, 11.0, 12.0, 14.0, 18.0, 14.0, 21.0, 24.0, 30.0, 23.0, 33.0, 32.0, 42.0, 35.0, 37.0, 45.0, 41.0, 42.0, 41.0, 32.0, 40.0, 40.0, 53.0, 37.0, 30.0, 32.0, 21.0, 30.0, 15.0, 16.0, 20.0, 16.0, 16.0, 13.0, 12.0, 9.0, 6.0, 4.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.020416259765625, -0.01985955238342285, -0.019302845001220703, -0.018746137619018555, -0.018189430236816406, -0.017632722854614258, -0.01707601547241211, -0.01651930809020996, -0.015962600708007812, -0.015405893325805664, -0.014849185943603516, -0.014292478561401367, -0.013735771179199219, -0.01317906379699707, -0.012622356414794922, -0.012065649032592773, -0.011508941650390625, -0.010952234268188477, -0.010395526885986328, -0.00983881950378418, -0.009282112121582031, -0.008725404739379883, -0.008168697357177734, -0.007611989974975586, -0.0070552825927734375, -0.006498575210571289, -0.005941867828369141, -0.005385160446166992, -0.004828453063964844, -0.004271745681762695, -0.003715038299560547, -0.0031583309173583984, -0.00260162353515625, -0.0020449161529541016, -0.0014882087707519531, -0.0009315013885498047, -0.00037479400634765625, 0.0001819133758544922, 0.0007386207580566406, 0.001295328140258789, 0.0018520355224609375, 0.002408742904663086, 0.0029654502868652344, 0.003522157669067383, 0.004078865051269531, 0.00463557243347168, 0.005192279815673828, 0.0057489871978759766, 0.006305694580078125, 0.0068624019622802734, 0.007419109344482422, 0.00797581672668457, 0.008532524108886719, 0.009089231491088867, 0.009645938873291016, 0.010202646255493164, 0.010759353637695312, 0.011316061019897461, 0.01187276840209961, 0.012429475784301758, 0.012986183166503906, 0.013542890548706055, 0.014099597930908203, 0.014656305313110352, 0.0152130126953125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 6.0, 11.0, 15.0, 19.0, 15.0, 25.0, 29.0, 27.0, 38.0, 47.0, 70.0, 97.0, 145.0, 426.0, 2513.0, 25835.0, 338187.0, 614040.0, 60354.0, 5221.0, 739.0, 221.0, 92.0, 71.0, 57.0, 50.0, 39.0, 17.0, 18.0, 25.0, 10.0, 21.0, 12.0, 8.0, 12.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.1805419921875, -0.17509841918945312, -0.16965484619140625, -0.16421127319335938, -0.1587677001953125, -0.15332412719726562, -0.14788055419921875, -0.14243698120117188, -0.136993408203125, -0.13154983520507812, -0.12610626220703125, -0.12066268920898438, -0.1152191162109375, -0.10977554321289062, -0.10433197021484375, -0.09888839721679688, -0.09344482421875, -0.08800125122070312, -0.08255767822265625, -0.07711410522460938, -0.0716705322265625, -0.06622695922851562, -0.06078338623046875, -0.055339813232421875, -0.049896240234375, -0.044452667236328125, -0.03900909423828125, -0.033565521240234375, -0.0281219482421875, -0.022678375244140625, -0.01723480224609375, -0.011791229248046875, -0.00634765625, -0.000904083251953125, 0.00453948974609375, 0.009983062744140625, 0.0154266357421875, 0.020870208740234375, 0.02631378173828125, 0.031757354736328125, 0.037200927734375, 0.042644500732421875, 0.04808807373046875, 0.053531646728515625, 0.0589752197265625, 0.06441879272460938, 0.06986236572265625, 0.07530593872070312, 0.08074951171875, 0.08619308471679688, 0.09163665771484375, 0.09708023071289062, 0.1025238037109375, 0.10796737670898438, 0.11341094970703125, 0.11885452270507812, 0.124298095703125, 0.12974166870117188, 0.13518524169921875, 0.14062881469726562, 0.1460723876953125, 0.15151596069335938, 0.15695953369140625, 0.16240310668945312, 0.1678466796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 3.0, 8.0, 12.0, 10.0, 9.0, 21.0, 9.0, 13.0, 20.0, 27.0, 34.0, 25.0, 34.0, 31.0, 39.0, 47.0, 34.0, 55.0, 50.0, 47.0, 40.0, 52.0, 41.0, 30.0, 41.0, 30.0, 31.0, 31.0, 23.0, 29.0, 14.0, 19.0, 19.0, 16.0, 11.0, 11.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.01837158203125, -0.01783132553100586, -0.01729106903076172, -0.016750812530517578, -0.016210556030273438, -0.015670299530029297, -0.015130043029785156, -0.014589786529541016, -0.014049530029296875, -0.013509273529052734, -0.012969017028808594, -0.012428760528564453, -0.011888504028320312, -0.011348247528076172, -0.010807991027832031, -0.01026773452758789, -0.00972747802734375, -0.00918722152709961, -0.008646965026855469, -0.008106708526611328, -0.0075664520263671875, -0.007026195526123047, -0.006485939025878906, -0.005945682525634766, -0.005405426025390625, -0.004865169525146484, -0.004324913024902344, -0.003784656524658203, -0.0032444000244140625, -0.002704143524169922, -0.0021638870239257812, -0.0016236305236816406, -0.0010833740234375, -0.0005431175231933594, -2.86102294921875e-06, 0.0005373954772949219, 0.0010776519775390625, 0.0016179084777832031, 0.0021581649780273438, 0.0026984214782714844, 0.003238677978515625, 0.0037789344787597656, 0.004319190979003906, 0.004859447479248047, 0.0053997039794921875, 0.005939960479736328, 0.006480216979980469, 0.007020473480224609, 0.00756072998046875, 0.00810098648071289, 0.008641242980957031, 0.009181499481201172, 0.009721755981445312, 0.010262012481689453, 0.010802268981933594, 0.011342525482177734, 0.011882781982421875, 0.012423038482666016, 0.012963294982910156, 0.013503551483154297, 0.014043807983398438, 0.014584064483642578, 0.015124320983886719, 0.01566457748413086, 0.016204833984375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 9.0, 6.0, 8.0, 15.0, 19.0, 22.0, 35.0, 55.0, 76.0, 109.0, 143.0, 209.0, 362.0, 544.0, 865.0, 1516.0, 2597.0, 5329.0, 11372.0, 28412.0, 91074.0, 452403.0, 338615.0, 70967.0, 23467.0, 9607.0, 4668.0, 2416.0, 1331.0, 840.0, 459.0, 323.0, 242.0, 118.0, 99.0, 77.0, 44.0, 35.0, 18.0, 10.0, 8.0, 11.0, 6.0, 5.0, 8.0, 1.0, 2.0, 4.0, 2.0], "bins": [-0.00090789794921875, -0.0008832961320877075, -0.000858694314956665, -0.0008340924978256226, -0.0008094906806945801, -0.0007848888635635376, -0.0007602870464324951, -0.0007356852293014526, -0.0007110834121704102, -0.0006864815950393677, -0.0006618797779083252, -0.0006372779607772827, -0.0006126761436462402, -0.0005880743265151978, -0.0005634725093841553, -0.0005388706922531128, -0.0005142688751220703, -0.0004896670579910278, -0.00046506524085998535, -0.00044046342372894287, -0.0004158616065979004, -0.0003912597894668579, -0.00036665797233581543, -0.00034205615520477295, -0.00031745433807373047, -0.000292852520942688, -0.0002682507038116455, -0.00024364888668060303, -0.00021904706954956055, -0.00019444525241851807, -0.00016984343528747559, -0.0001452416181564331, -0.00012063980102539062, -9.603798389434814e-05, -7.143616676330566e-05, -4.6834349632263184e-05, -2.2232532501220703e-05, 2.3692846298217773e-06, 2.6971101760864258e-05, 5.157291889190674e-05, 7.617473602294922e-05, 0.0001007765531539917, 0.00012537837028503418, 0.00014998018741607666, 0.00017458200454711914, 0.00019918382167816162, 0.0002237856388092041, 0.0002483874559402466, 0.00027298927307128906, 0.00029759109020233154, 0.000322192907333374, 0.0003467947244644165, 0.000371396541595459, 0.00039599835872650146, 0.00042060017585754395, 0.0004452019929885864, 0.0004698038101196289, 0.0004944056272506714, 0.0005190074443817139, 0.0005436092615127563, 0.0005682110786437988, 0.0005928128957748413, 0.0006174147129058838, 0.0006420165300369263, 0.0006666183471679688]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 11.0, 13.0, 4.0, 16.0, 46.0, 39.0, 53.0, 103.0, 174.0, 175.0, 135.0, 81.0, 56.0, 39.0, 24.0, 7.0, 9.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4722347259521484e-05, -1.4291144907474518e-05, -1.3859942555427551e-05, -1.3428740203380585e-05, -1.2997537851333618e-05, -1.2566335499286652e-05, -1.2135133147239685e-05, -1.1703930795192719e-05, -1.1272728443145752e-05, -1.0841526091098785e-05, -1.0410323739051819e-05, -9.979121387004852e-06, -9.547919034957886e-06, -9.11671668291092e-06, -8.685514330863953e-06, -8.254311978816986e-06, -7.82310962677002e-06, -7.391907274723053e-06, -6.9607049226760864e-06, -6.52950257062912e-06, -6.098300218582153e-06, -5.667097866535187e-06, -5.23589551448822e-06, -4.804693162441254e-06, -4.373490810394287e-06, -3.9422884583473206e-06, -3.511086106300354e-06, -3.0798837542533875e-06, -2.648681402206421e-06, -2.2174790501594543e-06, -1.7862766981124878e-06, -1.3550743460655212e-06, -9.238719940185547e-07, -4.926696419715881e-07, -6.146728992462158e-08, 3.6973506212234497e-07, 8.009374141693115e-07, 1.232139766216278e-06, 1.6633421182632446e-06, 2.094544470310211e-06, 2.5257468223571777e-06, 2.9569491744041443e-06, 3.388151526451111e-06, 3.819353878498077e-06, 4.250556230545044e-06, 4.6817585825920105e-06, 5.112960934638977e-06, 5.544163286685944e-06, 5.97536563873291e-06, 6.406567990779877e-06, 6.837770342826843e-06, 7.26897269487381e-06, 7.700175046920776e-06, 8.131377398967743e-06, 8.56257975101471e-06, 8.993782103061676e-06, 9.424984455108643e-06, 9.856186807155609e-06, 1.0287389159202576e-05, 1.0718591511249542e-05, 1.1149793863296509e-05, 1.1580996215343475e-05, 1.2012198567390442e-05, 1.2443400919437408e-05, 1.2874603271484375e-05]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 8.0, 3.0, 6.0, 7.0, 16.0, 16.0, 26.0, 29.0, 30.0, 29.0, 47.0, 68.0, 96.0, 212.0, 982.0, 20258.0, 929717.0, 93745.0, 2526.0, 287.0, 115.0, 80.0, 49.0, 41.0, 25.0, 26.0, 24.0, 17.0, 18.0, 7.0, 11.0, 12.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0018291473388671875, -0.0017653703689575195, -0.0017015933990478516, -0.0016378164291381836, -0.0015740394592285156, -0.0015102624893188477, -0.0014464855194091797, -0.0013827085494995117, -0.0013189315795898438, -0.0012551546096801758, -0.0011913776397705078, -0.0011276006698608398, -0.0010638236999511719, -0.001000046730041504, -0.0009362697601318359, -0.000872492790222168, -0.0008087158203125, -0.000744938850402832, -0.0006811618804931641, -0.0006173849105834961, -0.0005536079406738281, -0.0004898309707641602, -0.0004260540008544922, -0.0003622770309448242, -0.00029850006103515625, -0.00023472309112548828, -0.0001709461212158203, -0.00010716915130615234, -4.3392181396484375e-05, 2.0384788513183594e-05, 8.416175842285156e-05, 0.00014793872833251953, 0.0002117156982421875, 0.00027549266815185547, 0.00033926963806152344, 0.0004030466079711914, 0.0004668235778808594, 0.0005306005477905273, 0.0005943775177001953, 0.0006581544876098633, 0.0007219314575195312, 0.0007857084274291992, 0.0008494853973388672, 0.0009132623672485352, 0.0009770393371582031, 0.001040816307067871, 0.001104593276977539, 0.001168370246887207, 0.001232147216796875, 0.001295924186706543, 0.001359701156616211, 0.001423478126525879, 0.0014872550964355469, 0.0015510320663452148, 0.0016148090362548828, 0.0016785860061645508, 0.0017423629760742188, 0.0018061399459838867, 0.0018699169158935547, 0.0019336938858032227, 0.0019974708557128906, 0.0020612478256225586, 0.0021250247955322266, 0.0021888017654418945, 0.0022525787353515625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 10.0, 8.0, 6.0, 11.0, 19.0, 16.0, 23.0, 23.0, 33.0, 23.0, 43.0, 43.0, 50.0, 55.0, 53.0, 47.0, 62.0, 47.0, 63.0, 68.0, 41.0, 46.0, 33.0, 32.0, 24.0, 30.0, 14.0, 22.0, 13.0, 7.0, 4.0, 6.0, 3.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0001571178436279297, -0.00015252269804477692, -0.00014792755246162415, -0.00014333240687847137, -0.0001387372612953186, -0.00013414211571216583, -0.00012954697012901306, -0.0001249518245458603, -0.00012035667896270752, -0.00011576153337955475, -0.00011116638779640198, -0.0001065712422132492, -0.00010197609663009644, -9.738095104694366e-05, -9.27858054637909e-05, -8.819065988063812e-05, -8.359551429748535e-05, -7.900036871433258e-05, -7.440522313117981e-05, -6.981007754802704e-05, -6.521493196487427e-05, -6.0619786381721497e-05, -5.6024640798568726e-05, -5.1429495215415955e-05, -4.6834349632263184e-05, -4.223920404911041e-05, -3.764405846595764e-05, -3.304891288280487e-05, -2.84537672996521e-05, -2.385862171649933e-05, -1.9263476133346558e-05, -1.4668330550193787e-05, -1.0073184967041016e-05, -5.478039383888245e-06, -8.828938007354736e-07, 3.7122517824172974e-06, 8.307397365570068e-06, 1.290254294872284e-05, 1.749768853187561e-05, 2.209283411502838e-05, 2.6687979698181152e-05, 3.128312528133392e-05, 3.5878270864486694e-05, 4.0473416447639465e-05, 4.5068562030792236e-05, 4.966370761394501e-05, 5.425885319709778e-05, 5.885399878025055e-05, 6.344914436340332e-05, 6.804428994655609e-05, 7.263943552970886e-05, 7.723458111286163e-05, 8.18297266960144e-05, 8.642487227916718e-05, 9.102001786231995e-05, 9.561516344547272e-05, 0.00010021030902862549, 0.00010480545461177826, 0.00010940060019493103, 0.0001139957457780838, 0.00011859089136123657, 0.00012318603694438934, 0.00012778118252754211, 0.00013237632811069489, 0.00013697147369384766]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 13.0, 37.0, 109.0, 226.0, 321.0, 176.0, 80.0, 27.0, 9.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053385574370622635, -0.05032176896929741, -0.04725796356797218, -0.04419415816664696, -0.04113035276532173, -0.038066547363996506, -0.03500274196267128, -0.031938936561346054, -0.028875131160020828, -0.025811325758695602, -0.022747520357370377, -0.01968371495604515, -0.016619909554719925, -0.013556104153394699, -0.010492298752069473, -0.0074284933507442474, -0.004364687949419022, -0.0013008825480937958, 0.00176292285323143, 0.004826728254556656, 0.007890533655881882, 0.010954339057207108, 0.014018144458532333, 0.01708194985985756, 0.020145755261182785, 0.02320956066250801, 0.026273366063833237, 0.029337171465158463, 0.03240097686648369, 0.035464782267808914, 0.03852858766913414, 0.041592393070459366, 0.04465620219707489, 0.047720007598400116, 0.05078381299972534, 0.05384761840105057, 0.05691142380237579, 0.05997522920370102, 0.06303903460502625, 0.06610284000635147, 0.0691666454076767, 0.07223045080900192, 0.07529425621032715, 0.07835806161165237, 0.0814218670129776, 0.08448567241430283, 0.08754947781562805, 0.09061328321695328, 0.0936770886182785, 0.09674089401960373, 0.09980469942092896, 0.10286850482225418, 0.1059323102235794, 0.10899611562490463, 0.11205992102622986, 0.11512372642755508, 0.11818753182888031, 0.12125133723020554, 0.12431514263153076, 0.1273789405822754, 0.1304427534341812, 0.13350656628608704, 0.13657036423683167, 0.1396341621875763, 0.14269797503948212]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 5.0, 3.0, 6.0, 8.0, 9.0, 13.0, 8.0, 11.0, 15.0, 15.0, 17.0, 19.0, 21.0, 20.0, 26.0, 34.0, 24.0, 39.0, 43.0, 33.0, 29.0, 32.0, 40.0, 42.0, 43.0, 25.0, 48.0, 26.0, 34.0, 32.0, 35.0, 36.0, 27.0, 25.0, 12.0, 20.0, 26.0, 16.0, 18.0, 15.0, 8.0, 9.0, 5.0, 12.0, 6.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.020291706547141075, -0.019664447754621506, -0.019037187099456787, -0.018409928306937218, -0.01778266951441765, -0.01715540885925293, -0.01652815006673336, -0.01590089127421379, -0.015273630619049072, -0.014646370895206928, -0.014019111171364784, -0.013391852378845215, -0.01276459265500307, -0.012137332931160927, -0.011510074138641357, -0.010882814414799213, -0.01025555469095707, -0.009628294967114925, -0.009001035243272781, -0.008373776450753212, -0.007746516726911068, -0.007119257003068924, -0.006491997744888067, -0.0058647384867072105, -0.0052374787628650665, -0.0046102190390229225, -0.003982959780842066, -0.0033557002898305655, -0.002728440798819065, -0.0021011813078075647, -0.0014739218167960644, -0.0008466625586152077, -0.0002194046974182129, 0.00040785479359328747, 0.0010351142846047878, 0.0016623737756162882, 0.0022896332666277885, 0.002916892757639289, 0.0035441522486507893, 0.004171411506831646, 0.00479867123067379, 0.005425930954515934, 0.006053190212696791, 0.006680449470877647, 0.007307709194719791, 0.007934968918561935, 0.008562227711081505, 0.009189487434923649, 0.009816747158765793, 0.010444006882607937, 0.011071266606450081, 0.01169852539896965, 0.012325785122811794, 0.012953044846653938, 0.013580303639173508, 0.014207563363015652, 0.014834823086857796, 0.01546208281069994, 0.016089342534542084, 0.016716601327061653, 0.017343860119581223, 0.01797112077474594, 0.01859837956726551, 0.01922563835978508, 0.0198528990149498]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 8.0, 11.0, 9.0, 13.0, 20.0, 28.0, 31.0, 55.0, 72.0, 100.0, 115.0, 163.0, 219.0, 353.0, 530.0, 840.0, 1441.0, 2546.0, 4905.0, 13133.0, 112304.0, 2126191.0, 1802284.0, 104289.0, 13394.0, 4864.0, 2428.0, 1373.0, 799.0, 526.0, 390.0, 238.0, 160.0, 121.0, 87.0, 54.0, 44.0, 38.0, 30.0, 23.0, 16.0, 5.0, 8.0, 6.0, 3.0, 8.0, 2.0, 1.0, 1.0, 2.0, 4.0], "bins": [-0.03314208984375, -0.03219461441040039, -0.03124713897705078, -0.030299663543701172, -0.029352188110351562, -0.028404712677001953, -0.027457237243652344, -0.026509761810302734, -0.025562286376953125, -0.024614810943603516, -0.023667335510253906, -0.022719860076904297, -0.021772384643554688, -0.020824909210205078, -0.01987743377685547, -0.01892995834350586, -0.01798248291015625, -0.01703500747680664, -0.01608753204345703, -0.015140056610107422, -0.014192581176757812, -0.013245105743408203, -0.012297630310058594, -0.011350154876708984, -0.010402679443359375, -0.009455204010009766, -0.008507728576660156, -0.007560253143310547, -0.0066127777099609375, -0.005665302276611328, -0.004717826843261719, -0.0037703514099121094, -0.0028228759765625, -0.0018754005432128906, -0.0009279251098632812, 1.9550323486328125e-05, 0.0009670257568359375, 0.0019145011901855469, 0.0028619766235351562, 0.0038094520568847656, 0.004756927490234375, 0.005704402923583984, 0.006651878356933594, 0.007599353790283203, 0.008546829223632812, 0.009494304656982422, 0.010441780090332031, 0.01138925552368164, 0.01233673095703125, 0.01328420639038086, 0.014231681823730469, 0.015179157257080078, 0.016126632690429688, 0.017074108123779297, 0.018021583557128906, 0.018969058990478516, 0.019916534423828125, 0.020864009857177734, 0.021811485290527344, 0.022758960723876953, 0.023706436157226562, 0.024653911590576172, 0.02560138702392578, 0.02654886245727539, 0.027496337890625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 11.0, 3.0, 4.0, 2.0, 12.0, 13.0, 10.0, 9.0, 9.0, 19.0, 19.0, 14.0, 36.0, 30.0, 28.0, 28.0, 28.0, 39.0, 36.0, 33.0, 34.0, 44.0, 41.0, 49.0, 39.0, 32.0, 34.0, 38.0, 33.0, 32.0, 31.0, 32.0, 22.0, 22.0, 19.0, 15.0, 22.0, 21.0, 6.0, 12.0, 14.0, 10.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.015228271484375, -0.014733076095581055, -0.01423788070678711, -0.013742685317993164, -0.013247489929199219, -0.012752294540405273, -0.012257099151611328, -0.011761903762817383, -0.011266708374023438, -0.010771512985229492, -0.010276317596435547, -0.009781122207641602, -0.009285926818847656, -0.008790731430053711, -0.008295536041259766, -0.00780034065246582, -0.007305145263671875, -0.00680994987487793, -0.006314754486083984, -0.005819559097290039, -0.005324363708496094, -0.0048291683197021484, -0.004333972930908203, -0.003838777542114258, -0.0033435821533203125, -0.002848386764526367, -0.002353191375732422, -0.0018579959869384766, -0.0013628005981445312, -0.0008676052093505859, -0.0003724098205566406, 0.0001227855682373047, 0.00061798095703125, 0.0011131763458251953, 0.0016083717346191406, 0.002103567123413086, 0.0025987625122070312, 0.0030939579010009766, 0.003589153289794922, 0.004084348678588867, 0.0045795440673828125, 0.005074739456176758, 0.005569934844970703, 0.0060651302337646484, 0.006560325622558594, 0.007055521011352539, 0.007550716400146484, 0.00804591178894043, 0.008541107177734375, 0.00903630256652832, 0.009531497955322266, 0.010026693344116211, 0.010521888732910156, 0.011017084121704102, 0.011512279510498047, 0.012007474899291992, 0.012502670288085938, 0.012997865676879883, 0.013493061065673828, 0.013988256454467773, 0.014483451843261719, 0.014978647232055664, 0.01547384262084961, 0.015969038009643555, 0.0164642333984375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 4.0, 3.0, 10.0, 7.0, 8.0, 17.0, 15.0, 25.0, 29.0, 43.0, 89.0, 218.0, 461.0, 1561.0, 7522.0, 232501.0, 3932008.0, 15928.0, 2638.0, 675.0, 257.0, 116.0, 50.0, 20.0, 14.0, 15.0, 12.0, 6.0, 3.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1556396484375, -0.15064620971679688, -0.14565277099609375, -0.14065933227539062, -0.1356658935546875, -0.13067245483398438, -0.12567901611328125, -0.12068557739257812, -0.115692138671875, -0.11069869995117188, -0.10570526123046875, -0.10071182250976562, -0.0957183837890625, -0.09072494506835938, -0.08573150634765625, -0.08073806762695312, -0.07574462890625, -0.07075119018554688, -0.06575775146484375, -0.060764312744140625, -0.0557708740234375, -0.050777435302734375, -0.04578399658203125, -0.040790557861328125, -0.035797119140625, -0.030803680419921875, -0.02581024169921875, -0.020816802978515625, -0.0158233642578125, -0.010829925537109375, -0.00583648681640625, -0.000843048095703125, 0.004150390625, 0.009143829345703125, 0.01413726806640625, 0.019130706787109375, 0.0241241455078125, 0.029117584228515625, 0.03411102294921875, 0.039104461669921875, 0.044097900390625, 0.049091339111328125, 0.05408477783203125, 0.059078216552734375, 0.0640716552734375, 0.06906509399414062, 0.07405853271484375, 0.07905197143554688, 0.08404541015625, 0.08903884887695312, 0.09403228759765625, 0.09902572631835938, 0.1040191650390625, 0.10901260375976562, 0.11400604248046875, 0.11899948120117188, 0.123992919921875, 0.12898635864257812, 0.13397979736328125, 0.13897323608398438, 0.1439666748046875, 0.14896011352539062, 0.15395355224609375, 0.15894699096679688, 0.1639404296875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 3.0, 8.0, 8.0, 18.0, 28.0, 46.0, 119.0, 371.0, 965.0, 1309.0, 675.0, 238.0, 99.0, 58.0, 33.0, 22.0, 16.0, 10.0, 7.0, 8.0, 7.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0141448974609375, -0.01372063159942627, -0.013296365737915039, -0.012872099876403809, -0.012447834014892578, -0.012023568153381348, -0.011599302291870117, -0.011175036430358887, -0.010750770568847656, -0.010326504707336426, -0.009902238845825195, -0.009477972984313965, -0.009053707122802734, -0.008629441261291504, -0.008205175399780273, -0.007780909538269043, -0.0073566436767578125, -0.006932377815246582, -0.0065081119537353516, -0.006083846092224121, -0.005659580230712891, -0.00523531436920166, -0.00481104850769043, -0.004386782646179199, -0.003962516784667969, -0.0035382509231567383, -0.003113985061645508, -0.0026897192001342773, -0.002265453338623047, -0.0018411874771118164, -0.001416921615600586, -0.0009926557540893555, -0.000568389892578125, -0.00014412403106689453, 0.00028014183044433594, 0.0007044076919555664, 0.0011286735534667969, 0.0015529394149780273, 0.001977205276489258, 0.0024014711380004883, 0.0028257369995117188, 0.0032500028610229492, 0.0036742687225341797, 0.00409853458404541, 0.004522800445556641, 0.004947066307067871, 0.0053713321685791016, 0.005795598030090332, 0.0062198638916015625, 0.006644129753112793, 0.0070683956146240234, 0.007492661476135254, 0.007916927337646484, 0.008341193199157715, 0.008765459060668945, 0.009189724922180176, 0.009613990783691406, 0.010038256645202637, 0.010462522506713867, 0.010886788368225098, 0.011311054229736328, 0.011735320091247559, 0.012159585952758789, 0.01258385181427002, 0.01300811767578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 22.0, 34.0, 77.0, 142.0, 216.0, 237.0, 143.0, 66.0, 39.0, 14.0, 12.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030383160337805748, -0.028347738087177277, -0.026312315836548805, -0.024276893585920334, -0.022241471335291862, -0.02020604908466339, -0.01817062683403492, -0.01613520458340645, -0.014099782332777977, -0.012064360082149506, -0.010028937831521034, -0.007993515580892563, -0.0059580933302640915, -0.00392267107963562, -0.0018872488290071487, 0.00014817342162132263, 0.002183595672249794, 0.004219017922878265, 0.006254440173506737, 0.008289862424135208, 0.01032528467476368, 0.012360706925392151, 0.014396129176020622, 0.016431551426649094, 0.018466973677277565, 0.020502395927906036, 0.022537818178534508, 0.02457324042916298, 0.02660866267979145, 0.028644084930419922, 0.030679507181048393, 0.032714929431676865, 0.03475034981966019, 0.03678577393293381, 0.03882119432091713, 0.04085661470890045, 0.04289203882217407, 0.04492746293544769, 0.046962883323431015, 0.04899830371141434, 0.05103372782468796, 0.05306915193796158, 0.0551045723259449, 0.05713999271392822, 0.05917541682720184, 0.061210840940475464, 0.06324626505374908, 0.06528168171644211, 0.06731710582971573, 0.06935252994298935, 0.07138794660568237, 0.073423370718956, 0.07545879483222961, 0.07749421894550323, 0.07952964305877686, 0.08156505972146988, 0.0836004838347435, 0.08563590794801712, 0.08767132461071014, 0.08970674872398376, 0.09174217283725739, 0.093777596950531, 0.09581302106380463, 0.09784843772649765, 0.09988386183977127]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 11.0, 8.0, 7.0, 15.0, 12.0, 16.0, 18.0, 25.0, 11.0, 29.0, 27.0, 27.0, 26.0, 24.0, 27.0, 30.0, 34.0, 45.0, 43.0, 36.0, 31.0, 35.0, 36.0, 35.0, 34.0, 40.0, 30.0, 34.0, 26.0, 22.0, 28.0, 21.0, 19.0, 20.0, 17.0, 19.0, 11.0, 10.0, 9.0, 15.0, 3.0, 4.0, 3.0, 7.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.015698859468102455, -0.015224277973175049, -0.014749695546925068, -0.014275114051997662, -0.01380053162574768, -0.013325950130820274, -0.012851368635892868, -0.012376786209642887, -0.011902203783392906, -0.0114276222884655, -0.010953039862215519, -0.010478458367288113, -0.010003875941038132, -0.009529294446110725, -0.009054712951183319, -0.008580130524933338, -0.008105549030005932, -0.007630967069417238, -0.007156385108828545, -0.006681803613901138, -0.006207221187651157, -0.005732639692723751, -0.0052580577321350574, -0.004783475771546364, -0.00430889381095767, -0.0038343118503689766, -0.003359729889780283, -0.002885148162022233, -0.0024105662014335394, -0.0019359842408448458, -0.0014614025130867958, -0.0009868205524981022, -0.000512237660586834, -3.765575820580125e-05, 0.00043692614417523146, 0.0009115079883486032, 0.0013860899489372969, 0.0018606719095259905, 0.0023352536372840405, 0.002809835597872734, 0.0032844175584614277, 0.0037589995190501213, 0.004233581479638815, 0.0047081634402275085, 0.005182744935154915, 0.005657327361404896, 0.006131908856332302, 0.006606490816920996, 0.007081072777509689, 0.007555654738098383, 0.008030236698687077, 0.008504818193614483, 0.008979400619864464, 0.00945398211479187, 0.009928563609719276, 0.010403146035969257, 0.010877728462219238, 0.011352309957146645, 0.011826892383396626, 0.012301473878324032, 0.012776056304574013, 0.013250637799501419, 0.013725219294428825, 0.014199801720678806, 0.014674383215606213]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 8.0, 6.0, 9.0, 9.0, 17.0, 18.0, 25.0, 48.0, 55.0, 81.0, 111.0, 123.0, 218.0, 303.0, 420.0, 642.0, 935.0, 1354.0, 2014.0, 3192.0, 4765.0, 7579.0, 11879.0, 19903.0, 33828.0, 60732.0, 120316.0, 246504.0, 254896.0, 125426.0, 63035.0, 34979.0, 20349.0, 12320.0, 7653.0, 4993.0, 3226.0, 2120.0, 1440.0, 966.0, 624.0, 382.0, 304.0, 229.0, 156.0, 119.0, 79.0, 49.0, 28.0, 20.0, 30.0, 15.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0], "bins": [-0.00972747802734375, -0.009441614151000977, -0.009155750274658203, -0.00886988639831543, -0.008584022521972656, -0.008298158645629883, -0.00801229476928711, -0.007726430892944336, -0.0074405670166015625, -0.007154703140258789, -0.006868839263916016, -0.006582975387573242, -0.006297111511230469, -0.006011247634887695, -0.005725383758544922, -0.0054395198822021484, -0.005153656005859375, -0.0048677921295166016, -0.004581928253173828, -0.004296064376831055, -0.004010200500488281, -0.003724336624145508, -0.0034384727478027344, -0.003152608871459961, -0.0028667449951171875, -0.002580881118774414, -0.0022950172424316406, -0.002009153366088867, -0.0017232894897460938, -0.0014374256134033203, -0.0011515617370605469, -0.0008656978607177734, -0.000579833984375, -0.00029397010803222656, -8.106231689453125e-06, 0.0002777576446533203, 0.0005636215209960938, 0.0008494853973388672, 0.0011353492736816406, 0.001421213150024414, 0.0017070770263671875, 0.001992940902709961, 0.0022788047790527344, 0.002564668655395508, 0.0028505325317382812, 0.0031363964080810547, 0.003422260284423828, 0.0037081241607666016, 0.003993988037109375, 0.0042798519134521484, 0.004565715789794922, 0.004851579666137695, 0.005137443542480469, 0.005423307418823242, 0.005709171295166016, 0.005995035171508789, 0.0062808990478515625, 0.006566762924194336, 0.006852626800537109, 0.007138490676879883, 0.007424354553222656, 0.00771021842956543, 0.007996082305908203, 0.008281946182250977, 0.00856781005859375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 9.0, 6.0, 6.0, 7.0, 11.0, 11.0, 19.0, 11.0, 20.0, 11.0, 21.0, 20.0, 19.0, 19.0, 39.0, 25.0, 38.0, 18.0, 28.0, 27.0, 40.0, 39.0, 37.0, 31.0, 34.0, 24.0, 36.0, 41.0, 34.0, 36.0, 38.0, 27.0, 29.0, 27.0, 24.0, 16.0, 16.0, 15.0, 11.0, 15.0, 17.0, 9.0, 5.0, 6.0, 10.0, 3.0, 4.0, 2.0, 5.0, 0.0, 5.0, 2.0], "bins": [-0.016448974609375, -0.015978455543518066, -0.015507936477661133, -0.0150374174118042, -0.014566898345947266, -0.014096379280090332, -0.013625860214233398, -0.013155341148376465, -0.012684822082519531, -0.012214303016662598, -0.011743783950805664, -0.01127326488494873, -0.010802745819091797, -0.010332226753234863, -0.00986170768737793, -0.009391188621520996, -0.008920669555664062, -0.008450150489807129, -0.007979631423950195, -0.007509112358093262, -0.007038593292236328, -0.0065680742263793945, -0.006097555160522461, -0.005627036094665527, -0.005156517028808594, -0.00468599796295166, -0.0042154788970947266, -0.003744959831237793, -0.0032744407653808594, -0.0028039216995239258, -0.002333402633666992, -0.0018628835678100586, -0.001392364501953125, -0.0009218454360961914, -0.0004513263702392578, 1.919269561767578e-05, 0.0004897117614746094, 0.000960230827331543, 0.0014307498931884766, 0.0019012689590454102, 0.0023717880249023438, 0.0028423070907592773, 0.003312826156616211, 0.0037833452224731445, 0.004253864288330078, 0.004724383354187012, 0.005194902420043945, 0.005665421485900879, 0.0061359405517578125, 0.006606459617614746, 0.00707697868347168, 0.007547497749328613, 0.008018016815185547, 0.00848853588104248, 0.008959054946899414, 0.009429574012756348, 0.009900093078613281, 0.010370612144470215, 0.010841131210327148, 0.011311650276184082, 0.011782169342041016, 0.01225268840789795, 0.012723207473754883, 0.013193726539611816, 0.01366424560546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 3.0, 10.0, 9.0, 9.0, 15.0, 22.0, 38.0, 46.0, 60.0, 99.0, 136.0, 179.0, 262.0, 362.0, 529.0, 803.0, 1107.0, 1644.0, 2586.0, 3662.0, 5864.0, 8874.0, 14563.0, 23792.0, 41430.0, 79088.0, 184510.0, 360498.0, 153433.0, 68830.0, 37056.0, 21659.0, 13011.0, 8319.0, 5304.0, 3453.0, 2329.0, 1526.0, 1045.0, 705.0, 519.0, 360.0, 223.0, 164.0, 138.0, 95.0, 57.0, 36.0, 27.0, 20.0, 20.0, 17.0, 6.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.00885772705078125, -0.008575677871704102, -0.008293628692626953, -0.008011579513549805, -0.007729530334472656, -0.007447481155395508, -0.007165431976318359, -0.006883382797241211, -0.0066013336181640625, -0.006319284439086914, -0.006037235260009766, -0.005755186080932617, -0.005473136901855469, -0.00519108772277832, -0.004909038543701172, -0.0046269893646240234, -0.004344940185546875, -0.0040628910064697266, -0.003780841827392578, -0.0034987926483154297, -0.0032167434692382812, -0.002934694290161133, -0.0026526451110839844, -0.002370595932006836, -0.0020885467529296875, -0.001806497573852539, -0.0015244483947753906, -0.0012423992156982422, -0.0009603500366210938, -0.0006783008575439453, -0.0003962516784667969, -0.00011420249938964844, 0.0001678466796875, 0.00044989585876464844, 0.0007319450378417969, 0.0010139942169189453, 0.0012960433959960938, 0.0015780925750732422, 0.0018601417541503906, 0.002142190933227539, 0.0024242401123046875, 0.002706289291381836, 0.0029883384704589844, 0.003270387649536133, 0.0035524368286132812, 0.0038344860076904297, 0.004116535186767578, 0.0043985843658447266, 0.004680633544921875, 0.0049626827239990234, 0.005244731903076172, 0.00552678108215332, 0.005808830261230469, 0.006090879440307617, 0.006372928619384766, 0.006654977798461914, 0.0069370269775390625, 0.007219076156616211, 0.007501125335693359, 0.007783174514770508, 0.008065223693847656, 0.008347272872924805, 0.008629322052001953, 0.008911371231079102, 0.00919342041015625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 2.0, 9.0, 10.0, 7.0, 17.0, 12.0, 16.0, 21.0, 22.0, 30.0, 26.0, 28.0, 29.0, 28.0, 39.0, 47.0, 41.0, 57.0, 40.0, 34.0, 39.0, 43.0, 53.0, 38.0, 40.0, 32.0, 35.0, 23.0, 28.0, 24.0, 18.0, 17.0, 16.0, 9.0, 11.0, 13.0, 9.0, 9.0, 3.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0119476318359375, -0.011577010154724121, -0.011206388473510742, -0.010835766792297363, -0.010465145111083984, -0.010094523429870605, -0.009723901748657227, -0.009353280067443848, -0.008982658386230469, -0.00861203670501709, -0.008241415023803711, -0.007870793342590332, -0.007500171661376953, -0.007129549980163574, -0.006758928298950195, -0.006388306617736816, -0.0060176849365234375, -0.005647063255310059, -0.00527644157409668, -0.004905819892883301, -0.004535198211669922, -0.004164576530456543, -0.003793954849243164, -0.003423333168029785, -0.0030527114868164062, -0.0026820898056030273, -0.0023114681243896484, -0.0019408464431762695, -0.0015702247619628906, -0.0011996030807495117, -0.0008289813995361328, -0.0004583597183227539, -8.7738037109375e-05, 0.0002828836441040039, 0.0006535053253173828, 0.0010241270065307617, 0.0013947486877441406, 0.0017653703689575195, 0.0021359920501708984, 0.0025066137313842773, 0.0028772354125976562, 0.003247857093811035, 0.003618478775024414, 0.003989100456237793, 0.004359722137451172, 0.004730343818664551, 0.00510096549987793, 0.005471587181091309, 0.0058422088623046875, 0.006212830543518066, 0.006583452224731445, 0.006954073905944824, 0.007324695587158203, 0.007695317268371582, 0.008065938949584961, 0.00843656063079834, 0.008807182312011719, 0.009177803993225098, 0.009548425674438477, 0.009919047355651855, 0.010289669036865234, 0.010660290718078613, 0.011030912399291992, 0.011401534080505371, 0.01177215576171875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 10.0, 14.0, 19.0, 20.0, 26.0, 49.0, 61.0, 96.0, 156.0, 236.0, 384.0, 608.0, 1022.0, 1553.0, 2700.0, 4792.0, 9205.0, 18873.0, 43119.0, 135313.0, 605601.0, 139983.0, 44256.0, 19043.0, 9413.0, 4934.0, 2716.0, 1625.0, 1006.0, 627.0, 361.0, 232.0, 174.0, 105.0, 74.0, 55.0, 31.0, 18.0, 14.0, 9.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010881423950195312, -0.0010546743869781494, -0.0010212063789367676, -0.0009877383708953857, -0.0009542703628540039, -0.0009208023548126221, -0.0008873343467712402, -0.0008538663387298584, -0.0008203983306884766, -0.0007869303226470947, -0.0007534623146057129, -0.0007199943065643311, -0.0006865262985229492, -0.0006530582904815674, -0.0006195902824401855, -0.0005861222743988037, -0.0005526542663574219, -0.00051918625831604, -0.0004857182502746582, -0.00045225024223327637, -0.00041878223419189453, -0.0003853142261505127, -0.00035184621810913086, -0.000318378210067749, -0.0002849102020263672, -0.00025144219398498535, -0.00021797418594360352, -0.00018450617790222168, -0.00015103816986083984, -0.00011757016181945801, -8.410215377807617e-05, -5.0634145736694336e-05, -1.71661376953125e-05, 1.6301870346069336e-05, 4.976987838745117e-05, 8.323788642883301e-05, 0.00011670589447021484, 0.00015017390251159668, 0.00018364191055297852, 0.00021710991859436035, 0.0002505779266357422, 0.000284045934677124, 0.00031751394271850586, 0.0003509819507598877, 0.00038444995880126953, 0.00041791796684265137, 0.0004513859748840332, 0.00048485398292541504, 0.0005183219909667969, 0.0005517899990081787, 0.0005852580070495605, 0.0006187260150909424, 0.0006521940231323242, 0.0006856620311737061, 0.0007191300392150879, 0.0007525980472564697, 0.0007860660552978516, 0.0008195340633392334, 0.0008530020713806152, 0.0008864700794219971, 0.0009199380874633789, 0.0009534060955047607, 0.0009868741035461426, 0.0010203421115875244, 0.0010538101196289062]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 9.0, 7.0, 8.0, 8.0, 11.0, 13.0, 14.0, 21.0, 31.0, 31.0, 52.0, 70.0, 69.0, 90.0, 63.0, 75.0, 86.0, 75.0, 60.0, 42.0, 39.0, 39.0, 18.0, 22.0, 8.0, 9.0, 7.0, 9.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7344951629638672e-05, -1.6862526535987854e-05, -1.6380101442337036e-05, -1.5897676348686218e-05, -1.54152512550354e-05, -1.4932826161384583e-05, -1.4450401067733765e-05, -1.3967975974082947e-05, -1.3485550880432129e-05, -1.3003125786781311e-05, -1.2520700693130493e-05, -1.2038275599479675e-05, -1.1555850505828857e-05, -1.107342541217804e-05, -1.0591000318527222e-05, -1.0108575224876404e-05, -9.626150131225586e-06, -9.143725037574768e-06, -8.66129994392395e-06, -8.178874850273132e-06, -7.696449756622314e-06, -7.214024662971497e-06, -6.731599569320679e-06, -6.249174475669861e-06, -5.766749382019043e-06, -5.284324288368225e-06, -4.801899194717407e-06, -4.319474101066589e-06, -3.8370490074157715e-06, -3.3546239137649536e-06, -2.8721988201141357e-06, -2.389773726463318e-06, -1.9073486328125e-06, -1.4249235391616821e-06, -9.424984455108643e-07, -4.600733518600464e-07, 2.2351741790771484e-08, 5.047768354415894e-07, 9.872019290924072e-07, 1.469627022743225e-06, 1.952052116394043e-06, 2.434477210044861e-06, 2.9169023036956787e-06, 3.3993273973464966e-06, 3.8817524909973145e-06, 4.364177584648132e-06, 4.84660267829895e-06, 5.329027771949768e-06, 5.811452865600586e-06, 6.293877959251404e-06, 6.776303052902222e-06, 7.2587281465530396e-06, 7.741153240203857e-06, 8.223578333854675e-06, 8.706003427505493e-06, 9.188428521156311e-06, 9.670853614807129e-06, 1.0153278708457947e-05, 1.0635703802108765e-05, 1.1118128895759583e-05, 1.16005539894104e-05, 1.2082979083061218e-05, 1.2565404176712036e-05, 1.3047829270362854e-05, 1.3530254364013672e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 3.0, 7.0, 9.0, 12.0, 22.0, 26.0, 35.0, 61.0, 65.0, 139.0, 331.0, 922.0, 3484.0, 20068.0, 313257.0, 673609.0, 29823.0, 4733.0, 1152.0, 365.0, 165.0, 82.0, 51.0, 32.0, 24.0, 14.0, 13.0, 12.0, 11.0, 4.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021800994873046875, -0.002102494239807129, -0.0020248889923095703, -0.0019472837448120117, -0.0018696784973144531, -0.0017920732498168945, -0.001714468002319336, -0.0016368627548217773, -0.0015592575073242188, -0.0014816522598266602, -0.0014040470123291016, -0.001326441764831543, -0.0012488365173339844, -0.0011712312698364258, -0.0010936260223388672, -0.0010160207748413086, -0.00093841552734375, -0.0008608102798461914, -0.0007832050323486328, -0.0007055997848510742, -0.0006279945373535156, -0.000550389289855957, -0.00047278404235839844, -0.00039517879486083984, -0.00031757354736328125, -0.00023996829986572266, -0.00016236305236816406, -8.475780487060547e-05, -7.152557373046875e-06, 7.045269012451172e-05, 0.0001480579376220703, 0.0002256631851196289, 0.0003032684326171875, 0.0003808736801147461, 0.0004584789276123047, 0.0005360841751098633, 0.0006136894226074219, 0.0006912946701049805, 0.0007688999176025391, 0.0008465051651000977, 0.0009241104125976562, 0.0010017156600952148, 0.0010793209075927734, 0.001156926155090332, 0.0012345314025878906, 0.0013121366500854492, 0.0013897418975830078, 0.0014673471450805664, 0.001544952392578125, 0.0016225576400756836, 0.0017001628875732422, 0.0017777681350708008, 0.0018553733825683594, 0.001932978630065918, 0.0020105838775634766, 0.002088189125061035, 0.0021657943725585938, 0.0022433996200561523, 0.002321004867553711, 0.0023986101150512695, 0.002476215362548828, 0.0025538206100463867, 0.0026314258575439453, 0.002709031105041504, 0.0027866363525390625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 7.0, 5.0, 8.0, 9.0, 6.0, 14.0, 24.0, 19.0, 34.0, 31.0, 42.0, 58.0, 72.0, 109.0, 112.0, 96.0, 58.0, 61.0, 46.0, 39.0, 30.0, 20.0, 23.0, 18.0, 11.0, 14.0, 8.0, 4.0, 4.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000263214111328125, -0.00025580450892448425, -0.0002483949065208435, -0.00024098530411720276, -0.000233575701713562, -0.00022616609930992126, -0.00021875649690628052, -0.00021134689450263977, -0.00020393729209899902, -0.00019652768969535828, -0.00018911808729171753, -0.00018170848488807678, -0.00017429888248443604, -0.0001668892800807953, -0.00015947967767715454, -0.0001520700752735138, -0.00014466047286987305, -0.0001372508704662323, -0.00012984126806259155, -0.0001224316656589508, -0.00011502206325531006, -0.00010761246085166931, -0.00010020285844802856, -9.279325604438782e-05, -8.538365364074707e-05, -7.797405123710632e-05, -7.056444883346558e-05, -6.315484642982483e-05, -5.574524402618408e-05, -4.8335641622543335e-05, -4.092603921890259e-05, -3.351643681526184e-05, -2.6106834411621094e-05, -1.8697232007980347e-05, -1.12876296043396e-05, -3.8780272006988525e-06, 3.5315752029418945e-06, 1.0941177606582642e-05, 1.835078001022339e-05, 2.5760382413864136e-05, 3.316998481750488e-05, 4.057958722114563e-05, 4.798918962478638e-05, 5.5398792028427124e-05, 6.280839443206787e-05, 7.021799683570862e-05, 7.762759923934937e-05, 8.503720164299011e-05, 9.244680404663086e-05, 9.98564064502716e-05, 0.00010726600885391235, 0.0001146756112575531, 0.00012208521366119385, 0.0001294948160648346, 0.00013690441846847534, 0.0001443140208721161, 0.00015172362327575684, 0.00015913322567939758, 0.00016654282808303833, 0.00017395243048667908, 0.00018136203289031982, 0.00018877163529396057, 0.00019618123769760132, 0.00020359084010124207, 0.0002110004425048828]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 12.0, 17.0, 20.0, 31.0, 43.0, 73.0, 99.0, 113.0, 152.0, 131.0, 108.0, 69.0, 46.0, 30.0, 22.0, 14.0, 11.0, 4.0, 7.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05490463599562645, -0.053613971918821335, -0.05232330784201622, -0.051032643765211105, -0.04974197596311569, -0.04845131188631058, -0.04716064780950546, -0.04586998373270035, -0.04457931965589523, -0.04328865557909012, -0.041997991502285004, -0.04070732742547989, -0.039416663348674774, -0.03812599554657936, -0.036835331469774246, -0.03554466739296913, -0.03425400331616402, -0.0329633392393589, -0.03167267516255379, -0.030382009223103523, -0.02909134514629841, -0.027800681069493294, -0.02651001513004303, -0.025219351053237915, -0.0239286869764328, -0.022638022899627686, -0.02134735882282257, -0.020056692883372307, -0.018766028806567192, -0.017475364729762077, -0.016184698790311813, -0.014894034713506699, -0.013603366911411285, -0.01231270283460617, -0.011022037826478481, -0.009731372818350792, -0.008440708741545677, -0.007150044199079275, -0.005859379656612873, -0.004568714648485184, -0.003278050571680069, -0.001987386029213667, -0.0006967214867472649, 0.0005939430557191372, 0.0018846075981855392, 0.0031752721406519413, 0.004465936683118343, 0.005756601691246033, 0.0070472657680511475, 0.008337929844856262, 0.009628594852983952, 0.010919259861111641, 0.012209923937916756, 0.01350058801472187, 0.01479125302284956, 0.01608191803097725, 0.017372582107782364, 0.01866324618458748, 0.019953910261392593, 0.021244576200842857, 0.022535240277647972, 0.023825904354453087, 0.02511657029390335, 0.026407234370708466, 0.02769789844751358]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 11.0, 10.0, 12.0, 14.0, 11.0, 15.0, 26.0, 16.0, 22.0, 28.0, 24.0, 33.0, 17.0, 28.0, 30.0, 35.0, 36.0, 37.0, 43.0, 35.0, 36.0, 28.0, 30.0, 34.0, 31.0, 47.0, 26.0, 25.0, 24.0, 24.0, 33.0, 18.0, 17.0, 21.0, 18.0, 12.0, 13.0, 8.0, 9.0, 10.0, 9.0, 4.0, 7.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0], "bins": [-0.01538625918328762, -0.014942603185772896, -0.014498948119580746, -0.014055292122066021, -0.01361163705587387, -0.013167981058359146, -0.012724325060844421, -0.012280669994652271, -0.011837014928460121, -0.011393358930945396, -0.010949703864753246, -0.010506047867238522, -0.010062392801046371, -0.009618736803531647, -0.009175080806016922, -0.008731425739824772, -0.008287769742310047, -0.007844113744795322, -0.007400458678603172, -0.006956802681088448, -0.0065131476148962975, -0.006069491617381573, -0.005625836085528135, -0.005182180553674698, -0.0047385250218212605, -0.004294869489967823, -0.0038512139581143856, -0.0034075581934303045, -0.002963902661576867, -0.0025202471297234297, -0.0020765913650393486, -0.0016329358331859112, -0.0011892812326550484, -0.00074562564259395, -0.0003019700525328517, 0.00014168559573590755, 0.000585341127589345, 0.0010289966594427824, 0.0014726524241268635, 0.001916307955980301, 0.0023599634878337383, 0.0028036190196871758, 0.003247274551540613, 0.0036909303162246943, 0.004134586080908775, 0.0045782411471009254, 0.00502189714461565, 0.005465552676469088, 0.005909208208322525, 0.0063528637401759624, 0.0067965192720294, 0.007240175269544125, 0.007683830335736275, 0.008127486333251, 0.008571142330765724, 0.009014797396957874, 0.009458452463150024, 0.00990210846066475, 0.0103457635268569, 0.010789419524371624, 0.011233074590563774, 0.011676730588078499, 0.012120386585593224, 0.012564041651785374, 0.013007697649300098]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 10.0, 24.0, 24.0, 51.0, 50.0, 74.0, 113.0, 156.0, 202.0, 310.0, 442.0, 602.0, 857.0, 1328.0, 1825.0, 2677.0, 3741.0, 5627.0, 8024.0, 12118.0, 18078.0, 26671.0, 39802.0, 59225.0, 85912.0, 116118.0, 139936.0, 139716.0, 116359.0, 86182.0, 58908.0, 39997.0, 26764.0, 18011.0, 12079.0, 8249.0, 5593.0, 3823.0, 2700.0, 1894.0, 1317.0, 867.0, 629.0, 469.0, 338.0, 193.0, 148.0, 102.0, 78.0, 59.0, 23.0, 14.0, 14.0, 10.0, 9.0, 9.0, 1.0, 3.0], "bins": [-0.0268096923828125, -0.025997400283813477, -0.025185108184814453, -0.02437281608581543, -0.023560523986816406, -0.022748231887817383, -0.02193593978881836, -0.021123647689819336, -0.020311355590820312, -0.01949906349182129, -0.018686771392822266, -0.017874479293823242, -0.01706218719482422, -0.016249895095825195, -0.015437602996826172, -0.014625310897827148, -0.013813018798828125, -0.013000726699829102, -0.012188434600830078, -0.011376142501831055, -0.010563850402832031, -0.009751558303833008, -0.008939266204833984, -0.008126974105834961, -0.0073146820068359375, -0.006502389907836914, -0.005690097808837891, -0.004877805709838867, -0.004065513610839844, -0.0032532215118408203, -0.002440929412841797, -0.0016286373138427734, -0.00081634521484375, -4.0531158447265625e-06, 0.0008082389831542969, 0.0016205310821533203, 0.0024328231811523438, 0.003245115280151367, 0.004057407379150391, 0.004869699478149414, 0.0056819915771484375, 0.006494283676147461, 0.007306575775146484, 0.008118867874145508, 0.008931159973144531, 0.009743452072143555, 0.010555744171142578, 0.011368036270141602, 0.012180328369140625, 0.012992620468139648, 0.013804912567138672, 0.014617204666137695, 0.015429496765136719, 0.016241788864135742, 0.017054080963134766, 0.01786637306213379, 0.018678665161132812, 0.019490957260131836, 0.02030324935913086, 0.021115541458129883, 0.021927833557128906, 0.02274012565612793, 0.023552417755126953, 0.024364709854125977, 0.025177001953125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 10.0, 5.0, 3.0, 4.0, 9.0, 7.0, 11.0, 9.0, 11.0, 16.0, 20.0, 20.0, 21.0, 18.0, 29.0, 30.0, 24.0, 32.0, 39.0, 35.0, 38.0, 40.0, 36.0, 29.0, 46.0, 39.0, 37.0, 39.0, 36.0, 30.0, 31.0, 36.0, 27.0, 18.0, 28.0, 16.0, 20.0, 13.0, 16.0, 16.0, 10.0, 14.0, 7.0, 7.0, 4.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.012725830078125, -0.01231241226196289, -0.011898994445800781, -0.011485576629638672, -0.011072158813476562, -0.010658740997314453, -0.010245323181152344, -0.009831905364990234, -0.009418487548828125, -0.009005069732666016, -0.008591651916503906, -0.008178234100341797, -0.0077648162841796875, -0.007351398468017578, -0.006937980651855469, -0.006524562835693359, -0.00611114501953125, -0.005697727203369141, -0.005284309387207031, -0.004870891571044922, -0.0044574737548828125, -0.004044055938720703, -0.0036306381225585938, -0.0032172203063964844, -0.002803802490234375, -0.0023903846740722656, -0.0019769668579101562, -0.0015635490417480469, -0.0011501312255859375, -0.0007367134094238281, -0.00032329559326171875, 9.012222290039062e-05, 0.0005035400390625, 0.0009169578552246094, 0.0013303756713867188, 0.0017437934875488281, 0.0021572113037109375, 0.002570629119873047, 0.0029840469360351562, 0.0033974647521972656, 0.003810882568359375, 0.004224300384521484, 0.004637718200683594, 0.005051136016845703, 0.0054645538330078125, 0.005877971649169922, 0.006291389465332031, 0.006704807281494141, 0.00711822509765625, 0.007531642913818359, 0.007945060729980469, 0.008358478546142578, 0.008771896362304688, 0.009185314178466797, 0.009598731994628906, 0.010012149810791016, 0.010425567626953125, 0.010838985443115234, 0.011252403259277344, 0.011665821075439453, 0.012079238891601562, 0.012492656707763672, 0.012906074523925781, 0.01331949234008789, 0.01373291015625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 11.0, 8.0, 11.0, 8.0, 14.0, 12.0, 34.0, 53.0, 56.0, 88.0, 173.0, 375.0, 1142.0, 4458.0, 23842.0, 154208.0, 577746.0, 240439.0, 36835.0, 6457.0, 1522.0, 471.0, 216.0, 126.0, 63.0, 45.0, 30.0, 28.0, 25.0, 17.0, 10.0, 9.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12420654296875, -0.12061882019042969, -0.11703109741210938, -0.11344337463378906, -0.10985565185546875, -0.10626792907714844, -0.10268020629882812, -0.09909248352050781, -0.0955047607421875, -0.09191703796386719, -0.08832931518554688, -0.08474159240722656, -0.08115386962890625, -0.07756614685058594, -0.07397842407226562, -0.07039070129394531, -0.066802978515625, -0.06321525573730469, -0.059627532958984375, -0.05603981018066406, -0.05245208740234375, -0.04886436462402344, -0.045276641845703125, -0.04168891906738281, -0.0381011962890625, -0.03451347351074219, -0.030925750732421875, -0.027338027954101562, -0.02375030517578125, -0.020162582397460938, -0.016574859619140625, -0.012987136840820312, -0.0093994140625, -0.0058116912841796875, -0.002223968505859375, 0.0013637542724609375, 0.00495147705078125, 0.008539199829101562, 0.012126922607421875, 0.015714645385742188, 0.0193023681640625, 0.022890090942382812, 0.026477813720703125, 0.030065536499023438, 0.03365325927734375, 0.03724098205566406, 0.040828704833984375, 0.04441642761230469, 0.048004150390625, 0.05159187316894531, 0.055179595947265625, 0.05876731872558594, 0.06235504150390625, 0.06594276428222656, 0.06953048706054688, 0.07311820983886719, 0.0767059326171875, 0.08029365539550781, 0.08388137817382812, 0.08746910095214844, 0.09105682373046875, 0.09464454650878906, 0.09823226928710938, 0.10181999206542969, 0.10540771484375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 8.0, 12.0, 11.0, 22.0, 20.0, 21.0, 25.0, 30.0, 44.0, 50.0, 52.0, 63.0, 60.0, 49.0, 47.0, 60.0, 47.0, 28.0, 42.0, 53.0, 43.0, 31.0, 39.0, 25.0, 26.0, 14.0, 13.0, 10.0, 11.0, 11.0, 2.0, 6.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01485443115234375, -0.014327406883239746, -0.013800382614135742, -0.013273358345031738, -0.012746334075927734, -0.01221930980682373, -0.011692285537719727, -0.011165261268615723, -0.010638236999511719, -0.010111212730407715, -0.009584188461303711, -0.009057164192199707, -0.008530139923095703, -0.0080031156539917, -0.007476091384887695, -0.006949067115783691, -0.0064220428466796875, -0.005895018577575684, -0.00536799430847168, -0.004840970039367676, -0.004313945770263672, -0.003786921501159668, -0.003259897232055664, -0.00273287296295166, -0.0022058486938476562, -0.0016788244247436523, -0.0011518001556396484, -0.0006247758865356445, -9.775161743164062e-05, 0.0004292726516723633, 0.0009562969207763672, 0.001483321189880371, 0.002010345458984375, 0.002537369728088379, 0.003064393997192383, 0.0035914182662963867, 0.004118442535400391, 0.0046454668045043945, 0.0051724910736083984, 0.005699515342712402, 0.006226539611816406, 0.00675356388092041, 0.007280588150024414, 0.007807612419128418, 0.008334636688232422, 0.008861660957336426, 0.00938868522644043, 0.009915709495544434, 0.010442733764648438, 0.010969758033752441, 0.011496782302856445, 0.01202380657196045, 0.012550830841064453, 0.013077855110168457, 0.013604879379272461, 0.014131903648376465, 0.014658927917480469, 0.015185952186584473, 0.015712976455688477, 0.01624000072479248, 0.016767024993896484, 0.01729404926300049, 0.017821073532104492, 0.018348097801208496, 0.0188751220703125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 3.0, 3.0, 4.0, 8.0, 17.0, 27.0, 26.0, 43.0, 42.0, 64.0, 113.0, 154.0, 235.0, 373.0, 599.0, 967.0, 1763.0, 3060.0, 5822.0, 12079.0, 27186.0, 74906.0, 285250.0, 440565.0, 122439.0, 39299.0, 16374.0, 7730.0, 3970.0, 2136.0, 1186.0, 762.0, 430.0, 288.0, 218.0, 133.0, 79.0, 57.0, 37.0, 26.0, 25.0, 18.0, 13.0, 8.0, 2.0, 4.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0008330345153808594, -0.0008079409599304199, -0.0007828474044799805, -0.000757753849029541, -0.0007326602935791016, -0.0007075667381286621, -0.0006824731826782227, -0.0006573796272277832, -0.0006322860717773438, -0.0006071925163269043, -0.0005820989608764648, -0.0005570054054260254, -0.0005319118499755859, -0.0005068182945251465, -0.00048172473907470703, -0.0004566311836242676, -0.0004315376281738281, -0.00040644407272338867, -0.0003813505172729492, -0.00035625696182250977, -0.0003311634063720703, -0.00030606985092163086, -0.0002809762954711914, -0.00025588274002075195, -0.0002307891845703125, -0.00020569562911987305, -0.0001806020736694336, -0.00015550851821899414, -0.0001304149627685547, -0.00010532140731811523, -8.022785186767578e-05, -5.513429641723633e-05, -3.0040740966796875e-05, -4.947185516357422e-06, 2.014636993408203e-05, 4.5239925384521484e-05, 7.033348083496094e-05, 9.542703628540039e-05, 0.00012052059173583984, 0.0001456141471862793, 0.00017070770263671875, 0.0001958012580871582, 0.00022089481353759766, 0.0002459883689880371, 0.00027108192443847656, 0.000296175479888916, 0.00032126903533935547, 0.0003463625907897949, 0.0003714561462402344, 0.00039654970169067383, 0.0004216432571411133, 0.00044673681259155273, 0.0004718303680419922, 0.0004969239234924316, 0.0005220174789428711, 0.0005471110343933105, 0.00057220458984375, 0.0005972981452941895, 0.0006223917007446289, 0.0006474852561950684, 0.0006725788116455078, 0.0006976723670959473, 0.0007227659225463867, 0.0007478594779968262, 0.0007729530334472656]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 3.0, 9.0, 5.0, 8.0, 8.0, 9.0, 11.0, 18.0, 29.0, 22.0, 32.0, 46.0, 47.0, 57.0, 68.0, 67.0, 69.0, 106.0, 57.0, 63.0, 46.0, 38.0, 41.0, 21.0, 15.0, 20.0, 18.0, 12.0, 14.0, 8.0, 5.0, 2.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.7220458984375e-06, -5.539506673812866e-06, -5.356967449188232e-06, -5.174428224563599e-06, -4.991888999938965e-06, -4.809349775314331e-06, -4.626810550689697e-06, -4.4442713260650635e-06, -4.26173210144043e-06, -4.079192876815796e-06, -3.896653652191162e-06, -3.7141144275665283e-06, -3.5315752029418945e-06, -3.3490359783172607e-06, -3.166496753692627e-06, -2.983957529067993e-06, -2.8014183044433594e-06, -2.6188790798187256e-06, -2.436339855194092e-06, -2.253800630569458e-06, -2.0712614059448242e-06, -1.8887221813201904e-06, -1.7061829566955566e-06, -1.5236437320709229e-06, -1.341104507446289e-06, -1.1585652828216553e-06, -9.760260581970215e-07, -7.934868335723877e-07, -6.109476089477539e-07, -4.284083843231201e-07, -2.4586915969848633e-07, -6.332993507385254e-08, 1.1920928955078125e-07, 3.0174851417541504e-07, 4.842877388000488e-07, 6.668269634246826e-07, 8.493661880493164e-07, 1.0319054126739502e-06, 1.214444637298584e-06, 1.3969838619232178e-06, 1.5795230865478516e-06, 1.7620623111724854e-06, 1.944601535797119e-06, 2.127140760421753e-06, 2.3096799850463867e-06, 2.4922192096710205e-06, 2.6747584342956543e-06, 2.857297658920288e-06, 3.039836883544922e-06, 3.2223761081695557e-06, 3.4049153327941895e-06, 3.5874545574188232e-06, 3.769993782043457e-06, 3.952533006668091e-06, 4.135072231292725e-06, 4.317611455917358e-06, 4.500150680541992e-06, 4.682689905166626e-06, 4.86522912979126e-06, 5.0477683544158936e-06, 5.230307579040527e-06, 5.412846803665161e-06, 5.595386028289795e-06, 5.777925252914429e-06, 5.9604644775390625e-06]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 6.0, 3.0, 8.0, 13.0, 17.0, 39.0, 61.0, 128.0, 238.0, 547.0, 1614.0, 8651.0, 153914.0, 845959.0, 32088.0, 3550.0, 965.0, 365.0, 168.0, 87.0, 37.0, 37.0, 21.0, 10.0, 8.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00254058837890625, -0.002461850643157959, -0.002383112907409668, -0.002304375171661377, -0.002225637435913086, -0.002146899700164795, -0.002068161964416504, -0.001989424228668213, -0.0019106864929199219, -0.0018319487571716309, -0.0017532110214233398, -0.0016744732856750488, -0.0015957355499267578, -0.0015169978141784668, -0.0014382600784301758, -0.0013595223426818848, -0.0012807846069335938, -0.0012020468711853027, -0.0011233091354370117, -0.0010445713996887207, -0.0009658336639404297, -0.0008870959281921387, -0.0008083581924438477, -0.0007296204566955566, -0.0006508827209472656, -0.0005721449851989746, -0.0004934072494506836, -0.0004146695137023926, -0.00033593177795410156, -0.00025719404220581055, -0.00017845630645751953, -9.971857070922852e-05, -2.09808349609375e-05, 5.7756900787353516e-05, 0.00013649463653564453, 0.00021523237228393555, 0.00029397010803222656, 0.0003727078437805176, 0.0004514455795288086, 0.0005301833152770996, 0.0006089210510253906, 0.0006876587867736816, 0.0007663965225219727, 0.0008451342582702637, 0.0009238719940185547, 0.0010026097297668457, 0.0010813474655151367, 0.0011600852012634277, 0.0012388229370117188, 0.0013175606727600098, 0.0013962984085083008, 0.0014750361442565918, 0.0015537738800048828, 0.0016325116157531738, 0.0017112493515014648, 0.0017899870872497559, 0.0018687248229980469, 0.0019474625587463379, 0.002026200294494629, 0.00210493803024292, 0.002183675765991211, 0.002262413501739502, 0.002341151237487793, 0.002419888973236084, 0.002498626708984375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 10.0, 8.0, 15.0, 14.0, 18.0, 31.0, 38.0, 57.0, 83.0, 91.0, 91.0, 101.0, 95.0, 85.0, 57.0, 46.0, 34.0, 36.0, 20.0, 16.0, 15.0, 9.0, 7.0, 2.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003159046173095703, -0.0003065057098865509, -0.0002971068024635315, -0.0002877078950405121, -0.0002783089876174927, -0.00026891008019447327, -0.00025951117277145386, -0.00025011226534843445, -0.00024071335792541504, -0.00023131445050239563, -0.00022191554307937622, -0.0002125166356563568, -0.0002031177282333374, -0.000193718820810318, -0.00018431991338729858, -0.00017492100596427917, -0.00016552209854125977, -0.00015612319111824036, -0.00014672428369522095, -0.00013732537627220154, -0.00012792646884918213, -0.00011852756142616272, -0.00010912865400314331, -9.97297465801239e-05, -9.033083915710449e-05, -8.093193173408508e-05, -7.153302431106567e-05, -6.213411688804626e-05, -5.2735209465026855e-05, -4.3336302042007446e-05, -3.393739461898804e-05, -2.4538487195968628e-05, -1.5139579772949219e-05, -5.7406723499298096e-06, 3.6582350730895996e-06, 1.3057142496109009e-05, 2.2456049919128418e-05, 3.185495734214783e-05, 4.1253864765167236e-05, 5.0652772188186646e-05, 6.0051679611206055e-05, 6.945058703422546e-05, 7.884949445724487e-05, 8.824840188026428e-05, 9.764730930328369e-05, 0.0001070462167263031, 0.00011644512414932251, 0.00012584403157234192, 0.00013524293899536133, 0.00014464184641838074, 0.00015404075384140015, 0.00016343966126441956, 0.00017283856868743896, 0.00018223747611045837, 0.00019163638353347778, 0.0002010352909564972, 0.0002104341983795166, 0.000219833105802536, 0.00022923201322555542, 0.00023863092064857483, 0.00024802982807159424, 0.00025742873549461365, 0.00026682764291763306, 0.00027622655034065247, 0.0002856254577636719]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 14.0, 30.0, 105.0, 220.0, 334.0, 180.0, 90.0, 29.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.147277370095253, -0.14451964199543, -0.1417619287967682, -0.1390042006969452, -0.1362464725971222, -0.1334887444972992, -0.1307310312986374, -0.1279733031988144, -0.1252155750989914, -0.12245785444974899, -0.119700126349926, -0.1169424057006836, -0.1141846776008606, -0.1114269569516182, -0.1086692363023758, -0.1059115082025528, -0.10315379500389099, -0.10039607435464859, -0.09763834625482559, -0.09488062560558319, -0.09212289750576019, -0.08936517685651779, -0.08660745620727539, -0.08384972810745239, -0.0810920000076294, -0.078334279358387, -0.075576551258564, -0.0728188306093216, -0.0700611025094986, -0.0673033818602562, -0.0645456612110138, -0.061787933111190796, -0.059030212461948395, -0.056272488087415695, -0.053514763712882996, -0.050757043063640594, -0.047999318689107895, -0.045241594314575195, -0.042483869940042496, -0.039726145565509796, -0.036968424916267395, -0.034210700541734695, -0.031452976167201996, -0.028695253655314445, -0.025937531143426895, -0.023179806768894196, -0.020422082394361496, -0.017664359882473946, -0.014906635507941246, -0.012148912064731121, -0.009391188621520996, -0.0066334642469882965, -0.0038757408037781715, -0.0011180173605680466, 0.001639707013964653, 0.004397429525852203, 0.007155153900384903, 0.009912877343595028, 0.012670600786805153, 0.015428325161337852, 0.018186047673225403, 0.020943772047758102, 0.023701496422290802, 0.026459218934178352, 0.029216943308711052]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 8.0, 6.0, 13.0, 11.0, 7.0, 17.0, 14.0, 21.0, 26.0, 20.0, 15.0, 26.0, 26.0, 30.0, 42.0, 19.0, 43.0, 40.0, 41.0, 45.0, 47.0, 42.0, 47.0, 35.0, 28.0, 43.0, 38.0, 31.0, 29.0, 30.0, 24.0, 18.0, 20.0, 12.0, 15.0, 13.0, 13.0, 9.0, 7.0, 8.0, 9.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.018080241978168488, -0.017533646896481514, -0.01698705181479454, -0.016440454870462418, -0.015893859788775444, -0.01534726470708847, -0.014800669625401497, -0.014254074543714523, -0.013707478530704975, -0.013160883449018002, -0.012614287436008453, -0.01206769235432148, -0.011521097272634506, -0.010974501259624958, -0.010427906177937984, -0.009881310164928436, -0.009334715083241463, -0.00878812000155449, -0.008241523988544941, -0.007694928906857967, -0.0071483333595097065, -0.006601737812161446, -0.006055142730474472, -0.005508547183126211, -0.00496195163577795, -0.004415356088429689, -0.003868760773912072, -0.003322165459394455, -0.002775569912046194, -0.002228974364697933, -0.001682379050180316, -0.0011357837356626987, -0.0005891900509595871, -4.2594620026648045e-05, 0.000504000810906291, 0.00105059624183923, 0.0015971916727721691, 0.00214378722012043, 0.0026903825346380472, 0.0032369778491556644, 0.0037835733965039253, 0.004330168943852186, 0.004876764491200447, 0.005423359572887421, 0.0059699551202356815, 0.006516550667583942, 0.007063145749270916, 0.007609741296619177, 0.008156336843967438, 0.008702931925654411, 0.00924952793866396, 0.009796123020350933, 0.010342719033360481, 0.010889314115047455, 0.011435909196734428, 0.011982504278421402, 0.01252910029143095, 0.013075695373117924, 0.013622291386127472, 0.014168886467814445, 0.014715481549501419, 0.015262077562510967, 0.015808673575520515, 0.01635526865720749, 0.016901863738894463]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 6.0, 14.0, 12.0, 24.0, 28.0, 43.0, 60.0, 84.0, 106.0, 137.0, 178.0, 200.0, 357.0, 475.0, 768.0, 1292.0, 2535.0, 6292.0, 23866.0, 488660.0, 3489245.0, 156291.0, 13900.0, 4467.0, 2012.0, 1114.0, 634.0, 371.0, 266.0, 203.0, 170.0, 121.0, 87.0, 67.0, 51.0, 36.0, 38.0, 16.0, 16.0, 10.0, 8.0, 7.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031463623046875, -0.030312538146972656, -0.029161453247070312, -0.02801036834716797, -0.026859283447265625, -0.02570819854736328, -0.024557113647460938, -0.023406028747558594, -0.02225494384765625, -0.021103858947753906, -0.019952774047851562, -0.01880168914794922, -0.017650604248046875, -0.01649951934814453, -0.015348434448242188, -0.014197349548339844, -0.0130462646484375, -0.011895179748535156, -0.010744094848632812, -0.009593009948730469, -0.008441925048828125, -0.007290840148925781, -0.0061397552490234375, -0.004988670349121094, -0.00383758544921875, -0.0026865005493164062, -0.0015354156494140625, -0.00038433074951171875, 0.000766754150390625, 0.0019178390502929688, 0.0030689239501953125, 0.004220008850097656, 0.00537109375, 0.006522178649902344, 0.0076732635498046875, 0.008824348449707031, 0.009975433349609375, 0.011126518249511719, 0.012277603149414062, 0.013428688049316406, 0.01457977294921875, 0.015730857849121094, 0.016881942749023438, 0.01803302764892578, 0.019184112548828125, 0.02033519744873047, 0.021486282348632812, 0.022637367248535156, 0.0237884521484375, 0.024939537048339844, 0.026090621948242188, 0.02724170684814453, 0.028392791748046875, 0.02954387664794922, 0.030694961547851562, 0.031846046447753906, 0.03299713134765625, 0.034148216247558594, 0.03529930114746094, 0.03645038604736328, 0.037601470947265625, 0.03875255584716797, 0.03990364074707031, 0.041054725646972656, 0.042205810546875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 5.0, 11.0, 15.0, 8.0, 12.0, 17.0, 20.0, 25.0, 16.0, 16.0, 33.0, 14.0, 27.0, 38.0, 44.0, 43.0, 30.0, 56.0, 43.0, 36.0, 41.0, 42.0, 37.0, 45.0, 42.0, 27.0, 30.0, 26.0, 22.0, 19.0, 23.0, 15.0, 12.0, 17.0, 9.0, 14.0, 16.0, 6.0, 5.0, 6.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.01409149169921875, -0.013666152954101562, -0.013240814208984375, -0.012815475463867188, -0.01239013671875, -0.011964797973632812, -0.011539459228515625, -0.011114120483398438, -0.01068878173828125, -0.010263442993164062, -0.009838104248046875, -0.009412765502929688, -0.0089874267578125, -0.008562088012695312, -0.008136749267578125, -0.0077114105224609375, -0.00728607177734375, -0.0068607330322265625, -0.006435394287109375, -0.0060100555419921875, -0.005584716796875, -0.0051593780517578125, -0.004734039306640625, -0.0043087005615234375, -0.00388336181640625, -0.0034580230712890625, -0.003032684326171875, -0.0026073455810546875, -0.0021820068359375, -0.0017566680908203125, -0.001331329345703125, -0.0009059906005859375, -0.00048065185546875, -5.53131103515625e-05, 0.000370025634765625, 0.0007953643798828125, 0.001220703125, 0.0016460418701171875, 0.002071380615234375, 0.0024967193603515625, 0.00292205810546875, 0.0033473968505859375, 0.003772735595703125, 0.0041980743408203125, 0.0046234130859375, 0.0050487518310546875, 0.005474090576171875, 0.0058994293212890625, 0.00632476806640625, 0.0067501068115234375, 0.007175445556640625, 0.0076007843017578125, 0.008026123046875, 0.008451461791992188, 0.008876800537109375, 0.009302139282226562, 0.00972747802734375, 0.010152816772460938, 0.010578155517578125, 0.011003494262695312, 0.0114288330078125, 0.011854171752929688, 0.012279510498046875, 0.012704849243164062, 0.01313018798828125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 7.0, 3.0, 10.0, 15.0, 38.0, 69.0, 120.0, 275.0, 858.0, 5282.0, 211319.0, 3961435.0, 12641.0, 1469.0, 416.0, 144.0, 74.0, 26.0, 23.0, 17.0, 14.0, 8.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13818359375, -0.132904052734375, -0.12762451171875, -0.122344970703125, -0.1170654296875, -0.111785888671875, -0.10650634765625, -0.101226806640625, -0.095947265625, -0.090667724609375, -0.08538818359375, -0.080108642578125, -0.0748291015625, -0.069549560546875, -0.06427001953125, -0.058990478515625, -0.0537109375, -0.048431396484375, -0.04315185546875, -0.037872314453125, -0.0325927734375, -0.027313232421875, -0.02203369140625, -0.016754150390625, -0.011474609375, -0.006195068359375, -0.00091552734375, 0.004364013671875, 0.0096435546875, 0.014923095703125, 0.02020263671875, 0.025482177734375, 0.03076171875, 0.036041259765625, 0.04132080078125, 0.046600341796875, 0.0518798828125, 0.057159423828125, 0.06243896484375, 0.067718505859375, 0.072998046875, 0.078277587890625, 0.08355712890625, 0.088836669921875, 0.0941162109375, 0.099395751953125, 0.10467529296875, 0.109954833984375, 0.115234375, 0.120513916015625, 0.12579345703125, 0.131072998046875, 0.1363525390625, 0.141632080078125, 0.14691162109375, 0.152191162109375, 0.157470703125, 0.162750244140625, 0.16802978515625, 0.173309326171875, 0.1785888671875, 0.183868408203125, 0.18914794921875, 0.194427490234375, 0.19970703125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 11.0, 11.0, 22.0, 27.0, 25.0, 45.0, 104.0, 229.0, 677.0, 1725.0, 780.0, 221.0, 97.0, 34.0, 24.0, 13.0, 8.0, 10.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01654052734375, -0.01608717441558838, -0.015633821487426758, -0.015180468559265137, -0.014727115631103516, -0.014273762702941895, -0.013820409774780273, -0.013367056846618652, -0.012913703918457031, -0.01246035099029541, -0.012006998062133789, -0.011553645133972168, -0.011100292205810547, -0.010646939277648926, -0.010193586349487305, -0.009740233421325684, -0.009286880493164062, -0.008833527565002441, -0.00838017463684082, -0.0079268217086792, -0.007473468780517578, -0.007020115852355957, -0.006566762924194336, -0.006113409996032715, -0.005660057067871094, -0.005206704139709473, -0.0047533512115478516, -0.0042999982833862305, -0.0038466453552246094, -0.0033932924270629883, -0.002939939498901367, -0.002486586570739746, -0.002033233642578125, -0.001579880714416504, -0.0011265277862548828, -0.0006731748580932617, -0.00021982192993164062, 0.00023353099822998047, 0.0006868839263916016, 0.0011402368545532227, 0.0015935897827148438, 0.002046942710876465, 0.002500295639038086, 0.002953648567199707, 0.003407001495361328, 0.0038603544235229492, 0.00431370735168457, 0.004767060279846191, 0.0052204132080078125, 0.005673766136169434, 0.006127119064331055, 0.006580471992492676, 0.007033824920654297, 0.007487177848815918, 0.007940530776977539, 0.00839388370513916, 0.008847236633300781, 0.009300589561462402, 0.009753942489624023, 0.010207295417785645, 0.010660648345947266, 0.011114001274108887, 0.011567354202270508, 0.012020707130432129, 0.01247406005859375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 6.0, 13.0, 15.0, 25.0, 32.0, 48.0, 79.0, 93.0, 102.0, 114.0, 124.0, 109.0, 93.0, 37.0, 34.0, 34.0, 18.0, 12.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0373913012444973, -0.036518990993499756, -0.03564668074250221, -0.03477436676621437, -0.03390205651521683, -0.033029746264219284, -0.03215743601322174, -0.0312851257622242, -0.030412813648581505, -0.02954050339758396, -0.02866819128394127, -0.027795881032943726, -0.026923568919301033, -0.02605125866830349, -0.025178946554660797, -0.024306636303663254, -0.02343432605266571, -0.022562015801668167, -0.021689703688025475, -0.02081739343702793, -0.01994508132338524, -0.019072771072387695, -0.018200460821390152, -0.01732814870774746, -0.016455836594104767, -0.015583525411784649, -0.014711214229464531, -0.013838903978466988, -0.01296659279614687, -0.012094281613826752, -0.011221970431506634, -0.010349659249186516, -0.009477348998188972, -0.008605037815868855, -0.007732727099210024, -0.006860415916889906, -0.005988105200231075, -0.005115794017910957, -0.004243482835590839, -0.0033711721189320087, -0.002498860936611891, -0.0016265499871224165, -0.0007542389212176204, 0.00011807214468717575, 0.00099038309417665, 0.0018626940436661243, 0.0027350052259862423, 0.003607315942645073, 0.004479627124965191, 0.005351938307285309, 0.0062242490239441395, 0.007096560206264257, 0.007968870922923088, 0.008841182105243206, 0.009713493287563324, 0.010585803538560867, 0.01145811565220356, 0.012330426834523678, 0.013202738016843796, 0.014075048267841339, 0.014947359450161457, 0.015819670632481575, 0.016691982746124268, 0.01756429299712181, 0.018436603248119354]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 7.0, 2.0, 1.0, 3.0, 9.0, 7.0, 8.0, 9.0, 6.0, 10.0, 4.0, 17.0, 8.0, 11.0, 14.0, 26.0, 24.0, 17.0, 20.0, 40.0, 29.0, 26.0, 32.0, 30.0, 41.0, 48.0, 39.0, 41.0, 38.0, 31.0, 26.0, 28.0, 36.0, 35.0, 26.0, 36.0, 29.0, 25.0, 28.0, 21.0, 20.0, 16.0, 16.0, 10.0, 11.0, 13.0, 7.0, 5.0, 6.0, 6.0, 2.0, 2.0, 6.0, 0.0, 3.0, 3.0], "bins": [-0.014495215378701687, -0.01408306136727333, -0.0136709064245224, -0.013258752413094044, -0.012846598401665688, -0.012434444390237331, -0.012022290378808975, -0.011610135436058044, -0.011197981424629688, -0.010785827413201332, -0.010373672470450401, -0.009961518459022045, -0.009549364447593689, -0.009137210436165333, -0.008725056424736977, -0.008312901481986046, -0.00790074747055769, -0.0074885934591293335, -0.00707643898203969, -0.0066642845049500465, -0.00625213049352169, -0.005839976482093334, -0.005427822005003691, -0.005015667527914047, -0.004603513516485691, -0.004191359505057335, -0.0037792050279676914, -0.0033670507837086916, -0.0029548965394496918, -0.002542742295190692, -0.002130588050931692, -0.0017184338066726923, -0.001306280493736267, -0.0008941262494772673, -0.00048197200521826744, -6.981776095926762e-05, 0.0003423364832997322, 0.000754490727558732, 0.0011666449718177319, 0.0015787992160767317, 0.0019909534603357315, 0.0024031077045947313, 0.002815261948853731, 0.003227416193112731, 0.003639570437371731, 0.004051724448800087, 0.0044638789258897305, 0.004876033402979374, 0.00528818741440773, 0.005700341425836086, 0.00611249590292573, 0.006524650380015373, 0.006936804391443729, 0.007348958402872086, 0.007761112879961729, 0.008173267357051373, 0.008585421368479729, 0.008997575379908085, 0.009409729391336441, 0.009821884334087372, 0.010234038345515728, 0.010646192356944084, 0.011058347299695015, 0.011470501311123371, 0.011882655322551727]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 7.0, 10.0, 14.0, 32.0, 22.0, 44.0, 86.0, 115.0, 158.0, 234.0, 385.0, 572.0, 841.0, 1251.0, 1754.0, 2789.0, 4153.0, 6303.0, 9834.0, 15771.0, 25845.0, 43724.0, 79201.0, 157910.0, 292373.0, 186730.0, 91426.0, 49187.0, 28724.0, 17345.0, 10907.0, 6926.0, 4706.0, 3062.0, 2045.0, 1357.0, 883.0, 619.0, 390.0, 267.0, 185.0, 112.0, 90.0, 64.0, 35.0, 21.0, 19.0, 6.0, 9.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007564544677734375, -0.007325232028961182, -0.007085919380187988, -0.006846606731414795, -0.0066072940826416016, -0.006367981433868408, -0.006128668785095215, -0.0058893561363220215, -0.005650043487548828, -0.005410730838775635, -0.005171418190002441, -0.004932105541229248, -0.004692792892456055, -0.004453480243682861, -0.004214167594909668, -0.003974854946136475, -0.0037355422973632812, -0.003496229648590088, -0.0032569169998168945, -0.003017604351043701, -0.002778291702270508, -0.0025389790534973145, -0.002299666404724121, -0.0020603537559509277, -0.0018210411071777344, -0.001581728458404541, -0.0013424158096313477, -0.0011031031608581543, -0.0008637905120849609, -0.0006244778633117676, -0.0003851652145385742, -0.00014585256576538086, 9.34600830078125e-05, 0.00033277273178100586, 0.0005720853805541992, 0.0008113980293273926, 0.001050710678100586, 0.0012900233268737793, 0.0015293359756469727, 0.001768648624420166, 0.0020079612731933594, 0.0022472739219665527, 0.002486586570739746, 0.0027258992195129395, 0.002965211868286133, 0.003204524517059326, 0.0034438371658325195, 0.003683149814605713, 0.003922462463378906, 0.0041617751121521, 0.004401087760925293, 0.004640400409698486, 0.00487971305847168, 0.005119025707244873, 0.005358338356018066, 0.00559765100479126, 0.005836963653564453, 0.0060762763023376465, 0.00631558895111084, 0.006554901599884033, 0.0067942142486572266, 0.00703352689743042, 0.007272839546203613, 0.007512152194976807, 0.00775146484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 1.0, 13.0, 10.0, 6.0, 9.0, 15.0, 6.0, 8.0, 8.0, 13.0, 20.0, 16.0, 21.0, 17.0, 25.0, 31.0, 31.0, 33.0, 32.0, 37.0, 44.0, 35.0, 47.0, 41.0, 37.0, 41.0, 42.0, 33.0, 32.0, 29.0, 29.0, 20.0, 28.0, 23.0, 23.0, 21.0, 22.0, 11.0, 10.0, 13.0, 11.0, 15.0, 12.0, 8.0, 5.0, 2.0, 3.0, 1.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.01444244384765625, -0.01400601863861084, -0.01356959342956543, -0.01313316822052002, -0.01269674301147461, -0.0122603178024292, -0.011823892593383789, -0.011387467384338379, -0.010951042175292969, -0.010514616966247559, -0.010078191757202148, -0.009641766548156738, -0.009205341339111328, -0.008768916130065918, -0.008332490921020508, -0.007896065711975098, -0.0074596405029296875, -0.007023215293884277, -0.006586790084838867, -0.006150364875793457, -0.005713939666748047, -0.005277514457702637, -0.0048410892486572266, -0.004404664039611816, -0.003968238830566406, -0.003531813621520996, -0.003095388412475586, -0.0026589632034301758, -0.0022225379943847656, -0.0017861127853393555, -0.0013496875762939453, -0.0009132623672485352, -0.000476837158203125, -4.0411949157714844e-05, 0.0003960132598876953, 0.0008324384689331055, 0.0012688636779785156, 0.0017052888870239258, 0.002141714096069336, 0.002578139305114746, 0.0030145645141601562, 0.0034509897232055664, 0.0038874149322509766, 0.004323840141296387, 0.004760265350341797, 0.005196690559387207, 0.005633115768432617, 0.006069540977478027, 0.0065059661865234375, 0.006942391395568848, 0.007378816604614258, 0.007815241813659668, 0.008251667022705078, 0.008688092231750488, 0.009124517440795898, 0.009560942649841309, 0.009997367858886719, 0.010433793067932129, 0.010870218276977539, 0.01130664348602295, 0.01174306869506836, 0.01217949390411377, 0.01261591911315918, 0.01305234432220459, 0.01348876953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 12.0, 14.0, 13.0, 29.0, 33.0, 65.0, 72.0, 100.0, 155.0, 233.0, 305.0, 486.0, 722.0, 1007.0, 1570.0, 2373.0, 3537.0, 5533.0, 8402.0, 13354.0, 21086.0, 35992.0, 65126.0, 134406.0, 329312.0, 210929.0, 91583.0, 47335.0, 27565.0, 16695.0, 10622.0, 6707.0, 4384.0, 2885.0, 1904.0, 1258.0, 837.0, 577.0, 397.0, 269.0, 203.0, 127.0, 105.0, 59.0, 56.0, 40.0, 19.0, 27.0, 5.0, 6.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.00740814208984375, -0.007181942462921143, -0.006955742835998535, -0.006729543209075928, -0.00650334358215332, -0.006277143955230713, -0.0060509443283081055, -0.005824744701385498, -0.005598545074462891, -0.005372345447540283, -0.005146145820617676, -0.004919946193695068, -0.004693746566772461, -0.0044675469398498535, -0.004241347312927246, -0.004015147686004639, -0.0037889480590820312, -0.003562748432159424, -0.0033365488052368164, -0.003110349178314209, -0.0028841495513916016, -0.002657949924468994, -0.0024317502975463867, -0.0022055506706237793, -0.001979351043701172, -0.0017531514167785645, -0.001526951789855957, -0.0013007521629333496, -0.0010745525360107422, -0.0008483529090881348, -0.0006221532821655273, -0.0003959536552429199, -0.0001697540283203125, 5.644559860229492e-05, 0.00028264522552490234, 0.0005088448524475098, 0.0007350444793701172, 0.0009612441062927246, 0.001187443733215332, 0.0014136433601379395, 0.0016398429870605469, 0.0018660426139831543, 0.0020922422409057617, 0.002318441867828369, 0.0025446414947509766, 0.002770841121673584, 0.0029970407485961914, 0.003223240375518799, 0.0034494400024414062, 0.0036756396293640137, 0.003901839256286621, 0.0041280388832092285, 0.004354238510131836, 0.004580438137054443, 0.004806637763977051, 0.005032837390899658, 0.005259037017822266, 0.005485236644744873, 0.0057114362716674805, 0.005937635898590088, 0.006163835525512695, 0.006390035152435303, 0.00661623477935791, 0.006842434406280518, 0.007068634033203125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 9.0, 9.0, 4.0, 12.0, 15.0, 23.0, 18.0, 16.0, 23.0, 24.0, 21.0, 42.0, 28.0, 32.0, 37.0, 39.0, 41.0, 42.0, 48.0, 57.0, 51.0, 42.0, 44.0, 46.0, 53.0, 25.0, 35.0, 17.0, 31.0, 20.0, 16.0, 14.0, 16.0, 10.0, 9.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0098419189453125, -0.009508013725280762, -0.009174108505249023, -0.008840203285217285, -0.008506298065185547, -0.008172392845153809, -0.00783848762512207, -0.007504582405090332, -0.007170677185058594, -0.0068367719650268555, -0.006502866744995117, -0.006168961524963379, -0.005835056304931641, -0.005501151084899902, -0.005167245864868164, -0.004833340644836426, -0.0044994354248046875, -0.004165530204772949, -0.003831624984741211, -0.0034977197647094727, -0.0031638145446777344, -0.002829909324645996, -0.002496004104614258, -0.0021620988845825195, -0.0018281936645507812, -0.001494288444519043, -0.0011603832244873047, -0.0008264780044555664, -0.0004925727844238281, -0.00015866756439208984, 0.00017523765563964844, 0.0005091428756713867, 0.000843048095703125, 0.0011769533157348633, 0.0015108585357666016, 0.0018447637557983398, 0.002178668975830078, 0.0025125741958618164, 0.0028464794158935547, 0.003180384635925293, 0.0035142898559570312, 0.0038481950759887695, 0.004182100296020508, 0.004516005516052246, 0.004849910736083984, 0.005183815956115723, 0.005517721176147461, 0.005851626396179199, 0.0061855316162109375, 0.006519436836242676, 0.006853342056274414, 0.007187247276306152, 0.007521152496337891, 0.007855057716369629, 0.008188962936401367, 0.008522868156433105, 0.008856773376464844, 0.009190678596496582, 0.00952458381652832, 0.009858489036560059, 0.010192394256591797, 0.010526299476623535, 0.010860204696655273, 0.011194109916687012, 0.01152801513671875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 3.0, 6.0, 13.0, 14.0, 20.0, 41.0, 44.0, 57.0, 84.0, 140.0, 188.0, 291.0, 446.0, 616.0, 1078.0, 1820.0, 3001.0, 5749.0, 11012.0, 24337.0, 63852.0, 298065.0, 501433.0, 79701.0, 28754.0, 12687.0, 6304.0, 3460.0, 1925.0, 1204.0, 768.0, 461.0, 292.0, 211.0, 148.0, 105.0, 61.0, 41.0, 38.0, 23.0, 21.0, 10.0, 9.0, 6.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007190704345703125, -0.0006959438323974609, -0.0006728172302246094, -0.0006496906280517578, -0.0006265640258789062, -0.0006034374237060547, -0.0005803108215332031, -0.0005571842193603516, -0.0005340576171875, -0.0005109310150146484, -0.0004878044128417969, -0.0004646778106689453, -0.00044155120849609375, -0.0004184246063232422, -0.0003952980041503906, -0.00037217140197753906, -0.0003490447998046875, -0.00032591819763183594, -0.0003027915954589844, -0.0002796649932861328, -0.00025653839111328125, -0.0002334117889404297, -0.00021028518676757812, -0.00018715858459472656, -0.000164031982421875, -0.00014090538024902344, -0.00011777877807617188, -9.465217590332031e-05, -7.152557373046875e-05, -4.839897155761719e-05, -2.5272369384765625e-05, -2.1457672119140625e-06, 2.09808349609375e-05, 4.410743713378906e-05, 6.723403930664062e-05, 9.036064147949219e-05, 0.00011348724365234375, 0.0001366138458251953, 0.00015974044799804688, 0.00018286705017089844, 0.00020599365234375, 0.00022912025451660156, 0.0002522468566894531, 0.0002753734588623047, 0.00029850006103515625, 0.0003216266632080078, 0.0003447532653808594, 0.00036787986755371094, 0.0003910064697265625, 0.00041413307189941406, 0.0004372596740722656, 0.0004603862762451172, 0.00048351287841796875, 0.0005066394805908203, 0.0005297660827636719, 0.0005528926849365234, 0.000576019287109375, 0.0005991458892822266, 0.0006222724914550781, 0.0006453990936279297, 0.0006685256958007812, 0.0006916522979736328, 0.0007147789001464844, 0.0007379055023193359, 0.0007610321044921875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 8.0, 9.0, 16.0, 18.0, 23.0, 29.0, 34.0, 38.0, 57.0, 76.0, 85.0, 117.0, 99.0, 78.0, 77.0, 57.0, 46.0, 31.0, 20.0, 9.0, 10.0, 9.0, 8.0, 5.0, 5.0, 11.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1755695343017578e-05, -2.109445631504059e-05, -2.04332172870636e-05, -1.977197825908661e-05, -1.911073923110962e-05, -1.844950020313263e-05, -1.778826117515564e-05, -1.712702214717865e-05, -1.646578311920166e-05, -1.580454409122467e-05, -1.514330506324768e-05, -1.4482066035270691e-05, -1.3820827007293701e-05, -1.3159587979316711e-05, -1.2498348951339722e-05, -1.1837109923362732e-05, -1.1175870895385742e-05, -1.0514631867408752e-05, -9.853392839431763e-06, -9.192153811454773e-06, -8.530914783477783e-06, -7.869675755500793e-06, -7.208436727523804e-06, -6.547197699546814e-06, -5.885958671569824e-06, -5.2247196435928345e-06, -4.563480615615845e-06, -3.902241587638855e-06, -3.2410025596618652e-06, -2.5797635316848755e-06, -1.9185245037078857e-06, -1.257285475730896e-06, -5.960464477539062e-07, 6.51925802230835e-08, 7.264316082000732e-07, 1.387670636177063e-06, 2.0489096641540527e-06, 2.7101486921310425e-06, 3.3713877201080322e-06, 4.032626748085022e-06, 4.693865776062012e-06, 5.3551048040390015e-06, 6.016343832015991e-06, 6.677582859992981e-06, 7.338821887969971e-06, 8.00006091594696e-06, 8.66129994392395e-06, 9.32253897190094e-06, 9.98377799987793e-06, 1.064501702785492e-05, 1.130625605583191e-05, 1.1967495083808899e-05, 1.2628734111785889e-05, 1.3289973139762878e-05, 1.3951212167739868e-05, 1.4612451195716858e-05, 1.5273690223693848e-05, 1.5934929251670837e-05, 1.6596168279647827e-05, 1.7257407307624817e-05, 1.7918646335601807e-05, 1.8579885363578796e-05, 1.9241124391555786e-05, 1.9902363419532776e-05, 2.0563602447509766e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 6.0, 9.0, 6.0, 12.0, 15.0, 22.0, 19.0, 40.0, 55.0, 178.0, 630.0, 2433.0, 16437.0, 647944.0, 364843.0, 12853.0, 2198.0, 508.0, 149.0, 58.0, 35.0, 30.0, 17.0, 13.0, 9.0, 4.0, 5.0, 6.0, 3.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0025177001953125, -0.0024412870407104492, -0.0023648738861083984, -0.0022884607315063477, -0.002212047576904297, -0.002135634422302246, -0.0020592212677001953, -0.0019828081130981445, -0.0019063949584960938, -0.001829981803894043, -0.0017535686492919922, -0.0016771554946899414, -0.0016007423400878906, -0.0015243291854858398, -0.001447916030883789, -0.0013715028762817383, -0.0012950897216796875, -0.0012186765670776367, -0.001142263412475586, -0.0010658502578735352, -0.0009894371032714844, -0.0009130239486694336, -0.0008366107940673828, -0.000760197639465332, -0.0006837844848632812, -0.0006073713302612305, -0.0005309581756591797, -0.0004545450210571289, -0.0003781318664550781, -0.00030171871185302734, -0.00022530555725097656, -0.00014889240264892578, -7.2479248046875e-05, 3.933906555175781e-06, 8.034706115722656e-05, 0.00015676021575927734, 0.00023317337036132812, 0.0003095865249633789, 0.0003859996795654297, 0.00046241283416748047, 0.0005388259887695312, 0.000615239143371582, 0.0006916522979736328, 0.0007680654525756836, 0.0008444786071777344, 0.0009208917617797852, 0.000997304916381836, 0.0010737180709838867, 0.0011501312255859375, 0.0012265443801879883, 0.001302957534790039, 0.0013793706893920898, 0.0014557838439941406, 0.0015321969985961914, 0.0016086101531982422, 0.001685023307800293, 0.0017614364624023438, 0.0018378496170043945, 0.0019142627716064453, 0.001990675926208496, 0.002067089080810547, 0.0021435022354125977, 0.0022199153900146484, 0.0022963285446166992, 0.00237274169921875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 5.0, 7.0, 2.0, 12.0, 10.0, 16.0, 17.0, 24.0, 29.0, 43.0, 35.0, 70.0, 88.0, 172.0, 142.0, 63.0, 64.0, 47.0, 34.0, 20.0, 23.0, 16.0, 7.0, 9.0, 7.0, 8.0, 3.0, 7.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017118453979492188, -0.00016560964286327362, -0.00016003474593162537, -0.0001544598489999771, -0.00014888495206832886, -0.0001433100551366806, -0.00013773515820503235, -0.0001321602612733841, -0.00012658536434173584, -0.00012101046741008759, -0.00011543557047843933, -0.00010986067354679108, -0.00010428577661514282, -9.871087968349457e-05, -9.313598275184631e-05, -8.756108582019806e-05, -8.19861888885498e-05, -7.641129195690155e-05, -7.08363950252533e-05, -6.526149809360504e-05, -5.968660116195679e-05, -5.411170423030853e-05, -4.853680729866028e-05, -4.2961910367012024e-05, -3.738701343536377e-05, -3.1812116503715515e-05, -2.623721957206726e-05, -2.0662322640419006e-05, -1.5087425708770752e-05, -9.512528777122498e-06, -3.937631845474243e-06, 1.6372650861740112e-06, 7.212162017822266e-06, 1.278705894947052e-05, 1.8361955881118774e-05, 2.393685281276703e-05, 2.9511749744415283e-05, 3.508664667606354e-05, 4.066154360771179e-05, 4.6236440539360046e-05, 5.18113374710083e-05, 5.7386234402656555e-05, 6.296113133430481e-05, 6.853602826595306e-05, 7.411092519760132e-05, 7.968582212924957e-05, 8.526071906089783e-05, 9.083561599254608e-05, 9.641051292419434e-05, 0.00010198540985584259, 0.00010756030678749084, 0.0001131352037191391, 0.00011871010065078735, 0.0001242849975824356, 0.00012985989451408386, 0.00013543479144573212, 0.00014100968837738037, 0.00014658458530902863, 0.00015215948224067688, 0.00015773437917232513, 0.0001633092761039734, 0.00016888417303562164, 0.0001744590699672699, 0.00018003396689891815, 0.0001856088638305664]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 9.0, 9.0, 9.0, 6.0, 10.0, 14.0, 26.0, 24.0, 24.0, 48.0, 41.0, 59.0, 53.0, 62.0, 78.0, 63.0, 72.0, 70.0, 60.0, 55.0, 42.0, 30.0, 27.0, 17.0, 21.0, 17.0, 15.0, 10.0, 5.0, 6.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01665581949055195, -0.01610550656914711, -0.015555194579064846, -0.015004882588982582, -0.014454569667577744, -0.01390425767749548, -0.013353945687413216, -0.012803632766008377, -0.012253320775926113, -0.01170300878584385, -0.01115269586443901, -0.010602383874356747, -0.010052071884274483, -0.009501758962869644, -0.00895144697278738, -0.008401134982705116, -0.007850822061300278, -0.0073005096055567265, -0.006750197149813175, -0.006199885159730911, -0.00564957270398736, -0.005099260248243809, -0.004548948258161545, -0.0039986358024179935, -0.0034483233466744423, -0.002898010890930891, -0.0023476986680179834, -0.001797386328689754, -0.0012470739893615246, -0.0006967615336179733, -0.00014644931070506573, 0.0004038629122078419, 0.0009541753679513931, 0.0015044877072796226, 0.002054800046607852, 0.0026051122695207596, 0.003155424725264311, 0.003705737181007862, 0.004256049171090126, 0.004806361626833677, 0.0053566740825772285, 0.00590698653832078, 0.006457298994064331, 0.007007610984146595, 0.007557923439890146, 0.008108235895633698, 0.008658547885715961, 0.009208859875798225, 0.009759172797203064, 0.010309484787285328, 0.010859797708690166, 0.01141010969877243, 0.011960422620177269, 0.012510734610259533, 0.013061046600341797, 0.013611359521746635, 0.0141616715118289, 0.014711983501911163, 0.015262296423316002, 0.01581260934472084, 0.01636292040348053, 0.01691323332488537, 0.017463546246290207, 0.018013857305049896, 0.018564170226454735]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 3.0, 6.0, 8.0, 4.0, 10.0, 10.0, 10.0, 5.0, 13.0, 9.0, 10.0, 16.0, 19.0, 18.0, 19.0, 26.0, 37.0, 28.0, 30.0, 30.0, 33.0, 37.0, 37.0, 59.0, 40.0, 29.0, 39.0, 22.0, 29.0, 33.0, 38.0, 29.0, 36.0, 34.0, 18.0, 37.0, 17.0, 20.0, 18.0, 17.0, 9.0, 19.0, 7.0, 7.0, 6.0, 2.0, 6.0, 2.0, 6.0, 2.0, 1.0, 3.0, 3.0], "bins": [-0.014845266938209534, -0.014428218826651573, -0.014011169783771038, -0.013594121672213078, -0.013177073560655117, -0.012760024517774582, -0.012342976406216621, -0.011925928294658661, -0.0115088801831007, -0.01109183207154274, -0.010674783028662205, -0.010257734917104244, -0.009840686805546284, -0.009423637762665749, -0.009006589651107788, -0.008589541539549828, -0.008172493427991867, -0.007755444850772619, -0.007338396739214659, -0.006921348161995411, -0.00650430005043745, -0.006087251473218203, -0.005670202895998955, -0.005253154784440994, -0.004836105741560459, -0.004419057164341211, -0.004002009052783251, -0.003584960475564003, -0.0031679123640060425, -0.0027508637867867947, -0.0023338154423981905, -0.0019167670980095863, -0.0014997189864516258, -0.0010826706420630217, -0.0006656222394667566, -0.0002485738368704915, 0.00016847450751811266, 0.0005855229683220387, 0.0010025713127106428, 0.001419619657099247, 0.0018366680014878511, 0.0022537163458764553, 0.0026707646902650595, 0.0030878130346536636, 0.0035048616118729115, 0.003921910189092159, 0.00433895830065012, 0.00475600641220808, 0.005173054989427328, 0.005590103566646576, 0.0060071516782045364, 0.006424200255423784, 0.006841248366981745, 0.007258296944200993, 0.007675345055758953, 0.008092394098639488, 0.008509442210197449, 0.00892649032175541, 0.009343539364635944, 0.009760587476193905, 0.010177635587751865, 0.0105946846306324, 0.011011732742190361, 0.011428780853748322, 0.011845828965306282]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 6.0, 9.0, 15.0, 11.0, 26.0, 38.0, 43.0, 67.0, 80.0, 144.0, 200.0, 299.0, 458.0, 670.0, 967.0, 1375.0, 2119.0, 3285.0, 4968.0, 7695.0, 11915.0, 18535.0, 29052.0, 46240.0, 74160.0, 114429.0, 159890.0, 174159.0, 140564.0, 93975.0, 59466.0, 37211.0, 23347.0, 14993.0, 9561.0, 6266.0, 4113.0, 2647.0, 1804.0, 1197.0, 808.0, 582.0, 374.0, 247.0, 166.0, 130.0, 76.0, 54.0, 39.0, 31.0, 19.0, 10.0, 12.0, 7.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.0247039794921875, -0.023913860321044922, -0.023123741149902344, -0.022333621978759766, -0.021543502807617188, -0.02075338363647461, -0.01996326446533203, -0.019173145294189453, -0.018383026123046875, -0.017592906951904297, -0.01680278778076172, -0.01601266860961914, -0.015222549438476562, -0.014432430267333984, -0.013642311096191406, -0.012852191925048828, -0.01206207275390625, -0.011271953582763672, -0.010481834411621094, -0.009691715240478516, -0.008901596069335938, -0.00811147689819336, -0.007321357727050781, -0.006531238555908203, -0.005741119384765625, -0.004951000213623047, -0.004160881042480469, -0.0033707618713378906, -0.0025806427001953125, -0.0017905235290527344, -0.0010004043579101562, -0.00021028518676757812, 0.000579833984375, 0.0013699531555175781, 0.0021600723266601562, 0.0029501914978027344, 0.0037403106689453125, 0.004530429840087891, 0.005320549011230469, 0.006110668182373047, 0.006900787353515625, 0.007690906524658203, 0.008481025695800781, 0.00927114486694336, 0.010061264038085938, 0.010851383209228516, 0.011641502380371094, 0.012431621551513672, 0.01322174072265625, 0.014011859893798828, 0.014801979064941406, 0.015592098236083984, 0.016382217407226562, 0.01717233657836914, 0.01796245574951172, 0.018752574920654297, 0.019542694091796875, 0.020332813262939453, 0.02112293243408203, 0.02191305160522461, 0.022703170776367188, 0.023493289947509766, 0.024283409118652344, 0.025073528289794922, 0.0258636474609375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 9.0, 7.0, 8.0, 8.0, 11.0, 5.0, 9.0, 11.0, 18.0, 17.0, 22.0, 17.0, 19.0, 15.0, 41.0, 25.0, 26.0, 37.0, 40.0, 42.0, 39.0, 41.0, 41.0, 42.0, 40.0, 34.0, 34.0, 40.0, 32.0, 27.0, 25.0, 29.0, 29.0, 22.0, 25.0, 15.0, 20.0, 11.0, 10.0, 8.0, 10.0, 9.0, 3.0, 5.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.01152801513671875, -0.011190176010131836, -0.010852336883544922, -0.010514497756958008, -0.010176658630371094, -0.00983881950378418, -0.009500980377197266, -0.009163141250610352, -0.008825302124023438, -0.008487462997436523, -0.00814962387084961, -0.007811784744262695, -0.007473945617675781, -0.007136106491088867, -0.006798267364501953, -0.006460428237915039, -0.006122589111328125, -0.005784749984741211, -0.005446910858154297, -0.005109071731567383, -0.004771232604980469, -0.004433393478393555, -0.004095554351806641, -0.0037577152252197266, -0.0034198760986328125, -0.0030820369720458984, -0.0027441978454589844, -0.0024063587188720703, -0.0020685195922851562, -0.0017306804656982422, -0.0013928413391113281, -0.001055002212524414, -0.0007171630859375, -0.00037932395935058594, -4.1484832763671875e-05, 0.0002963542938232422, 0.0006341934204101562, 0.0009720325469970703, 0.0013098716735839844, 0.0016477108001708984, 0.0019855499267578125, 0.0023233890533447266, 0.0026612281799316406, 0.0029990673065185547, 0.0033369064331054688, 0.003674745559692383, 0.004012584686279297, 0.004350423812866211, 0.004688262939453125, 0.005026102066040039, 0.005363941192626953, 0.005701780319213867, 0.006039619445800781, 0.006377458572387695, 0.006715297698974609, 0.0070531368255615234, 0.0073909759521484375, 0.0077288150787353516, 0.008066654205322266, 0.00840449333190918, 0.008742332458496094, 0.009080171585083008, 0.009418010711669922, 0.009755849838256836, 0.01009368896484375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 5.0, 8.0, 14.0, 27.0, 14.0, 26.0, 26.0, 33.0, 46.0, 83.0, 215.0, 900.0, 4373.0, 23254.0, 130725.0, 502694.0, 312929.0, 59481.0, 10684.0, 2101.0, 454.0, 160.0, 68.0, 37.0, 31.0, 23.0, 23.0, 24.0, 11.0, 11.0, 13.0, 10.0, 10.0, 7.0, 4.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06768798828125, -0.06506156921386719, -0.062435150146484375, -0.05980873107910156, -0.05718231201171875, -0.05455589294433594, -0.051929473876953125, -0.04930305480957031, -0.0466766357421875, -0.04405021667480469, -0.041423797607421875, -0.03879737854003906, -0.03617095947265625, -0.03354454040527344, -0.030918121337890625, -0.028291702270507812, -0.025665283203125, -0.023038864135742188, -0.020412445068359375, -0.017786026000976562, -0.01515960693359375, -0.012533187866210938, -0.009906768798828125, -0.0072803497314453125, -0.0046539306640625, -0.0020275115966796875, 0.000598907470703125, 0.0032253265380859375, 0.00585174560546875, 0.008478164672851562, 0.011104583740234375, 0.013731002807617188, 0.016357421875, 0.018983840942382812, 0.021610260009765625, 0.024236679077148438, 0.02686309814453125, 0.029489517211914062, 0.032115936279296875, 0.03474235534667969, 0.0373687744140625, 0.03999519348144531, 0.042621612548828125, 0.04524803161621094, 0.04787445068359375, 0.05050086975097656, 0.053127288818359375, 0.05575370788574219, 0.058380126953125, 0.06100654602050781, 0.06363296508789062, 0.06625938415527344, 0.06888580322265625, 0.07151222229003906, 0.07413864135742188, 0.07676506042480469, 0.0793914794921875, 0.08201789855957031, 0.08464431762695312, 0.08727073669433594, 0.08989715576171875, 0.09252357482910156, 0.09514999389648438, 0.09777641296386719, 0.10040283203125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 3.0, 6.0, 9.0, 8.0, 7.0, 14.0, 20.0, 22.0, 20.0, 21.0, 32.0, 38.0, 29.0, 24.0, 40.0, 35.0, 43.0, 53.0, 38.0, 55.0, 47.0, 41.0, 51.0, 48.0, 30.0, 33.0, 26.0, 34.0, 37.0, 24.0, 19.0, 16.0, 17.0, 12.0, 14.0, 12.0, 7.0, 3.0, 3.0, 3.0, 3.0, 4.0, 0.0, 4.0], "bins": [-0.013671875, -0.013327717781066895, -0.012983560562133789, -0.012639403343200684, -0.012295246124267578, -0.011951088905334473, -0.011606931686401367, -0.011262774467468262, -0.010918617248535156, -0.01057446002960205, -0.010230302810668945, -0.00988614559173584, -0.009541988372802734, -0.009197831153869629, -0.008853673934936523, -0.008509516716003418, -0.008165359497070312, -0.007821202278137207, -0.0074770450592041016, -0.007132887840270996, -0.006788730621337891, -0.006444573402404785, -0.00610041618347168, -0.005756258964538574, -0.005412101745605469, -0.005067944526672363, -0.004723787307739258, -0.004379630088806152, -0.004035472869873047, -0.0036913156509399414, -0.003347158432006836, -0.0030030012130737305, -0.002658843994140625, -0.0023146867752075195, -0.001970529556274414, -0.0016263723373413086, -0.0012822151184082031, -0.0009380578994750977, -0.0005939006805419922, -0.0002497434616088867, 9.441375732421875e-05, 0.0004385709762573242, 0.0007827281951904297, 0.0011268854141235352, 0.0014710426330566406, 0.001815199851989746, 0.0021593570709228516, 0.002503514289855957, 0.0028476715087890625, 0.003191828727722168, 0.0035359859466552734, 0.003880143165588379, 0.004224300384521484, 0.00456845760345459, 0.004912614822387695, 0.005256772041320801, 0.005600929260253906, 0.005945086479187012, 0.006289243698120117, 0.006633400917053223, 0.006977558135986328, 0.007321715354919434, 0.007665872573852539, 0.008010029792785645, 0.00835418701171875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 5.0, 14.0, 12.0, 12.0, 31.0, 53.0, 58.0, 94.0, 135.0, 156.0, 274.0, 340.0, 511.0, 785.0, 1239.0, 2046.0, 3324.0, 5959.0, 20552.0, 834708.0, 155821.0, 10376.0, 4562.0, 2652.0, 1640.0, 1052.0, 700.0, 432.0, 295.0, 236.0, 116.0, 108.0, 83.0, 58.0, 34.0, 22.0, 16.0, 19.0, 8.0, 9.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.004558563232421875, -0.004423677921295166, -0.004288792610168457, -0.004153907299041748, -0.004019021987915039, -0.00388413667678833, -0.003749251365661621, -0.003614366054534912, -0.003479480743408203, -0.003344595432281494, -0.003209710121154785, -0.003074824810028076, -0.002939939498901367, -0.002805054187774658, -0.0026701688766479492, -0.0025352835655212402, -0.0024003982543945312, -0.0022655129432678223, -0.0021306276321411133, -0.0019957423210144043, -0.0018608570098876953, -0.0017259716987609863, -0.0015910863876342773, -0.0014562010765075684, -0.0013213157653808594, -0.0011864304542541504, -0.0010515451431274414, -0.0009166598320007324, -0.0007817745208740234, -0.0006468892097473145, -0.0005120038986206055, -0.0003771185874938965, -0.0002422332763671875, -0.00010734796524047852, 2.753734588623047e-05, 0.00016242265701293945, 0.00029730796813964844, 0.0004321932792663574, 0.0005670785903930664, 0.0007019639015197754, 0.0008368492126464844, 0.0009717345237731934, 0.0011066198348999023, 0.0012415051460266113, 0.0013763904571533203, 0.0015112757682800293, 0.0016461610794067383, 0.0017810463905334473, 0.0019159317016601562, 0.0020508170127868652, 0.0021857023239135742, 0.002320587635040283, 0.002455472946166992, 0.002590358257293701, 0.00272524356842041, 0.002860128879547119, 0.002995014190673828, 0.003129899501800537, 0.003264784812927246, 0.003399670124053955, 0.003534555435180664, 0.003669440746307373, 0.003804326057434082, 0.003939211368560791, 0.0040740966796875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 2.0, 13.0, 15.0, 14.0, 23.0, 27.0, 46.0, 58.0, 68.0, 82.0, 80.0, 90.0, 105.0, 74.0, 61.0, 47.0, 48.0, 38.0, 23.0, 16.0, 14.0, 6.0, 14.0, 4.0, 4.0, 9.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.233816146850586e-05, -1.2033618986606598e-05, -1.1729076504707336e-05, -1.1424534022808075e-05, -1.1119991540908813e-05, -1.0815449059009552e-05, -1.051090657711029e-05, -1.0206364095211029e-05, -9.901821613311768e-06, -9.597279131412506e-06, -9.292736649513245e-06, -8.988194167613983e-06, -8.683651685714722e-06, -8.37910920381546e-06, -8.074566721916199e-06, -7.770024240016937e-06, -7.465481758117676e-06, -7.160939276218414e-06, -6.856396794319153e-06, -6.551854312419891e-06, -6.24731183052063e-06, -5.942769348621368e-06, -5.638226866722107e-06, -5.3336843848228455e-06, -5.029141902923584e-06, -4.7245994210243225e-06, -4.420056939125061e-06, -4.1155144572257996e-06, -3.810971975326538e-06, -3.5064294934272766e-06, -3.201887011528015e-06, -2.8973445296287537e-06, -2.592802047729492e-06, -2.2882595658302307e-06, -1.9837170839309692e-06, -1.6791746020317078e-06, -1.3746321201324463e-06, -1.0700896382331848e-06, -7.655471563339233e-07, -4.6100467443466187e-07, -1.564621925354004e-07, 1.4808028936386108e-07, 4.5262277126312256e-07, 7.57165253162384e-07, 1.0617077350616455e-06, 1.366250216960907e-06, 1.6707926988601685e-06, 1.97533518075943e-06, 2.2798776626586914e-06, 2.584420144557953e-06, 2.8889626264572144e-06, 3.193505108356476e-06, 3.4980475902557373e-06, 3.8025900721549988e-06, 4.10713255405426e-06, 4.411675035953522e-06, 4.716217517852783e-06, 5.020759999752045e-06, 5.325302481651306e-06, 5.629844963550568e-06, 5.934387445449829e-06, 6.2389299273490906e-06, 6.543472409248352e-06, 6.8480148911476135e-06, 7.152557373046875e-06]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 18.0, 34.0, 101.0, 314.0, 1044.0, 4023.0, 45183.0, 989263.0, 6307.0, 1579.0, 465.0, 129.0, 49.0, 22.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01349639892578125, -0.013048768043518066, -0.012601137161254883, -0.0121535062789917, -0.011705875396728516, -0.011258244514465332, -0.010810613632202148, -0.010362982749938965, -0.009915351867675781, -0.009467720985412598, -0.009020090103149414, -0.00857245922088623, -0.008124828338623047, -0.007677197456359863, -0.00722956657409668, -0.006781935691833496, -0.0063343048095703125, -0.005886673927307129, -0.005439043045043945, -0.004991412162780762, -0.004543781280517578, -0.0040961503982543945, -0.003648519515991211, -0.0032008886337280273, -0.0027532577514648438, -0.00230562686920166, -0.0018579959869384766, -0.001410365104675293, -0.0009627342224121094, -0.0005151033401489258, -6.747245788574219e-05, 0.0003801584243774414, 0.000827789306640625, 0.0012754201889038086, 0.0017230510711669922, 0.0021706819534301758, 0.0026183128356933594, 0.003065943717956543, 0.0035135746002197266, 0.00396120548248291, 0.004408836364746094, 0.004856467247009277, 0.005304098129272461, 0.0057517290115356445, 0.006199359893798828, 0.006646990776062012, 0.007094621658325195, 0.007542252540588379, 0.007989883422851562, 0.008437514305114746, 0.00888514518737793, 0.009332776069641113, 0.009780406951904297, 0.01022803783416748, 0.010675668716430664, 0.011123299598693848, 0.011570930480957031, 0.012018561363220215, 0.012466192245483398, 0.012913823127746582, 0.013361454010009766, 0.01380908489227295, 0.014256715774536133, 0.014704346656799316, 0.0151519775390625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 20.0, 102.0, 394.0, 353.0, 72.0, 23.0, 7.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016489028930664062, -0.0015988051891326904, -0.0015487074851989746, -0.0014986097812652588, -0.001448512077331543, -0.0013984143733978271, -0.0013483166694641113, -0.0012982189655303955, -0.0012481212615966797, -0.0011980235576629639, -0.001147925853729248, -0.0010978281497955322, -0.0010477304458618164, -0.0009976327419281006, -0.0009475350379943848, -0.0008974373340606689, -0.0008473396301269531, -0.0007972419261932373, -0.0007471442222595215, -0.0006970465183258057, -0.0006469488143920898, -0.000596851110458374, -0.0005467534065246582, -0.0004966557025909424, -0.00044655799865722656, -0.00039646029472351074, -0.0003463625907897949, -0.0002962648868560791, -0.0002461671829223633, -0.00019606947898864746, -0.00014597177505493164, -9.587407112121582e-05, -4.57763671875e-05, 4.32133674621582e-06, 5.441904067993164e-05, 0.00010451674461364746, 0.00015461444854736328, 0.0002047121524810791, 0.0002548098564147949, 0.00030490756034851074, 0.00035500526428222656, 0.0004051029682159424, 0.0004552006721496582, 0.000505298376083374, 0.0005553960800170898, 0.0006054937839508057, 0.0006555914878845215, 0.0007056891918182373, 0.0007557868957519531, 0.0008058845996856689, 0.0008559823036193848, 0.0009060800075531006, 0.0009561777114868164, 0.0010062754154205322, 0.001056373119354248, 0.0011064708232879639, 0.0011565685272216797, 0.0012066662311553955, 0.0012567639350891113, 0.0013068616390228271, 0.001356959342956543, 0.0014070570468902588, 0.0014571547508239746, 0.0015072524547576904, 0.0015573501586914062]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 1.0, 4.0, 7.0, 7.0, 10.0, 8.0, 15.0, 18.0, 18.0, 27.0, 27.0, 54.0, 57.0, 70.0, 68.0, 93.0, 81.0, 77.0, 76.0, 60.0, 51.0, 51.0, 34.0, 21.0, 18.0, 6.0, 12.0, 11.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019766420125961304, -0.01911001466214657, -0.018453609198331833, -0.017797203734517097, -0.017140798270702362, -0.016484392806887627, -0.01582798734307289, -0.01517158281058073, -0.014515177346765995, -0.01385877188295126, -0.013202366419136524, -0.012545961886644363, -0.011889556422829628, -0.011233150959014893, -0.010576745495200157, -0.009920340031385422, -0.009263934567570686, -0.008607529103755951, -0.007951123639941216, -0.007294718641787767, -0.006638313177973032, -0.005981907714158297, -0.0053255027160048485, -0.004669097252190113, -0.004012691788375378, -0.0033562863245606422, -0.0026998810935765505, -0.0020434758625924587, -0.0013870703987777233, -0.0007306649349629879, -7.42599368095398e-05, 0.0005821455270051956, 0.001238550990819931, 0.0018949563382193446, 0.002551361685618758, 0.00320776691660285, 0.0038641723804175854, 0.004520577844232321, 0.005176982842385769, 0.005833388306200504, 0.00648979377001524, 0.007146199233829975, 0.0078026046976447105, 0.008459009230136871, 0.009115414693951607, 0.009771820157766342, 0.010428225621581078, 0.011084631085395813, 0.011741036549210548, 0.012397442013025284, 0.01305384747684002, 0.013710252940654755, 0.01436665840446949, 0.015023063868284225, 0.01567946746945381, 0.016335874795913696, 0.016992278397083282, 0.017648683860898018, 0.018305089324712753, 0.01896149478852749, 0.019617900252342224, 0.02027430571615696, 0.020930711179971695, 0.02158711478114128, 0.022243522107601166]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 7.0, 6.0, 10.0, 12.0, 8.0, 12.0, 14.0, 15.0, 13.0, 27.0, 27.0, 27.0, 27.0, 29.0, 34.0, 32.0, 32.0, 40.0, 30.0, 36.0, 40.0, 49.0, 47.0, 42.0, 47.0, 33.0, 39.0, 34.0, 30.0, 32.0, 25.0, 21.0, 20.0, 21.0, 20.0, 13.0, 16.0, 5.0, 9.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.013522660359740257, -0.013048499822616577, -0.012574338354170322, -0.012100177817046642, -0.011626017279922962, -0.011151855811476707, -0.010677695274353027, -0.010203534737229347, -0.009729374200105667, -0.009255213662981987, -0.008781052194535732, -0.008306891657412052, -0.007832731120288372, -0.007358570117503405, -0.006884409114718437, -0.006410248577594757, -0.00593608757480979, -0.005461926572024822, -0.004987766034901142, -0.004513605032116175, -0.004039444494992495, -0.003565283492207527, -0.0030911227222532034, -0.0026169619522988796, -0.002142801182344556, -0.001668640412390232, -0.0011944796424359083, -0.0007203187560662627, -0.00024615798611193895, 0.00022800290025770664, 0.0007021636702120304, 0.0011763244401663542, 0.001650485210120678, 0.0021246459800750017, 0.0025988067500293255, 0.003072967752814293, 0.003547128289937973, 0.0040212892927229404, 0.004495450295507908, 0.004969610832631588, 0.005443771369755268, 0.0059179323725402355, 0.006392092909663916, 0.006866253912448883, 0.007340414449572563, 0.007814574986696243, 0.008288736455142498, 0.008762896992266178, 0.009237058460712433, 0.009711218997836113, 0.010185380466282368, 0.010659541003406048, 0.011133701540529728, 0.011607863008975983, 0.012082023546099663, 0.012556184083223343, 0.013030344620347023, 0.013504505157470703, 0.013978666625916958, 0.014452827163040638, 0.014926987700164318, 0.015401149168610573, 0.015875309705734253, 0.016349470242857933, 0.016823630779981613]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 9.0, 8.0, 17.0, 15.0, 21.0, 23.0, 30.0, 49.0, 65.0, 136.0, 206.0, 332.0, 566.0, 1231.0, 2450.0, 6132.0, 18557.0, 122141.0, 3941883.0, 75774.0, 14786.0, 5285.0, 2161.0, 1052.0, 536.0, 310.0, 159.0, 101.0, 65.0, 42.0, 31.0, 28.0, 24.0, 11.0, 11.0, 4.0, 4.0, 8.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07159423828125, -0.06938648223876953, -0.06717872619628906, -0.0649709701538086, -0.06276321411132812, -0.060555458068847656, -0.05834770202636719, -0.05613994598388672, -0.05393218994140625, -0.05172443389892578, -0.04951667785644531, -0.047308921813964844, -0.045101165771484375, -0.042893409729003906, -0.04068565368652344, -0.03847789764404297, -0.0362701416015625, -0.03406238555908203, -0.03185462951660156, -0.029646873474121094, -0.027439117431640625, -0.025231361389160156, -0.023023605346679688, -0.02081584930419922, -0.01860809326171875, -0.01640033721923828, -0.014192581176757812, -0.011984825134277344, -0.009777069091796875, -0.007569313049316406, -0.0053615570068359375, -0.0031538009643554688, -0.000946044921875, 0.0012617111206054688, 0.0034694671630859375, 0.005677223205566406, 0.007884979248046875, 0.010092735290527344, 0.012300491333007812, 0.014508247375488281, 0.01671600341796875, 0.01892375946044922, 0.021131515502929688, 0.023339271545410156, 0.025547027587890625, 0.027754783630371094, 0.029962539672851562, 0.03217029571533203, 0.0343780517578125, 0.03658580780029297, 0.03879356384277344, 0.041001319885253906, 0.043209075927734375, 0.045416831970214844, 0.04762458801269531, 0.04983234405517578, 0.05204010009765625, 0.05424785614013672, 0.05645561218261719, 0.058663368225097656, 0.060871124267578125, 0.0630788803100586, 0.06528663635253906, 0.06749439239501953, 0.0697021484375]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 3.0, 11.0, 7.0, 7.0, 13.0, 18.0, 18.0, 17.0, 18.0, 21.0, 27.0, 37.0, 33.0, 37.0, 41.0, 47.0, 44.0, 61.0, 46.0, 50.0, 44.0, 36.0, 39.0, 38.0, 39.0, 39.0, 35.0, 32.0, 27.0, 19.0, 19.0, 15.0, 12.0, 16.0, 9.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01318359375, -0.012754321098327637, -0.012325048446655273, -0.01189577579498291, -0.011466503143310547, -0.011037230491638184, -0.01060795783996582, -0.010178685188293457, -0.009749412536621094, -0.00932013988494873, -0.008890867233276367, -0.008461594581604004, -0.00803232192993164, -0.007603049278259277, -0.007173776626586914, -0.006744503974914551, -0.0063152313232421875, -0.005885958671569824, -0.005456686019897461, -0.005027413368225098, -0.004598140716552734, -0.004168868064880371, -0.003739595413208008, -0.0033103227615356445, -0.0028810501098632812, -0.002451777458190918, -0.0020225048065185547, -0.0015932321548461914, -0.0011639595031738281, -0.0007346868515014648, -0.00030541419982910156, 0.00012385845184326172, 0.000553131103515625, 0.0009824037551879883, 0.0014116764068603516, 0.0018409490585327148, 0.002270221710205078, 0.0026994943618774414, 0.0031287670135498047, 0.003558039665222168, 0.003987312316894531, 0.0044165849685668945, 0.004845857620239258, 0.005275130271911621, 0.005704402923583984, 0.006133675575256348, 0.006562948226928711, 0.006992220878601074, 0.0074214935302734375, 0.0078507661819458, 0.008280038833618164, 0.008709311485290527, 0.00913858413696289, 0.009567856788635254, 0.009997129440307617, 0.01042640209197998, 0.010855674743652344, 0.011284947395324707, 0.01171422004699707, 0.012143492698669434, 0.012572765350341797, 0.01300203800201416, 0.013431310653686523, 0.013860583305358887, 0.01428985595703125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 11.0, 18.0, 39.0, 103.0, 351.0, 1723.0, 14945.0, 2159046.0, 2000822.0, 14838.0, 1807.0, 353.0, 106.0, 36.0, 27.0, 12.0, 11.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.173828125, -0.16886138916015625, -0.1638946533203125, -0.15892791748046875, -0.153961181640625, -0.14899444580078125, -0.1440277099609375, -0.13906097412109375, -0.13409423828125, -0.12912750244140625, -0.1241607666015625, -0.11919403076171875, -0.114227294921875, -0.10926055908203125, -0.1042938232421875, -0.09932708740234375, -0.0943603515625, -0.08939361572265625, -0.0844268798828125, -0.07946014404296875, -0.074493408203125, -0.06952667236328125, -0.0645599365234375, -0.05959320068359375, -0.05462646484375, -0.04965972900390625, -0.0446929931640625, -0.03972625732421875, -0.034759521484375, -0.02979278564453125, -0.0248260498046875, -0.01985931396484375, -0.014892578125, -0.00992584228515625, -0.0049591064453125, 7.62939453125e-06, 0.004974365234375, 0.00994110107421875, 0.0149078369140625, 0.01987457275390625, 0.02484130859375, 0.02980804443359375, 0.0347747802734375, 0.03974151611328125, 0.044708251953125, 0.04967498779296875, 0.0546417236328125, 0.05960845947265625, 0.0645751953125, 0.06954193115234375, 0.0745086669921875, 0.07947540283203125, 0.084442138671875, 0.08940887451171875, 0.0943756103515625, 0.09934234619140625, 0.10430908203125, 0.10927581787109375, 0.1142425537109375, 0.11920928955078125, 0.124176025390625, 0.12914276123046875, 0.1341094970703125, 0.13907623291015625, 0.14404296875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 2.0, 12.0, 10.0, 18.0, 33.0, 24.0, 36.0, 52.0, 84.0, 161.0, 391.0, 1092.0, 1225.0, 462.0, 186.0, 89.0, 54.0, 35.0, 30.0, 19.0, 8.0, 10.0, 9.0, 11.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00894927978515625, -0.008577227592468262, -0.008205175399780273, -0.007833123207092285, -0.007461071014404297, -0.007089018821716309, -0.00671696662902832, -0.006344914436340332, -0.005972862243652344, -0.0056008100509643555, -0.005228757858276367, -0.004856705665588379, -0.004484653472900391, -0.004112601280212402, -0.003740549087524414, -0.0033684968948364258, -0.0029964447021484375, -0.0026243925094604492, -0.002252340316772461, -0.0018802881240844727, -0.0015082359313964844, -0.001136183738708496, -0.0007641315460205078, -0.00039207935333251953, -2.002716064453125e-05, 0.00035202503204345703, 0.0007240772247314453, 0.0010961294174194336, 0.0014681816101074219, 0.0018402338027954102, 0.0022122859954833984, 0.0025843381881713867, 0.002956390380859375, 0.0033284425735473633, 0.0037004947662353516, 0.00407254695892334, 0.004444599151611328, 0.004816651344299316, 0.005188703536987305, 0.005560755729675293, 0.005932807922363281, 0.0063048601150512695, 0.006676912307739258, 0.007048964500427246, 0.007421016693115234, 0.007793068885803223, 0.008165121078491211, 0.0085371732711792, 0.008909225463867188, 0.009281277656555176, 0.009653329849243164, 0.010025382041931152, 0.01039743423461914, 0.010769486427307129, 0.011141538619995117, 0.011513590812683105, 0.011885643005371094, 0.012257695198059082, 0.01262974739074707, 0.013001799583435059, 0.013373851776123047, 0.013745903968811035, 0.014117956161499023, 0.014490008354187012, 0.014862060546875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 4.0, 5.0, 17.0, 15.0, 19.0, 22.0, 36.0, 29.0, 39.0, 56.0, 63.0, 69.0, 84.0, 92.0, 69.0, 67.0, 68.0, 56.0, 38.0, 36.0, 30.0, 14.0, 16.0, 12.0, 8.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017624402418732643, -0.01703825406730175, -0.016452105715870857, -0.015865957364439964, -0.015279809013009071, -0.014693660661578178, -0.014107512310147285, -0.013521363958716393, -0.0129352156072855, -0.012349067255854607, -0.011762918904423714, -0.01117677055299282, -0.010590622201561928, -0.010004473850131035, -0.009418325498700142, -0.008832177147269249, -0.008246028795838356, -0.007659880444407463, -0.00707373209297657, -0.006487583741545677, -0.005901435390114784, -0.005315287038683891, -0.004729138687252998, -0.004142990335822105, -0.0035568419843912125, -0.0029706936329603195, -0.0023845452815294266, -0.0017983969300985336, -0.0012122485786676407, -0.0006261002272367477, -3.99518758058548e-05, 0.0005461964756250381, 0.001132344827055931, 0.001718493178486824, 0.002304641529917717, 0.00289078988134861, 0.003476938232779503, 0.004063086584210396, 0.004649234935641289, 0.005235383287072182, 0.005821531638503075, 0.006407679989933968, 0.0069938283413648605, 0.0075799766927957535, 0.008166125044226646, 0.00875227339565754, 0.009338421747088432, 0.009924570098519325, 0.010510718449950218, 0.011096866801381111, 0.011683015152812004, 0.012269163504242897, 0.01285531185567379, 0.013441460207104683, 0.014027608558535576, 0.014613756909966469, 0.015199905261397362, 0.015786053612828255, 0.016372201964259148, 0.01695835031569004, 0.017544498667120934, 0.018130647018551826, 0.01871679536998272, 0.019302943721413612, 0.019889092072844505]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 15.0, 4.0, 5.0, 6.0, 7.0, 14.0, 12.0, 19.0, 18.0, 20.0, 30.0, 24.0, 43.0, 43.0, 47.0, 48.0, 45.0, 45.0, 45.0, 47.0, 38.0, 44.0, 38.0, 43.0, 43.0, 37.0, 42.0, 24.0, 29.0, 30.0, 15.0, 21.0, 20.0, 13.0, 7.0, 9.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014208605512976646, -0.013705836609005928, -0.013203066773712635, -0.012700297869741917, -0.012197528034448624, -0.011694759130477905, -0.011191990226507187, -0.010689220391213894, -0.010186450555920601, -0.009683681651949883, -0.00918091181665659, -0.008678142912685871, -0.008175373077392578, -0.00767260417342186, -0.007169834803789854, -0.006667065434157848, -0.00616429653018713, -0.005661527160555124, -0.005158757790923119, -0.0046559888869524, -0.004153219051659107, -0.003650449914857745, -0.003147680778056383, -0.0026449114084243774, -0.0021421420387923717, -0.001639372669160366, -0.0011366034159436822, -0.0006338341627269983, -0.00013106479309499264, 0.00037170457653701305, 0.0008744737133383751, 0.0013772430829703808, 0.0018800124526023865, 0.002382781822234392, 0.002885551191866398, 0.00338832032866776, 0.0038910896982997656, 0.004393858835101128, 0.004896628204733133, 0.005399397574365139, 0.005902166943997145, 0.00640493631362915, 0.006907705683261156, 0.007410475052893162, 0.00791324395686388, 0.008416013792157173, 0.008918782696127892, 0.00942155160009861, 0.009924321435391903, 0.010427090339362621, 0.010929860174655914, 0.011432629078626633, 0.011935398913919926, 0.012438167817890644, 0.012940937653183937, 0.013443706557154655, 0.013946475461125374, 0.014449244365096092, 0.014952014200389385, 0.015454783104360104, 0.015957552939653397, 0.016460321843624115, 0.016963090747594833, 0.017465859651565552, 0.01796863041818142]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 12.0, 17.0, 22.0, 42.0, 41.0, 58.0, 90.0, 129.0, 165.0, 267.0, 367.0, 468.0, 760.0, 1031.0, 1424.0, 2031.0, 2967.0, 4169.0, 6075.0, 8810.0, 13277.0, 20234.0, 32013.0, 51896.0, 89160.0, 167049.0, 260838.0, 158468.0, 85606.0, 49804.0, 31114.0, 19319.0, 12588.0, 8659.0, 5769.0, 4053.0, 2798.0, 2001.0, 1503.0, 1008.0, 677.0, 539.0, 354.0, 254.0, 193.0, 120.0, 101.0, 78.0, 38.0, 29.0, 21.0, 18.0, 14.0, 5.0, 8.0, 2.0, 3.0], "bins": [-0.0066375732421875, -0.006439208984375, -0.0062408447265625, -0.00604248046875, -0.0058441162109375, -0.005645751953125, -0.0054473876953125, -0.0052490234375, -0.0050506591796875, -0.004852294921875, -0.0046539306640625, -0.00445556640625, -0.0042572021484375, -0.004058837890625, -0.0038604736328125, -0.003662109375, -0.0034637451171875, -0.003265380859375, -0.0030670166015625, -0.00286865234375, -0.0026702880859375, -0.002471923828125, -0.0022735595703125, -0.0020751953125, -0.0018768310546875, -0.001678466796875, -0.0014801025390625, -0.00128173828125, -0.0010833740234375, -0.000885009765625, -0.0006866455078125, -0.00048828125, -0.0002899169921875, -9.1552734375e-05, 0.0001068115234375, 0.00030517578125, 0.0005035400390625, 0.000701904296875, 0.0009002685546875, 0.0010986328125, 0.0012969970703125, 0.001495361328125, 0.0016937255859375, 0.00189208984375, 0.0020904541015625, 0.002288818359375, 0.0024871826171875, 0.002685546875, 0.0028839111328125, 0.003082275390625, 0.0032806396484375, 0.00347900390625, 0.0036773681640625, 0.003875732421875, 0.0040740966796875, 0.0042724609375, 0.0044708251953125, 0.004669189453125, 0.0048675537109375, 0.00506591796875, 0.0052642822265625, 0.005462646484375, 0.0056610107421875, 0.005859375, 0.0060577392578125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 6.0, 6.0, 1.0, 7.0, 5.0, 7.0, 6.0, 14.0, 13.0, 18.0, 10.0, 14.0, 25.0, 23.0, 41.0, 34.0, 56.0, 39.0, 38.0, 50.0, 43.0, 35.0, 52.0, 51.0, 56.0, 44.0, 37.0, 41.0, 42.0, 33.0, 25.0, 28.0, 21.0, 17.0, 19.0, 9.0, 14.0, 8.0, 10.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0162200927734375, -0.015692472457885742, -0.015164852142333984, -0.014637231826782227, -0.014109611511230469, -0.013581991195678711, -0.013054370880126953, -0.012526750564575195, -0.011999130249023438, -0.01147150993347168, -0.010943889617919922, -0.010416269302368164, -0.009888648986816406, -0.009361028671264648, -0.00883340835571289, -0.008305788040161133, -0.007778167724609375, -0.007250547409057617, -0.006722927093505859, -0.0061953067779541016, -0.005667686462402344, -0.005140066146850586, -0.004612445831298828, -0.00408482551574707, -0.0035572052001953125, -0.0030295848846435547, -0.002501964569091797, -0.001974344253540039, -0.0014467239379882812, -0.0009191036224365234, -0.0003914833068847656, 0.0001361370086669922, 0.00066375732421875, 0.0011913776397705078, 0.0017189979553222656, 0.0022466182708740234, 0.0027742385864257812, 0.003301858901977539, 0.003829479217529297, 0.004357099533081055, 0.0048847198486328125, 0.00541234016418457, 0.005939960479736328, 0.006467580795288086, 0.006995201110839844, 0.0075228214263916016, 0.00805044174194336, 0.008578062057495117, 0.009105682373046875, 0.009633302688598633, 0.01016092300415039, 0.010688543319702148, 0.011216163635253906, 0.011743783950805664, 0.012271404266357422, 0.01279902458190918, 0.013326644897460938, 0.013854265213012695, 0.014381885528564453, 0.014909505844116211, 0.015437126159667969, 0.015964746475219727, 0.016492366790771484, 0.017019987106323242, 0.017547607421875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 12.0, 17.0, 13.0, 28.0, 24.0, 34.0, 64.0, 86.0, 155.0, 182.0, 249.0, 371.0, 535.0, 728.0, 1142.0, 1595.0, 2352.0, 3425.0, 5267.0, 7950.0, 12004.0, 18481.0, 30856.0, 51442.0, 95997.0, 216042.0, 302658.0, 129435.0, 64920.0, 37330.0, 22749.0, 14309.0, 9354.0, 5956.0, 4043.0, 2816.0, 1810.0, 1267.0, 848.0, 611.0, 400.0, 296.0, 219.0, 154.0, 114.0, 66.0, 43.0, 32.0, 27.0, 18.0, 13.0, 8.0, 8.0, 4.0, 3.0, 1.0, 3.0], "bins": [-0.006717681884765625, -0.006515324115753174, -0.006312966346740723, -0.0061106085777282715, -0.00590825080871582, -0.005705893039703369, -0.005503535270690918, -0.005301177501678467, -0.005098819732666016, -0.0048964619636535645, -0.004694104194641113, -0.004491746425628662, -0.004289388656616211, -0.00408703088760376, -0.0038846731185913086, -0.0036823153495788574, -0.0034799575805664062, -0.003277599811553955, -0.003075242042541504, -0.0028728842735290527, -0.0026705265045166016, -0.0024681687355041504, -0.0022658109664916992, -0.002063453197479248, -0.0018610954284667969, -0.0016587376594543457, -0.0014563798904418945, -0.0012540221214294434, -0.0010516643524169922, -0.000849306583404541, -0.0006469488143920898, -0.00044459104537963867, -0.0002422332763671875, -3.987550735473633e-05, 0.00016248226165771484, 0.000364840030670166, 0.0005671977996826172, 0.0007695555686950684, 0.0009719133377075195, 0.0011742711067199707, 0.0013766288757324219, 0.001578986644744873, 0.0017813444137573242, 0.0019837021827697754, 0.0021860599517822266, 0.0023884177207946777, 0.002590775489807129, 0.00279313325881958, 0.0029954910278320312, 0.0031978487968444824, 0.0034002065658569336, 0.0036025643348693848, 0.003804922103881836, 0.004007279872894287, 0.004209637641906738, 0.0044119954109191895, 0.004614353179931641, 0.004816710948944092, 0.005019068717956543, 0.005221426486968994, 0.005423784255981445, 0.0056261420249938965, 0.005828499794006348, 0.006030857563018799, 0.00623321533203125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 6.0, 13.0, 10.0, 24.0, 10.0, 25.0, 16.0, 23.0, 34.0, 29.0, 37.0, 34.0, 33.0, 39.0, 45.0, 50.0, 37.0, 47.0, 42.0, 32.0, 50.0, 39.0, 44.0, 31.0, 33.0, 33.0, 24.0, 24.0, 14.0, 25.0, 15.0, 14.0, 11.0, 14.0, 7.0, 8.0, 7.0, 3.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00838470458984375, -0.008086204528808594, -0.0077877044677734375, -0.007489204406738281, -0.007190704345703125, -0.006892204284667969, -0.0065937042236328125, -0.006295204162597656, -0.0059967041015625, -0.005698204040527344, -0.0053997039794921875, -0.005101203918457031, -0.004802703857421875, -0.004504203796386719, -0.0042057037353515625, -0.003907203674316406, -0.00360870361328125, -0.0033102035522460938, -0.0030117034912109375, -0.0027132034301757812, -0.002414703369140625, -0.0021162033081054688, -0.0018177032470703125, -0.0015192031860351562, -0.001220703125, -0.0009222030639648438, -0.0006237030029296875, -0.00032520294189453125, -2.6702880859375e-05, 0.00027179718017578125, 0.0005702972412109375, 0.0008687973022460938, 0.00116729736328125, 0.0014657974243164062, 0.0017642974853515625, 0.0020627975463867188, 0.002361297607421875, 0.0026597976684570312, 0.0029582977294921875, 0.0032567977905273438, 0.0035552978515625, 0.0038537979125976562, 0.0041522979736328125, 0.004450798034667969, 0.004749298095703125, 0.005047798156738281, 0.0053462982177734375, 0.005644798278808594, 0.00594329833984375, 0.006241798400878906, 0.0065402984619140625, 0.006838798522949219, 0.007137298583984375, 0.007435798645019531, 0.0077342987060546875, 0.008032798767089844, 0.008331298828125, 0.008629798889160156, 0.008928298950195312, 0.009226799011230469, 0.009525299072265625, 0.009823799133300781, 0.010122299194335938, 0.010420799255371094, 0.01071929931640625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 9.0, 10.0, 13.0, 18.0, 27.0, 41.0, 48.0, 85.0, 115.0, 202.0, 274.0, 383.0, 631.0, 970.0, 1467.0, 2477.0, 4092.0, 7154.0, 12757.0, 24146.0, 50399.0, 130771.0, 518185.0, 171926.0, 59589.0, 28026.0, 14715.0, 8045.0, 4558.0, 2666.0, 1633.0, 1050.0, 652.0, 445.0, 316.0, 223.0, 120.0, 92.0, 72.0, 39.0, 36.0, 23.0, 13.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0005750656127929688, -0.0005568712949752808, -0.0005386769771575928, -0.0005204826593399048, -0.0005022883415222168, -0.0004840940237045288, -0.0004658997058868408, -0.00044770538806915283, -0.00042951107025146484, -0.00041131675243377686, -0.00039312243461608887, -0.0003749281167984009, -0.0003567337989807129, -0.0003385394811630249, -0.0003203451633453369, -0.0003021508455276489, -0.00028395652770996094, -0.00026576220989227295, -0.00024756789207458496, -0.00022937357425689697, -0.00021117925643920898, -0.000192984938621521, -0.000174790620803833, -0.00015659630298614502, -0.00013840198516845703, -0.00012020766735076904, -0.00010201334953308105, -8.381903171539307e-05, -6.562471389770508e-05, -4.743039608001709e-05, -2.92360782623291e-05, -1.1041760444641113e-05, 7.152557373046875e-06, 2.5346875190734863e-05, 4.354119300842285e-05, 6.173551082611084e-05, 7.992982864379883e-05, 9.812414646148682e-05, 0.0001163184642791748, 0.0001345127820968628, 0.00015270709991455078, 0.00017090141773223877, 0.00018909573554992676, 0.00020729005336761475, 0.00022548437118530273, 0.00024367868900299072, 0.0002618730068206787, 0.0002800673246383667, 0.0002982616424560547, 0.0003164559602737427, 0.00033465027809143066, 0.00035284459590911865, 0.00037103891372680664, 0.00038923323154449463, 0.0004074275493621826, 0.0004256218671798706, 0.0004438161849975586, 0.0004620105028152466, 0.00048020482063293457, 0.0004983991384506226, 0.0005165934562683105, 0.0005347877740859985, 0.0005529820919036865, 0.0005711764097213745, 0.0005893707275390625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 7.0, 7.0, 2.0, 10.0, 6.0, 9.0, 7.0, 19.0, 16.0, 15.0, 23.0, 32.0, 33.0, 42.0, 40.0, 53.0, 78.0, 84.0, 67.0, 67.0, 63.0, 58.0, 49.0, 47.0, 33.0, 19.0, 19.0, 18.0, 14.0, 13.0, 13.0, 5.0, 7.0, 6.0, 8.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1622905731201172e-05, -1.1198222637176514e-05, -1.0773539543151855e-05, -1.0348856449127197e-05, -9.924173355102539e-06, -9.499490261077881e-06, -9.074807167053223e-06, -8.650124073028564e-06, -8.225440979003906e-06, -7.800757884979248e-06, -7.37607479095459e-06, -6.951391696929932e-06, -6.5267086029052734e-06, -6.102025508880615e-06, -5.677342414855957e-06, -5.252659320831299e-06, -4.827976226806641e-06, -4.403293132781982e-06, -3.978610038757324e-06, -3.553926944732666e-06, -3.129243850708008e-06, -2.7045607566833496e-06, -2.2798776626586914e-06, -1.8551945686340332e-06, -1.430511474609375e-06, -1.0058283805847168e-06, -5.811452865600586e-07, -1.564621925354004e-07, 2.682209014892578e-07, 6.92903995513916e-07, 1.1175870895385742e-06, 1.5422701835632324e-06, 1.9669532775878906e-06, 2.391636371612549e-06, 2.816319465637207e-06, 3.2410025596618652e-06, 3.6656856536865234e-06, 4.090368747711182e-06, 4.51505184173584e-06, 4.939734935760498e-06, 5.364418029785156e-06, 5.7891011238098145e-06, 6.213784217834473e-06, 6.638467311859131e-06, 7.063150405883789e-06, 7.487833499908447e-06, 7.912516593933105e-06, 8.337199687957764e-06, 8.761882781982422e-06, 9.18656587600708e-06, 9.611248970031738e-06, 1.0035932064056396e-05, 1.0460615158081055e-05, 1.0885298252105713e-05, 1.1309981346130371e-05, 1.173466444015503e-05, 1.2159347534179688e-05, 1.2584030628204346e-05, 1.3008713722229004e-05, 1.3433396816253662e-05, 1.385807991027832e-05, 1.4282763004302979e-05, 1.4707446098327637e-05, 1.5132129192352295e-05, 1.5556812286376953e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 4.0, 6.0, 10.0, 7.0, 14.0, 12.0, 26.0, 32.0, 44.0, 74.0, 267.0, 1157.0, 9797.0, 192484.0, 814570.0, 26780.0, 2567.0, 424.0, 134.0, 47.0, 23.0, 20.0, 14.0, 7.0, 12.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0023365020751953125, -0.0022719502449035645, -0.0022073984146118164, -0.0021428465843200684, -0.0020782947540283203, -0.0020137429237365723, -0.0019491910934448242, -0.0018846392631530762, -0.0018200874328613281, -0.00175553560256958, -0.001690983772277832, -0.001626431941986084, -0.001561880111694336, -0.0014973282814025879, -0.0014327764511108398, -0.0013682246208190918, -0.0013036727905273438, -0.0012391209602355957, -0.0011745691299438477, -0.0011100172996520996, -0.0010454654693603516, -0.0009809136390686035, -0.0009163618087768555, -0.0008518099784851074, -0.0007872581481933594, -0.0007227063179016113, -0.0006581544876098633, -0.0005936026573181152, -0.0005290508270263672, -0.00046449899673461914, -0.0003999471664428711, -0.00033539533615112305, -0.000270843505859375, -0.00020629167556762695, -0.0001417398452758789, -7.718801498413086e-05, -1.2636184692382812e-05, 5.1915645599365234e-05, 0.00011646747589111328, 0.00018101930618286133, 0.0002455711364746094, 0.0003101229667663574, 0.00037467479705810547, 0.0004392266273498535, 0.0005037784576416016, 0.0005683302879333496, 0.0006328821182250977, 0.0006974339485168457, 0.0007619857788085938, 0.0008265376091003418, 0.0008910894393920898, 0.0009556412696838379, 0.001020193099975586, 0.001084744930267334, 0.001149296760559082, 0.00121384859085083, 0.0012784004211425781, 0.0013429522514343262, 0.0014075040817260742, 0.0014720559120178223, 0.0015366077423095703, 0.0016011595726013184, 0.0016657114028930664, 0.0017302632331848145, 0.0017948150634765625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 11.0, 9.0, 5.0, 7.0, 11.0, 18.0, 25.0, 17.0, 22.0, 22.0, 44.0, 29.0, 47.0, 64.0, 74.0, 63.0, 50.0, 74.0, 64.0, 47.0, 38.0, 27.0, 31.0, 36.0, 22.0, 24.0, 12.0, 19.0, 23.0, 10.0, 10.0, 10.0, 3.0, 9.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010877847671508789, -0.00010503362864255905, -0.00010128878057003021, -9.754393249750137e-05, -9.379908442497253e-05, -9.00542363524437e-05, -8.630938827991486e-05, -8.256454020738602e-05, -7.881969213485718e-05, -7.507484406232834e-05, -7.13299959897995e-05, -6.758514791727066e-05, -6.384029984474182e-05, -6.009545177221298e-05, -5.635060369968414e-05, -5.2605755627155304e-05, -4.8860907554626465e-05, -4.5116059482097626e-05, -4.137121140956879e-05, -3.762636333703995e-05, -3.388151526451111e-05, -3.013666719198227e-05, -2.639181911945343e-05, -2.264697104692459e-05, -1.8902122974395752e-05, -1.5157274901866913e-05, -1.1412426829338074e-05, -7.667578756809235e-06, -3.9227306842803955e-06, -1.778826117515564e-07, 3.5669654607772827e-06, 7.311813533306122e-06, 1.1056661605834961e-05, 1.48015096783638e-05, 1.854635775089264e-05, 2.2291205823421478e-05, 2.6036053895950317e-05, 2.9780901968479156e-05, 3.3525750041007996e-05, 3.7270598113536835e-05, 4.1015446186065674e-05, 4.476029425859451e-05, 4.850514233112335e-05, 5.224999040365219e-05, 5.599483847618103e-05, 5.973968654870987e-05, 6.348453462123871e-05, 6.722938269376755e-05, 7.097423076629639e-05, 7.471907883882523e-05, 7.846392691135406e-05, 8.22087749838829e-05, 8.595362305641174e-05, 8.969847112894058e-05, 9.344331920146942e-05, 9.718816727399826e-05, 0.0001009330153465271, 0.00010467786341905594, 0.00010842271149158478, 0.00011216755956411362, 0.00011591240763664246, 0.0001196572557091713, 0.00012340210378170013, 0.00012714695185422897, 0.0001308917999267578]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 10.0, 15.0, 20.0, 21.0, 30.0, 31.0, 55.0, 66.0, 67.0, 98.0, 90.0, 104.0, 75.0, 76.0, 60.0, 43.0, 35.0, 29.0, 14.0, 14.0, 6.0, 12.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023227859288454056, -0.022489765658974648, -0.02175167202949524, -0.02101358026266098, -0.020275486633181572, -0.019537393003702164, -0.018799301236867905, -0.018061207607388496, -0.017323113977909088, -0.01658502034842968, -0.01584692671895027, -0.015108834952116013, -0.014370741322636604, -0.013632647693157196, -0.012894554995000362, -0.012156462296843529, -0.01141836866736412, -0.010680275037884712, -0.009942182339727879, -0.009204089641571045, -0.008465996012091637, -0.007727902848273516, -0.006989809684455395, -0.006251716520637274, -0.005513623356819153, -0.004775530193001032, -0.004037437029182911, -0.00329934386536479, -0.002561250701546669, -0.001823157537728548, -0.001085064373910427, -0.00034697121009230614, 0.0003911219537258148, 0.0011292151175439358, 0.0018673082813620567, 0.0026054014451801777, 0.0033434946089982986, 0.00408158777281642, 0.0048196809366345406, 0.0055577741004526615, 0.0062958672642707825, 0.007033960428088903, 0.007772053591907024, 0.008510146290063858, 0.009248239919543266, 0.009986333549022675, 0.010724426247179508, 0.011462518945336342, 0.01220061257481575, 0.012938706204295158, 0.013676798902451992, 0.014414891600608826, 0.015152985230088234, 0.015891078859567642, 0.0166291706264019, 0.01736726425588131, 0.018105357885360718, 0.018843451514840126, 0.019581545144319534, 0.020319636911153793, 0.0210577305406332, 0.02179582417011261, 0.02253391593694687, 0.023272009566426277, 0.024010103195905685]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 6.0, 7.0, 5.0, 7.0, 12.0, 11.0, 12.0, 8.0, 17.0, 23.0, 24.0, 22.0, 35.0, 43.0, 48.0, 46.0, 47.0, 51.0, 36.0, 49.0, 46.0, 36.0, 40.0, 35.0, 33.0, 43.0, 44.0, 35.0, 31.0, 31.0, 22.0, 19.0, 21.0, 17.0, 11.0, 6.0, 12.0, 4.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013517429120838642, -0.013031098060309887, -0.012544766068458557, -0.012058435007929802, -0.011572103947401047, -0.011085772886872292, -0.010599440895020962, -0.010113109834492207, -0.009626777842640877, -0.009140446782112122, -0.008654114790260792, -0.008167783729732037, -0.007681452669203281, -0.007195121143013239, -0.006708789616823196, -0.006222458556294441, -0.005736127495765686, -0.0052497959695756435, -0.004763464909046888, -0.004277133382856846, -0.003790802089497447, -0.003304470796138048, -0.0028181392699480057, -0.002331807976588607, -0.001845476683229208, -0.0013591453898698092, -0.0008728139800950885, -0.0003864825703203678, 9.984872303903103e-05, 0.0005861800163984299, 0.0010725115425884724, 0.0015588428359478712, 0.0020451750606298447, 0.0025315063539892435, 0.0030178376473486423, 0.003504169173538685, 0.00399050023406744, 0.0044768317602574825, 0.004963163286447525, 0.00544949434697628, 0.005935825873166323, 0.006422157399356365, 0.00690848845988512, 0.007394819986075163, 0.007881151512265205, 0.00836748257279396, 0.008853813633322716, 0.009340145625174046, 0.0098264766857028, 0.010312807746231556, 0.010799139738082886, 0.011285470798611641, 0.011771801859140396, 0.012258132919669151, 0.012744464911520481, 0.013230795972049236, 0.013717127963900566, 0.014203459024429321, 0.014689791016280651, 0.015176122076809406, 0.015662454068660736, 0.01614878512918949, 0.016635116189718246, 0.017121447250247, 0.017607778310775757]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 12.0, 7.0, 11.0, 20.0, 26.0, 47.0, 47.0, 79.0, 122.0, 177.0, 246.0, 430.0, 744.0, 1034.0, 1617.0, 2685.0, 4087.0, 6828.0, 11556.0, 19391.0, 33636.0, 57735.0, 98205.0, 156984.0, 199597.0, 173784.0, 114496.0, 68115.0, 39146.0, 22801.0, 13575.0, 8158.0, 4960.0, 2933.0, 1917.0, 1200.0, 760.0, 515.0, 314.0, 180.0, 138.0, 75.0, 56.0, 39.0, 27.0, 20.0, 11.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 2.0, 4.0], "bins": [-0.03131103515625, -0.0303804874420166, -0.029449939727783203, -0.028519392013549805, -0.027588844299316406, -0.026658296585083008, -0.02572774887084961, -0.02479720115661621, -0.023866653442382812, -0.022936105728149414, -0.022005558013916016, -0.021075010299682617, -0.02014446258544922, -0.01921391487121582, -0.018283367156982422, -0.017352819442749023, -0.016422271728515625, -0.015491724014282227, -0.014561176300048828, -0.01363062858581543, -0.012700080871582031, -0.011769533157348633, -0.010838985443115234, -0.009908437728881836, -0.008977890014648438, -0.008047342300415039, -0.007116794586181641, -0.006186246871948242, -0.005255699157714844, -0.004325151443481445, -0.003394603729248047, -0.0024640560150146484, -0.00153350830078125, -0.0006029605865478516, 0.0003275871276855469, 0.0012581348419189453, 0.0021886825561523438, 0.003119230270385742, 0.004049777984619141, 0.004980325698852539, 0.0059108734130859375, 0.006841421127319336, 0.007771968841552734, 0.008702516555786133, 0.009633064270019531, 0.01056361198425293, 0.011494159698486328, 0.012424707412719727, 0.013355255126953125, 0.014285802841186523, 0.015216350555419922, 0.01614689826965332, 0.01707744598388672, 0.018007993698120117, 0.018938541412353516, 0.019869089126586914, 0.020799636840820312, 0.02173018455505371, 0.02266073226928711, 0.023591279983520508, 0.024521827697753906, 0.025452375411987305, 0.026382923126220703, 0.0273134708404541, 0.0282440185546875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 0.0, 7.0, 4.0, 13.0, 13.0, 11.0, 8.0, 15.0, 13.0, 32.0, 26.0, 53.0, 38.0, 65.0, 48.0, 44.0, 50.0, 42.0, 47.0, 53.0, 54.0, 52.0, 40.0, 43.0, 42.0, 34.0, 24.0, 24.0, 27.0, 19.0, 15.0, 11.0, 10.0, 12.0, 6.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01168060302734375, -0.011279463768005371, -0.010878324508666992, -0.010477185249328613, -0.010076045989990234, -0.009674906730651855, -0.009273767471313477, -0.008872628211975098, -0.008471488952636719, -0.00807034969329834, -0.007669210433959961, -0.007268071174621582, -0.006866931915283203, -0.006465792655944824, -0.006064653396606445, -0.005663514137268066, -0.0052623748779296875, -0.004861235618591309, -0.00446009635925293, -0.004058957099914551, -0.003657817840576172, -0.003256678581237793, -0.002855539321899414, -0.002454400062561035, -0.0020532608032226562, -0.0016521215438842773, -0.0012509822845458984, -0.0008498430252075195, -0.0004487037658691406, -4.756450653076172e-05, 0.0003535747528076172, 0.0007547140121459961, 0.001155853271484375, 0.001556992530822754, 0.001958131790161133, 0.0023592710494995117, 0.0027604103088378906, 0.0031615495681762695, 0.0035626888275146484, 0.003963828086853027, 0.004364967346191406, 0.004766106605529785, 0.005167245864868164, 0.005568385124206543, 0.005969524383544922, 0.006370663642883301, 0.00677180290222168, 0.007172942161560059, 0.0075740814208984375, 0.007975220680236816, 0.008376359939575195, 0.008777499198913574, 0.009178638458251953, 0.009579777717590332, 0.009980916976928711, 0.01038205623626709, 0.010783195495605469, 0.011184334754943848, 0.011585474014282227, 0.011986613273620605, 0.012387752532958984, 0.012788891792297363, 0.013190031051635742, 0.013591170310974121, 0.0139923095703125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 8.0, 10.0, 11.0, 25.0, 16.0, 24.0, 19.0, 27.0, 36.0, 28.0, 59.0, 100.0, 249.0, 1214.0, 7188.0, 47561.0, 327702.0, 543996.0, 102337.0, 14700.0, 2359.0, 455.0, 153.0, 54.0, 41.0, 22.0, 30.0, 16.0, 19.0, 19.0, 11.0, 12.0, 10.0, 7.0, 8.0, 4.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.077880859375, -0.07501697540283203, -0.07215309143066406, -0.0692892074584961, -0.06642532348632812, -0.06356143951416016, -0.06069755554199219, -0.05783367156982422, -0.05496978759765625, -0.05210590362548828, -0.04924201965332031, -0.046378135681152344, -0.043514251708984375, -0.040650367736816406, -0.03778648376464844, -0.03492259979248047, -0.0320587158203125, -0.02919483184814453, -0.026330947875976562, -0.023467063903808594, -0.020603179931640625, -0.017739295959472656, -0.014875411987304688, -0.012011528015136719, -0.00914764404296875, -0.006283760070800781, -0.0034198760986328125, -0.0005559921264648438, 0.002307891845703125, 0.005171775817871094, 0.008035659790039062, 0.010899543762207031, 0.013763427734375, 0.01662731170654297, 0.019491195678710938, 0.022355079650878906, 0.025218963623046875, 0.028082847595214844, 0.030946731567382812, 0.03381061553955078, 0.03667449951171875, 0.03953838348388672, 0.04240226745605469, 0.045266151428222656, 0.048130035400390625, 0.050993919372558594, 0.05385780334472656, 0.05672168731689453, 0.0595855712890625, 0.06244945526123047, 0.06531333923339844, 0.0681772232055664, 0.07104110717773438, 0.07390499114990234, 0.07676887512207031, 0.07963275909423828, 0.08249664306640625, 0.08536052703857422, 0.08822441101074219, 0.09108829498291016, 0.09395217895507812, 0.0968160629272461, 0.09967994689941406, 0.10254383087158203, 0.10540771484375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 8.0, 9.0, 16.0, 11.0, 12.0, 16.0, 21.0, 22.0, 27.0, 32.0, 36.0, 38.0, 42.0, 51.0, 44.0, 46.0, 41.0, 55.0, 39.0, 40.0, 46.0, 42.0, 33.0, 35.0, 37.0, 21.0, 25.0, 27.0, 20.0, 19.0, 13.0, 10.0, 12.0, 9.0, 6.0, 5.0, 4.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.010955810546875, -0.010643362998962402, -0.010330915451049805, -0.010018467903137207, -0.00970602035522461, -0.009393572807312012, -0.009081125259399414, -0.008768677711486816, -0.008456230163574219, -0.008143782615661621, -0.007831335067749023, -0.007518887519836426, -0.007206439971923828, -0.0068939924240112305, -0.006581544876098633, -0.006269097328186035, -0.0059566497802734375, -0.00564420223236084, -0.005331754684448242, -0.0050193071365356445, -0.004706859588623047, -0.004394412040710449, -0.0040819644927978516, -0.003769516944885254, -0.0034570693969726562, -0.0031446218490600586, -0.002832174301147461, -0.0025197267532348633, -0.0022072792053222656, -0.001894831657409668, -0.0015823841094970703, -0.0012699365615844727, -0.000957489013671875, -0.0006450414657592773, -0.0003325939178466797, -2.014636993408203e-05, 0.0002923011779785156, 0.0006047487258911133, 0.0009171962738037109, 0.0012296438217163086, 0.0015420913696289062, 0.001854538917541504, 0.0021669864654541016, 0.0024794340133666992, 0.002791881561279297, 0.0031043291091918945, 0.003416776657104492, 0.00372922420501709, 0.0040416717529296875, 0.004354119300842285, 0.004666566848754883, 0.0049790143966674805, 0.005291461944580078, 0.005603909492492676, 0.0059163570404052734, 0.006228804588317871, 0.006541252136230469, 0.006853699684143066, 0.007166147232055664, 0.007478594779968262, 0.007791042327880859, 0.008103489875793457, 0.008415937423706055, 0.008728384971618652, 0.00904083251953125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 10.0, 14.0, 31.0, 23.0, 49.0, 119.0, 189.0, 310.0, 553.0, 1026.0, 1713.0, 3552.0, 7521.0, 20139.0, 896188.0, 92059.0, 13382.0, 5586.0, 2782.0, 1479.0, 800.0, 414.0, 257.0, 163.0, 76.0, 45.0, 32.0, 9.0, 12.0, 9.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00817108154296875, -0.007905960083007812, -0.007640838623046875, -0.0073757171630859375, -0.007110595703125, -0.0068454742431640625, -0.006580352783203125, -0.0063152313232421875, -0.00605010986328125, -0.0057849884033203125, -0.005519866943359375, -0.0052547454833984375, -0.0049896240234375, -0.0047245025634765625, -0.004459381103515625, -0.0041942596435546875, -0.00392913818359375, -0.0036640167236328125, -0.003398895263671875, -0.0031337738037109375, -0.00286865234375, -0.0026035308837890625, -0.002338409423828125, -0.0020732879638671875, -0.00180816650390625, -0.0015430450439453125, -0.001277923583984375, -0.0010128021240234375, -0.0007476806640625, -0.0004825592041015625, -0.000217437744140625, 4.76837158203125e-05, 0.00031280517578125, 0.0005779266357421875, 0.000843048095703125, 0.0011081695556640625, 0.001373291015625, 0.0016384124755859375, 0.001903533935546875, 0.0021686553955078125, 0.00243377685546875, 0.0026988983154296875, 0.002964019775390625, 0.0032291412353515625, 0.0034942626953125, 0.0037593841552734375, 0.004024505615234375, 0.0042896270751953125, 0.00455474853515625, 0.0048198699951171875, 0.005084991455078125, 0.0053501129150390625, 0.005615234375, 0.0058803558349609375, 0.006145477294921875, 0.0064105987548828125, 0.00667572021484375, 0.0069408416748046875, 0.007205963134765625, 0.0074710845947265625, 0.0077362060546875, 0.008001327514648438, 0.008266448974609375, 0.008531570434570312, 0.00879669189453125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 8.0, 7.0, 12.0, 8.0, 12.0, 22.0, 21.0, 12.0, 34.0, 40.0, 72.0, 80.0, 102.0, 100.0, 115.0, 75.0, 70.0, 42.0, 45.0, 24.0, 14.0, 24.0, 11.0, 6.0, 10.0, 3.0, 5.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.119510650634766e-06, -8.760951459407806e-06, -8.402392268180847e-06, -8.043833076953888e-06, -7.685273885726929e-06, -7.3267146944999695e-06, -6.96815550327301e-06, -6.609596312046051e-06, -6.251037120819092e-06, -5.8924779295921326e-06, -5.533918738365173e-06, -5.175359547138214e-06, -4.816800355911255e-06, -4.458241164684296e-06, -4.0996819734573364e-06, -3.741122782230377e-06, -3.382563591003418e-06, -3.0240043997764587e-06, -2.6654452085494995e-06, -2.3068860173225403e-06, -1.948326826095581e-06, -1.5897676348686218e-06, -1.2312084436416626e-06, -8.726492524147034e-07, -5.140900611877441e-07, -1.555308699607849e-07, 2.0302832126617432e-07, 5.615875124931335e-07, 9.201467037200928e-07, 1.278705894947052e-06, 1.6372650861740112e-06, 1.9958242774009705e-06, 2.3543834686279297e-06, 2.712942659854889e-06, 3.071501851081848e-06, 3.4300610423088074e-06, 3.7886202335357666e-06, 4.147179424762726e-06, 4.505738615989685e-06, 4.864297807216644e-06, 5.2228569984436035e-06, 5.581416189670563e-06, 5.939975380897522e-06, 6.298534572124481e-06, 6.6570937633514404e-06, 7.0156529545784e-06, 7.374212145805359e-06, 7.732771337032318e-06, 8.091330528259277e-06, 8.449889719486237e-06, 8.808448910713196e-06, 9.167008101940155e-06, 9.525567293167114e-06, 9.884126484394073e-06, 1.0242685675621033e-05, 1.0601244866847992e-05, 1.0959804058074951e-05, 1.131836324930191e-05, 1.167692244052887e-05, 1.2035481631755829e-05, 1.2394040822982788e-05, 1.2752600014209747e-05, 1.3111159205436707e-05, 1.3469718396663666e-05, 1.3828277587890625e-05]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 9.0, 24.0, 81.0, 264.0, 1070.0, 4767.0, 31365.0, 988124.0, 18471.0, 3252.0, 764.0, 213.0, 58.0, 24.0, 8.0, 3.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01319122314453125, -0.012726426124572754, -0.012261629104614258, -0.011796832084655762, -0.011332035064697266, -0.01086723804473877, -0.010402441024780273, -0.009937644004821777, -0.009472846984863281, -0.009008049964904785, -0.008543252944946289, -0.008078455924987793, -0.007613658905029297, -0.007148861885070801, -0.006684064865112305, -0.006219267845153809, -0.0057544708251953125, -0.005289673805236816, -0.00482487678527832, -0.004360079765319824, -0.003895282745361328, -0.003430485725402832, -0.002965688705444336, -0.00250089168548584, -0.0020360946655273438, -0.0015712976455688477, -0.0011065006256103516, -0.0006417036056518555, -0.00017690658569335938, 0.0002878904342651367, 0.0007526874542236328, 0.001217484474182129, 0.001682281494140625, 0.002147078514099121, 0.002611875534057617, 0.0030766725540161133, 0.0035414695739746094, 0.0040062665939331055, 0.0044710636138916016, 0.004935860633850098, 0.005400657653808594, 0.00586545467376709, 0.006330251693725586, 0.006795048713684082, 0.007259845733642578, 0.007724642753601074, 0.00818943977355957, 0.008654236793518066, 0.009119033813476562, 0.009583830833435059, 0.010048627853393555, 0.01051342487335205, 0.010978221893310547, 0.011443018913269043, 0.011907815933227539, 0.012372612953186035, 0.012837409973144531, 0.013302206993103027, 0.013767004013061523, 0.01423180103302002, 0.014696598052978516, 0.015161395072937012, 0.015626192092895508, 0.016090989112854004, 0.0165557861328125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 5.0, 3.0, 9.0, 7.0, 10.0, 12.0, 32.0, 91.0, 347.0, 285.0, 90.0, 29.0, 11.0, 7.0, 3.0, 7.0, 0.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0013990402221679688, -0.0013590008020401, -0.0013189613819122314, -0.0012789219617843628, -0.0012388825416564941, -0.0011988431215286255, -0.0011588037014007568, -0.0011187642812728882, -0.0010787248611450195, -0.0010386854410171509, -0.0009986460208892822, -0.0009586066007614136, -0.0009185671806335449, -0.0008785277605056763, -0.0008384883403778076, -0.000798448920249939, -0.0007584095001220703, -0.0007183700799942017, -0.000678330659866333, -0.0006382912397384644, -0.0005982518196105957, -0.000558212399482727, -0.0005181729793548584, -0.00047813355922698975, -0.0004380941390991211, -0.00039805471897125244, -0.0003580152988433838, -0.00031797587871551514, -0.0002779364585876465, -0.00023789703845977783, -0.00019785761833190918, -0.00015781819820404053, -0.00011777877807617188, -7.773935794830322e-05, -3.769993782043457e-05, 2.339482307434082e-06, 4.2378902435302734e-05, 8.241832256317139e-05, 0.00012245774269104004, 0.0001624971628189087, 0.00020253658294677734, 0.000242576003074646, 0.00028261542320251465, 0.0003226548433303833, 0.00036269426345825195, 0.0004027336835861206, 0.00044277310371398926, 0.0004828125238418579, 0.0005228519439697266, 0.0005628913640975952, 0.0006029307842254639, 0.0006429702043533325, 0.0006830096244812012, 0.0007230490446090698, 0.0007630884647369385, 0.0008031278848648071, 0.0008431673049926758, 0.0008832067251205444, 0.0009232461452484131, 0.0009632855653762817, 0.0010033249855041504, 0.001043364405632019, 0.0010834038257598877, 0.0011234432458877563, 0.001163482666015625]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 11.0, 11.0, 11.0, 14.0, 26.0, 34.0, 39.0, 45.0, 69.0, 76.0, 108.0, 91.0, 100.0, 96.0, 67.0, 46.0, 43.0, 36.0, 30.0, 12.0, 10.0, 7.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.02553023025393486, -0.02488432079553604, -0.02423841319978237, -0.023592503741383553, -0.022946596145629883, -0.022300686687231064, -0.021654777228832245, -0.021008867770433426, -0.020362960174679756, -0.019717050716280937, -0.019071143120527267, -0.01842523366212845, -0.01777932420372963, -0.01713341660797596, -0.01648750714957714, -0.01584159955382347, -0.015195690095424652, -0.014549781568348408, -0.013903873041272163, -0.013257963582873344, -0.0126120550557971, -0.011966146528720856, -0.011320237070322037, -0.010674328543245792, -0.010028420016169548, -0.009382511489093304, -0.00873660296201706, -0.00809069350361824, -0.007444784976541996, -0.006798876449465752, -0.00615296745672822, -0.005507058463990688, -0.004861149936914444, -0.0042152414098382, -0.003569332417100668, -0.00292342365719378, -0.002277514897286892, -0.001631606137380004, -0.000985697377473116, -0.00033978838473558426, 0.0003061201423406601, 0.0009520289022475481, 0.0015979376621544361, 0.002243846422061324, 0.002889755181968212, 0.0035356639418751, 0.004181572701781988, 0.00482748169451952, 0.005473390221595764, 0.0061192987486720085, 0.00676520774140954, 0.007411116734147072, 0.008057025261223316, 0.00870293378829956, 0.00934884324669838, 0.009994751773774624, 0.010640660300850868, 0.011286568827927113, 0.011932477355003357, 0.012578386813402176, 0.01322429534047842, 0.013870203867554665, 0.014516113325953484, 0.015162021853029728, 0.015807930380105972]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 4.0, 5.0, 4.0, 5.0, 10.0, 6.0, 17.0, 11.0, 22.0, 21.0, 21.0, 24.0, 14.0, 35.0, 29.0, 34.0, 28.0, 41.0, 40.0, 33.0, 45.0, 41.0, 49.0, 40.0, 39.0, 59.0, 38.0, 26.0, 35.0, 34.0, 27.0, 27.0, 17.0, 13.0, 20.0, 12.0, 13.0, 12.0, 6.0, 5.0, 9.0, 7.0, 5.0, 8.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.012280215509235859, -0.011896738782525063, -0.011513262055814266, -0.01112978532910347, -0.010746309533715248, -0.010362832807004452, -0.009979356080293655, -0.009595879353582859, -0.009212402626872063, -0.008828925900161266, -0.00844544917345047, -0.008061972446739674, -0.0076784961856901646, -0.007295019458979368, -0.006911543197929859, -0.006528066471219063, -0.0061445897445082664, -0.00576111301779747, -0.005377636291086674, -0.004994160030037165, -0.004610683303326368, -0.004227206576615572, -0.0038437300827354193, -0.0034602535888552666, -0.00307677686214447, -0.002693300135433674, -0.002309823641553521, -0.0019263470312580466, -0.001542870420962572, -0.0011593938106670976, -0.000775917200371623, -0.00039244070649147034, -8.96397978067398e-06, 0.00037451263051480055, 0.0007579892408102751, 0.0011414658511057496, 0.0015249424614012241, 0.0019084190716966987, 0.002291895681992173, 0.002675372175872326, 0.0030588489025831223, 0.0034423256292939186, 0.0038258021231740713, 0.004209278617054224, 0.00459275534376502, 0.004976232070475817, 0.005359708331525326, 0.005743185058236122, 0.0061266617849469185, 0.006510138511657715, 0.006893615238368511, 0.00727709149941802, 0.007660568226128817, 0.008044044487178326, 0.008427521213889122, 0.008810997940599918, 0.009194474667310715, 0.009577951394021511, 0.009961428120732307, 0.010344904847443104, 0.0107283815741539, 0.011111857369542122, 0.011495334096252918, 0.011878810822963715, 0.012262287549674511]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 3.0, 5.0, 8.0, 9.0, 7.0, 11.0, 19.0, 12.0, 15.0, 20.0, 44.0, 80.0, 127.0, 205.0, 370.0, 703.0, 1566.0, 3993.0, 12999.0, 83561.0, 3907674.0, 157419.0, 16920.0, 4835.0, 1787.0, 827.0, 436.0, 219.0, 117.0, 76.0, 38.0, 34.0, 20.0, 17.0, 12.0, 12.0, 15.0, 10.0, 8.0, 12.0, 5.0, 3.0, 7.0, 5.0, 0.0, 4.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.057830810546875, -0.05615854263305664, -0.05448627471923828, -0.05281400680541992, -0.05114173889160156, -0.0494694709777832, -0.047797203063964844, -0.046124935150146484, -0.044452667236328125, -0.042780399322509766, -0.041108131408691406, -0.03943586349487305, -0.03776359558105469, -0.03609132766723633, -0.03441905975341797, -0.03274679183959961, -0.03107452392578125, -0.02940225601196289, -0.02772998809814453, -0.026057720184326172, -0.024385452270507812, -0.022713184356689453, -0.021040916442871094, -0.019368648529052734, -0.017696380615234375, -0.016024112701416016, -0.014351844787597656, -0.012679576873779297, -0.011007308959960938, -0.009335041046142578, -0.007662773132324219, -0.005990505218505859, -0.0043182373046875, -0.0026459693908691406, -0.0009737014770507812, 0.0006985664367675781, 0.0023708343505859375, 0.004043102264404297, 0.005715370178222656, 0.007387638092041016, 0.009059906005859375, 0.010732173919677734, 0.012404441833496094, 0.014076709747314453, 0.015748977661132812, 0.017421245574951172, 0.01909351348876953, 0.02076578140258789, 0.02243804931640625, 0.02411031723022461, 0.02578258514404297, 0.027454853057861328, 0.029127120971679688, 0.030799388885498047, 0.032471656799316406, 0.034143924713134766, 0.035816192626953125, 0.037488460540771484, 0.039160728454589844, 0.0408329963684082, 0.04250526428222656, 0.04417753219604492, 0.04584980010986328, 0.04752206802368164, 0.0491943359375]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 6.0, 6.0, 13.0, 5.0, 11.0, 14.0, 19.0, 23.0, 29.0, 29.0, 33.0, 33.0, 40.0, 42.0, 32.0, 43.0, 40.0, 44.0, 39.0, 33.0, 45.0, 44.0, 46.0, 55.0, 39.0, 36.0, 27.0, 32.0, 32.0, 22.0, 12.0, 12.0, 9.0, 7.0, 5.0, 9.0, 5.0, 5.0, 5.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.01088714599609375, -0.010561347007751465, -0.01023554801940918, -0.009909749031066895, -0.00958395004272461, -0.009258151054382324, -0.008932352066040039, -0.008606553077697754, -0.008280754089355469, -0.007954955101013184, -0.0076291561126708984, -0.007303357124328613, -0.006977558135986328, -0.006651759147644043, -0.006325960159301758, -0.006000161170959473, -0.0056743621826171875, -0.005348563194274902, -0.005022764205932617, -0.004696965217590332, -0.004371166229248047, -0.004045367240905762, -0.0037195682525634766, -0.0033937692642211914, -0.0030679702758789062, -0.002742171287536621, -0.002416372299194336, -0.0020905733108520508, -0.0017647743225097656, -0.0014389753341674805, -0.0011131763458251953, -0.0007873773574829102, -0.000461578369140625, -0.00013577938079833984, 0.0001900196075439453, 0.0005158185958862305, 0.0008416175842285156, 0.0011674165725708008, 0.001493215560913086, 0.001819014549255371, 0.0021448135375976562, 0.0024706125259399414, 0.0027964115142822266, 0.0031222105026245117, 0.003448009490966797, 0.003773808479309082, 0.004099607467651367, 0.004425406455993652, 0.0047512054443359375, 0.005077004432678223, 0.005402803421020508, 0.005728602409362793, 0.006054401397705078, 0.006380200386047363, 0.0067059993743896484, 0.007031798362731934, 0.007357597351074219, 0.007683396339416504, 0.008009195327758789, 0.008334994316101074, 0.00866079330444336, 0.008986592292785645, 0.00931239128112793, 0.009638190269470215, 0.0099639892578125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 9.0, 5.0, 9.0, 10.0, 22.0, 36.0, 41.0, 86.0, 265.0, 994.0, 7056.0, 235354.0, 3928452.0, 19329.0, 1928.0, 403.0, 119.0, 61.0, 37.0, 14.0, 16.0, 4.0, 7.0, 7.0, 2.0, 1.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1439208984375, -0.1394500732421875, -0.134979248046875, -0.1305084228515625, -0.12603759765625, -0.1215667724609375, -0.117095947265625, -0.1126251220703125, -0.108154296875, -0.1036834716796875, -0.099212646484375, -0.0947418212890625, -0.09027099609375, -0.0858001708984375, -0.081329345703125, -0.0768585205078125, -0.0723876953125, -0.0679168701171875, -0.063446044921875, -0.0589752197265625, -0.05450439453125, -0.0500335693359375, -0.045562744140625, -0.0410919189453125, -0.03662109375, -0.0321502685546875, -0.027679443359375, -0.0232086181640625, -0.01873779296875, -0.0142669677734375, -0.009796142578125, -0.0053253173828125, -0.0008544921875, 0.0036163330078125, 0.008087158203125, 0.0125579833984375, 0.01702880859375, 0.0214996337890625, 0.025970458984375, 0.0304412841796875, 0.034912109375, 0.0393829345703125, 0.043853759765625, 0.0483245849609375, 0.05279541015625, 0.0572662353515625, 0.061737060546875, 0.0662078857421875, 0.0706787109375, 0.0751495361328125, 0.079620361328125, 0.0840911865234375, 0.08856201171875, 0.0930328369140625, 0.097503662109375, 0.1019744873046875, 0.1064453125, 0.1109161376953125, 0.115386962890625, 0.1198577880859375, 0.12432861328125, 0.1287994384765625, 0.133270263671875, 0.1377410888671875, 0.1422119140625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 4.0, 7.0, 12.0, 20.0, 25.0, 21.0, 36.0, 48.0, 56.0, 103.0, 173.0, 398.0, 803.0, 1075.0, 554.0, 250.0, 141.0, 90.0, 53.0, 47.0, 30.0, 19.0, 20.0, 14.0, 16.0, 14.0, 8.0, 3.0, 2.0, 5.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.007476806640625, -0.007237434387207031, -0.0069980621337890625, -0.006758689880371094, -0.006519317626953125, -0.006279945373535156, -0.0060405731201171875, -0.005801200866699219, -0.00556182861328125, -0.005322456359863281, -0.0050830841064453125, -0.004843711853027344, -0.004604339599609375, -0.004364967346191406, -0.0041255950927734375, -0.0038862228393554688, -0.0036468505859375, -0.0034074783325195312, -0.0031681060791015625, -0.0029287338256835938, -0.002689361572265625, -0.0024499893188476562, -0.0022106170654296875, -0.0019712448120117188, -0.00173187255859375, -0.0014925003051757812, -0.0012531280517578125, -0.0010137557983398438, -0.000774383544921875, -0.0005350112915039062, -0.0002956390380859375, -5.626678466796875e-05, 0.00018310546875, 0.00042247772216796875, 0.0006618499755859375, 0.0009012222290039062, 0.001140594482421875, 0.0013799667358398438, 0.0016193389892578125, 0.0018587112426757812, 0.00209808349609375, 0.0023374557495117188, 0.0025768280029296875, 0.0028162002563476562, 0.003055572509765625, 0.0032949447631835938, 0.0035343170166015625, 0.0037736892700195312, 0.0040130615234375, 0.004252433776855469, 0.0044918060302734375, 0.004731178283691406, 0.004970550537109375, 0.005209922790527344, 0.0054492950439453125, 0.005688667297363281, 0.00592803955078125, 0.006167411804199219, 0.0064067840576171875, 0.006646156311035156, 0.006885528564453125, 0.007124900817871094, 0.0073642730712890625, 0.007603645324707031, 0.007843017578125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 15.0, 26.0, 49.0, 80.0, 135.0, 171.0, 188.0, 139.0, 76.0, 54.0, 34.0, 21.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0270912554115057, -0.02601061575114727, -0.024929974228143692, -0.023849334567785263, -0.022768694907426834, -0.021688055247068405, -0.020607415586709976, -0.019526774063706398, -0.01844613440334797, -0.01736549474298954, -0.016284853219985962, -0.015204213559627533, -0.014123573899269104, -0.013042934238910675, -0.011962293647229671, -0.010881653055548668, -0.009801013395190239, -0.00872037373483181, -0.007639733143150806, -0.00655909301713109, -0.005478452891111374, -0.004397812765091658, -0.0033171726390719414, -0.002236532513052225, -0.0011558923870325089, -7.525226101279259e-05, 0.0010053878650069237, 0.00208602799102664, 0.003166668117046356, 0.0042473082430660725, 0.005327948369085789, 0.006408588495105505, 0.007489226758480072, 0.008569866418838501, 0.009650507010519505, 0.010731147602200508, 0.011811787262558937, 0.012892426922917366, 0.01397306751459837, 0.015053708106279373, 0.016134347766637802, 0.01721498742699623, 0.01829562708735466, 0.019376268610358238, 0.020456908270716667, 0.021537547931075096, 0.022618189454078674, 0.023698829114437103, 0.024779468774795532, 0.02586010843515396, 0.02694074809551239, 0.02802138961851597, 0.029102029278874397, 0.030182668939232826, 0.031263310462236404, 0.03234395012259483, 0.03342458978295326, 0.03450522944331169, 0.03558586910367012, 0.03666650876402855, 0.03774715214967728, 0.038827791810035706, 0.039908431470394135, 0.040989071130752563, 0.04206971079111099]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 10.0, 7.0, 13.0, 14.0, 12.0, 15.0, 11.0, 17.0, 26.0, 16.0, 19.0, 33.0, 38.0, 24.0, 34.0, 39.0, 45.0, 32.0, 34.0, 36.0, 38.0, 31.0, 29.0, 44.0, 37.0, 31.0, 30.0, 28.0, 29.0, 31.0, 32.0, 17.0, 18.0, 20.0, 16.0, 12.0, 9.0, 14.0, 13.0, 8.0, 6.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009933240711688995, -0.009593583643436432, -0.009253925643861294, -0.00891426857560873, -0.008574610576033592, -0.008234953507781029, -0.00789529550820589, -0.007555638439953327, -0.007215980440378189, -0.006876322906464338, -0.0065366653725504875, -0.006197007838636637, -0.005857350304722786, -0.005517692770808935, -0.005178035236895084, -0.004838378168642521, -0.00449872063472867, -0.004159063100814819, -0.0038194055669009686, -0.0034797480329871178, -0.003140090499073267, -0.002800432965159416, -0.002460775664076209, -0.0021211181301623583, -0.0017814605962485075, -0.0014418030623346567, -0.001102145528420806, -0.000762488110922277, -0.0004228305770084262, -8.31730430945754e-05, 0.00025648437440395355, 0.0005961419083178043, 0.0009357994422316551, 0.001275456976145506, 0.0016151145100593567, 0.0019547720439732075, 0.0022944295778870583, 0.002634087111800909, 0.002973744412884116, 0.003313401946797967, 0.0036530594807118177, 0.003992716781795025, 0.004332374315708876, 0.0046720318496227264, 0.005011689383536577, 0.005351346917450428, 0.005691004451364279, 0.00603066198527813, 0.00637031951919198, 0.006709977053105831, 0.007049634587019682, 0.007389292120933533, 0.0077289496548473835, 0.008068607188761234, 0.008408264257013798, 0.008747922256588936, 0.0090875793248415, 0.009427236393094063, 0.009766894392669201, 0.010106551460921764, 0.010446209460496902, 0.010785866528749466, 0.011125524528324604, 0.011465181596577168, 0.011804839596152306]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 17.0, 12.0, 21.0, 37.0, 53.0, 74.0, 77.0, 140.0, 193.0, 314.0, 455.0, 658.0, 1053.0, 1599.0, 2548.0, 3868.0, 6030.0, 10413.0, 17244.0, 29168.0, 51787.0, 96185.0, 201938.0, 302647.0, 147183.0, 73861.0, 40663.0, 23463.0, 13967.0, 8350.0, 5214.0, 3208.0, 2139.0, 1290.0, 885.0, 630.0, 345.0, 272.0, 143.0, 122.0, 94.0, 60.0, 36.0, 27.0, 27.0, 15.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.006511688232421875, -0.006316125392913818, -0.006120562553405762, -0.005924999713897705, -0.0057294368743896484, -0.005533874034881592, -0.005338311195373535, -0.0051427483558654785, -0.004947185516357422, -0.004751622676849365, -0.004556059837341309, -0.004360496997833252, -0.004164934158325195, -0.003969371318817139, -0.003773808479309082, -0.0035782456398010254, -0.0033826828002929688, -0.003187119960784912, -0.0029915571212768555, -0.002795994281768799, -0.002600431442260742, -0.0024048686027526855, -0.002209305763244629, -0.0020137429237365723, -0.0018181800842285156, -0.001622617244720459, -0.0014270544052124023, -0.0012314915657043457, -0.001035928726196289, -0.0008403658866882324, -0.0006448030471801758, -0.00044924020767211914, -0.0002536773681640625, -5.811452865600586e-05, 0.00013744831085205078, 0.0003330111503601074, 0.0005285739898681641, 0.0007241368293762207, 0.0009196996688842773, 0.001115262508392334, 0.0013108253479003906, 0.0015063881874084473, 0.001701951026916504, 0.0018975138664245605, 0.002093076705932617, 0.002288639545440674, 0.0024842023849487305, 0.002679765224456787, 0.0028753280639648438, 0.0030708909034729004, 0.003266453742980957, 0.0034620165824890137, 0.0036575794219970703, 0.003853142261505127, 0.004048705101013184, 0.00424426794052124, 0.004439830780029297, 0.0046353936195373535, 0.00483095645904541, 0.005026519298553467, 0.0052220821380615234, 0.00541764497756958, 0.005613207817077637, 0.005808770656585693, 0.00600433349609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 7.0, 4.0, 1.0, 11.0, 8.0, 11.0, 10.0, 15.0, 16.0, 13.0, 19.0, 26.0, 21.0, 28.0, 28.0, 35.0, 42.0, 37.0, 42.0, 36.0, 45.0, 38.0, 35.0, 41.0, 42.0, 29.0, 36.0, 31.0, 33.0, 30.0, 36.0, 23.0, 26.0, 21.0, 26.0, 16.0, 17.0, 11.0, 9.0, 12.0, 11.0, 5.0, 4.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01070404052734375, -0.010340213775634766, -0.009976387023925781, -0.009612560272216797, -0.009248733520507812, -0.008884906768798828, -0.008521080017089844, -0.00815725326538086, -0.007793426513671875, -0.007429599761962891, -0.007065773010253906, -0.006701946258544922, -0.0063381195068359375, -0.005974292755126953, -0.005610466003417969, -0.005246639251708984, -0.0048828125, -0.004518985748291016, -0.004155158996582031, -0.003791332244873047, -0.0034275054931640625, -0.003063678741455078, -0.0026998519897460938, -0.0023360252380371094, -0.001972198486328125, -0.0016083717346191406, -0.0012445449829101562, -0.0008807182312011719, -0.0005168914794921875, -0.00015306472778320312, 0.00021076202392578125, 0.0005745887756347656, 0.00093841552734375, 0.0013022422790527344, 0.0016660690307617188, 0.002029895782470703, 0.0023937225341796875, 0.002757549285888672, 0.0031213760375976562, 0.0034852027893066406, 0.003849029541015625, 0.004212856292724609, 0.004576683044433594, 0.004940509796142578, 0.0053043365478515625, 0.005668163299560547, 0.006031990051269531, 0.006395816802978516, 0.0067596435546875, 0.007123470306396484, 0.007487297058105469, 0.007851123809814453, 0.008214950561523438, 0.008578777313232422, 0.008942604064941406, 0.00930643081665039, 0.009670257568359375, 0.01003408432006836, 0.010397911071777344, 0.010761737823486328, 0.011125564575195312, 0.011489391326904297, 0.011853218078613281, 0.012217044830322266, 0.01258087158203125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 6.0, 5.0, 11.0, 11.0, 9.0, 15.0, 36.0, 51.0, 63.0, 87.0, 123.0, 161.0, 260.0, 328.0, 488.0, 710.0, 1009.0, 1486.0, 2041.0, 3136.0, 4601.0, 6948.0, 10629.0, 16650.0, 27488.0, 48376.0, 93047.0, 213072.0, 323002.0, 134607.0, 64714.0, 35546.0, 21028.0, 12943.0, 8332.0, 5581.0, 3713.0, 2560.0, 1693.0, 1218.0, 792.0, 605.0, 403.0, 284.0, 197.0, 139.0, 93.0, 89.0, 46.0, 44.0, 28.0, 27.0, 8.0, 6.0, 5.0, 4.0, 9.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.005588531494140625, -0.005409598350524902, -0.00523066520690918, -0.005051732063293457, -0.004872798919677734, -0.004693865776062012, -0.004514932632446289, -0.004335999488830566, -0.004157066345214844, -0.003978133201599121, -0.0037992000579833984, -0.0036202669143676758, -0.003441333770751953, -0.0032624006271362305, -0.003083467483520508, -0.002904534339904785, -0.0027256011962890625, -0.00254666805267334, -0.002367734909057617, -0.0021888017654418945, -0.002009868621826172, -0.0018309354782104492, -0.0016520023345947266, -0.001473069190979004, -0.0012941360473632812, -0.0011152029037475586, -0.0009362697601318359, -0.0007573366165161133, -0.0005784034729003906, -0.00039947032928466797, -0.0002205371856689453, -4.1604042053222656e-05, 0.0001373291015625, 0.00031626224517822266, 0.0004951953887939453, 0.000674128532409668, 0.0008530616760253906, 0.0010319948196411133, 0.001210927963256836, 0.0013898611068725586, 0.0015687942504882812, 0.001747727394104004, 0.0019266605377197266, 0.0021055936813354492, 0.002284526824951172, 0.0024634599685668945, 0.002642393112182617, 0.00282132625579834, 0.0030002593994140625, 0.003179192543029785, 0.003358125686645508, 0.0035370588302612305, 0.003715991973876953, 0.0038949251174926758, 0.0040738582611083984, 0.004252791404724121, 0.004431724548339844, 0.004610657691955566, 0.004789590835571289, 0.004968523979187012, 0.005147457122802734, 0.005326390266418457, 0.00550532341003418, 0.005684256553649902, 0.005863189697265625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 4.0, 2.0, 0.0, 4.0, 8.0, 9.0, 6.0, 10.0, 8.0, 10.0, 13.0, 18.0, 27.0, 24.0, 23.0, 30.0, 33.0, 38.0, 42.0, 36.0, 43.0, 52.0, 38.0, 34.0, 45.0, 46.0, 38.0, 23.0, 34.0, 37.0, 28.0, 33.0, 31.0, 25.0, 19.0, 22.0, 15.0, 12.0, 19.0, 11.0, 15.0, 7.0, 9.0, 4.0, 7.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007617950439453125, -0.007378280162811279, -0.007138609886169434, -0.006898939609527588, -0.006659269332885742, -0.0064195990562438965, -0.006179928779602051, -0.005940258502960205, -0.005700588226318359, -0.005460917949676514, -0.005221247673034668, -0.004981577396392822, -0.0047419071197509766, -0.004502236843109131, -0.004262566566467285, -0.0040228962898254395, -0.0037832260131835938, -0.003543555736541748, -0.0033038854598999023, -0.0030642151832580566, -0.002824544906616211, -0.0025848746299743652, -0.0023452043533325195, -0.002105534076690674, -0.0018658638000488281, -0.0016261935234069824, -0.0013865232467651367, -0.001146852970123291, -0.0009071826934814453, -0.0006675124168395996, -0.0004278421401977539, -0.0001881718635559082, 5.14984130859375e-05, 0.0002911686897277832, 0.0005308389663696289, 0.0007705092430114746, 0.0010101795196533203, 0.001249849796295166, 0.0014895200729370117, 0.0017291903495788574, 0.001968860626220703, 0.002208530902862549, 0.0024482011795043945, 0.0026878714561462402, 0.002927541732788086, 0.0031672120094299316, 0.0034068822860717773, 0.003646552562713623, 0.0038862228393554688, 0.0041258931159973145, 0.00436556339263916, 0.004605233669281006, 0.0048449039459228516, 0.005084574222564697, 0.005324244499206543, 0.005563914775848389, 0.005803585052490234, 0.00604325532913208, 0.006282925605773926, 0.0065225958824157715, 0.006762266159057617, 0.007001936435699463, 0.007241606712341309, 0.007481276988983154, 0.007720947265625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 18.0, 12.0, 15.0, 18.0, 34.0, 44.0, 63.0, 121.0, 159.0, 250.0, 356.0, 554.0, 796.0, 1379.0, 2282.0, 4067.0, 7672.0, 15734.0, 35060.0, 93602.0, 493024.0, 269916.0, 68208.0, 27278.0, 12597.0, 6429.0, 3469.0, 2019.0, 1198.0, 726.0, 458.0, 305.0, 209.0, 148.0, 92.0, 60.0, 46.0, 41.0, 21.0, 20.0, 16.0, 6.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.00025844573974609375, -0.0002503320574760437, -0.00024221837520599365, -0.0002341046929359436, -0.00022599101066589355, -0.0002178773283958435, -0.00020976364612579346, -0.0002016499638557434, -0.00019353628158569336, -0.0001854225993156433, -0.00017730891704559326, -0.0001691952347755432, -0.00016108155250549316, -0.00015296787023544312, -0.00014485418796539307, -0.00013674050569534302, -0.00012862682342529297, -0.00012051314115524292, -0.00011239945888519287, -0.00010428577661514282, -9.617209434509277e-05, -8.805841207504272e-05, -7.994472980499268e-05, -7.183104753494263e-05, -6.371736526489258e-05, -5.560368299484253e-05, -4.749000072479248e-05, -3.937631845474243e-05, -3.126263618469238e-05, -2.3148953914642334e-05, -1.5035271644592285e-05, -6.921589374542236e-06, 1.1920928955078125e-06, 9.305775165557861e-06, 1.741945743560791e-05, 2.553313970565796e-05, 3.364682197570801e-05, 4.176050424575806e-05, 4.9874186515808105e-05, 5.7987868785858154e-05, 6.61015510559082e-05, 7.421523332595825e-05, 8.23289155960083e-05, 9.044259786605835e-05, 9.85562801361084e-05, 0.00010666996240615845, 0.0001147836446762085, 0.00012289732694625854, 0.0001310110092163086, 0.00013912469148635864, 0.0001472383737564087, 0.00015535205602645874, 0.0001634657382965088, 0.00017157942056655884, 0.0001796931028366089, 0.00018780678510665894, 0.00019592046737670898, 0.00020403414964675903, 0.00021214783191680908, 0.00022026151418685913, 0.00022837519645690918, 0.00023648887872695923, 0.0002446025609970093, 0.0002527162432670593, 0.0002608299255371094]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 8.0, 13.0, 10.0, 34.0, 34.0, 67.0, 61.0, 93.0, 91.0, 136.0, 113.0, 89.0, 69.0, 39.0, 43.0, 24.0, 23.0, 6.0, 13.0, 9.0, 3.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9669532775878906e-05, -1.904275268316269e-05, -1.8415972590446472e-05, -1.7789192497730255e-05, -1.7162412405014038e-05, -1.653563231229782e-05, -1.5908852219581604e-05, -1.5282072126865387e-05, -1.465529203414917e-05, -1.4028511941432953e-05, -1.3401731848716736e-05, -1.2774951756000519e-05, -1.2148171663284302e-05, -1.1521391570568085e-05, -1.0894611477851868e-05, -1.026783138513565e-05, -9.641051292419434e-06, -9.014271199703217e-06, -8.387491106987e-06, -7.760711014270782e-06, -7.1339309215545654e-06, -6.507150828838348e-06, -5.880370736122131e-06, -5.253590643405914e-06, -4.626810550689697e-06, -4.00003045797348e-06, -3.373250365257263e-06, -2.746470272541046e-06, -2.119690179824829e-06, -1.492910087108612e-06, -8.66129994392395e-07, -2.39349901676178e-07, 3.8743019104003906e-07, 1.014210283756256e-06, 1.6409903764724731e-06, 2.26777046918869e-06, 2.8945505619049072e-06, 3.5213306546211243e-06, 4.148110747337341e-06, 4.774890840053558e-06, 5.401670932769775e-06, 6.0284510254859924e-06, 6.6552311182022095e-06, 7.2820112109184265e-06, 7.908791303634644e-06, 8.53557139635086e-06, 9.162351489067078e-06, 9.789131581783295e-06, 1.0415911674499512e-05, 1.1042691767215729e-05, 1.1669471859931946e-05, 1.2296251952648163e-05, 1.292303204536438e-05, 1.3549812138080597e-05, 1.4176592230796814e-05, 1.4803372323513031e-05, 1.5430152416229248e-05, 1.6056932508945465e-05, 1.6683712601661682e-05, 1.73104926943779e-05, 1.7937272787094116e-05, 1.8564052879810333e-05, 1.919083297252655e-05, 1.9817613065242767e-05, 2.0444393157958984e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 10.0, 10.0, 10.0, 9.0, 24.0, 24.0, 37.0, 63.0, 100.0, 204.0, 565.0, 2604.0, 22620.0, 759194.0, 249687.0, 11001.0, 1534.0, 428.0, 163.0, 91.0, 39.0, 42.0, 13.0, 18.0, 18.0, 10.0, 5.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0011281967163085938, -0.0010958313941955566, -0.0010634660720825195, -0.0010311007499694824, -0.0009987354278564453, -0.0009663701057434082, -0.0009340047836303711, -0.000901639461517334, -0.0008692741394042969, -0.0008369088172912598, -0.0008045434951782227, -0.0007721781730651855, -0.0007398128509521484, -0.0007074475288391113, -0.0006750822067260742, -0.0006427168846130371, -0.0006103515625, -0.0005779862403869629, -0.0005456209182739258, -0.0005132555961608887, -0.00048089027404785156, -0.00044852495193481445, -0.00041615962982177734, -0.00038379430770874023, -0.0003514289855957031, -0.000319063663482666, -0.0002866983413696289, -0.0002543330192565918, -0.0002219676971435547, -0.00018960237503051758, -0.00015723705291748047, -0.00012487173080444336, -9.250640869140625e-05, -6.014108657836914e-05, -2.777576446533203e-05, 4.589557647705078e-06, 3.695487976074219e-05, 6.93202018737793e-05, 0.0001016855239868164, 0.00013405084609985352, 0.00016641616821289062, 0.00019878149032592773, 0.00023114681243896484, 0.00026351213455200195, 0.00029587745666503906, 0.00032824277877807617, 0.0003606081008911133, 0.0003929734230041504, 0.0004253387451171875, 0.0004577040672302246, 0.0004900693893432617, 0.0005224347114562988, 0.0005548000335693359, 0.000587165355682373, 0.0006195306777954102, 0.0006518959999084473, 0.0006842613220214844, 0.0007166266441345215, 0.0007489919662475586, 0.0007813572883605957, 0.0008137226104736328, 0.0008460879325866699, 0.000878453254699707, 0.0009108185768127441, 0.0009431838989257812]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 5.0, 9.0, 9.0, 6.0, 11.0, 8.0, 17.0, 21.0, 24.0, 27.0, 30.0, 34.0, 64.0, 79.0, 144.0, 124.0, 97.0, 54.0, 51.0, 39.0, 24.0, 20.0, 16.0, 25.0, 12.0, 8.0, 11.0, 5.0, 10.0, 5.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.854534149169922e-05, -6.646569818258286e-05, -6.438605487346649e-05, -6.230641156435013e-05, -6.0226768255233765e-05, -5.81471249461174e-05, -5.606748163700104e-05, -5.3987838327884674e-05, -5.190819501876831e-05, -4.982855170965195e-05, -4.7748908400535583e-05, -4.566926509141922e-05, -4.3589621782302856e-05, -4.150997847318649e-05, -3.943033516407013e-05, -3.7350691854953766e-05, -3.52710485458374e-05, -3.319140523672104e-05, -3.1111761927604675e-05, -2.9032118618488312e-05, -2.6952475309371948e-05, -2.4872832000255585e-05, -2.279318869113922e-05, -2.0713545382022858e-05, -1.8633902072906494e-05, -1.655425876379013e-05, -1.4474615454673767e-05, -1.2394972145557404e-05, -1.031532883644104e-05, -8.235685527324677e-06, -6.156042218208313e-06, -4.0763989090919495e-06, -1.996755599975586e-06, 8.288770914077759e-08, 2.162531018257141e-06, 4.242174327373505e-06, 6.321817636489868e-06, 8.401460945606232e-06, 1.0481104254722595e-05, 1.2560747563838959e-05, 1.4640390872955322e-05, 1.6720034182071686e-05, 1.879967749118805e-05, 2.0879320800304413e-05, 2.2958964109420776e-05, 2.503860741853714e-05, 2.7118250727653503e-05, 2.9197894036769867e-05, 3.127753734588623e-05, 3.3357180655002594e-05, 3.543682396411896e-05, 3.751646727323532e-05, 3.9596110582351685e-05, 4.167575389146805e-05, 4.375539720058441e-05, 4.5835040509700775e-05, 4.791468381881714e-05, 4.99943271279335e-05, 5.2073970437049866e-05, 5.415361374616623e-05, 5.623325705528259e-05, 5.8312900364398956e-05, 6.039254367351532e-05, 6.247218698263168e-05, 6.455183029174805e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 13.0, 9.0, 13.0, 20.0, 31.0, 32.0, 36.0, 51.0, 68.0, 66.0, 92.0, 92.0, 68.0, 94.0, 65.0, 47.0, 46.0, 35.0, 22.0, 20.0, 12.0, 20.0, 7.0, 15.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.016040945425629616, -0.015517537482082844, -0.014994129538536072, -0.0144707215949893, -0.013947313651442528, -0.01342390663921833, -0.012900498695671558, -0.012377090752124786, -0.011853682808578014, -0.011330274865031242, -0.01080686692148447, -0.010283458977937698, -0.009760051965713501, -0.009236643090844154, -0.008713236078619957, -0.008189828135073185, -0.007666420191526413, -0.007143012247979641, -0.006619604304432869, -0.006096196826547384, -0.005572788883000612, -0.00504938093945384, -0.0045259734615683556, -0.0040025655180215836, -0.0034791575744748116, -0.0029557496309280396, -0.002432341920211911, -0.001908934093080461, -0.0013855262659490108, -0.0008621183224022388, -0.0003387106116861105, 0.00018469709903001785, 0.0007081050425767899, 0.00123151286970824, 0.0017549206968396902, 0.0022783284075558186, 0.0028017363511025906, 0.0033251442946493626, 0.003848552005365491, 0.004371959716081619, 0.004895367659628391, 0.005418775603175163, 0.005942183546721935, 0.00646559102460742, 0.006988998968154192, 0.007512406911700964, 0.008035814389586449, 0.00855922233313322, 0.009082630276679993, 0.009606038220226765, 0.010129446163773537, 0.010652854107320309, 0.01117626205086708, 0.011699669063091278, 0.01222307700663805, 0.012746484950184822, 0.013269892893731594, 0.013793300837278366, 0.014316708780825138, 0.01484011672437191, 0.015363523736596107, 0.015886932611465454, 0.01641033962368965, 0.01693374663591385, 0.017457155510783195]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 6.0, 3.0, 0.0, 4.0, 0.0, 3.0, 5.0, 3.0, 9.0, 12.0, 10.0, 15.0, 9.0, 18.0, 14.0, 14.0, 22.0, 25.0, 17.0, 34.0, 36.0, 29.0, 41.0, 39.0, 41.0, 39.0, 30.0, 33.0, 37.0, 34.0, 28.0, 47.0, 41.0, 26.0, 32.0, 27.0, 30.0, 30.0, 25.0, 22.0, 20.0, 16.0, 11.0, 14.0, 11.0, 14.0, 7.0, 10.0, 6.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00948487501591444, -0.009158382192254066, -0.008831889368593693, -0.008505396544933319, -0.008178903721272945, -0.007852410897612572, -0.007525918073952198, -0.007199425250291824, -0.006872932426631451, -0.006546439602971077, -0.006219946779310703, -0.00589345395565033, -0.005566961131989956, -0.005240468308329582, -0.0049139754846692085, -0.004587482661008835, -0.0042609903030097485, -0.003934497479349375, -0.003608004655689001, -0.0032815118320286274, -0.0029550190083682537, -0.00262852618470788, -0.00230203359387815, -0.0019755407702177763, -0.0016490479465574026, -0.001322555122897029, -0.0009960622992366552, -0.0006695695919916034, -0.0003430767683312297, -1.6583944670856e-05, 0.00030990876257419586, 0.0006364015862345695, 0.0009628944098949432, 0.001289387233555317, 0.0016158800572156906, 0.0019423727644607425, 0.002268865704536438, 0.0025953585281968117, 0.0029218511190265417, 0.0032483439426869154, 0.003574836766347289, 0.0039013295900076628, 0.004227822180837393, 0.0045543150044977665, 0.00488080782815814, 0.005207300651818514, 0.0055337934754788876, 0.005860286299139261, 0.006186779122799635, 0.006513271946460009, 0.006839764770120382, 0.007166257593780756, 0.00749275041744113, 0.007819242775440216, 0.00814573559910059, 0.008472228422760963, 0.008798721246421337, 0.00912521407008171, 0.009451706893742085, 0.009778199717402458, 0.010104692541062832, 0.010431185364723206, 0.01075767818838358, 0.011084171012043953, 0.011410663835704327]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 6.0, 13.0, 8.0, 17.0, 20.0, 18.0, 21.0, 44.0, 60.0, 104.0, 256.0, 670.0, 2008.0, 6108.0, 19575.0, 68050.0, 234947.0, 434145.0, 200766.0, 56733.0, 16790.0, 5285.0, 1758.0, 618.0, 235.0, 99.0, 56.0, 25.0, 23.0, 17.0, 17.0, 12.0, 13.0, 13.0, 5.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.07086181640625, -0.0689687728881836, -0.06707572937011719, -0.06518268585205078, -0.06328964233398438, -0.06139659881591797, -0.05950355529785156, -0.057610511779785156, -0.05571746826171875, -0.053824424743652344, -0.05193138122558594, -0.05003833770751953, -0.048145294189453125, -0.04625225067138672, -0.04435920715332031, -0.042466163635253906, -0.0405731201171875, -0.038680076599121094, -0.03678703308105469, -0.03489398956298828, -0.033000946044921875, -0.03110790252685547, -0.029214859008789062, -0.027321815490722656, -0.02542877197265625, -0.023535728454589844, -0.021642684936523438, -0.01974964141845703, -0.017856597900390625, -0.01596355438232422, -0.014070510864257812, -0.012177467346191406, -0.010284423828125, -0.008391380310058594, -0.0064983367919921875, -0.004605293273925781, -0.002712249755859375, -0.0008192062377929688, 0.0010738372802734375, 0.0029668807983398438, 0.00485992431640625, 0.006752967834472656, 0.008646011352539062, 0.010539054870605469, 0.012432098388671875, 0.014325141906738281, 0.016218185424804688, 0.018111228942871094, 0.0200042724609375, 0.021897315979003906, 0.023790359497070312, 0.02568340301513672, 0.027576446533203125, 0.02946949005126953, 0.03136253356933594, 0.033255577087402344, 0.03514862060546875, 0.037041664123535156, 0.03893470764160156, 0.04082775115966797, 0.042720794677734375, 0.04461383819580078, 0.04650688171386719, 0.048399925231933594, 0.05029296875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 3.0, 5.0, 10.0, 11.0, 8.0, 20.0, 22.0, 20.0, 28.0, 34.0, 44.0, 48.0, 49.0, 59.0, 60.0, 58.0, 66.0, 43.0, 73.0, 49.0, 40.0, 52.0, 32.0, 42.0, 25.0, 25.0, 22.0, 18.0, 13.0, 5.0, 9.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01399993896484375, -0.013604402542114258, -0.013208866119384766, -0.012813329696655273, -0.012417793273925781, -0.012022256851196289, -0.011626720428466797, -0.011231184005737305, -0.010835647583007812, -0.01044011116027832, -0.010044574737548828, -0.009649038314819336, -0.009253501892089844, -0.008857965469360352, -0.00846242904663086, -0.008066892623901367, -0.007671356201171875, -0.007275819778442383, -0.006880283355712891, -0.0064847469329833984, -0.006089210510253906, -0.005693674087524414, -0.005298137664794922, -0.00490260124206543, -0.0045070648193359375, -0.004111528396606445, -0.003715991973876953, -0.003320455551147461, -0.0029249191284179688, -0.0025293827056884766, -0.0021338462829589844, -0.0017383098602294922, -0.0013427734375, -0.0009472370147705078, -0.0005517005920410156, -0.00015616416931152344, 0.00023937225341796875, 0.0006349086761474609, 0.0010304450988769531, 0.0014259815216064453, 0.0018215179443359375, 0.0022170543670654297, 0.002612590789794922, 0.003008127212524414, 0.0034036636352539062, 0.0037992000579833984, 0.004194736480712891, 0.004590272903442383, 0.004985809326171875, 0.005381345748901367, 0.005776882171630859, 0.0061724185943603516, 0.006567955017089844, 0.006963491439819336, 0.007359027862548828, 0.00775456428527832, 0.008150100708007812, 0.008545637130737305, 0.008941173553466797, 0.009336709976196289, 0.009732246398925781, 0.010127782821655273, 0.010523319244384766, 0.010918855667114258, 0.01131439208984375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 4.0, 6.0, 10.0, 18.0, 11.0, 16.0, 23.0, 22.0, 31.0, 36.0, 47.0, 57.0, 82.0, 162.0, 394.0, 1211.0, 5408.0, 32101.0, 228860.0, 596760.0, 155940.0, 21754.0, 3848.0, 930.0, 315.0, 133.0, 67.0, 67.0, 40.0, 25.0, 22.0, 20.0, 23.0, 19.0, 20.0, 12.0, 13.0, 6.0, 5.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0], "bins": [-0.0921630859375, -0.08955955505371094, -0.08695602416992188, -0.08435249328613281, -0.08174896240234375, -0.07914543151855469, -0.07654190063476562, -0.07393836975097656, -0.0713348388671875, -0.06873130798339844, -0.06612777709960938, -0.06352424621582031, -0.06092071533203125, -0.05831718444824219, -0.055713653564453125, -0.05311012268066406, -0.050506591796875, -0.04790306091308594, -0.045299530029296875, -0.04269599914550781, -0.04009246826171875, -0.03748893737792969, -0.034885406494140625, -0.03228187561035156, -0.0296783447265625, -0.027074813842773438, -0.024471282958984375, -0.021867752075195312, -0.01926422119140625, -0.016660690307617188, -0.014057159423828125, -0.011453628540039062, -0.00885009765625, -0.0062465667724609375, -0.003643035888671875, -0.0010395050048828125, 0.00156402587890625, 0.0041675567626953125, 0.006771087646484375, 0.009374618530273438, 0.0119781494140625, 0.014581680297851562, 0.017185211181640625, 0.019788742065429688, 0.02239227294921875, 0.024995803833007812, 0.027599334716796875, 0.030202865600585938, 0.032806396484375, 0.03540992736816406, 0.038013458251953125, 0.04061698913574219, 0.04322052001953125, 0.04582405090332031, 0.048427581787109375, 0.05103111267089844, 0.0536346435546875, 0.05623817443847656, 0.058841705322265625, 0.06144523620605469, 0.06404876708984375, 0.06665229797363281, 0.06925582885742188, 0.07185935974121094, 0.074462890625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 5.0, 7.0, 12.0, 15.0, 8.0, 23.0, 24.0, 23.0, 28.0, 22.0, 28.0, 39.0, 46.0, 35.0, 31.0, 36.0, 43.0, 43.0, 36.0, 38.0, 47.0, 52.0, 43.0, 38.0, 40.0, 27.0, 30.0, 28.0, 28.0, 24.0, 15.0, 18.0, 18.0, 12.0, 9.0, 4.0, 6.0, 2.0, 2.0, 5.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00818634033203125, -0.007897019386291504, -0.007607698440551758, -0.007318377494812012, -0.007029056549072266, -0.0067397356033325195, -0.0064504146575927734, -0.006161093711853027, -0.005871772766113281, -0.005582451820373535, -0.005293130874633789, -0.005003809928894043, -0.004714488983154297, -0.004425168037414551, -0.004135847091674805, -0.0038465261459350586, -0.0035572052001953125, -0.0032678842544555664, -0.0029785633087158203, -0.0026892423629760742, -0.002399921417236328, -0.002110600471496582, -0.001821279525756836, -0.0015319585800170898, -0.0012426376342773438, -0.0009533166885375977, -0.0006639957427978516, -0.00037467479705810547, -8.535385131835938e-05, 0.00020396709442138672, 0.0004932880401611328, 0.0007826089859008789, 0.001071929931640625, 0.001361250877380371, 0.0016505718231201172, 0.0019398927688598633, 0.0022292137145996094, 0.0025185346603393555, 0.0028078556060791016, 0.0030971765518188477, 0.0033864974975585938, 0.00367581844329834, 0.003965139389038086, 0.004254460334777832, 0.004543781280517578, 0.004833102226257324, 0.00512242317199707, 0.005411744117736816, 0.0057010650634765625, 0.005990386009216309, 0.006279706954956055, 0.006569027900695801, 0.006858348846435547, 0.007147669792175293, 0.007436990737915039, 0.007726311683654785, 0.008015632629394531, 0.008304953575134277, 0.008594274520874023, 0.00888359546661377, 0.009172916412353516, 0.009462237358093262, 0.009751558303833008, 0.010040879249572754, 0.0103302001953125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 2.0, 6.0, 14.0, 24.0, 26.0, 38.0, 45.0, 69.0, 143.0, 244.0, 533.0, 984.0, 2251.0, 5170.0, 15134.0, 67638.0, 739577.0, 176923.0, 25912.0, 7896.0, 3073.0, 1386.0, 660.0, 335.0, 185.0, 83.0, 58.0, 43.0, 34.0, 20.0, 7.0, 8.0, 9.0, 7.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0027446746826171875, -0.00266990065574646, -0.0025951266288757324, -0.002520352602005005, -0.0024455785751342773, -0.00237080454826355, -0.0022960305213928223, -0.0022212564945220947, -0.002146482467651367, -0.0020717084407806396, -0.001996934413909912, -0.0019221603870391846, -0.001847386360168457, -0.0017726123332977295, -0.001697838306427002, -0.0016230642795562744, -0.0015482902526855469, -0.0014735162258148193, -0.0013987421989440918, -0.0013239681720733643, -0.0012491941452026367, -0.0011744201183319092, -0.0010996460914611816, -0.001024872064590454, -0.0009500980377197266, -0.000875324010848999, -0.0008005499839782715, -0.0007257759571075439, -0.0006510019302368164, -0.0005762279033660889, -0.0005014538764953613, -0.0004266798496246338, -0.00035190582275390625, -0.0002771317958831787, -0.00020235776901245117, -0.00012758374214172363, -5.2809715270996094e-05, 2.1964311599731445e-05, 9.673833847045898e-05, 0.00017151236534118652, 0.00024628639221191406, 0.0003210604190826416, 0.00039583444595336914, 0.0004706084728240967, 0.0005453824996948242, 0.0006201565265655518, 0.0006949305534362793, 0.0007697045803070068, 0.0008444786071777344, 0.0009192526340484619, 0.0009940266609191895, 0.001068800687789917, 0.0011435747146606445, 0.001218348741531372, 0.0012931227684020996, 0.0013678967952728271, 0.0014426708221435547, 0.0015174448490142822, 0.0015922188758850098, 0.0016669929027557373, 0.0017417669296264648, 0.0018165409564971924, 0.00189131498336792, 0.0019660890102386475, 0.002040863037109375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 5.0, 9.0, 5.0, 5.0, 12.0, 15.0, 23.0, 24.0, 34.0, 43.0, 58.0, 61.0, 81.0, 94.0, 88.0, 84.0, 67.0, 61.0, 49.0, 39.0, 32.0, 16.0, 18.0, 21.0, 9.0, 9.0, 5.0, 6.0, 2.0, 7.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-06, -6.73346221446991e-06, -6.433576345443726e-06, -6.1336904764175415e-06, -5.833804607391357e-06, -5.533918738365173e-06, -5.234032869338989e-06, -4.934147000312805e-06, -4.634261131286621e-06, -4.334375262260437e-06, -4.034489393234253e-06, -3.734603524208069e-06, -3.4347176551818848e-06, -3.1348317861557007e-06, -2.8349459171295166e-06, -2.5350600481033325e-06, -2.2351741790771484e-06, -1.9352883100509644e-06, -1.6354024410247803e-06, -1.3355165719985962e-06, -1.0356307029724121e-06, -7.35744833946228e-07, -4.3585896492004395e-07, -1.3597309589385986e-07, 1.6391277313232422e-07, 4.637986421585083e-07, 7.636845111846924e-07, 1.0635703802108765e-06, 1.3634562492370605e-06, 1.6633421182632446e-06, 1.9632279872894287e-06, 2.263113856315613e-06, 2.562999725341797e-06, 2.862885594367981e-06, 3.162771463394165e-06, 3.462657332420349e-06, 3.762543201446533e-06, 4.062429070472717e-06, 4.362314939498901e-06, 4.6622008085250854e-06, 4.9620866775512695e-06, 5.261972546577454e-06, 5.561858415603638e-06, 5.861744284629822e-06, 6.161630153656006e-06, 6.46151602268219e-06, 6.761401891708374e-06, 7.061287760734558e-06, 7.361173629760742e-06, 7.661059498786926e-06, 7.96094536781311e-06, 8.260831236839294e-06, 8.560717105865479e-06, 8.860602974891663e-06, 9.160488843917847e-06, 9.46037471294403e-06, 9.760260581970215e-06, 1.0060146450996399e-05, 1.0360032320022583e-05, 1.0659918189048767e-05, 1.0959804058074951e-05, 1.1259689927101135e-05, 1.155957579612732e-05, 1.1859461665153503e-05, 1.2159347534179688e-05]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 6.0, 2.0, 2.0, 6.0, 2.0, 8.0, 20.0, 15.0, 20.0, 46.0, 104.0, 339.0, 1124.0, 5267.0, 47691.0, 940197.0, 46746.0, 5267.0, 1110.0, 321.0, 121.0, 50.0, 19.0, 16.0, 12.0, 11.0, 11.0, 3.0, 3.0, 4.0, 3.0, 1.0, 9.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0046539306640625, -0.0045149922370910645, -0.004376053810119629, -0.004237115383148193, -0.004098176956176758, -0.003959238529205322, -0.0038203001022338867, -0.003681361675262451, -0.0035424232482910156, -0.00340348482131958, -0.0032645463943481445, -0.003125607967376709, -0.0029866695404052734, -0.002847731113433838, -0.0027087926864624023, -0.002569854259490967, -0.0024309158325195312, -0.0022919774055480957, -0.00215303897857666, -0.0020141005516052246, -0.001875162124633789, -0.0017362236976623535, -0.001597285270690918, -0.0014583468437194824, -0.0013194084167480469, -0.0011804699897766113, -0.0010415315628051758, -0.0009025931358337402, -0.0007636547088623047, -0.0006247162818908691, -0.0004857778549194336, -0.00034683942794799805, -0.0002079010009765625, -6.896257400512695e-05, 6.99758529663086e-05, 0.00020891427993774414, 0.0003478527069091797, 0.00048679113388061523, 0.0006257295608520508, 0.0007646679878234863, 0.0009036064147949219, 0.0010425448417663574, 0.001181483268737793, 0.0013204216957092285, 0.001459360122680664, 0.0015982985496520996, 0.0017372369766235352, 0.0018761754035949707, 0.0020151138305664062, 0.002154052257537842, 0.0022929906845092773, 0.002431929111480713, 0.0025708675384521484, 0.002709805965423584, 0.0028487443923950195, 0.002987682819366455, 0.0031266212463378906, 0.003265559673309326, 0.0034044981002807617, 0.0035434365272521973, 0.003682374954223633, 0.0038213133811950684, 0.003960251808166504, 0.0040991902351379395, 0.004238128662109375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 2.0, 6.0, 2.0, 3.0, 12.0, 11.0, 10.0, 10.0, 14.0, 27.0, 20.0, 51.0, 81.0, 99.0, 116.0, 120.0, 105.0, 92.0, 74.0, 35.0, 23.0, 22.0, 10.0, 13.0, 10.0, 7.0, 2.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003685951232910156, -0.00035641714930534363, -0.00034423917531967163, -0.00033206120133399963, -0.00031988322734832764, -0.00030770525336265564, -0.00029552727937698364, -0.00028334930539131165, -0.00027117133140563965, -0.00025899335741996765, -0.00024681538343429565, -0.00023463740944862366, -0.00022245943546295166, -0.00021028146147727966, -0.00019810348749160767, -0.00018592551350593567, -0.00017374753952026367, -0.00016156956553459167, -0.00014939159154891968, -0.00013721361756324768, -0.00012503564357757568, -0.00011285766959190369, -0.00010067969560623169, -8.850172162055969e-05, -7.63237476348877e-05, -6.41457736492157e-05, -5.19677996635437e-05, -3.9789825677871704e-05, -2.7611851692199707e-05, -1.543387770652771e-05, -3.255903720855713e-06, 8.922070264816284e-06, 2.110004425048828e-05, 3.327801823616028e-05, 4.5455992221832275e-05, 5.763396620750427e-05, 6.981194019317627e-05, 8.198991417884827e-05, 9.416788816452026e-05, 0.00010634586215019226, 0.00011852383613586426, 0.00013070181012153625, 0.00014287978410720825, 0.00015505775809288025, 0.00016723573207855225, 0.00017941370606422424, 0.00019159168004989624, 0.00020376965403556824, 0.00021594762802124023, 0.00022812560200691223, 0.00024030357599258423, 0.0002524815499782562, 0.0002646595239639282, 0.0002768374979496002, 0.0002890154719352722, 0.0003011934459209442, 0.0003133714199066162, 0.0003255493938922882, 0.0003377273678779602, 0.0003499053418636322, 0.0003620833158493042, 0.0003742612898349762, 0.0003864392638206482, 0.0003986172378063202, 0.0004107952117919922]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 13.0, 26.0, 48.0, 132.0, 213.0, 252.0, 162.0, 81.0, 42.0, 19.0, 10.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035227105021476746, -0.03364362195134163, -0.03206014260649681, -0.030476661399006844, -0.028893180191516876, -0.02730969712138176, -0.02572621777653694, -0.024142734706401825, -0.022559255361557007, -0.02097577415406704, -0.019392292946577072, -0.017808811739087105, -0.016225330531597137, -0.014641848392784595, -0.013058367185294628, -0.01147488597780466, -0.009891403838992119, -0.008307922631502151, -0.006724441424012184, -0.0051409597508609295, -0.003557478543370962, -0.0019739968702197075, -0.00039051566272974014, 0.0011929655447602272, 0.0027764467522501945, 0.004359927959740162, 0.005943409167230129, 0.007526890840381384, 0.009110372513532639, 0.010693853721022606, 0.012277334928512573, 0.01386081613600254, 0.015444297343492508, 0.017027778550982475, 0.018611259758472443, 0.02019474096596241, 0.021778222173452377, 0.023361705243587494, 0.024945184588432312, 0.02652866765856743, 0.028112147003412247, 0.029695628210902214, 0.03127910941839218, 0.0328625924885273, 0.034446071833372116, 0.03602955490350723, 0.03761303424835205, 0.03919651731848717, 0.040780000388622284, 0.0423634834587574, 0.04394696280360222, 0.045530445873737335, 0.04711392521858215, 0.04869740828871727, 0.05028088763356209, 0.051864370703697205, 0.05344785004854202, 0.05503133311867714, 0.05661481246352196, 0.058198295533657074, 0.05978177487850189, 0.06136525794863701, 0.06294874101877213, 0.06453222036361694, 0.06611569970846176]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 7.0, 5.0, 11.0, 12.0, 17.0, 19.0, 14.0, 22.0, 18.0, 36.0, 30.0, 23.0, 26.0, 40.0, 48.0, 40.0, 51.0, 52.0, 53.0, 38.0, 48.0, 50.0, 34.0, 33.0, 26.0, 36.0, 28.0, 19.0, 23.0, 22.0, 16.0, 15.0, 17.0, 14.0, 10.0, 8.0, 10.0, 4.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.012291666120290756, -0.0119145717471838, -0.011537477374076843, -0.011160383000969887, -0.01078328862786293, -0.010406194254755974, -0.010029099881649017, -0.00965200550854206, -0.009274911135435104, -0.008897816762328148, -0.008520722389221191, -0.008143628016114235, -0.0077665336430072784, -0.007389439269900322, -0.007012345362454653, -0.006635250989347696, -0.006258157081902027, -0.005881062708795071, -0.005503968335688114, -0.005126873962581158, -0.004749779589474201, -0.004372685216367245, -0.0039955913089215755, -0.003618496935814619, -0.0032414025627076626, -0.002864308189600706, -0.0024872138164937496, -0.002110119676217437, -0.0017330253031104803, -0.0013559309300035238, -0.000978836789727211, -0.0006017424166202545, -0.00022464897483587265, 0.00015244534006342292, 0.0005295396549627185, 0.0009066339116543531, 0.0012837282847613096, 0.001660822657868266, 0.002037916798144579, 0.0024150111712515354, 0.002792105544358492, 0.0031691999174654484, 0.003546294290572405, 0.003923388198018074, 0.0043004825711250305, 0.004677576944231987, 0.0050546713173389435, 0.0054317656904459, 0.0058088600635528564, 0.006185954436659813, 0.006563048809766769, 0.006940143182873726, 0.007317237555980682, 0.007694331929087639, 0.008071426302194595, 0.008448520675301552, 0.008825615048408508, 0.009202709421515465, 0.009579803794622421, 0.009956898167729378, 0.010333992540836334, 0.01071108691394329, 0.011088181287050247, 0.011465275660157204, 0.011842369101941586]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 10.0, 7.0, 11.0, 10.0, 17.0, 23.0, 31.0, 53.0, 55.0, 92.0, 131.0, 188.0, 287.0, 447.0, 761.0, 1520.0, 3217.0, 8095.0, 27771.0, 456620.0, 3564701.0, 101680.0, 17093.0, 5853.0, 2425.0, 1302.0, 668.0, 376.0, 272.0, 150.0, 120.0, 85.0, 62.0, 35.0, 35.0, 22.0, 17.0, 11.0, 9.0, 8.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0391845703125, -0.0379328727722168, -0.036681175231933594, -0.03542947769165039, -0.03417778015136719, -0.032926082611083984, -0.03167438507080078, -0.030422687530517578, -0.029170989990234375, -0.027919292449951172, -0.02666759490966797, -0.025415897369384766, -0.024164199829101562, -0.02291250228881836, -0.021660804748535156, -0.020409107208251953, -0.01915740966796875, -0.017905712127685547, -0.016654014587402344, -0.01540231704711914, -0.014150619506835938, -0.012898921966552734, -0.011647224426269531, -0.010395526885986328, -0.009143829345703125, -0.007892131805419922, -0.006640434265136719, -0.005388736724853516, -0.0041370391845703125, -0.0028853416442871094, -0.0016336441040039062, -0.0003819465637207031, 0.0008697509765625, 0.002121448516845703, 0.0033731460571289062, 0.004624843597412109, 0.0058765411376953125, 0.007128238677978516, 0.008379936218261719, 0.009631633758544922, 0.010883331298828125, 0.012135028839111328, 0.013386726379394531, 0.014638423919677734, 0.015890121459960938, 0.01714181900024414, 0.018393516540527344, 0.019645214080810547, 0.02089691162109375, 0.022148609161376953, 0.023400306701660156, 0.02465200424194336, 0.025903701782226562, 0.027155399322509766, 0.02840709686279297, 0.029658794403076172, 0.030910491943359375, 0.03216218948364258, 0.03341388702392578, 0.034665584564208984, 0.03591728210449219, 0.03716897964477539, 0.038420677185058594, 0.0396723747253418, 0.040924072265625]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 5.0, 9.0, 13.0, 11.0, 13.0, 14.0, 18.0, 20.0, 29.0, 26.0, 34.0, 20.0, 38.0, 45.0, 34.0, 45.0, 55.0, 45.0, 58.0, 51.0, 45.0, 47.0, 45.0, 33.0, 35.0, 29.0, 24.0, 18.0, 19.0, 19.0, 23.0, 12.0, 17.0, 7.0, 6.0, 9.0, 9.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01116943359375, -0.010840654373168945, -0.01051187515258789, -0.010183095932006836, -0.009854316711425781, -0.009525537490844727, -0.009196758270263672, -0.008867979049682617, -0.008539199829101562, -0.008210420608520508, -0.007881641387939453, -0.0075528621673583984, -0.007224082946777344, -0.006895303726196289, -0.006566524505615234, -0.00623774528503418, -0.005908966064453125, -0.00558018684387207, -0.005251407623291016, -0.004922628402709961, -0.004593849182128906, -0.0042650699615478516, -0.003936290740966797, -0.003607511520385742, -0.0032787322998046875, -0.002949953079223633, -0.002621173858642578, -0.0022923946380615234, -0.0019636154174804688, -0.001634836196899414, -0.0013060569763183594, -0.0009772777557373047, -0.00064849853515625, -0.0003197193145751953, 9.059906005859375e-06, 0.00033783912658691406, 0.0006666183471679688, 0.0009953975677490234, 0.0013241767883300781, 0.0016529560089111328, 0.0019817352294921875, 0.002310514450073242, 0.002639293670654297, 0.0029680728912353516, 0.0032968521118164062, 0.003625631332397461, 0.003954410552978516, 0.00428318977355957, 0.004611968994140625, 0.00494074821472168, 0.005269527435302734, 0.005598306655883789, 0.005927085876464844, 0.0062558650970458984, 0.006584644317626953, 0.006913423538208008, 0.0072422027587890625, 0.007570981979370117, 0.007899761199951172, 0.008228540420532227, 0.008557319641113281, 0.008886098861694336, 0.00921487808227539, 0.009543657302856445, 0.0098724365234375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 20.0, 16.0, 41.0, 72.0, 229.0, 1159.0, 11568.0, 4118531.0, 59186.0, 2663.0, 451.0, 149.0, 61.0, 36.0, 26.0, 21.0, 8.0, 6.0, 5.0, 5.0, 4.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19775390625, -0.19086456298828125, -0.1839752197265625, -0.17708587646484375, -0.170196533203125, -0.16330718994140625, -0.1564178466796875, -0.14952850341796875, -0.14263916015625, -0.13574981689453125, -0.1288604736328125, -0.12197113037109375, -0.115081787109375, -0.10819244384765625, -0.1013031005859375, -0.09441375732421875, -0.0875244140625, -0.08063507080078125, -0.0737457275390625, -0.06685638427734375, -0.059967041015625, -0.05307769775390625, -0.0461883544921875, -0.03929901123046875, -0.03240966796875, -0.02552032470703125, -0.0186309814453125, -0.01174163818359375, -0.004852294921875, 0.00203704833984375, 0.0089263916015625, 0.01581573486328125, 0.022705078125, 0.02959442138671875, 0.0364837646484375, 0.04337310791015625, 0.050262451171875, 0.05715179443359375, 0.0640411376953125, 0.07093048095703125, 0.07781982421875, 0.08470916748046875, 0.0915985107421875, 0.09848785400390625, 0.105377197265625, 0.11226654052734375, 0.1191558837890625, 0.12604522705078125, 0.1329345703125, 0.13982391357421875, 0.1467132568359375, 0.15360260009765625, 0.160491943359375, 0.16738128662109375, 0.1742706298828125, 0.18115997314453125, 0.18804931640625, 0.19493865966796875, 0.2018280029296875, 0.20871734619140625, 0.215606689453125, 0.22249603271484375, 0.2293853759765625, 0.23627471923828125, 0.2431640625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 3.0, 4.0, 2.0, 6.0, 13.0, 14.0, 27.0, 30.0, 47.0, 56.0, 122.0, 245.0, 715.0, 1571.0, 721.0, 261.0, 87.0, 46.0, 26.0, 28.0, 15.0, 11.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01194000244140625, -0.011547684669494629, -0.011155366897583008, -0.010763049125671387, -0.010370731353759766, -0.009978413581848145, -0.009586095809936523, -0.009193778038024902, -0.008801460266113281, -0.00840914249420166, -0.008016824722290039, -0.007624506950378418, -0.007232189178466797, -0.006839871406555176, -0.006447553634643555, -0.006055235862731934, -0.0056629180908203125, -0.005270600318908691, -0.00487828254699707, -0.004485964775085449, -0.004093647003173828, -0.003701329231262207, -0.003309011459350586, -0.002916693687438965, -0.0025243759155273438, -0.0021320581436157227, -0.0017397403717041016, -0.0013474225997924805, -0.0009551048278808594, -0.0005627870559692383, -0.0001704692840576172, 0.0002218484878540039, 0.000614166259765625, 0.001006484031677246, 0.0013988018035888672, 0.0017911195755004883, 0.0021834373474121094, 0.0025757551193237305, 0.0029680728912353516, 0.0033603906631469727, 0.0037527084350585938, 0.004145026206970215, 0.004537343978881836, 0.004929661750793457, 0.005321979522705078, 0.005714297294616699, 0.00610661506652832, 0.006498932838439941, 0.0068912506103515625, 0.007283568382263184, 0.007675886154174805, 0.008068203926086426, 0.008460521697998047, 0.008852839469909668, 0.009245157241821289, 0.00963747501373291, 0.010029792785644531, 0.010422110557556152, 0.010814428329467773, 0.011206746101379395, 0.011599063873291016, 0.011991381645202637, 0.012383699417114258, 0.012776017189025879, 0.0131683349609375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 6.0, 7.0, 11.0, 15.0, 26.0, 30.0, 28.0, 48.0, 68.0, 111.0, 128.0, 112.0, 118.0, 85.0, 66.0, 41.0, 23.0, 19.0, 23.0, 11.0, 2.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017119349911808968, -0.016514858230948448, -0.01591036655008793, -0.01530587486922741, -0.01470138318836689, -0.01409689150750637, -0.013492399826645851, -0.012887908145785332, -0.012283416464924812, -0.011678924784064293, -0.011074433103203773, -0.010469941422343254, -0.009865449741482735, -0.009260958060622215, -0.008656466379761696, -0.008051974698901176, -0.007447483018040657, -0.006842991337180138, -0.006238499656319618, -0.005634007975459099, -0.005029516294598579, -0.00442502461373806, -0.0038205329328775406, -0.003216041252017021, -0.0026115495711565018, -0.0020070578902959824, -0.001402566209435463, -0.0007980745285749435, -0.00019358284771442413, 0.0004109088331460953, 0.0010154005140066147, 0.001619892194867134, 0.0022243857383728027, 0.002828877419233322, 0.0034333691000938416, 0.004037860780954361, 0.00464235246181488, 0.0052468441426754, 0.005851335823535919, 0.006455827504396439, 0.007060319185256958, 0.007664810866117477, 0.008269302546977997, 0.008873794227838516, 0.009478285908699036, 0.010082777589559555, 0.010687269270420074, 0.011291760951280594, 0.011896252632141113, 0.012500744313001633, 0.013105235993862152, 0.013709727674722672, 0.014314219355583191, 0.01491871103644371, 0.01552320271730423, 0.01612769439816475, 0.01673218607902527, 0.017336677759885788, 0.017941169440746307, 0.018545661121606827, 0.019150152802467346, 0.019754644483327866, 0.020359136164188385, 0.020963627845048904, 0.021568119525909424]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 7.0, 2.0, 4.0, 7.0, 6.0, 12.0, 13.0, 13.0, 13.0, 14.0, 27.0, 29.0, 30.0, 30.0, 32.0, 36.0, 36.0, 42.0, 34.0, 42.0, 42.0, 46.0, 41.0, 32.0, 45.0, 41.0, 37.0, 40.0, 42.0, 30.0, 28.0, 17.0, 32.0, 10.0, 18.0, 15.0, 10.0, 9.0, 13.0, 5.0, 5.0, 3.0, 7.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.011803703382611275, -0.01145873498171568, -0.011113766580820084, -0.010768799111247063, -0.010423830710351467, -0.010078862309455872, -0.009733893908560276, -0.00938892550766468, -0.009043957106769085, -0.00869898870587349, -0.008354020304977894, -0.008009051904082298, -0.00766408396884799, -0.007319116033613682, -0.006974147632718086, -0.006629179231822491, -0.0062842112965881824, -0.005939242895692587, -0.005594274960458279, -0.005249306559562683, -0.0049043381586670876, -0.004559369757771492, -0.004214401822537184, -0.003869433421641588, -0.0035244652535766363, -0.0031794970855116844, -0.002834528684616089, -0.002489560516551137, -0.002144592348486185, -0.0017996239475905895, -0.0014546557795256376, -0.001109687378630042, -0.0007647192105650902, -0.0004197509551886469, -7.478269981220365e-05, 0.00027018552646040916, 0.0006151538109406829, 0.0009601220954209566, 0.0013050902634859085, 0.001650058664381504, 0.001995026832446456, 0.002339995000511408, 0.0026849634014070034, 0.0030299315694719553, 0.003374899737536907, 0.0037198681384325027, 0.004064836539328098, 0.004409804940223694, 0.004754772875458002, 0.005099741276353598, 0.005444709211587906, 0.0057896776124835014, 0.006134646013379097, 0.0064796144142746925, 0.006824582349509001, 0.007169550750404596, 0.007514518685638905, 0.0078594870865345, 0.008204455487430096, 0.008549423888325691, 0.008894391357898712, 0.009239359758794308, 0.009584328159689903, 0.009929296560585499, 0.010274264961481094]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 6.0, 4.0, 7.0, 4.0, 8.0, 17.0, 26.0, 22.0, 44.0, 57.0, 102.0, 128.0, 222.0, 359.0, 517.0, 858.0, 1456.0, 2287.0, 3949.0, 6630.0, 11493.0, 19795.0, 35924.0, 71284.0, 165006.0, 368421.0, 189426.0, 79370.0, 39349.0, 21326.0, 12380.0, 7225.0, 4361.0, 2457.0, 1472.0, 927.0, 562.0, 363.0, 224.0, 179.0, 98.0, 78.0, 40.0, 36.0, 21.0, 18.0, 11.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00616455078125, -0.005948781967163086, -0.005733013153076172, -0.005517244338989258, -0.005301475524902344, -0.00508570671081543, -0.004869937896728516, -0.0046541690826416016, -0.0044384002685546875, -0.0042226314544677734, -0.004006862640380859, -0.0037910938262939453, -0.0035753250122070312, -0.003359556198120117, -0.003143787384033203, -0.002928018569946289, -0.002712249755859375, -0.002496480941772461, -0.002280712127685547, -0.002064943313598633, -0.0018491744995117188, -0.0016334056854248047, -0.0014176368713378906, -0.0012018680572509766, -0.0009860992431640625, -0.0007703304290771484, -0.0005545616149902344, -0.0003387928009033203, -0.00012302398681640625, 9.274482727050781e-05, 0.0003085136413574219, 0.0005242824554443359, 0.00074005126953125, 0.0009558200836181641, 0.0011715888977050781, 0.0013873577117919922, 0.0016031265258789062, 0.0018188953399658203, 0.0020346641540527344, 0.0022504329681396484, 0.0024662017822265625, 0.0026819705963134766, 0.0028977394104003906, 0.0031135082244873047, 0.0033292770385742188, 0.003545045852661133, 0.003760814666748047, 0.003976583480834961, 0.004192352294921875, 0.004408121109008789, 0.004623889923095703, 0.004839658737182617, 0.005055427551269531, 0.005271196365356445, 0.005486965179443359, 0.0057027339935302734, 0.0059185028076171875, 0.0061342716217041016, 0.006350040435791016, 0.00656580924987793, 0.006781578063964844, 0.006997346878051758, 0.007213115692138672, 0.007428884506225586, 0.0076446533203125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 3.0, 6.0, 5.0, 5.0, 13.0, 13.0, 11.0, 23.0, 21.0, 21.0, 25.0, 23.0, 48.0, 36.0, 37.0, 50.0, 46.0, 41.0, 53.0, 59.0, 38.0, 51.0, 53.0, 49.0, 40.0, 46.0, 35.0, 22.0, 19.0, 18.0, 25.0, 11.0, 13.0, 10.0, 10.0, 8.0, 5.0, 5.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.014129638671875, -0.013747096061706543, -0.013364553451538086, -0.012982010841369629, -0.012599468231201172, -0.012216925621032715, -0.011834383010864258, -0.0114518404006958, -0.011069297790527344, -0.010686755180358887, -0.01030421257019043, -0.009921669960021973, -0.009539127349853516, -0.009156584739685059, -0.008774042129516602, -0.008391499519348145, -0.008008956909179688, -0.0076264142990112305, -0.0072438716888427734, -0.006861329078674316, -0.006478786468505859, -0.006096243858337402, -0.005713701248168945, -0.005331158638000488, -0.004948616027832031, -0.004566073417663574, -0.004183530807495117, -0.00380098819732666, -0.003418445587158203, -0.003035902976989746, -0.002653360366821289, -0.002270817756652832, -0.001888275146484375, -0.001505732536315918, -0.001123189926147461, -0.0007406473159790039, -0.0003581047058105469, 2.4437904357910156e-05, 0.0004069805145263672, 0.0007895231246948242, 0.0011720657348632812, 0.0015546083450317383, 0.0019371509552001953, 0.0023196935653686523, 0.0027022361755371094, 0.0030847787857055664, 0.0034673213958740234, 0.0038498640060424805, 0.0042324066162109375, 0.0046149492263793945, 0.0049974918365478516, 0.005380034446716309, 0.005762577056884766, 0.006145119667053223, 0.00652766227722168, 0.006910204887390137, 0.007292747497558594, 0.007675290107727051, 0.008057832717895508, 0.008440375328063965, 0.008822917938232422, 0.009205460548400879, 0.009588003158569336, 0.009970545768737793, 0.01035308837890625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 7.0, 8.0, 10.0, 19.0, 27.0, 27.0, 70.0, 88.0, 122.0, 191.0, 243.0, 366.0, 542.0, 884.0, 1238.0, 1947.0, 2994.0, 4464.0, 6979.0, 11119.0, 17757.0, 29592.0, 53181.0, 107074.0, 280491.0, 286936.0, 108869.0, 53635.0, 29976.0, 17916.0, 11121.0, 7062.0, 4622.0, 3096.0, 1952.0, 1276.0, 863.0, 572.0, 399.0, 255.0, 182.0, 116.0, 84.0, 60.0, 44.0, 30.0, 10.0, 13.0, 11.0, 6.0, 2.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005382537841796875, -0.0052089691162109375, -0.005035400390625, -0.0048618316650390625, -0.004688262939453125, -0.0045146942138671875, -0.00434112548828125, -0.0041675567626953125, -0.003993988037109375, -0.0038204193115234375, -0.0036468505859375, -0.0034732818603515625, -0.003299713134765625, -0.0031261444091796875, -0.00295257568359375, -0.0027790069580078125, -0.002605438232421875, -0.0024318695068359375, -0.00225830078125, -0.0020847320556640625, -0.001911163330078125, -0.0017375946044921875, -0.00156402587890625, -0.0013904571533203125, -0.001216888427734375, -0.0010433197021484375, -0.0008697509765625, -0.0006961822509765625, -0.000522613525390625, -0.0003490447998046875, -0.00017547607421875, -1.9073486328125e-06, 0.000171661376953125, 0.0003452301025390625, 0.000518798828125, 0.0006923675537109375, 0.000865936279296875, 0.0010395050048828125, 0.00121307373046875, 0.0013866424560546875, 0.001560211181640625, 0.0017337799072265625, 0.0019073486328125, 0.0020809173583984375, 0.002254486083984375, 0.0024280548095703125, 0.00260162353515625, 0.0027751922607421875, 0.002948760986328125, 0.0031223297119140625, 0.0032958984375, 0.0034694671630859375, 0.003643035888671875, 0.0038166046142578125, 0.00399017333984375, 0.0041637420654296875, 0.004337310791015625, 0.0045108795166015625, 0.0046844482421875, 0.0048580169677734375, 0.005031585693359375, 0.0052051544189453125, 0.00537872314453125, 0.0055522918701171875, 0.005725860595703125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 2.0, 6.0, 8.0, 9.0, 7.0, 8.0, 13.0, 15.0, 9.0, 24.0, 17.0, 27.0, 33.0, 36.0, 25.0, 28.0, 32.0, 37.0, 38.0, 36.0, 35.0, 44.0, 31.0, 39.0, 39.0, 34.0, 47.0, 45.0, 29.0, 32.0, 33.0, 26.0, 27.0, 20.0, 10.0, 13.0, 16.0, 14.0, 11.0, 9.0, 8.0, 7.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006427764892578125, -0.006225287914276123, -0.006022810935974121, -0.005820333957672119, -0.005617856979370117, -0.005415380001068115, -0.005212903022766113, -0.005010426044464111, -0.004807949066162109, -0.004605472087860107, -0.0044029951095581055, -0.0042005181312561035, -0.0039980411529541016, -0.0037955641746520996, -0.0035930871963500977, -0.0033906102180480957, -0.0031881332397460938, -0.002985656261444092, -0.00278317928314209, -0.002580702304840088, -0.002378225326538086, -0.002175748348236084, -0.001973271369934082, -0.00177079439163208, -0.0015683174133300781, -0.0013658404350280762, -0.0011633634567260742, -0.0009608864784240723, -0.0007584095001220703, -0.0005559325218200684, -0.0003534555435180664, -0.00015097856521606445, 5.14984130859375e-05, 0.00025397539138793945, 0.0004564523696899414, 0.0006589293479919434, 0.0008614063262939453, 0.0010638833045959473, 0.0012663602828979492, 0.0014688372611999512, 0.0016713142395019531, 0.001873791217803955, 0.002076268196105957, 0.002278745174407959, 0.002481222152709961, 0.002683699131011963, 0.002886176109313965, 0.003088653087615967, 0.0032911300659179688, 0.0034936070442199707, 0.0036960840225219727, 0.0038985610008239746, 0.0041010379791259766, 0.0043035149574279785, 0.0045059919357299805, 0.004708468914031982, 0.004910945892333984, 0.005113422870635986, 0.005315899848937988, 0.00551837682723999, 0.005720853805541992, 0.005923330783843994, 0.006125807762145996, 0.006328284740447998, 0.00653076171875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 5.0, 5.0, 11.0, 28.0, 25.0, 49.0, 56.0, 95.0, 134.0, 189.0, 255.0, 386.0, 590.0, 931.0, 1444.0, 2307.0, 3665.0, 6148.0, 10445.0, 18924.0, 36351.0, 78687.0, 247703.0, 434889.0, 104963.0, 45392.0, 23207.0, 12673.0, 7228.0, 4349.0, 2570.0, 1629.0, 1060.0, 682.0, 443.0, 351.0, 225.0, 140.0, 79.0, 69.0, 43.0, 32.0, 29.0, 18.0, 13.0, 11.0, 3.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00020015239715576172, -0.00019372813403606415, -0.00018730387091636658, -0.000180879607796669, -0.00017445534467697144, -0.00016803108155727386, -0.0001616068184375763, -0.00015518255531787872, -0.00014875829219818115, -0.00014233402907848358, -0.000135909765958786, -0.00012948550283908844, -0.00012306123971939087, -0.0001166369765996933, -0.00011021271347999573, -0.00010378845036029816, -9.736418724060059e-05, -9.093992412090302e-05, -8.451566100120544e-05, -7.809139788150787e-05, -7.16671347618103e-05, -6.524287164211273e-05, -5.881860852241516e-05, -5.239434540271759e-05, -4.597008228302002e-05, -3.954581916332245e-05, -3.312155604362488e-05, -2.6697292923927307e-05, -2.0273029804229736e-05, -1.3848766684532166e-05, -7.424503564834595e-06, -1.000240445137024e-06, 5.424022674560547e-06, 1.1848285794258118e-05, 1.827254891395569e-05, 2.469681203365326e-05, 3.112107515335083e-05, 3.75453382730484e-05, 4.396960139274597e-05, 5.039386451244354e-05, 5.681812763214111e-05, 6.324239075183868e-05, 6.966665387153625e-05, 7.609091699123383e-05, 8.25151801109314e-05, 8.893944323062897e-05, 9.536370635032654e-05, 0.00010178796947002411, 0.00010821223258972168, 0.00011463649570941925, 0.00012106075882911682, 0.0001274850219488144, 0.00013390928506851196, 0.00014033354818820953, 0.0001467578113079071, 0.00015318207442760468, 0.00015960633754730225, 0.00016603060066699982, 0.0001724548637866974, 0.00017887912690639496, 0.00018530339002609253, 0.0001917276531457901, 0.00019815191626548767, 0.00020457617938518524, 0.0002110004425048828]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 7.0, 2.0, 4.0, 10.0, 16.0, 18.0, 32.0, 47.0, 61.0, 67.0, 83.0, 104.0, 127.0, 94.0, 75.0, 63.0, 58.0, 34.0, 30.0, 19.0, 16.0, 13.0, 9.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8715858459472656e-05, -1.811794936656952e-05, -1.7520040273666382e-05, -1.6922131180763245e-05, -1.6324222087860107e-05, -1.572631299495697e-05, -1.5128403902053833e-05, -1.4530494809150696e-05, -1.3932585716247559e-05, -1.3334676623344421e-05, -1.2736767530441284e-05, -1.2138858437538147e-05, -1.154094934463501e-05, -1.0943040251731873e-05, -1.0345131158828735e-05, -9.747222065925598e-06, -9.149312973022461e-06, -8.551403880119324e-06, -7.953494787216187e-06, -7.355585694313049e-06, -6.757676601409912e-06, -6.159767508506775e-06, -5.561858415603638e-06, -4.9639493227005005e-06, -4.366040229797363e-06, -3.768131136894226e-06, -3.170222043991089e-06, -2.5723129510879517e-06, -1.9744038581848145e-06, -1.3764947652816772e-06, -7.7858567237854e-07, -1.8067657947540283e-07, 4.172325134277344e-07, 1.0151416063308716e-06, 1.6130506992340088e-06, 2.210959792137146e-06, 2.808868885040283e-06, 3.4067779779434204e-06, 4.004687070846558e-06, 4.602596163749695e-06, 5.200505256652832e-06, 5.798414349555969e-06, 6.3963234424591064e-06, 6.994232535362244e-06, 7.592141628265381e-06, 8.190050721168518e-06, 8.787959814071655e-06, 9.385868906974792e-06, 9.98377799987793e-06, 1.0581687092781067e-05, 1.1179596185684204e-05, 1.1777505278587341e-05, 1.2375414371490479e-05, 1.2973323464393616e-05, 1.3571232557296753e-05, 1.416914165019989e-05, 1.4767050743103027e-05, 1.5364959836006165e-05, 1.5962868928909302e-05, 1.656077802181244e-05, 1.7158687114715576e-05, 1.7756596207618713e-05, 1.835450530052185e-05, 1.8952414393424988e-05, 1.9550323486328125e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 10.0, 15.0, 12.0, 19.0, 33.0, 45.0, 80.0, 253.0, 1943.0, 51078.0, 976066.0, 17512.0, 1067.0, 179.0, 70.0, 43.0, 27.0, 14.0, 16.0, 9.0, 6.0, 6.0, 7.0, 7.0, 5.0, 1.0, 1.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00141143798828125, -0.0013649612665176392, -0.0013184845447540283, -0.0012720078229904175, -0.0012255311012268066, -0.0011790543794631958, -0.001132577657699585, -0.0010861009359359741, -0.0010396242141723633, -0.0009931474924087524, -0.0009466707706451416, -0.0009001940488815308, -0.0008537173271179199, -0.0008072406053543091, -0.0007607638835906982, -0.0007142871618270874, -0.0006678104400634766, -0.0006213337182998657, -0.0005748569965362549, -0.000528380274772644, -0.0004819035530090332, -0.00043542683124542236, -0.0003889501094818115, -0.0003424733877182007, -0.00029599666595458984, -0.000249519944190979, -0.00020304322242736816, -0.00015656650066375732, -0.00011008977890014648, -6.361305713653564e-05, -1.7136335372924805e-05, 2.9340386390686035e-05, 7.581710815429688e-05, 0.00012229382991790771, 0.00016877055168151855, 0.0002152472734451294, 0.00026172399520874023, 0.0003082007169723511, 0.0003546774387359619, 0.00040115416049957275, 0.0004476308822631836, 0.0004941076040267944, 0.0005405843257904053, 0.0005870610475540161, 0.000633537769317627, 0.0006800144910812378, 0.0007264912128448486, 0.0007729679346084595, 0.0008194446563720703, 0.0008659213781356812, 0.000912398099899292, 0.0009588748216629028, 0.0010053515434265137, 0.0010518282651901245, 0.0010983049869537354, 0.0011447817087173462, 0.001191258430480957, 0.0012377351522445679, 0.0012842118740081787, 0.0013306885957717896, 0.0013771653175354004, 0.0014236420392990112, 0.001470118761062622, 0.001516595482826233, 0.0015630722045898438]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 7.0, 4.0, 6.0, 9.0, 5.0, 17.0, 17.0, 24.0, 29.0, 49.0, 59.0, 67.0, 105.0, 127.0, 104.0, 82.0, 70.0, 46.0, 44.0, 32.0, 25.0, 15.0, 6.0, 10.0, 11.0, 7.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.891654968261719e-05, -7.658172398805618e-05, -7.424689829349518e-05, -7.191207259893417e-05, -6.957724690437317e-05, -6.724242120981216e-05, -6.490759551525116e-05, -6.257276982069016e-05, -6.023794412612915e-05, -5.7903118431568146e-05, -5.556829273700714e-05, -5.3233467042446136e-05, -5.089864134788513e-05, -4.856381565332413e-05, -4.622898995876312e-05, -4.389416426420212e-05, -4.155933856964111e-05, -3.922451287508011e-05, -3.6889687180519104e-05, -3.45548614859581e-05, -3.2220035791397095e-05, -2.988521009683609e-05, -2.7550384402275085e-05, -2.521555870771408e-05, -2.2880733013153076e-05, -2.054590731859207e-05, -1.8211081624031067e-05, -1.5876255929470062e-05, -1.3541430234909058e-05, -1.1206604540348053e-05, -8.871778845787048e-06, -6.536953151226044e-06, -4.202127456665039e-06, -1.8673017621040344e-06, 4.675239324569702e-07, 2.802349627017975e-06, 5.1371753215789795e-06, 7.472001016139984e-06, 9.806826710700989e-06, 1.2141652405261993e-05, 1.4476478099822998e-05, 1.6811303794384003e-05, 1.9146129488945007e-05, 2.1480955183506012e-05, 2.3815780878067017e-05, 2.615060657262802e-05, 2.8485432267189026e-05, 3.082025796175003e-05, 3.3155083656311035e-05, 3.548990935087204e-05, 3.7824735045433044e-05, 4.015956073999405e-05, 4.2494386434555054e-05, 4.482921212911606e-05, 4.716403782367706e-05, 4.949886351823807e-05, 5.183368921279907e-05, 5.416851490736008e-05, 5.650334060192108e-05, 5.8838166296482086e-05, 6.117299199104309e-05, 6.35078176856041e-05, 6.58426433801651e-05, 6.81774690747261e-05, 7.051229476928711e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 19.0, 20.0, 26.0, 32.0, 35.0, 51.0, 86.0, 77.0, 111.0, 120.0, 82.0, 76.0, 62.0, 50.0, 32.0, 18.0, 16.0, 20.0, 14.0, 4.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01985890045762062, -0.019323380663990974, -0.018787862733006477, -0.01825234293937683, -0.017716823145747185, -0.017181305214762688, -0.01664578542113304, -0.016110265627503395, -0.015574747696518898, -0.015039228834211826, -0.01450370904058218, -0.013968190178275108, -0.013432671315968037, -0.012897152453660965, -0.012361632660031319, -0.011826113797724247, -0.0112905940040946, -0.010755075141787529, -0.010219555348157883, -0.009684036485850811, -0.00914851762354374, -0.008612997829914093, -0.008077478967607021, -0.00754196010529995, -0.007006440777331591, -0.006470921449363232, -0.00593540258705616, -0.005399883259087801, -0.004864363931119442, -0.00432884506881237, -0.0037933257408440113, -0.003257806645706296, -0.0027222884818911552, -0.00218676938675344, -0.0016512501752004027, -0.0011157309636473656, -0.0005802118685096502, -4.469277337193489e-05, 0.0004908265545964241, 0.0010263456497341394, 0.0015618647448718548, 0.00209738384000957, 0.0026329029351472855, 0.0031684222631156445, 0.00370394135825336, 0.004239460453391075, 0.004774979781359434, 0.005310499109327793, 0.005846017971634865, 0.006381537299603224, 0.0069170561619102955, 0.0074525754898786545, 0.007988094352185726, 0.008523613214492798, 0.009059133008122444, 0.009594651870429516, 0.010130170732736588, 0.01066568959504366, 0.011201209388673306, 0.011736728250980377, 0.012272247113287449, 0.01280776597559452, 0.013343285769224167, 0.013878804631531239, 0.014414324425160885]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 3.0, 5.0, 8.0, 6.0, 10.0, 9.0, 18.0, 12.0, 20.0, 32.0, 28.0, 34.0, 29.0, 40.0, 43.0, 50.0, 35.0, 39.0, 51.0, 47.0, 52.0, 40.0, 41.0, 47.0, 54.0, 39.0, 36.0, 28.0, 20.0, 23.0, 22.0, 18.0, 10.0, 13.0, 12.0, 8.0, 4.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.012911301106214523, -0.012563847005367279, -0.012216392904520035, -0.01186893880367279, -0.011521485634148121, -0.011174031533300877, -0.010826577432453632, -0.010479123331606388, -0.010131670162081718, -0.009784216061234474, -0.00943676196038723, -0.009089307859539986, -0.008741854690015316, -0.008394400589168072, -0.008046946488320827, -0.007699492387473583, -0.007352038286626339, -0.007004584185779095, -0.006657130550593138, -0.0063096764497458935, -0.0059622228145599365, -0.005614768713712692, -0.005267314612865448, -0.004919860512018204, -0.004572406876832247, -0.0042249527759850025, -0.0038774991407990456, -0.0035300450399518013, -0.0031825911719352007, -0.0028351373039186, -0.002487683203071356, -0.002140229335054755, -0.0017927763983607292, -0.0014453225303441286, -0.0010978685459122062, -0.0007504145614802837, -0.00040296069346368313, -5.550682544708252e-05, 0.00029194727540016174, 0.0006394011434167624, 0.000986855011433363, 0.0013343088794499636, 0.001681762863881886, 0.0020292168483138084, 0.002376670716330409, 0.0027241245843470097, 0.003071578685194254, 0.0034190325532108545, 0.003766486421227455, 0.004113940522074699, 0.004461394157260656, 0.004808848258107901, 0.005156301893293858, 0.005503755994141102, 0.005851210094988346, 0.00619866419583559, 0.006546117831021547, 0.006893571931868792, 0.0072410255670547485, 0.007588479667901993, 0.007935933768749237, 0.008283387869596481, 0.008630841970443726, 0.008978295139968395, 0.00932574924081564]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 5.0, 8.0, 5.0, 2.0, 13.0, 8.0, 14.0, 14.0, 17.0, 11.0, 22.0, 23.0, 33.0, 44.0, 57.0, 167.0, 653.0, 3102.0, 15947.0, 91777.0, 486667.0, 372958.0, 62701.0, 11214.0, 2174.0, 480.0, 146.0, 63.0, 33.0, 26.0, 24.0, 19.0, 27.0, 23.0, 15.0, 16.0, 14.0, 7.0, 5.0, 10.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0633544921875, -0.06099891662597656, -0.058643341064453125, -0.05628776550292969, -0.05393218994140625, -0.05157661437988281, -0.049221038818359375, -0.04686546325683594, -0.0445098876953125, -0.04215431213378906, -0.039798736572265625, -0.03744316101074219, -0.03508758544921875, -0.03273200988769531, -0.030376434326171875, -0.028020858764648438, -0.025665283203125, -0.023309707641601562, -0.020954132080078125, -0.018598556518554688, -0.01624298095703125, -0.013887405395507812, -0.011531829833984375, -0.009176254272460938, -0.0068206787109375, -0.0044651031494140625, -0.002109527587890625, 0.0002460479736328125, 0.00260162353515625, 0.0049571990966796875, 0.007312774658203125, 0.009668350219726562, 0.01202392578125, 0.014379501342773438, 0.016735076904296875, 0.019090652465820312, 0.02144622802734375, 0.023801803588867188, 0.026157379150390625, 0.028512954711914062, 0.0308685302734375, 0.03322410583496094, 0.035579681396484375, 0.03793525695800781, 0.04029083251953125, 0.04264640808105469, 0.045001983642578125, 0.04735755920410156, 0.049713134765625, 0.05206871032714844, 0.054424285888671875, 0.05677986145019531, 0.05913543701171875, 0.06149101257324219, 0.06384658813476562, 0.06620216369628906, 0.0685577392578125, 0.07091331481933594, 0.07326889038085938, 0.07562446594238281, 0.07798004150390625, 0.08033561706542969, 0.08269119262695312, 0.08504676818847656, 0.08740234375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 11.0, 18.0, 30.0, 46.0, 54.0, 72.0, 90.0, 108.0, 91.0, 107.0, 79.0, 88.0, 62.0, 56.0, 40.0, 23.0, 9.0, 9.0, 6.0, 3.0, 2.0, 3.0], "bins": [-0.038726806640625, -0.03796374797821045, -0.0372006893157959, -0.03643763065338135, -0.0356745719909668, -0.034911513328552246, -0.034148454666137695, -0.033385396003723145, -0.032622337341308594, -0.03185927867889404, -0.031096220016479492, -0.03033316135406494, -0.02957010269165039, -0.02880704402923584, -0.02804398536682129, -0.02728092670440674, -0.026517868041992188, -0.025754809379577637, -0.024991750717163086, -0.024228692054748535, -0.023465633392333984, -0.022702574729919434, -0.021939516067504883, -0.021176457405090332, -0.02041339874267578, -0.01965034008026123, -0.01888728141784668, -0.01812422275543213, -0.017361164093017578, -0.016598105430603027, -0.015835046768188477, -0.015071988105773926, -0.014308929443359375, -0.013545870780944824, -0.012782812118530273, -0.012019753456115723, -0.011256694793701172, -0.010493636131286621, -0.00973057746887207, -0.00896751880645752, -0.008204460144042969, -0.007441401481628418, -0.006678342819213867, -0.005915284156799316, -0.005152225494384766, -0.004389166831970215, -0.003626108169555664, -0.0028630495071411133, -0.0020999908447265625, -0.0013369321823120117, -0.0005738735198974609, 0.00018918514251708984, 0.0009522438049316406, 0.0017153024673461914, 0.002478361129760742, 0.003241419792175293, 0.004004478454589844, 0.0047675371170043945, 0.005530595779418945, 0.006293654441833496, 0.007056713104248047, 0.007819771766662598, 0.008582830429077148, 0.0093458890914917, 0.01010894775390625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 7.0, 11.0, 11.0, 10.0, 13.0, 12.0, 21.0, 33.0, 41.0, 49.0, 122.0, 337.0, 1330.0, 7354.0, 58130.0, 573634.0, 367709.0, 33535.0, 4660.0, 925.0, 262.0, 81.0, 55.0, 37.0, 39.0, 33.0, 21.0, 15.0, 12.0, 3.0, 6.0, 7.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10516357421875, -0.10196495056152344, -0.09876632690429688, -0.09556770324707031, -0.09236907958984375, -0.08917045593261719, -0.08597183227539062, -0.08277320861816406, -0.0795745849609375, -0.07637596130371094, -0.07317733764648438, -0.06997871398925781, -0.06678009033203125, -0.06358146667480469, -0.060382843017578125, -0.05718421936035156, -0.053985595703125, -0.05078697204589844, -0.047588348388671875, -0.04438972473144531, -0.04119110107421875, -0.03799247741699219, -0.034793853759765625, -0.03159523010253906, -0.0283966064453125, -0.025197982788085938, -0.021999359130859375, -0.018800735473632812, -0.01560211181640625, -0.012403488159179688, -0.009204864501953125, -0.0060062408447265625, -0.0028076171875, 0.0003910064697265625, 0.003589630126953125, 0.0067882537841796875, 0.00998687744140625, 0.013185501098632812, 0.016384124755859375, 0.019582748413085938, 0.0227813720703125, 0.025979995727539062, 0.029178619384765625, 0.03237724304199219, 0.03557586669921875, 0.03877449035644531, 0.041973114013671875, 0.04517173767089844, 0.048370361328125, 0.05156898498535156, 0.054767608642578125, 0.05796623229980469, 0.06116485595703125, 0.06436347961425781, 0.06756210327148438, 0.07076072692871094, 0.0739593505859375, 0.07715797424316406, 0.08035659790039062, 0.08355522155761719, 0.08675384521484375, 0.08995246887207031, 0.09315109252929688, 0.09634971618652344, 0.09954833984375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 5.0, 9.0, 14.0, 8.0, 23.0, 30.0, 26.0, 31.0, 43.0, 37.0, 41.0, 49.0, 39.0, 46.0, 58.0, 49.0, 50.0, 49.0, 46.0, 53.0, 56.0, 45.0, 34.0, 26.0, 27.0, 19.0, 12.0, 13.0, 7.0, 10.0, 6.0, 5.0, 8.0, 2.0, 7.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01045989990234375, -0.01012885570526123, -0.009797811508178711, -0.009466767311096191, -0.009135723114013672, -0.008804678916931152, -0.008473634719848633, -0.008142590522766113, -0.007811546325683594, -0.007480502128601074, -0.007149457931518555, -0.006818413734436035, -0.006487369537353516, -0.006156325340270996, -0.0058252811431884766, -0.005494236946105957, -0.0051631927490234375, -0.004832148551940918, -0.0045011043548583984, -0.004170060157775879, -0.0038390159606933594, -0.00350797176361084, -0.0031769275665283203, -0.0028458833694458008, -0.0025148391723632812, -0.0021837949752807617, -0.0018527507781982422, -0.0015217065811157227, -0.0011906623840332031, -0.0008596181869506836, -0.0005285739898681641, -0.00019752979278564453, 0.000133514404296875, 0.00046455860137939453, 0.0007956027984619141, 0.0011266469955444336, 0.0014576911926269531, 0.0017887353897094727, 0.002119779586791992, 0.0024508237838745117, 0.0027818679809570312, 0.0031129121780395508, 0.0034439563751220703, 0.00377500057220459, 0.004106044769287109, 0.004437088966369629, 0.0047681331634521484, 0.005099177360534668, 0.0054302215576171875, 0.005761265754699707, 0.0060923099517822266, 0.006423354148864746, 0.006754398345947266, 0.007085442543029785, 0.007416486740112305, 0.007747530937194824, 0.008078575134277344, 0.008409619331359863, 0.008740663528442383, 0.009071707725524902, 0.009402751922607422, 0.009733796119689941, 0.010064840316772461, 0.01039588451385498, 0.0107269287109375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 5.0, 5.0, 9.0, 18.0, 18.0, 19.0, 35.0, 60.0, 57.0, 92.0, 100.0, 138.0, 211.0, 304.0, 420.0, 595.0, 884.0, 1376.0, 2138.0, 3723.0, 6722.0, 15114.0, 95541.0, 863399.0, 33234.0, 10632.0, 5282.0, 2916.0, 1791.0, 1128.0, 760.0, 502.0, 364.0, 261.0, 206.0, 129.0, 87.0, 74.0, 55.0, 35.0, 28.0, 19.0, 23.0, 14.0, 9.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00339508056640625, -0.0032899677753448486, -0.0031848549842834473, -0.003079742193222046, -0.0029746294021606445, -0.002869516611099243, -0.002764403820037842, -0.0026592910289764404, -0.002554178237915039, -0.0024490654468536377, -0.0023439526557922363, -0.002238839864730835, -0.0021337270736694336, -0.0020286142826080322, -0.0019235014915466309, -0.0018183887004852295, -0.0017132759094238281, -0.0016081631183624268, -0.0015030503273010254, -0.001397937536239624, -0.0012928247451782227, -0.0011877119541168213, -0.00108259916305542, -0.0009774863719940186, -0.0008723735809326172, -0.0007672607898712158, -0.0006621479988098145, -0.0005570352077484131, -0.0004519224166870117, -0.00034680962562561035, -0.00024169683456420898, -0.00013658404350280762, -3.147125244140625e-05, 7.364153861999512e-05, 0.00017875432968139648, 0.00028386712074279785, 0.0003889799118041992, 0.0004940927028656006, 0.000599205493927002, 0.0007043182849884033, 0.0008094310760498047, 0.0009145438671112061, 0.0010196566581726074, 0.0011247694492340088, 0.0012298822402954102, 0.0013349950313568115, 0.0014401078224182129, 0.0015452206134796143, 0.0016503334045410156, 0.001755446195602417, 0.0018605589866638184, 0.0019656717777252197, 0.002070784568786621, 0.0021758973598480225, 0.002281010150909424, 0.002386122941970825, 0.0024912357330322266, 0.002596348524093628, 0.0027014613151550293, 0.0028065741062164307, 0.002911686897277832, 0.0030167996883392334, 0.0031219124794006348, 0.003227025270462036, 0.0033321380615234375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 10.0, 10.0, 17.0, 17.0, 31.0, 18.0, 46.0, 87.0, 82.0, 89.0, 106.0, 121.0, 102.0, 63.0, 59.0, 41.0, 22.0, 16.0, 15.0, 18.0, 4.0, 3.0, 2.0, 10.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0967254638671875e-05, -1.0620802640914917e-05, -1.0274350643157959e-05, -9.927898645401001e-06, -9.581446647644043e-06, -9.234994649887085e-06, -8.888542652130127e-06, -8.542090654373169e-06, -8.195638656616211e-06, -7.849186658859253e-06, -7.502734661102295e-06, -7.156282663345337e-06, -6.809830665588379e-06, -6.463378667831421e-06, -6.116926670074463e-06, -5.770474672317505e-06, -5.424022674560547e-06, -5.077570676803589e-06, -4.731118679046631e-06, -4.384666681289673e-06, -4.038214683532715e-06, -3.691762685775757e-06, -3.345310688018799e-06, -2.998858690261841e-06, -2.652406692504883e-06, -2.305954694747925e-06, -1.959502696990967e-06, -1.6130506992340088e-06, -1.2665987014770508e-06, -9.201467037200928e-07, -5.736947059631348e-07, -2.2724270820617676e-07, 1.1920928955078125e-07, 4.6566128730773926e-07, 8.121132850646973e-07, 1.1585652828216553e-06, 1.5050172805786133e-06, 1.8514692783355713e-06, 2.1979212760925293e-06, 2.5443732738494873e-06, 2.8908252716064453e-06, 3.2372772693634033e-06, 3.5837292671203613e-06, 3.930181264877319e-06, 4.276633262634277e-06, 4.623085260391235e-06, 4.969537258148193e-06, 5.315989255905151e-06, 5.662441253662109e-06, 6.008893251419067e-06, 6.355345249176025e-06, 6.701797246932983e-06, 7.048249244689941e-06, 7.394701242446899e-06, 7.741153240203857e-06, 8.087605237960815e-06, 8.434057235717773e-06, 8.780509233474731e-06, 9.12696123123169e-06, 9.473413228988647e-06, 9.819865226745605e-06, 1.0166317224502563e-05, 1.0512769222259521e-05, 1.085922122001648e-05, 1.1205673217773438e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 15.0, 85.0, 302.0, 1780.0, 14682.0, 1009425.0, 19472.0, 2206.0, 389.0, 90.0, 35.0, 4.0, 3.0, 5.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0150299072265625, -0.014618754386901855, -0.014207601547241211, -0.013796448707580566, -0.013385295867919922, -0.012974143028259277, -0.012562990188598633, -0.012151837348937988, -0.011740684509277344, -0.0113295316696167, -0.010918378829956055, -0.01050722599029541, -0.010096073150634766, -0.009684920310974121, -0.009273767471313477, -0.008862614631652832, -0.008451461791992188, -0.008040308952331543, -0.0076291561126708984, -0.007218003273010254, -0.006806850433349609, -0.006395697593688965, -0.00598454475402832, -0.005573391914367676, -0.005162239074707031, -0.004751086235046387, -0.004339933395385742, -0.003928780555725098, -0.003517627716064453, -0.0031064748764038086, -0.002695322036743164, -0.0022841691970825195, -0.001873016357421875, -0.0014618635177612305, -0.001050710678100586, -0.0006395578384399414, -0.00022840499877929688, 0.00018274784088134766, 0.0005939006805419922, 0.0010050535202026367, 0.0014162063598632812, 0.0018273591995239258, 0.0022385120391845703, 0.002649664878845215, 0.0030608177185058594, 0.003471970558166504, 0.0038831233978271484, 0.004294276237487793, 0.0047054290771484375, 0.005116581916809082, 0.0055277347564697266, 0.005938887596130371, 0.006350040435791016, 0.00676119327545166, 0.007172346115112305, 0.007583498954772949, 0.007994651794433594, 0.008405804634094238, 0.008816957473754883, 0.009228110313415527, 0.009639263153076172, 0.010050415992736816, 0.010461568832397461, 0.010872721672058105, 0.01128387451171875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 4.0, 3.0, 2.0, 9.0, 15.0, 23.0, 49.0, 203.0, 373.0, 174.0, 53.0, 20.0, 13.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009860992431640625, -0.000950157642364502, -0.0009142160415649414, -0.0008782744407653809, -0.0008423328399658203, -0.0008063912391662598, -0.0007704496383666992, -0.0007345080375671387, -0.0006985664367675781, -0.0006626248359680176, -0.000626683235168457, -0.0005907416343688965, -0.0005548000335693359, -0.0005188584327697754, -0.00048291683197021484, -0.0004469752311706543, -0.00041103363037109375, -0.0003750920295715332, -0.00033915042877197266, -0.0003032088279724121, -0.00026726722717285156, -0.00023132562637329102, -0.00019538402557373047, -0.00015944242477416992, -0.00012350082397460938, -8.755922317504883e-05, -5.161762237548828e-05, -1.5676021575927734e-05, 2.0265579223632812e-05, 5.620718002319336e-05, 9.21487808227539e-05, 0.00012809038162231445, 0.000164031982421875, 0.00019997358322143555, 0.0002359151840209961, 0.00027185678482055664, 0.0003077983856201172, 0.00034373998641967773, 0.0003796815872192383, 0.00041562318801879883, 0.0004515647888183594, 0.0004875063896179199, 0.0005234479904174805, 0.000559389591217041, 0.0005953311920166016, 0.0006312727928161621, 0.0006672143936157227, 0.0007031559944152832, 0.0007390975952148438, 0.0007750391960144043, 0.0008109807968139648, 0.0008469223976135254, 0.0008828639984130859, 0.0009188055992126465, 0.000954747200012207, 0.0009906888008117676, 0.0010266304016113281, 0.0010625720024108887, 0.0010985136032104492, 0.0011344552040100098, 0.0011703968048095703, 0.0012063384056091309, 0.0012422800064086914, 0.001278221607208252, 0.0013141632080078125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 7.0, 9.0, 14.0, 18.0, 32.0, 43.0, 47.0, 79.0, 102.0, 126.0, 139.0, 113.0, 92.0, 67.0, 34.0, 33.0, 15.0, 13.0, 8.0, 6.0, 1.0, 7.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0104088569059968, -0.009762255474925041, -0.009115654975175858, -0.008469054475426674, -0.007822453044354916, -0.007175852078944445, -0.006529251113533974, -0.005882650148123503, -0.005236049182713032, -0.004589448217302561, -0.00394284725189209, -0.003296246286481619, -0.002649645321071148, -0.002003044355660677, -0.001356443390250206, -0.000709842424839735, -6.324145942926407e-05, 0.0005833595059812069, 0.0012299604713916779, 0.0018765614368021488, 0.0025231624022126198, 0.0031697633676230907, 0.0038163643330335617, 0.004462965298444033, 0.005109566263854504, 0.005756167229264975, 0.0064027681946754456, 0.0070493691600859165, 0.0076959701254963875, 0.008342571556568146, 0.00898917205631733, 0.009635772556066513, 0.010282374918460846, 0.01092897541821003, 0.011575576849281788, 0.012222178280353546, 0.01286877878010273, 0.013515379279851913, 0.014161980710923672, 0.01480858214199543, 0.015455182641744614, 0.016101783141493797, 0.01674838364124298, 0.017394986003637314, 0.018041586503386497, 0.01868818700313568, 0.019334789365530014, 0.019981389865279198, 0.02062799036502838, 0.021274590864777565, 0.02192119136452675, 0.02256779372692108, 0.023214394226670265, 0.02386099472641945, 0.024507597088813782, 0.025154197588562965, 0.02580079808831215, 0.026447398588061333, 0.027093999087810516, 0.02774060145020485, 0.028387201949954033, 0.029033802449703217, 0.02968040481209755, 0.030327005311846733, 0.030973605811595917]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 11.0, 13.0, 24.0, 19.0, 37.0, 36.0, 61.0, 75.0, 74.0, 73.0, 87.0, 97.0, 84.0, 78.0, 66.0, 45.0, 41.0, 21.0, 31.0, 20.0, 7.0, 6.0, 3.0, 1.0], "bins": [-0.03486692160367966, -0.0341830775141716, -0.033499233424663544, -0.03281538933515549, -0.03213154524564743, -0.03144770488142967, -0.030763860791921616, -0.03008001670241356, -0.029396172612905502, -0.028712328523397446, -0.02802848443388939, -0.02734464220702648, -0.026660798117518425, -0.02597695402801037, -0.02529311180114746, -0.024609267711639404, -0.023925423622131348, -0.02324157953262329, -0.022557735443115234, -0.021873893216252327, -0.02119004912674427, -0.020506205037236214, -0.019822362810373306, -0.01913851872086525, -0.018454674631357193, -0.017770830541849136, -0.01708698645234108, -0.016403144225478172, -0.015719300135970116, -0.015035456046462059, -0.014351612888276577, -0.013667769730091095, -0.012983927503228188, -0.012300083413720131, -0.011616240255534649, -0.010932397097349167, -0.01024855300784111, -0.009564708918333054, -0.008880865760147572, -0.00819702260196209, -0.007513178512454033, -0.0068293348886072636, -0.006145491264760494, -0.005461647640913725, -0.004777804017066956, -0.004093960393220186, -0.003410116769373417, -0.0027262731455266476, -0.0020424295216798782, -0.001358585897833109, -0.0006747422739863396, 9.101349860429764e-06, 0.0006929449737071991, 0.0013767885975539684, 0.0020606322214007378, 0.002744475845247507, 0.0034283194690942764, 0.004112163092941046, 0.004796006716787815, 0.005479850340634584, 0.006163693964481354, 0.006847537588328123, 0.007531381212174892, 0.008215224370360374, 0.008899068459868431]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 9.0, 17.0, 15.0, 17.0, 38.0, 54.0, 85.0, 101.0, 156.0, 258.0, 462.0, 1094.0, 3532.0, 33184.0, 3410256.0, 730777.0, 10074.0, 2460.0, 734.0, 348.0, 209.0, 143.0, 87.0, 68.0, 45.0, 26.0, 19.0, 7.0, 5.0, 8.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.05767822265625, -0.05639004707336426, -0.055101871490478516, -0.05381369590759277, -0.05252552032470703, -0.05123734474182129, -0.04994916915893555, -0.048660993576049805, -0.04737281799316406, -0.04608464241027832, -0.04479646682739258, -0.043508291244506836, -0.042220115661621094, -0.04093194007873535, -0.03964376449584961, -0.03835558891296387, -0.037067413330078125, -0.03577923774719238, -0.03449106216430664, -0.0332028865814209, -0.031914710998535156, -0.030626535415649414, -0.029338359832763672, -0.02805018424987793, -0.026762008666992188, -0.025473833084106445, -0.024185657501220703, -0.02289748191833496, -0.02160930633544922, -0.020321130752563477, -0.019032955169677734, -0.017744779586791992, -0.01645660400390625, -0.015168428421020508, -0.013880252838134766, -0.012592077255249023, -0.011303901672363281, -0.010015726089477539, -0.008727550506591797, -0.007439374923706055, -0.0061511993408203125, -0.00486302375793457, -0.003574848175048828, -0.002286672592163086, -0.0009984970092773438, 0.00028967857360839844, 0.0015778541564941406, 0.002866029739379883, 0.004154205322265625, 0.005442380905151367, 0.006730556488037109, 0.008018732070922852, 0.009306907653808594, 0.010595083236694336, 0.011883258819580078, 0.01317143440246582, 0.014459609985351562, 0.015747785568237305, 0.017035961151123047, 0.01832413673400879, 0.01961231231689453, 0.020900487899780273, 0.022188663482666016, 0.023476839065551758, 0.0247650146484375]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 12.0, 15.0, 15.0, 11.0, 16.0, 32.0, 27.0, 44.0, 37.0, 66.0, 64.0, 60.0, 62.0, 63.0, 59.0, 75.0, 55.0, 52.0, 50.0, 37.0, 36.0, 28.0, 20.0, 12.0, 22.0, 13.0, 9.0, 6.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0217437744140625, -0.02125370502471924, -0.020763635635375977, -0.020273566246032715, -0.019783496856689453, -0.01929342746734619, -0.01880335807800293, -0.018313288688659668, -0.017823219299316406, -0.017333149909973145, -0.016843080520629883, -0.01635301113128662, -0.01586294174194336, -0.015372872352600098, -0.014882802963256836, -0.014392733573913574, -0.013902664184570312, -0.01341259479522705, -0.012922525405883789, -0.012432456016540527, -0.011942386627197266, -0.011452317237854004, -0.010962247848510742, -0.01047217845916748, -0.009982109069824219, -0.009492039680480957, -0.009001970291137695, -0.008511900901794434, -0.008021831512451172, -0.00753176212310791, -0.0070416927337646484, -0.006551623344421387, -0.006061553955078125, -0.005571484565734863, -0.0050814151763916016, -0.00459134578704834, -0.004101276397705078, -0.0036112070083618164, -0.0031211376190185547, -0.002631068229675293, -0.0021409988403320312, -0.0016509294509887695, -0.0011608600616455078, -0.0006707906723022461, -0.00018072128295898438, 0.00030934810638427734, 0.0007994174957275391, 0.0012894868850708008, 0.0017795562744140625, 0.0022696256637573242, 0.002759695053100586, 0.0032497644424438477, 0.0037398338317871094, 0.004229903221130371, 0.004719972610473633, 0.0052100419998168945, 0.005700111389160156, 0.006190180778503418, 0.00668025016784668, 0.007170319557189941, 0.007660388946533203, 0.008150458335876465, 0.008640527725219727, 0.009130597114562988, 0.00962066650390625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 8.0, 12.0, 12.0, 28.0, 35.0, 67.0, 138.0, 433.0, 3399.0, 4162132.0, 26649.0, 899.0, 212.0, 94.0, 38.0, 38.0, 23.0, 22.0, 9.0, 8.0, 6.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.274658203125, -0.2679119110107422, -0.2611656188964844, -0.25441932678222656, -0.24767303466796875, -0.24092674255371094, -0.23418045043945312, -0.2274341583251953, -0.2206878662109375, -0.2139415740966797, -0.20719528198242188, -0.20044898986816406, -0.19370269775390625, -0.18695640563964844, -0.18021011352539062, -0.1734638214111328, -0.166717529296875, -0.1599712371826172, -0.15322494506835938, -0.14647865295410156, -0.13973236083984375, -0.13298606872558594, -0.12623977661132812, -0.11949348449707031, -0.1127471923828125, -0.10600090026855469, -0.09925460815429688, -0.09250831604003906, -0.08576202392578125, -0.07901573181152344, -0.07226943969726562, -0.06552314758300781, -0.05877685546875, -0.05203056335449219, -0.045284271240234375, -0.03853797912597656, -0.03179168701171875, -0.025045394897460938, -0.018299102783203125, -0.011552810668945312, -0.0048065185546875, 0.0019397735595703125, 0.008686065673828125, 0.015432357788085938, 0.02217864990234375, 0.028924942016601562, 0.035671234130859375, 0.04241752624511719, 0.049163818359375, 0.05591011047363281, 0.06265640258789062, 0.06940269470214844, 0.07614898681640625, 0.08289527893066406, 0.08964157104492188, 0.09638786315917969, 0.1031341552734375, 0.10988044738769531, 0.11662673950195312, 0.12337303161621094, 0.13011932373046875, 0.13686561584472656, 0.14361190795898438, 0.1503582000732422, 0.1571044921875]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 8.0, 5.0, 8.0, 7.0, 11.0, 22.0, 28.0, 44.0, 51.0, 145.0, 287.0, 657.0, 1084.0, 880.0, 431.0, 179.0, 78.0, 56.0, 29.0, 20.0, 17.0, 6.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006816864013671875, -0.006541788578033447, -0.0062667131423950195, -0.005991637706756592, -0.005716562271118164, -0.005441486835479736, -0.005166411399841309, -0.004891335964202881, -0.004616260528564453, -0.004341185092926025, -0.004066109657287598, -0.00379103422164917, -0.003515958786010742, -0.0032408833503723145, -0.0029658079147338867, -0.002690732479095459, -0.0024156570434570312, -0.0021405816078186035, -0.0018655061721801758, -0.001590430736541748, -0.0013153553009033203, -0.0010402798652648926, -0.0007652044296264648, -0.0004901289939880371, -0.00021505355834960938, 6.002187728881836e-05, 0.0003350973129272461, 0.0006101727485656738, 0.0008852481842041016, 0.0011603236198425293, 0.001435399055480957, 0.0017104744911193848, 0.0019855499267578125, 0.0022606253623962402, 0.002535700798034668, 0.0028107762336730957, 0.0030858516693115234, 0.003360927104949951, 0.003636002540588379, 0.003911077976226807, 0.004186153411865234, 0.004461228847503662, 0.00473630428314209, 0.005011379718780518, 0.005286455154418945, 0.005561530590057373, 0.005836606025695801, 0.0061116814613342285, 0.006386756896972656, 0.006661832332611084, 0.006936907768249512, 0.0072119832038879395, 0.007487058639526367, 0.007762134075164795, 0.008037209510803223, 0.00831228494644165, 0.008587360382080078, 0.008862435817718506, 0.009137511253356934, 0.009412586688995361, 0.009687662124633789, 0.009962737560272217, 0.010237812995910645, 0.010512888431549072, 0.0107879638671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 6.0, 22.0, 47.0, 97.0, 202.0, 277.0, 197.0, 95.0, 33.0, 19.0, 11.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011120890267193317, -0.009938569739460945, -0.008756248280405998, -0.007573927287012339, -0.006391606293618679, -0.0052092853002250195, -0.00402696430683136, -0.0028446437790989876, -0.0016623223200440407, -0.0004800013266503811, 0.0007023196667432785, 0.001884640660136938, 0.0030669616535305977, 0.004249282646924257, 0.005431603640317917, 0.006613924168050289, 0.007796245627105236, 0.008978566154837608, 0.010160887613892555, 0.011343209072947502, 0.012525529600679874, 0.013707850128412247, 0.014890171587467194, 0.01607249304652214, 0.017254814505577087, 0.018437135964632034, 0.01961945742368698, 0.02080177702009678, 0.021984098479151726, 0.023166419938206673, 0.02434873953461647, 0.025531060993671417, 0.026713378727436066, 0.027895700186491013, 0.02907802164554596, 0.030260341241955757, 0.03144266456365585, 0.0326249822974205, 0.03380730375647545, 0.034989625215530396, 0.03617194667458534, 0.03735426813364029, 0.038536589592695236, 0.03971891105175018, 0.04090122878551483, 0.04208355024456978, 0.043265871703624725, 0.04444819316267967, 0.04563051462173462, 0.046812836080789566, 0.04799515753984451, 0.04917747899889946, 0.05035980045795441, 0.051542118191719055, 0.052724439650774, 0.05390676110982895, 0.055089082568883896, 0.05627140402793884, 0.05745372548699379, 0.05863604694604874, 0.059818364679813385, 0.06100068613886833, 0.06218300759792328, 0.06336532533168793, 0.06454765051603317]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 9.0, 9.0, 14.0, 11.0, 16.0, 14.0, 19.0, 19.0, 27.0, 25.0, 40.0, 29.0, 33.0, 40.0, 38.0, 50.0, 37.0, 47.0, 38.0, 37.0, 36.0, 27.0, 38.0, 47.0, 40.0, 34.0, 34.0, 27.0, 26.0, 25.0, 18.0, 15.0, 20.0, 7.0, 8.0, 4.0, 10.0, 5.0, 5.0, 4.0, 6.0, 1.0, 3.0], "bins": [-0.013951079919934273, -0.013594147749245167, -0.013237214647233486, -0.01288028247654438, -0.0125233493745327, -0.012166417203843594, -0.011809484101831913, -0.011452551931142807, -0.011095618829131126, -0.01073868665844202, -0.01038175355643034, -0.010024821385741234, -0.009667888283729553, -0.009310956113040447, -0.008954023011028767, -0.00859709084033966, -0.00824015773832798, -0.007883225567638874, -0.0075262924656271935, -0.0071693598292768, -0.006812427192926407, -0.0064554945565760136, -0.00609856192022562, -0.005741629749536514, -0.005384697578847408, -0.005027764942497015, -0.004670832306146622, -0.004313899669796228, -0.003956967033445835, -0.003600034397095442, -0.003243101993575692, -0.002886169357225299, -0.002529236488044262, -0.0021723038516938686, -0.0018153712153434753, -0.0014584386954084039, -0.0011015060590580106, -0.0007445734227076173, -0.0003876409027725458, -3.070826642215252e-05, 0.0003262243699282408, 0.0006831570062786341, 0.0010400896426290274, 0.0013970221625640988, 0.0017539547989144921, 0.0021108873188495636, 0.002467819955199957, 0.00282475259155035, 0.0031816852279007435, 0.0035386178642511368, 0.00389555050060153, 0.004252483136951923, 0.004609415773302317, 0.00496634840965271, 0.005323280580341816, 0.0056802136823534966, 0.0060371458530426025, 0.006394078489392996, 0.006751011125743389, 0.007107943762093782, 0.007464876398444176, 0.007821808569133282, 0.008178741671144962, 0.008535673841834068, 0.008892606943845749]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 5.0, 12.0, 8.0, 10.0, 18.0, 26.0, 50.0, 78.0, 108.0, 156.0, 332.0, 599.0, 1091.0, 1884.0, 3508.0, 6202.0, 11348.0, 21729.0, 43893.0, 98835.0, 278768.0, 349254.0, 123218.0, 52849.0, 25414.0, 12972.0, 7227.0, 3920.0, 2172.0, 1242.0, 656.0, 402.0, 211.0, 131.0, 70.0, 41.0, 36.0, 19.0, 18.0, 7.0, 9.0, 5.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00698089599609375, -0.006776273250579834, -0.006571650505065918, -0.006367027759552002, -0.006162405014038086, -0.00595778226852417, -0.005753159523010254, -0.005548536777496338, -0.005343914031982422, -0.005139291286468506, -0.00493466854095459, -0.004730045795440674, -0.004525423049926758, -0.004320800304412842, -0.004116177558898926, -0.00391155481338501, -0.0037069320678710938, -0.0035023093223571777, -0.0032976865768432617, -0.0030930638313293457, -0.0028884410858154297, -0.0026838183403015137, -0.0024791955947875977, -0.0022745728492736816, -0.0020699501037597656, -0.0018653273582458496, -0.0016607046127319336, -0.0014560818672180176, -0.0012514591217041016, -0.0010468363761901855, -0.0008422136306762695, -0.0006375908851623535, -0.0004329681396484375, -0.00022834539413452148, -2.372264862060547e-05, 0.00018090009689331055, 0.00038552284240722656, 0.0005901455879211426, 0.0007947683334350586, 0.0009993910789489746, 0.0012040138244628906, 0.0014086365699768066, 0.0016132593154907227, 0.0018178820610046387, 0.0020225048065185547, 0.0022271275520324707, 0.0024317502975463867, 0.0026363730430603027, 0.0028409957885742188, 0.0030456185340881348, 0.0032502412796020508, 0.003454864025115967, 0.003659486770629883, 0.003864109516143799, 0.004068732261657715, 0.004273355007171631, 0.004477977752685547, 0.004682600498199463, 0.004887223243713379, 0.005091845989227295, 0.005296468734741211, 0.005501091480255127, 0.005705714225769043, 0.005910336971282959, 0.006114959716796875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 8.0, 6.0, 11.0, 10.0, 16.0, 14.0, 25.0, 28.0, 27.0, 31.0, 28.0, 40.0, 43.0, 48.0, 50.0, 49.0, 54.0, 43.0, 45.0, 56.0, 39.0, 52.0, 37.0, 42.0, 34.0, 35.0, 28.0, 21.0, 18.0, 17.0, 8.0, 12.0, 13.0, 9.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0129852294921875, -0.012645840644836426, -0.012306451797485352, -0.011967062950134277, -0.011627674102783203, -0.011288285255432129, -0.010948896408081055, -0.01060950756072998, -0.010270118713378906, -0.009930729866027832, -0.009591341018676758, -0.009251952171325684, -0.00891256332397461, -0.008573174476623535, -0.008233785629272461, -0.007894396781921387, -0.0075550079345703125, -0.007215619087219238, -0.006876230239868164, -0.00653684139251709, -0.006197452545166016, -0.005858063697814941, -0.005518674850463867, -0.005179286003112793, -0.004839897155761719, -0.0045005083084106445, -0.00416111946105957, -0.003821730613708496, -0.003482341766357422, -0.0031429529190063477, -0.0028035640716552734, -0.0024641752243041992, -0.002124786376953125, -0.0017853975296020508, -0.0014460086822509766, -0.0011066198348999023, -0.0007672309875488281, -0.0004278421401977539, -8.845329284667969e-05, 0.00025093555450439453, 0.0005903244018554688, 0.000929713249206543, 0.0012691020965576172, 0.0016084909439086914, 0.0019478797912597656, 0.00228726863861084, 0.002626657485961914, 0.0029660463333129883, 0.0033054351806640625, 0.0036448240280151367, 0.003984212875366211, 0.004323601722717285, 0.004662990570068359, 0.005002379417419434, 0.005341768264770508, 0.005681157112121582, 0.006020545959472656, 0.0063599348068237305, 0.006699323654174805, 0.007038712501525879, 0.007378101348876953, 0.007717490196228027, 0.008056879043579102, 0.008396267890930176, 0.00873565673828125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 14.0, 17.0, 17.0, 42.0, 50.0, 69.0, 98.0, 135.0, 180.0, 320.0, 435.0, 670.0, 903.0, 1407.0, 2092.0, 3140.0, 4821.0, 7546.0, 11858.0, 19204.0, 31788.0, 56628.0, 115674.0, 315010.0, 251068.0, 98060.0, 50260.0, 28617.0, 17433.0, 10717.0, 6860.0, 4600.0, 2844.0, 1916.0, 1312.0, 890.0, 603.0, 392.0, 264.0, 186.0, 130.0, 102.0, 52.0, 45.0, 24.0, 29.0, 15.0, 3.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.004734039306640625, -0.004590153694152832, -0.004446268081665039, -0.004302382469177246, -0.004158496856689453, -0.00401461124420166, -0.003870725631713867, -0.0037268400192260742, -0.0035829544067382812, -0.0034390687942504883, -0.0032951831817626953, -0.0031512975692749023, -0.0030074119567871094, -0.0028635263442993164, -0.0027196407318115234, -0.0025757551193237305, -0.0024318695068359375, -0.0022879838943481445, -0.0021440982818603516, -0.0020002126693725586, -0.0018563270568847656, -0.0017124414443969727, -0.0015685558319091797, -0.0014246702194213867, -0.0012807846069335938, -0.0011368989944458008, -0.0009930133819580078, -0.0008491277694702148, -0.0007052421569824219, -0.0005613565444946289, -0.00041747093200683594, -0.00027358531951904297, -0.00012969970703125, 1.4185905456542969e-05, 0.00015807151794433594, 0.0003019571304321289, 0.0004458427429199219, 0.0005897283554077148, 0.0007336139678955078, 0.0008774995803833008, 0.0010213851928710938, 0.0011652708053588867, 0.0013091564178466797, 0.0014530420303344727, 0.0015969276428222656, 0.0017408132553100586, 0.0018846988677978516, 0.0020285844802856445, 0.0021724700927734375, 0.0023163557052612305, 0.0024602413177490234, 0.0026041269302368164, 0.0027480125427246094, 0.0028918981552124023, 0.0030357837677001953, 0.0031796693801879883, 0.0033235549926757812, 0.0034674406051635742, 0.003611326217651367, 0.00375521183013916, 0.003899097442626953, 0.004042983055114746, 0.004186868667602539, 0.004330754280090332, 0.004474639892578125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 4.0, 12.0, 9.0, 7.0, 9.0, 18.0, 18.0, 13.0, 26.0, 26.0, 25.0, 27.0, 30.0, 31.0, 39.0, 37.0, 39.0, 37.0, 35.0, 39.0, 43.0, 46.0, 29.0, 43.0, 43.0, 39.0, 33.0, 24.0, 29.0, 22.0, 25.0, 15.0, 16.0, 15.0, 21.0, 12.0, 15.0, 10.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00551605224609375, -0.005340456962585449, -0.0051648616790771484, -0.004989266395568848, -0.004813671112060547, -0.004638075828552246, -0.004462480545043945, -0.0042868852615356445, -0.004111289978027344, -0.003935694694519043, -0.003760099411010742, -0.0035845041275024414, -0.0034089088439941406, -0.00323331356048584, -0.003057718276977539, -0.0028821229934692383, -0.0027065277099609375, -0.0025309324264526367, -0.002355337142944336, -0.002179741859436035, -0.0020041465759277344, -0.0018285512924194336, -0.0016529560089111328, -0.001477360725402832, -0.0013017654418945312, -0.0011261701583862305, -0.0009505748748779297, -0.0007749795913696289, -0.0005993843078613281, -0.00042378902435302734, -0.00024819374084472656, -7.259845733642578e-05, 0.000102996826171875, 0.0002785921096801758, 0.00045418739318847656, 0.0006297826766967773, 0.0008053779602050781, 0.000980973243713379, 0.0011565685272216797, 0.0013321638107299805, 0.0015077590942382812, 0.001683354377746582, 0.0018589496612548828, 0.0020345449447631836, 0.0022101402282714844, 0.002385735511779785, 0.002561330795288086, 0.0027369260787963867, 0.0029125213623046875, 0.0030881166458129883, 0.003263711929321289, 0.00343930721282959, 0.0036149024963378906, 0.0037904977798461914, 0.003966093063354492, 0.004141688346862793, 0.004317283630371094, 0.0044928789138793945, 0.004668474197387695, 0.004844069480895996, 0.005019664764404297, 0.005195260047912598, 0.0053708553314208984, 0.005546450614929199, 0.0057220458984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 6.0, 8.0, 9.0, 15.0, 29.0, 42.0, 69.0, 88.0, 107.0, 192.0, 322.0, 506.0, 813.0, 1386.0, 2479.0, 4605.0, 9084.0, 20114.0, 51921.0, 203204.0, 598990.0, 94981.0, 31718.0, 13287.0, 6521.0, 3341.0, 1848.0, 1092.0, 628.0, 383.0, 259.0, 165.0, 114.0, 69.0, 46.0, 26.0, 25.0, 18.0, 12.0, 13.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002465248107910156, -0.000238882377743721, -0.0002312399446964264, -0.00022359751164913177, -0.00021595507860183716, -0.00020831264555454254, -0.00020067021250724792, -0.0001930277794599533, -0.0001853853464126587, -0.00017774291336536407, -0.00017010048031806946, -0.00016245804727077484, -0.00015481561422348022, -0.0001471731811761856, -0.000139530748128891, -0.00013188831508159637, -0.00012424588203430176, -0.00011660344898700714, -0.00010896101593971252, -0.00010131858289241791, -9.367614984512329e-05, -8.603371679782867e-05, -7.839128375053406e-05, -7.074885070323944e-05, -6.310641765594482e-05, -5.546398460865021e-05, -4.782155156135559e-05, -4.0179118514060974e-05, -3.253668546676636e-05, -2.489425241947174e-05, -1.7251819372177124e-05, -9.609386324882507e-06, -1.9669532775878906e-06, 5.675479769706726e-06, 1.3317912817001343e-05, 2.096034586429596e-05, 2.8602778911590576e-05, 3.624521195888519e-05, 4.388764500617981e-05, 5.1530078053474426e-05, 5.917251110076904e-05, 6.681494414806366e-05, 7.445737719535828e-05, 8.209981024265289e-05, 8.974224328994751e-05, 9.738467633724213e-05, 0.00010502710938453674, 0.00011266954243183136, 0.00012031197547912598, 0.0001279544085264206, 0.0001355968415737152, 0.00014323927462100983, 0.00015088170766830444, 0.00015852414071559906, 0.00016616657376289368, 0.0001738090068101883, 0.0001814514398574829, 0.00018909387290477753, 0.00019673630595207214, 0.00020437873899936676, 0.00021202117204666138, 0.000219663605093956, 0.0002273060381412506, 0.00023494847118854523, 0.00024259090423583984]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 5.0, 4.0, 5.0, 2.0, 5.0, 6.0, 14.0, 7.0, 11.0, 19.0, 14.0, 23.0, 40.0, 48.0, 47.0, 54.0, 79.0, 60.0, 67.0, 70.0, 65.0, 62.0, 41.0, 44.0, 37.0, 28.0, 25.0, 14.0, 12.0, 20.0, 16.0, 6.0, 11.0, 6.0, 2.0, 4.0, 4.0, 3.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.239776611328125e-05, -1.2001022696495056e-05, -1.1604279279708862e-05, -1.1207535862922668e-05, -1.0810792446136475e-05, -1.041404902935028e-05, -1.0017305612564087e-05, -9.620562195777893e-06, -9.2238187789917e-06, -8.827075362205505e-06, -8.430331945419312e-06, -8.033588528633118e-06, -7.636845111846924e-06, -7.24010169506073e-06, -6.843358278274536e-06, -6.446614861488342e-06, -6.0498714447021484e-06, -5.653128027915955e-06, -5.256384611129761e-06, -4.859641194343567e-06, -4.462897777557373e-06, -4.066154360771179e-06, -3.6694109439849854e-06, -3.2726675271987915e-06, -2.8759241104125977e-06, -2.479180693626404e-06, -2.08243727684021e-06, -1.6856938600540161e-06, -1.2889504432678223e-06, -8.922070264816284e-07, -4.954636096954346e-07, -9.872019290924072e-08, 2.980232238769531e-07, 6.94766640663147e-07, 1.0915100574493408e-06, 1.4882534742355347e-06, 1.8849968910217285e-06, 2.2817403078079224e-06, 2.678483724594116e-06, 3.07522714138031e-06, 3.471970558166504e-06, 3.868713974952698e-06, 4.265457391738892e-06, 4.6622008085250854e-06, 5.058944225311279e-06, 5.455687642097473e-06, 5.852431058883667e-06, 6.249174475669861e-06, 6.645917892456055e-06, 7.0426613092422485e-06, 7.439404726028442e-06, 7.836148142814636e-06, 8.23289155960083e-06, 8.629634976387024e-06, 9.026378393173218e-06, 9.423121809959412e-06, 9.819865226745605e-06, 1.02166086435318e-05, 1.0613352060317993e-05, 1.1010095477104187e-05, 1.1406838893890381e-05, 1.1803582310676575e-05, 1.2200325727462769e-05, 1.2597069144248962e-05, 1.2993812561035156e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 1.0, 11.0, 17.0, 17.0, 28.0, 36.0, 69.0, 207.0, 1028.0, 17600.0, 1005358.0, 22575.0, 1174.0, 221.0, 63.0, 37.0, 20.0, 22.0, 15.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0014677047729492188, -0.001422584056854248, -0.0013774633407592773, -0.0013323426246643066, -0.001287221908569336, -0.0012421011924743652, -0.0011969804763793945, -0.0011518597602844238, -0.0011067390441894531, -0.0010616183280944824, -0.0010164976119995117, -0.000971376895904541, -0.0009262561798095703, -0.0008811354637145996, -0.0008360147476196289, -0.0007908940315246582, -0.0007457733154296875, -0.0007006525993347168, -0.0006555318832397461, -0.0006104111671447754, -0.0005652904510498047, -0.000520169734954834, -0.0004750490188598633, -0.0004299283027648926, -0.0003848075866699219, -0.00033968687057495117, -0.00029456615447998047, -0.00024944543838500977, -0.00020432472229003906, -0.00015920400619506836, -0.00011408329010009766, -6.896257400512695e-05, -2.384185791015625e-05, 2.1278858184814453e-05, 6.639957427978516e-05, 0.00011152029037475586, 0.00015664100646972656, 0.00020176172256469727, 0.00024688243865966797, 0.00029200315475463867, 0.0003371238708496094, 0.0003822445869445801, 0.0004273653030395508, 0.0004724860191345215, 0.0005176067352294922, 0.0005627274513244629, 0.0006078481674194336, 0.0006529688835144043, 0.000698089599609375, 0.0007432103157043457, 0.0007883310317993164, 0.0008334517478942871, 0.0008785724639892578, 0.0009236931800842285, 0.0009688138961791992, 0.00101393461227417, 0.0010590553283691406, 0.0011041760444641113, 0.001149296760559082, 0.0011944174766540527, 0.0012395381927490234, 0.0012846589088439941, 0.0013297796249389648, 0.0013749003410339355, 0.0014200210571289062]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 8.0, 5.0, 9.0, 18.0, 12.0, 39.0, 29.0, 50.0, 71.0, 72.0, 135.0, 133.0, 102.0, 81.0, 59.0, 51.0, 27.0, 19.0, 18.0, 19.0, 7.0, 8.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-05, -4.379637539386749e-05, -4.229322075843811e-05, -4.079006612300873e-05, -3.9286911487579346e-05, -3.778375685214996e-05, -3.628060221672058e-05, -3.47774475812912e-05, -3.3274292945861816e-05, -3.1771138310432434e-05, -3.0267983675003052e-05, -2.876482903957367e-05, -2.7261674404144287e-05, -2.5758519768714905e-05, -2.4255365133285522e-05, -2.275221049785614e-05, -2.1249055862426758e-05, -1.9745901226997375e-05, -1.8242746591567993e-05, -1.673959195613861e-05, -1.5236437320709229e-05, -1.3733282685279846e-05, -1.2230128049850464e-05, -1.0726973414421082e-05, -9.2238187789917e-06, -7.720664143562317e-06, -6.2175095081329346e-06, -4.714354872703552e-06, -3.21120023727417e-06, -1.7080456018447876e-06, -2.0489096641540527e-07, 1.298263669013977e-06, 2.8014183044433594e-06, 4.304572939872742e-06, 5.807727575302124e-06, 7.310882210731506e-06, 8.814036846160889e-06, 1.0317191481590271e-05, 1.1820346117019653e-05, 1.3323500752449036e-05, 1.4826655387878418e-05, 1.63298100233078e-05, 1.7832964658737183e-05, 1.9336119294166565e-05, 2.0839273929595947e-05, 2.234242856502533e-05, 2.3845583200454712e-05, 2.5348737835884094e-05, 2.6851892471313477e-05, 2.835504710674286e-05, 2.985820174217224e-05, 3.1361356377601624e-05, 3.2864511013031006e-05, 3.436766564846039e-05, 3.587082028388977e-05, 3.737397491931915e-05, 3.8877129554748535e-05, 4.038028419017792e-05, 4.18834388256073e-05, 4.338659346103668e-05, 4.4889748096466064e-05, 4.639290273189545e-05, 4.789605736732483e-05, 4.939921200275421e-05, 5.0902366638183594e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 1.0, 5.0, 5.0, 4.0, 10.0, 8.0, 14.0, 19.0, 18.0, 27.0, 24.0, 38.0, 32.0, 51.0, 57.0, 81.0, 76.0, 77.0, 67.0, 71.0, 53.0, 51.0, 50.0, 33.0, 27.0, 21.0, 20.0, 13.0, 5.0, 8.0, 8.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.010797964408993721, -0.010474925860762596, -0.010151887312531471, -0.009828848764300346, -0.009505810216069221, -0.009182771667838097, -0.008859733119606972, -0.008536694571375847, -0.008213656023144722, -0.007890617474913597, -0.007567578926682472, -0.007244540378451347, -0.0069215018302202225, -0.006598463281989098, -0.00627542519941926, -0.005952386651188135, -0.005629348568618298, -0.005306310020387173, -0.004983271472156048, -0.004660232923924923, -0.004337194375693798, -0.004014155827462673, -0.0036911177448928356, -0.0033680791966617107, -0.003045040648430586, -0.002722002100199461, -0.002398963551968336, -0.002075925236567855, -0.00175288668833673, -0.0014298481401056051, -0.001106809708289802, -0.000783771276473999, -0.00046073272824287415, -0.00013769423821941018, 0.00018534425180405378, 0.0005083827418275177, 0.0008314212318509817, 0.0011544597800821066, 0.0014774982118979096, 0.0018005366437137127, 0.0021235751919448376, 0.0024466137401759624, 0.0027696522884070873, 0.0030926906038075686, 0.0034157291520386934, 0.0037387677002698183, 0.0040618060156702995, 0.004384844563901424, 0.004707883112132549, 0.005030921660363674, 0.005353960208594799, 0.005676998756825924, 0.006000037305057049, 0.006323075853288174, 0.006646113935858011, 0.006969152484089136, 0.007292191032320261, 0.007615229580551386, 0.007938267663121223, 0.008261306211352348, 0.008584344759583473, 0.008907383307814598, 0.009230421856045723, 0.009553460404276848, 0.009876498952507973]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 6.0, 5.0, 5.0, 9.0, 15.0, 11.0, 14.0, 12.0, 23.0, 19.0, 21.0, 25.0, 35.0, 25.0, 46.0, 39.0, 42.0, 41.0, 54.0, 50.0, 42.0, 36.0, 40.0, 37.0, 38.0, 45.0, 40.0, 37.0, 25.0, 32.0, 32.0, 19.0, 20.0, 17.0, 12.0, 6.0, 9.0, 7.0, 8.0, 5.0, 2.0, 3.0, 3.0, 3.0], "bins": [-0.011580615304410458, -0.011293569579720497, -0.011006522923707962, -0.010719476267695427, -0.010432430543005466, -0.010145384818315506, -0.009858338162302971, -0.009571291506290436, -0.009284245781600475, -0.008997200056910515, -0.00871015340089798, -0.008423106744885445, -0.008136061020195484, -0.007849015295505524, -0.007561968639492989, -0.007274922449141741, -0.006987876258790493, -0.006700830068439245, -0.0064137838780879974, -0.00612673768773675, -0.005839691497385502, -0.005552645307034254, -0.005265599116683006, -0.0049785529263317585, -0.004691506735980511, -0.004404460545629263, -0.004117414355278015, -0.0038303681649267673, -0.0035433219745755196, -0.0032562757842242718, -0.002969229593873024, -0.002682183403521776, -0.002395136281847954, -0.002108090091496706, -0.0018210439011454582, -0.0015339977107942104, -0.0012469515204429626, -0.0009599053300917149, -0.0006728591397404671, -0.0003858129493892193, -9.87667590379715e-05, 0.0001882794313132763, 0.0004753256216645241, 0.0007623718120157719, 0.0010494180023670197, 0.0013364641927182674, 0.0016235103830695152, 0.001910556573420763, 0.002197602763772011, 0.0024846489541232586, 0.0027716951444745064, 0.003058741334825754, 0.003345787525177002, 0.0036328337155282497, 0.0039198799058794975, 0.004206926096230745, 0.004493972286581993, 0.004781018476933241, 0.005068064667284489, 0.0053551108576357365, 0.005642157047986984, 0.005929203238338232, 0.00621624942868948, 0.006503295619040728, 0.006790341809391975]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 9.0, 11.0, 8.0, 11.0, 14.0, 18.0, 15.0, 18.0, 21.0, 21.0, 31.0, 39.0, 49.0, 142.0, 395.0, 1695.0, 7670.0, 38568.0, 209094.0, 560260.0, 186966.0, 34374.0, 6828.0, 1510.0, 386.0, 113.0, 54.0, 33.0, 32.0, 20.0, 21.0, 15.0, 13.0, 13.0, 16.0, 17.0, 7.0, 11.0, 5.0, 7.0, 7.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.05841064453125, -0.056554317474365234, -0.05469799041748047, -0.0528416633605957, -0.05098533630371094, -0.04912900924682617, -0.047272682189941406, -0.04541635513305664, -0.043560028076171875, -0.04170370101928711, -0.039847373962402344, -0.03799104690551758, -0.03613471984863281, -0.03427839279174805, -0.03242206573486328, -0.030565738677978516, -0.02870941162109375, -0.026853084564208984, -0.02499675750732422, -0.023140430450439453, -0.021284103393554688, -0.019427776336669922, -0.017571449279785156, -0.01571512222290039, -0.013858795166015625, -0.01200246810913086, -0.010146141052246094, -0.008289813995361328, -0.0064334869384765625, -0.004577159881591797, -0.0027208328247070312, -0.0008645057678222656, 0.0009918212890625, 0.0028481483459472656, 0.004704475402832031, 0.006560802459716797, 0.008417129516601562, 0.010273456573486328, 0.012129783630371094, 0.01398611068725586, 0.015842437744140625, 0.01769876480102539, 0.019555091857910156, 0.021411418914794922, 0.023267745971679688, 0.025124073028564453, 0.02698040008544922, 0.028836727142333984, 0.03069305419921875, 0.032549381256103516, 0.03440570831298828, 0.03626203536987305, 0.03811836242675781, 0.03997468948364258, 0.041831016540527344, 0.04368734359741211, 0.045543670654296875, 0.04739999771118164, 0.049256324768066406, 0.05111265182495117, 0.05296897888183594, 0.0548253059387207, 0.05668163299560547, 0.058537960052490234, 0.060394287109375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 8.0, 11.0, 15.0, 32.0, 34.0, 45.0, 60.0, 71.0, 81.0, 91.0, 88.0, 81.0, 75.0, 101.0, 60.0, 53.0, 30.0, 24.0, 20.0, 19.0, 6.0, 4.0, 4.0, 1.0], "bins": [-0.03192138671875, -0.031290411949157715, -0.03065943717956543, -0.030028462409973145, -0.02939748764038086, -0.028766512870788574, -0.02813553810119629, -0.027504563331604004, -0.02687358856201172, -0.026242613792419434, -0.02561163902282715, -0.024980664253234863, -0.024349689483642578, -0.023718714714050293, -0.023087739944458008, -0.022456765174865723, -0.021825790405273438, -0.021194815635681152, -0.020563840866088867, -0.019932866096496582, -0.019301891326904297, -0.01867091655731201, -0.018039941787719727, -0.01740896701812744, -0.016777992248535156, -0.01614701747894287, -0.015516042709350586, -0.0148850679397583, -0.014254093170166016, -0.01362311840057373, -0.012992143630981445, -0.01236116886138916, -0.011730194091796875, -0.01109921932220459, -0.010468244552612305, -0.00983726978302002, -0.009206295013427734, -0.00857532024383545, -0.007944345474243164, -0.007313370704650879, -0.006682395935058594, -0.006051421165466309, -0.0054204463958740234, -0.004789471626281738, -0.004158496856689453, -0.003527522087097168, -0.002896547317504883, -0.0022655725479125977, -0.0016345977783203125, -0.0010036230087280273, -0.0003726482391357422, 0.00025832653045654297, 0.0008893013000488281, 0.0015202760696411133, 0.0021512508392333984, 0.0027822256088256836, 0.0034132003784179688, 0.004044175148010254, 0.004675149917602539, 0.005306124687194824, 0.005937099456787109, 0.0065680742263793945, 0.00719904899597168, 0.007830023765563965, 0.00846099853515625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 11.0, 9.0, 14.0, 15.0, 22.0, 22.0, 17.0, 27.0, 24.0, 31.0, 35.0, 34.0, 64.0, 238.0, 1691.0, 15897.0, 178065.0, 709702.0, 129259.0, 11553.0, 1311.0, 185.0, 51.0, 38.0, 27.0, 33.0, 25.0, 24.0, 18.0, 18.0, 11.0, 12.0, 12.0, 10.0, 11.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08197021484375, -0.07944297790527344, -0.07691574096679688, -0.07438850402832031, -0.07186126708984375, -0.06933403015136719, -0.06680679321289062, -0.06427955627441406, -0.0617523193359375, -0.05922508239746094, -0.056697845458984375, -0.05417060852050781, -0.05164337158203125, -0.04911613464355469, -0.046588897705078125, -0.04406166076660156, -0.041534423828125, -0.03900718688964844, -0.036479949951171875, -0.03395271301269531, -0.03142547607421875, -0.028898239135742188, -0.026371002197265625, -0.023843765258789062, -0.0213165283203125, -0.018789291381835938, -0.016262054443359375, -0.013734817504882812, -0.01120758056640625, -0.008680343627929688, -0.006153106689453125, -0.0036258697509765625, -0.0010986328125, 0.0014286041259765625, 0.003955841064453125, 0.0064830780029296875, 0.00901031494140625, 0.011537551879882812, 0.014064788818359375, 0.016592025756835938, 0.0191192626953125, 0.021646499633789062, 0.024173736572265625, 0.026700973510742188, 0.02922821044921875, 0.03175544738769531, 0.034282684326171875, 0.03680992126464844, 0.039337158203125, 0.04186439514160156, 0.044391632080078125, 0.04691886901855469, 0.04944610595703125, 0.05197334289550781, 0.054500579833984375, 0.05702781677246094, 0.0595550537109375, 0.06208229064941406, 0.06460952758789062, 0.06713676452636719, 0.06966400146484375, 0.07219123840332031, 0.07471847534179688, 0.07724571228027344, 0.07977294921875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 9.0, 6.0, 9.0, 4.0, 9.0, 12.0, 11.0, 22.0, 21.0, 23.0, 21.0, 38.0, 31.0, 32.0, 43.0, 45.0, 50.0, 49.0, 44.0, 41.0, 50.0, 45.0, 45.0, 48.0, 35.0, 31.0, 33.0, 32.0, 27.0, 23.0, 20.0, 17.0, 17.0, 8.0, 13.0, 11.0, 8.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00760650634765625, -0.007355213165283203, -0.007103919982910156, -0.006852626800537109, -0.0066013336181640625, -0.006350040435791016, -0.006098747253417969, -0.005847454071044922, -0.005596160888671875, -0.005344867706298828, -0.005093574523925781, -0.004842281341552734, -0.0045909881591796875, -0.004339694976806641, -0.004088401794433594, -0.003837108612060547, -0.0035858154296875, -0.003334522247314453, -0.0030832290649414062, -0.0028319358825683594, -0.0025806427001953125, -0.0023293495178222656, -0.0020780563354492188, -0.0018267631530761719, -0.001575469970703125, -0.0013241767883300781, -0.0010728836059570312, -0.0008215904235839844, -0.0005702972412109375, -0.0003190040588378906, -6.771087646484375e-05, 0.00018358230590820312, 0.00043487548828125, 0.0006861686706542969, 0.0009374618530273438, 0.0011887550354003906, 0.0014400482177734375, 0.0016913414001464844, 0.0019426345825195312, 0.002193927764892578, 0.002445220947265625, 0.002696514129638672, 0.0029478073120117188, 0.0031991004943847656, 0.0034503936767578125, 0.0037016868591308594, 0.003952980041503906, 0.004204273223876953, 0.00445556640625, 0.004706859588623047, 0.004958152770996094, 0.005209445953369141, 0.0054607391357421875, 0.005712032318115234, 0.005963325500488281, 0.006214618682861328, 0.006465911865234375, 0.006717205047607422, 0.006968498229980469, 0.007219791412353516, 0.0074710845947265625, 0.007722377777099609, 0.007973670959472656, 0.008224964141845703, 0.00847625732421875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 5.0, 3.0, 8.0, 11.0, 20.0, 18.0, 20.0, 27.0, 41.0, 45.0, 72.0, 104.0, 107.0, 150.0, 201.0, 325.0, 609.0, 1011.0, 1865.0, 3882.0, 9347.0, 31691.0, 821913.0, 143905.0, 19702.0, 6626.0, 2989.0, 1475.0, 830.0, 451.0, 301.0, 229.0, 134.0, 104.0, 62.0, 62.0, 43.0, 46.0, 20.0, 16.0, 15.0, 19.0, 14.0, 8.0, 5.0, 5.0, 6.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.005756378173828125, -0.005586206912994385, -0.0054160356521606445, -0.005245864391326904, -0.005075693130493164, -0.004905521869659424, -0.004735350608825684, -0.004565179347991943, -0.004395008087158203, -0.004224836826324463, -0.004054665565490723, -0.0038844943046569824, -0.003714323043823242, -0.003544151782989502, -0.0033739805221557617, -0.0032038092613220215, -0.0030336380004882812, -0.002863466739654541, -0.0026932954788208008, -0.0025231242179870605, -0.0023529529571533203, -0.00218278169631958, -0.00201261043548584, -0.0018424391746520996, -0.0016722679138183594, -0.0015020966529846191, -0.001331925392150879, -0.0011617541313171387, -0.0009915828704833984, -0.0008214116096496582, -0.000651240348815918, -0.00048106908798217773, -0.0003108978271484375, -0.00014072656631469727, 2.944469451904297e-05, 0.0001996159553527832, 0.00036978721618652344, 0.0005399584770202637, 0.0007101297378540039, 0.0008803009986877441, 0.0010504722595214844, 0.0012206435203552246, 0.0013908147811889648, 0.001560986042022705, 0.0017311573028564453, 0.0019013285636901855, 0.0020714998245239258, 0.002241671085357666, 0.0024118423461914062, 0.0025820136070251465, 0.0027521848678588867, 0.002922356128692627, 0.003092527389526367, 0.0032626986503601074, 0.0034328699111938477, 0.003603041172027588, 0.003773212432861328, 0.003943383693695068, 0.004113554954528809, 0.004283726215362549, 0.004453897476196289, 0.004624068737030029, 0.0047942399978637695, 0.00496441125869751, 0.00513458251953125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 12.0, 12.0, 17.0, 28.0, 29.0, 40.0, 47.0, 64.0, 102.0, 95.0, 89.0, 95.0, 73.0, 83.0, 40.0, 36.0, 30.0, 30.0, 13.0, 8.0, 11.0, 9.0, 7.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.450580596923828e-06, -7.199123501777649e-06, -6.94766640663147e-06, -6.6962093114852905e-06, -6.444752216339111e-06, -6.193295121192932e-06, -5.941838026046753e-06, -5.690380930900574e-06, -5.4389238357543945e-06, -5.187466740608215e-06, -4.936009645462036e-06, -4.684552550315857e-06, -4.433095455169678e-06, -4.1816383600234985e-06, -3.930181264877319e-06, -3.67872416973114e-06, -3.427267074584961e-06, -3.1758099794387817e-06, -2.9243528842926025e-06, -2.6728957891464233e-06, -2.421438694000244e-06, -2.169981598854065e-06, -1.9185245037078857e-06, -1.6670674085617065e-06, -1.4156103134155273e-06, -1.1641532182693481e-06, -9.126961231231689e-07, -6.612390279769897e-07, -4.0978193283081055e-07, -1.5832483768463135e-07, 9.313225746154785e-08, 3.4458935260772705e-07, 5.960464477539062e-07, 8.475035429000854e-07, 1.0989606380462646e-06, 1.3504177331924438e-06, 1.601874828338623e-06, 1.8533319234848022e-06, 2.1047890186309814e-06, 2.3562461137771606e-06, 2.60770320892334e-06, 2.859160304069519e-06, 3.1106173992156982e-06, 3.3620744943618774e-06, 3.6135315895080566e-06, 3.864988684654236e-06, 4.116445779800415e-06, 4.367902874946594e-06, 4.6193599700927734e-06, 4.870817065238953e-06, 5.122274160385132e-06, 5.373731255531311e-06, 5.62518835067749e-06, 5.8766454458236694e-06, 6.128102540969849e-06, 6.379559636116028e-06, 6.631016731262207e-06, 6.882473826408386e-06, 7.1339309215545654e-06, 7.385388016700745e-06, 7.636845111846924e-06, 7.888302206993103e-06, 8.139759302139282e-06, 8.391216397285461e-06, 8.64267349243164e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 6.0, 10.0, 14.0, 15.0, 72.0, 484.0, 3511.0, 47978.0, 982347.0, 12421.0, 1368.0, 218.0, 30.0, 11.0, 6.0, 9.0, 7.0, 3.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016754150390625, -0.01621842384338379, -0.015682697296142578, -0.015146970748901367, -0.014611244201660156, -0.014075517654418945, -0.013539791107177734, -0.013004064559936523, -0.012468338012695312, -0.011932611465454102, -0.01139688491821289, -0.01086115837097168, -0.010325431823730469, -0.009789705276489258, -0.009253978729248047, -0.008718252182006836, -0.008182525634765625, -0.007646799087524414, -0.007111072540283203, -0.006575345993041992, -0.006039619445800781, -0.00550389289855957, -0.004968166351318359, -0.0044324398040771484, -0.0038967132568359375, -0.0033609867095947266, -0.0028252601623535156, -0.0022895336151123047, -0.0017538070678710938, -0.0012180805206298828, -0.0006823539733886719, -0.00014662742614746094, 0.00038909912109375, 0.0009248256683349609, 0.0014605522155761719, 0.001996278762817383, 0.0025320053100585938, 0.0030677318572998047, 0.0036034584045410156, 0.0041391849517822266, 0.0046749114990234375, 0.0052106380462646484, 0.005746364593505859, 0.00628209114074707, 0.006817817687988281, 0.007353544235229492, 0.007889270782470703, 0.008424997329711914, 0.008960723876953125, 0.009496450424194336, 0.010032176971435547, 0.010567903518676758, 0.011103630065917969, 0.01163935661315918, 0.01217508316040039, 0.012710809707641602, 0.013246536254882812, 0.013782262802124023, 0.014317989349365234, 0.014853715896606445, 0.015389442443847656, 0.015925168991088867, 0.016460895538330078, 0.01699662208557129, 0.0175323486328125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 9.0, 11.0, 4.0, 8.0, 10.0, 26.0, 33.0, 106.0, 397.0, 211.0, 52.0, 31.0, 18.0, 12.0, 14.0, 7.0, 7.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015087127685546875, -0.001462593674659729, -0.0014164745807647705, -0.001370355486869812, -0.0013242363929748535, -0.001278117299079895, -0.0012319982051849365, -0.001185879111289978, -0.0011397600173950195, -0.001093640923500061, -0.0010475218296051025, -0.001001402735710144, -0.0009552836418151855, -0.000909164547920227, -0.0008630454540252686, -0.0008169263601303101, -0.0007708072662353516, -0.0007246881723403931, -0.0006785690784454346, -0.0006324499845504761, -0.0005863308906555176, -0.0005402117967605591, -0.0004940927028656006, -0.0004479736089706421, -0.0004018545150756836, -0.0003557354211807251, -0.0003096163272857666, -0.0002634972333908081, -0.0002173781394958496, -0.0001712590456008911, -0.00012513995170593262, -7.902085781097412e-05, -3.2901763916015625e-05, 1.3217329978942871e-05, 5.933642387390137e-05, 0.00010545551776885986, 0.00015157461166381836, 0.00019769370555877686, 0.00024381279945373535, 0.00028993189334869385, 0.00033605098724365234, 0.00038217008113861084, 0.00042828917503356934, 0.00047440826892852783, 0.0005205273628234863, 0.0005666464567184448, 0.0006127655506134033, 0.0006588846445083618, 0.0007050037384033203, 0.0007511228322982788, 0.0007972419261932373, 0.0008433610200881958, 0.0008894801139831543, 0.0009355992078781128, 0.0009817183017730713, 0.0010278373956680298, 0.0010739564895629883, 0.0011200755834579468, 0.0011661946773529053, 0.0012123137712478638, 0.0012584328651428223, 0.0013045519590377808, 0.0013506710529327393, 0.0013967901468276978, 0.0014429092407226562]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 14.0, 21.0, 29.0, 44.0, 76.0, 88.0, 124.0, 165.0, 146.0, 108.0, 65.0, 44.0, 37.0, 14.0, 9.0, 4.0, 6.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025207070633769035, -0.024584876373410225, -0.023962680250406265, -0.023340485990047455, -0.022718291729688644, -0.022096097469329834, -0.021473901346325874, -0.020851707085967064, -0.020229510962963104, -0.019607316702604294, -0.018985120579600334, -0.018362926319241524, -0.017740732058882713, -0.017118535935878754, -0.016496341675519943, -0.015874147415161133, -0.015251953154802322, -0.014629757963120937, -0.014007563702762127, -0.013385368511080742, -0.012763174250721931, -0.012140979059040546, -0.011518783867359161, -0.010896589607000351, -0.010274394415318966, -0.009652199223637581, -0.00903000496327877, -0.008407809771597385, -0.007785615045577288, -0.00716342031955719, -0.006541225127875805, -0.005919030401855707, -0.005296834744513035, -0.004674640018492937, -0.004052445292472839, -0.0034302501007914543, -0.0028080553747713566, -0.002185860648751259, -0.0015636656899005175, -0.0009414707310497761, -0.00031927600502967834, 0.0003029188374057412, 0.0009251136798411608, 0.0015473085222765803, 0.002169503364712, 0.0027916980907320976, 0.003413893049582839, 0.00403608800843358, 0.004658282734453678, 0.005280477460473776, 0.005902672186493874, 0.006524867378175259, 0.007147062104195356, 0.007769256830215454, 0.00839145202189684, 0.009013647213578224, 0.009635841473937035, 0.01025803666561842, 0.01088023092597723, 0.011502426117658615, 0.012124620378017426, 0.01274681556969881, 0.013369010761380196, 0.013991205021739006, 0.014613400213420391]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 5.0, 2.0, 12.0, 15.0, 13.0, 20.0, 37.0, 47.0, 50.0, 72.0, 61.0, 66.0, 84.0, 71.0, 99.0, 58.0, 65.0, 46.0, 50.0, 38.0, 40.0, 21.0, 16.0, 6.0, 7.0, 6.0, 3.0, 5.0], "bins": [-0.026590803638100624, -0.02605682797729969, -0.025522852316498756, -0.024988876655697823, -0.02445490099489689, -0.023920925334095955, -0.02338694967329502, -0.022852975875139236, -0.022319000214338303, -0.02178502455353737, -0.021251048892736435, -0.0207170732319355, -0.020183097571134567, -0.019649121910333633, -0.0191151462495327, -0.018581170588731766, -0.018047194927930832, -0.017513219267129898, -0.016979243606328964, -0.01644526794552803, -0.015911292284727097, -0.015377316623926163, -0.014843341894447803, -0.01430936623364687, -0.013775390572845936, -0.013241414912045002, -0.012707439251244068, -0.012173463590443134, -0.011639488860964775, -0.011105513200163841, -0.010571537539362907, -0.010037561878561974, -0.009503587149083614, -0.00896961148828268, -0.008435635827481747, -0.007901660166680813, -0.007367684971541166, -0.0068337093107402325, -0.006299734115600586, -0.005765758454799652, -0.005231782793998718, -0.004697807133197784, -0.004163831472396851, -0.003629856277257204, -0.0030958806164562702, -0.0025619049556553364, -0.002027929527685046, -0.001493954099714756, -0.0009599784389138222, -0.00042600289452821016, 0.00010797264985740185, 0.0006419481942430139, 0.0011759237386286259, 0.0017098993994295597, 0.00224387482739985, 0.00277785025537014, 0.003311825916171074, 0.0038458015769720078, 0.004379777237772942, 0.004913752432912588, 0.005447728093713522, 0.005981703754514456, 0.006515678949654102, 0.007049654610455036, 0.00758363027125597]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 11.0, 20.0, 20.0, 43.0, 65.0, 96.0, 162.0, 315.0, 619.0, 1330.0, 4356.0, 297729.0, 3841006.0, 43147.0, 2982.0, 1178.0, 525.0, 282.0, 158.0, 95.0, 62.0, 23.0, 24.0, 13.0, 4.0, 4.0, 6.0, 3.0, 2.0, 1.0], "bins": [-0.04449462890625, -0.043534278869628906, -0.04257392883300781, -0.04161357879638672, -0.040653228759765625, -0.03969287872314453, -0.03873252868652344, -0.037772178649902344, -0.03681182861328125, -0.035851478576660156, -0.03489112854003906, -0.03393077850341797, -0.032970428466796875, -0.03201007843017578, -0.031049728393554688, -0.030089378356933594, -0.0291290283203125, -0.028168678283691406, -0.027208328247070312, -0.02624797821044922, -0.025287628173828125, -0.02432727813720703, -0.023366928100585938, -0.022406578063964844, -0.02144622802734375, -0.020485877990722656, -0.019525527954101562, -0.01856517791748047, -0.017604827880859375, -0.01664447784423828, -0.015684127807617188, -0.014723777770996094, -0.013763427734375, -0.012803077697753906, -0.011842727661132812, -0.010882377624511719, -0.009922027587890625, -0.008961677551269531, -0.008001327514648438, -0.007040977478027344, -0.00608062744140625, -0.005120277404785156, -0.0041599273681640625, -0.0031995773315429688, -0.002239227294921875, -0.0012788772583007812, -0.0003185272216796875, 0.0006418228149414062, 0.0016021728515625, 0.0025625228881835938, 0.0035228729248046875, 0.004483222961425781, 0.005443572998046875, 0.006403923034667969, 0.0073642730712890625, 0.008324623107910156, 0.00928497314453125, 0.010245323181152344, 0.011205673217773438, 0.012166023254394531, 0.013126373291015625, 0.014086723327636719, 0.015047073364257812, 0.016007423400878906, 0.0169677734375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 13.0, 4.0, 13.0, 14.0, 18.0, 23.0, 38.0, 37.0, 35.0, 55.0, 43.0, 51.0, 56.0, 65.0, 50.0, 64.0, 63.0, 47.0, 52.0, 45.0, 46.0, 24.0, 30.0, 27.0, 21.0, 17.0, 12.0, 9.0, 14.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01529693603515625, -0.014876246452331543, -0.014455556869506836, -0.014034867286682129, -0.013614177703857422, -0.013193488121032715, -0.012772798538208008, -0.0123521089553833, -0.011931419372558594, -0.011510729789733887, -0.01109004020690918, -0.010669350624084473, -0.010248661041259766, -0.009827971458435059, -0.009407281875610352, -0.008986592292785645, -0.008565902709960938, -0.00814521312713623, -0.0077245235443115234, -0.007303833961486816, -0.006883144378662109, -0.006462454795837402, -0.006041765213012695, -0.005621075630187988, -0.005200386047363281, -0.004779696464538574, -0.004359006881713867, -0.00393831729888916, -0.003517627716064453, -0.003096938133239746, -0.002676248550415039, -0.002255558967590332, -0.001834869384765625, -0.001414179801940918, -0.000993490219116211, -0.0005728006362915039, -0.00015211105346679688, 0.00026857852935791016, 0.0006892681121826172, 0.0011099576950073242, 0.0015306472778320312, 0.0019513368606567383, 0.0023720264434814453, 0.0027927160263061523, 0.0032134056091308594, 0.0036340951919555664, 0.0040547847747802734, 0.0044754743576049805, 0.0048961639404296875, 0.0053168535232543945, 0.0057375431060791016, 0.006158232688903809, 0.006578922271728516, 0.006999611854553223, 0.00742030143737793, 0.007840991020202637, 0.008261680603027344, 0.00868237018585205, 0.009103059768676758, 0.009523749351501465, 0.009944438934326172, 0.010365128517150879, 0.010785818099975586, 0.011206507682800293, 0.011627197265625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 5.0, 6.0, 7.0, 11.0, 10.0, 7.0, 11.0, 14.0, 20.0, 33.0, 44.0, 68.0, 160.0, 381.0, 1230.0, 9446.0, 4139499.0, 39709.0, 2372.0, 626.0, 275.0, 159.0, 83.0, 31.0, 30.0, 13.0, 8.0, 10.0, 1.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07965087890625, -0.07713699340820312, -0.07462310791015625, -0.07210922241210938, -0.0695953369140625, -0.06708145141601562, -0.06456756591796875, -0.062053680419921875, -0.059539794921875, -0.057025909423828125, -0.05451202392578125, -0.051998138427734375, -0.0494842529296875, -0.046970367431640625, -0.04445648193359375, -0.041942596435546875, -0.0394287109375, -0.036914825439453125, -0.03440093994140625, -0.031887054443359375, -0.0293731689453125, -0.026859283447265625, -0.02434539794921875, -0.021831512451171875, -0.019317626953125, -0.016803741455078125, -0.01428985595703125, -0.011775970458984375, -0.0092620849609375, -0.006748199462890625, -0.00423431396484375, -0.001720428466796875, 0.00079345703125, 0.003307342529296875, 0.00582122802734375, 0.008335113525390625, 0.0108489990234375, 0.013362884521484375, 0.01587677001953125, 0.018390655517578125, 0.020904541015625, 0.023418426513671875, 0.02593231201171875, 0.028446197509765625, 0.0309600830078125, 0.033473968505859375, 0.03598785400390625, 0.038501739501953125, 0.041015625, 0.043529510498046875, 0.04604339599609375, 0.048557281494140625, 0.0510711669921875, 0.053585052490234375, 0.05609893798828125, 0.058612823486328125, 0.061126708984375, 0.06364059448242188, 0.06615447998046875, 0.06866836547851562, 0.0711822509765625, 0.07369613647460938, 0.07621002197265625, 0.07872390747070312, 0.08123779296875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 10.0, 12.0, 17.0, 43.0, 95.0, 237.0, 443.0, 756.0, 1003.0, 691.0, 379.0, 166.0, 66.0, 42.0, 28.0, 21.0, 13.0, 11.0, 4.0, 6.0, 4.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004302978515625, -0.004152476787567139, -0.004001975059509277, -0.003851473331451416, -0.0037009716033935547, -0.0035504698753356934, -0.003399968147277832, -0.0032494664192199707, -0.0030989646911621094, -0.002948462963104248, -0.0027979612350463867, -0.0026474595069885254, -0.002496957778930664, -0.0023464560508728027, -0.0021959543228149414, -0.00204545259475708, -0.0018949508666992188, -0.0017444491386413574, -0.001593947410583496, -0.0014434456825256348, -0.0012929439544677734, -0.0011424422264099121, -0.0009919404983520508, -0.0008414387702941895, -0.0006909370422363281, -0.0005404353141784668, -0.00038993358612060547, -0.00023943185806274414, -8.893013000488281e-05, 6.157159805297852e-05, 0.00021207332611083984, 0.00036257505416870117, 0.0005130767822265625, 0.0006635785102844238, 0.0008140802383422852, 0.0009645819664001465, 0.0011150836944580078, 0.0012655854225158691, 0.0014160871505737305, 0.0015665888786315918, 0.0017170906066894531, 0.0018675923347473145, 0.0020180940628051758, 0.002168595790863037, 0.0023190975189208984, 0.0024695992469787598, 0.002620100975036621, 0.0027706027030944824, 0.0029211044311523438, 0.003071606159210205, 0.0032221078872680664, 0.0033726096153259277, 0.003523111343383789, 0.0036736130714416504, 0.0038241147994995117, 0.003974616527557373, 0.004125118255615234, 0.004275619983673096, 0.004426121711730957, 0.004576623439788818, 0.00472712516784668, 0.004877626895904541, 0.005028128623962402, 0.005178630352020264, 0.005329132080078125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 10.0, 23.0, 25.0, 41.0, 74.0, 120.0, 160.0, 156.0, 120.0, 100.0, 54.0, 40.0, 33.0, 13.0, 12.0, 7.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.026307469233870506, -0.025735270231962204, -0.02516307309269905, -0.02459087409079075, -0.024018675088882446, -0.023446477949619293, -0.02287427894771099, -0.02230207994580269, -0.021729882806539536, -0.021157683804631233, -0.02058548666536808, -0.020013287663459778, -0.019441088661551476, -0.018868891522288322, -0.01829669252038002, -0.017724495381116867, -0.017152294516563416, -0.016580095514655113, -0.01600789837539196, -0.015435699373483658, -0.01486350130289793, -0.014291303232312202, -0.0137191042304039, -0.013146906159818172, -0.012574708089232445, -0.012002510018646717, -0.011430311016738415, -0.010858112946152687, -0.01028591487556696, -0.009713716804981232, -0.00914151780307293, -0.008569319732487202, -0.0079971207305789, -0.007424922194331884, -0.006852724123746157, -0.006280525587499142, -0.005708327516913414, -0.005136128980666399, -0.004563930444419384, -0.003991732373833656, -0.0034195338375866413, -0.00284733553417027, -0.0022751372307538986, -0.0017029386945068836, -0.0011307403910905123, -0.0005585420876741409, 1.365644857287407e-05, 0.0005858545191586018, 0.0011580530554056168, 0.001730251358821988, 0.0023024496622383595, 0.0028746481984853745, 0.003446846501901746, 0.004019044805318117, 0.004591243341565132, 0.00516344141215086, 0.005735639948397875, 0.00630783848464489, 0.0068800365552306175, 0.0074522350914776325, 0.008024433627724648, 0.008596631698310375, 0.009168829768896103, 0.009741028770804405, 0.010313226841390133]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 2.0, 4.0, 13.0, 10.0, 15.0, 19.0, 24.0, 20.0, 20.0, 29.0, 20.0, 34.0, 36.0, 47.0, 39.0, 45.0, 43.0, 47.0, 49.0, 43.0, 46.0, 42.0, 37.0, 36.0, 32.0, 38.0, 24.0, 31.0, 24.0, 28.0, 27.0, 14.0, 9.0, 10.0, 11.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.01139611005783081, -0.011077133007347584, -0.010758155025541782, -0.010439177975058556, -0.010120200924575329, -0.009801223874092102, -0.0094822458922863, -0.009163268841803074, -0.008844291791319847, -0.00852531474083662, -0.008206336759030819, -0.007887359708547592, -0.007568382658064365, -0.007249405141919851, -0.006930427625775337, -0.0066114505752921104, -0.006292472593486309, -0.005973495077341795, -0.005654518026858568, -0.005335540510714054, -0.005016563460230827, -0.004697585944086313, -0.004378608427941799, -0.004059631377458572, -0.0037406538613140583, -0.003421676578000188, -0.0031026992946863174, -0.0027837217785418034, -0.002464744495227933, -0.0021457672119140625, -0.0018267898121848702, -0.001507812412455678, -0.001188834197819233, -0.0008698568562977016, -0.0005508795147761703, -0.0002319021732546389, 8.707516826689243e-05, 0.00040605245158076286, 0.0007250298513099551, 0.0010440072510391474, 0.0013629845343530178, 0.0016819618176668882, 0.0020009391009807587, 0.0023199166171252728, 0.002638893900439143, 0.0029578711837530136, 0.0032768486998975277, 0.003595825983211398, 0.0039148032665252686, 0.004233780782669783, 0.004552757833153009, 0.0048717353492975235, 0.00519071239978075, 0.005509689915925264, 0.0058286674320697784, 0.006147644482553005, 0.006466621998697519, 0.006785599514842033, 0.00710457656532526, 0.007423554081469774, 0.007742531597614288, 0.008061508648097515, 0.008380485698580742, 0.008699463680386543, 0.00901844073086977]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 3.0, 7.0, 6.0, 10.0, 20.0, 24.0, 43.0, 63.0, 89.0, 112.0, 187.0, 326.0, 579.0, 1029.0, 1757.0, 3436.0, 6612.0, 12730.0, 25241.0, 53235.0, 127418.0, 352758.0, 275294.0, 100223.0, 43547.0, 21059.0, 10605.0, 5435.0, 2901.0, 1576.0, 871.0, 499.0, 306.0, 209.0, 126.0, 74.0, 49.0, 30.0, 26.0, 12.0, 7.0, 5.0, 9.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00487518310546875, -0.004706323146820068, -0.004537463188171387, -0.004368603229522705, -0.0041997432708740234, -0.004030883312225342, -0.00386202335357666, -0.0036931633949279785, -0.003524303436279297, -0.0033554434776306152, -0.0031865835189819336, -0.003017723560333252, -0.0028488636016845703, -0.0026800036430358887, -0.002511143684387207, -0.0023422837257385254, -0.0021734237670898438, -0.002004563808441162, -0.0018357038497924805, -0.0016668438911437988, -0.0014979839324951172, -0.0013291239738464355, -0.001160264015197754, -0.0009914040565490723, -0.0008225440979003906, -0.000653684139251709, -0.00048482418060302734, -0.0003159642219543457, -0.00014710426330566406, 2.1755695343017578e-05, 0.00019061565399169922, 0.00035947561264038086, 0.0005283355712890625, 0.0006971955299377441, 0.0008660554885864258, 0.0010349154472351074, 0.001203775405883789, 0.0013726353645324707, 0.0015414953231811523, 0.001710355281829834, 0.0018792152404785156, 0.0020480751991271973, 0.002216935157775879, 0.0023857951164245605, 0.002554655075073242, 0.002723515033721924, 0.0028923749923706055, 0.003061234951019287, 0.0032300949096679688, 0.0033989548683166504, 0.003567814826965332, 0.0037366747856140137, 0.0039055347442626953, 0.004074394702911377, 0.004243254661560059, 0.00441211462020874, 0.004580974578857422, 0.0047498345375061035, 0.004918694496154785, 0.005087554454803467, 0.0052564144134521484, 0.00542527437210083, 0.005594134330749512, 0.005762994289398193, 0.005931854248046875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 4.0, 7.0, 17.0, 22.0, 17.0, 23.0, 31.0, 33.0, 32.0, 33.0, 52.0, 52.0, 41.0, 46.0, 48.0, 45.0, 65.0, 67.0, 43.0, 44.0, 39.0, 35.0, 34.0, 23.0, 25.0, 30.0, 18.0, 16.0, 10.0, 10.0, 9.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01009368896484375, -0.009807348251342773, -0.009521007537841797, -0.00923466682434082, -0.008948326110839844, -0.008661985397338867, -0.00837564468383789, -0.008089303970336914, -0.0078029632568359375, -0.007516622543334961, -0.007230281829833984, -0.006943941116333008, -0.006657600402832031, -0.006371259689331055, -0.006084918975830078, -0.0057985782623291016, -0.005512237548828125, -0.0052258968353271484, -0.004939556121826172, -0.004653215408325195, -0.004366874694824219, -0.004080533981323242, -0.0037941932678222656, -0.003507852554321289, -0.0032215118408203125, -0.002935171127319336, -0.0026488304138183594, -0.002362489700317383, -0.0020761489868164062, -0.0017898082733154297, -0.0015034675598144531, -0.0012171268463134766, -0.0009307861328125, -0.0006444454193115234, -0.0003581047058105469, -7.176399230957031e-05, 0.00021457672119140625, 0.0005009174346923828, 0.0007872581481933594, 0.001073598861694336, 0.0013599395751953125, 0.001646280288696289, 0.0019326210021972656, 0.002218961715698242, 0.0025053024291992188, 0.0027916431427001953, 0.003077983856201172, 0.0033643245697021484, 0.003650665283203125, 0.0039370059967041016, 0.004223346710205078, 0.004509687423706055, 0.004796028137207031, 0.005082368850708008, 0.005368709564208984, 0.005655050277709961, 0.0059413909912109375, 0.006227731704711914, 0.006514072418212891, 0.006800413131713867, 0.007086753845214844, 0.00737309455871582, 0.007659435272216797, 0.007945775985717773, 0.00823211669921875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 11.0, 14.0, 30.0, 35.0, 49.0, 48.0, 75.0, 124.0, 195.0, 271.0, 389.0, 567.0, 840.0, 1201.0, 1794.0, 2678.0, 4136.0, 6237.0, 9491.0, 14978.0, 24140.0, 41370.0, 75816.0, 165421.0, 349106.0, 165671.0, 75377.0, 41099.0, 24263.0, 15058.0, 9361.0, 6175.0, 4045.0, 2730.0, 1799.0, 1282.0, 832.0, 551.0, 405.0, 274.0, 198.0, 121.0, 99.0, 64.0, 38.0, 42.0, 20.0, 11.0, 10.0, 2.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.003536224365234375, -0.0034274160861968994, -0.003318607807159424, -0.0032097995281219482, -0.0031009912490844727, -0.002992182970046997, -0.0028833746910095215, -0.002774566411972046, -0.0026657581329345703, -0.0025569498538970947, -0.002448141574859619, -0.0023393332958221436, -0.002230525016784668, -0.0021217167377471924, -0.002012908458709717, -0.0019041001796722412, -0.0017952919006347656, -0.00168648362159729, -0.0015776753425598145, -0.0014688670635223389, -0.0013600587844848633, -0.0012512505054473877, -0.0011424422264099121, -0.0010336339473724365, -0.0009248256683349609, -0.0008160173892974854, -0.0007072091102600098, -0.0005984008312225342, -0.0004895925521850586, -0.000380784273147583, -0.0002719759941101074, -0.00016316771507263184, -5.435943603515625e-05, 5.4448843002319336e-05, 0.00016325712203979492, 0.0002720654010772705, 0.0003808736801147461, 0.0004896819591522217, 0.0005984902381896973, 0.0007072985172271729, 0.0008161067962646484, 0.000924915075302124, 0.0010337233543395996, 0.0011425316333770752, 0.0012513399124145508, 0.0013601481914520264, 0.001468956470489502, 0.0015777647495269775, 0.0016865730285644531, 0.0017953813076019287, 0.0019041895866394043, 0.00201299786567688, 0.0021218061447143555, 0.002230614423751831, 0.0023394227027893066, 0.0024482309818267822, 0.002557039260864258, 0.0026658475399017334, 0.002774655818939209, 0.0028834640979766846, 0.00299227237701416, 0.0031010806560516357, 0.0032098889350891113, 0.003318697214126587, 0.0034275054931640625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 6.0, 9.0, 10.0, 14.0, 10.0, 10.0, 18.0, 20.0, 19.0, 25.0, 28.0, 30.0, 30.0, 35.0, 30.0, 43.0, 35.0, 45.0, 38.0, 33.0, 33.0, 46.0, 34.0, 37.0, 32.0, 32.0, 28.0, 31.0, 27.0, 26.0, 20.0, 15.0, 25.0, 15.0, 19.0, 16.0, 9.0, 9.0, 13.0, 5.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0040130615234375, -0.0038785338401794434, -0.0037440061569213867, -0.00360947847366333, -0.0034749507904052734, -0.003340423107147217, -0.00320589542388916, -0.0030713677406311035, -0.002936840057373047, -0.0028023123741149902, -0.0026677846908569336, -0.002533257007598877, -0.0023987293243408203, -0.0022642016410827637, -0.002129673957824707, -0.0019951462745666504, -0.0018606185913085938, -0.0017260909080505371, -0.0015915632247924805, -0.0014570355415344238, -0.0013225078582763672, -0.0011879801750183105, -0.001053452491760254, -0.0009189248085021973, -0.0007843971252441406, -0.000649869441986084, -0.0005153417587280273, -0.0003808140754699707, -0.00024628639221191406, -0.00011175870895385742, 2.276897430419922e-05, 0.00015729665756225586, 0.0002918243408203125, 0.00042635202407836914, 0.0005608797073364258, 0.0006954073905944824, 0.0008299350738525391, 0.0009644627571105957, 0.0010989904403686523, 0.001233518123626709, 0.0013680458068847656, 0.0015025734901428223, 0.001637101173400879, 0.0017716288566589355, 0.0019061565399169922, 0.002040684223175049, 0.0021752119064331055, 0.002309739589691162, 0.0024442672729492188, 0.0025787949562072754, 0.002713322639465332, 0.0028478503227233887, 0.0029823780059814453, 0.003116905689239502, 0.0032514333724975586, 0.0033859610557556152, 0.003520488739013672, 0.0036550164222717285, 0.003789544105529785, 0.003924071788787842, 0.0040585994720458984, 0.004193127155303955, 0.004327654838562012, 0.004462182521820068, 0.004596710205078125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 7.0, 14.0, 15.0, 14.0, 38.0, 31.0, 36.0, 80.0, 106.0, 187.0, 274.0, 399.0, 668.0, 1139.0, 1937.0, 3421.0, 6482.0, 12950.0, 28263.0, 74710.0, 437892.0, 355225.0, 70581.0, 27411.0, 12392.0, 6200.0, 3386.0, 1836.0, 1034.0, 625.0, 387.0, 249.0, 148.0, 130.0, 76.0, 64.0, 40.0, 36.0, 25.0, 13.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002117156982421875, -0.0002048797905445099, -0.00019804388284683228, -0.00019120797514915466, -0.00018437206745147705, -0.00017753615975379944, -0.00017070025205612183, -0.00016386434435844421, -0.0001570284366607666, -0.000150192528963089, -0.00014335662126541138, -0.00013652071356773376, -0.00012968480587005615, -0.00012284889817237854, -0.00011601299047470093, -0.00010917708277702332, -0.0001023411750793457, -9.550526738166809e-05, -8.866935968399048e-05, -8.183345198631287e-05, -7.499754428863525e-05, -6.816163659095764e-05, -6.132572889328003e-05, -5.448982119560242e-05, -4.7653913497924805e-05, -4.081800580024719e-05, -3.398209810256958e-05, -2.7146190404891968e-05, -2.0310282707214355e-05, -1.3474375009536743e-05, -6.638467311859131e-06, 1.9744038581848145e-07, 7.033348083496094e-06, 1.3869255781173706e-05, 2.070516347885132e-05, 2.754107117652893e-05, 3.437697887420654e-05, 4.1212886571884155e-05, 4.804879426956177e-05, 5.488470196723938e-05, 6.172060966491699e-05, 6.85565173625946e-05, 7.539242506027222e-05, 8.222833275794983e-05, 8.906424045562744e-05, 9.590014815330505e-05, 0.00010273605585098267, 0.00010957196354866028, 0.00011640787124633789, 0.0001232437789440155, 0.00013007968664169312, 0.00013691559433937073, 0.00014375150203704834, 0.00015058740973472595, 0.00015742331743240356, 0.00016425922513008118, 0.0001710951328277588, 0.0001779310405254364, 0.00018476694822311401, 0.00019160285592079163, 0.00019843876361846924, 0.00020527467131614685, 0.00021211057901382446, 0.00021894648671150208, 0.0002257823944091797]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 9.0, 9.0, 2.0, 5.0, 10.0, 9.0, 15.0, 13.0, 17.0, 30.0, 44.0, 45.0, 46.0, 54.0, 48.0, 64.0, 66.0, 64.0, 73.0, 47.0, 66.0, 50.0, 47.0, 34.0, 31.0, 18.0, 19.0, 18.0, 5.0, 7.0, 4.0, 7.0, 3.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.2099742889404297e-05, -1.1753290891647339e-05, -1.1406838893890381e-05, -1.1060386896133423e-05, -1.0713934898376465e-05, -1.0367482900619507e-05, -1.0021030902862549e-05, -9.67457890510559e-06, -9.328126907348633e-06, -8.981674909591675e-06, -8.635222911834717e-06, -8.288770914077759e-06, -7.9423189163208e-06, -7.595866918563843e-06, -7.249414920806885e-06, -6.902962923049927e-06, -6.556510925292969e-06, -6.210058927536011e-06, -5.863606929779053e-06, -5.517154932022095e-06, -5.170702934265137e-06, -4.824250936508179e-06, -4.477798938751221e-06, -4.131346940994263e-06, -3.7848949432373047e-06, -3.4384429454803467e-06, -3.0919909477233887e-06, -2.7455389499664307e-06, -2.3990869522094727e-06, -2.0526349544525146e-06, -1.7061829566955566e-06, -1.3597309589385986e-06, -1.0132789611816406e-06, -6.668269634246826e-07, -3.203749656677246e-07, 2.60770320892334e-08, 3.725290298461914e-07, 7.189810276031494e-07, 1.0654330253601074e-06, 1.4118850231170654e-06, 1.7583370208740234e-06, 2.1047890186309814e-06, 2.4512410163879395e-06, 2.7976930141448975e-06, 3.1441450119018555e-06, 3.4905970096588135e-06, 3.8370490074157715e-06, 4.1835010051727295e-06, 4.5299530029296875e-06, 4.8764050006866455e-06, 5.2228569984436035e-06, 5.5693089962005615e-06, 5.9157609939575195e-06, 6.2622129917144775e-06, 6.6086649894714355e-06, 6.9551169872283936e-06, 7.3015689849853516e-06, 7.64802098274231e-06, 7.994472980499268e-06, 8.340924978256226e-06, 8.687376976013184e-06, 9.033828973770142e-06, 9.3802809715271e-06, 9.726732969284058e-06, 1.0073184967041016e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 5.0, 10.0, 8.0, 9.0, 7.0, 21.0, 17.0, 26.0, 31.0, 43.0, 45.0, 93.0, 1379.0, 793385.0, 252304.0, 822.0, 72.0, 51.0, 40.0, 27.0, 28.0, 30.0, 14.0, 9.0, 17.0, 7.0, 11.0, 8.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0014476776123046875, -0.001397654414176941, -0.0013476312160491943, -0.0012976080179214478, -0.0012475848197937012, -0.0011975616216659546, -0.001147538423538208, -0.0010975152254104614, -0.0010474920272827148, -0.0009974688291549683, -0.0009474456310272217, -0.0008974224328994751, -0.0008473992347717285, -0.0007973760366439819, -0.0007473528385162354, -0.0006973296403884888, -0.0006473064422607422, -0.0005972832441329956, -0.000547260046005249, -0.0004972368478775024, -0.00044721364974975586, -0.0003971904516220093, -0.0003471672534942627, -0.0002971440553665161, -0.00024712085723876953, -0.00019709765911102295, -0.00014707446098327637, -9.705126285552979e-05, -4.70280647277832e-05, 2.995133399963379e-06, 5.301833152770996e-05, 0.00010304152965545654, 0.00015306472778320312, 0.0002030879259109497, 0.0002531111240386963, 0.00030313432216644287, 0.00035315752029418945, 0.00040318071842193604, 0.0004532039165496826, 0.0005032271146774292, 0.0005532503128051758, 0.0006032735109329224, 0.0006532967090606689, 0.0007033199071884155, 0.0007533431053161621, 0.0008033663034439087, 0.0008533895015716553, 0.0009034126996994019, 0.0009534358978271484, 0.001003459095954895, 0.0010534822940826416, 0.0011035054922103882, 0.0011535286903381348, 0.0012035518884658813, 0.001253575086593628, 0.0013035982847213745, 0.001353621482849121, 0.0014036446809768677, 0.0014536678791046143, 0.0015036910772323608, 0.0015537142753601074, 0.001603737473487854, 0.0016537606716156006, 0.0017037838697433472, 0.0017538070678710938]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 5.0, 5.0, 8.0, 9.0, 12.0, 21.0, 11.0, 16.0, 24.0, 22.0, 30.0, 39.0, 52.0, 73.0, 93.0, 135.0, 95.0, 68.0, 52.0, 43.0, 29.0, 21.0, 12.0, 17.0, 17.0, 12.0, 12.0, 7.0, 10.0, 9.0, 3.0, 10.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.786252975463867e-05, -4.6479515731334686e-05, -4.50965017080307e-05, -4.3713487684726715e-05, -4.233047366142273e-05, -4.0947459638118744e-05, -3.956444561481476e-05, -3.818143159151077e-05, -3.679841756820679e-05, -3.54154035449028e-05, -3.4032389521598816e-05, -3.264937549829483e-05, -3.1266361474990845e-05, -2.988334745168686e-05, -2.8500333428382874e-05, -2.7117319405078888e-05, -2.5734305381774902e-05, -2.4351291358470917e-05, -2.296827733516693e-05, -2.1585263311862946e-05, -2.020224928855896e-05, -1.8819235265254974e-05, -1.743622124195099e-05, -1.6053207218647003e-05, -1.4670193195343018e-05, -1.3287179172039032e-05, -1.1904165148735046e-05, -1.052115112543106e-05, -9.138137102127075e-06, -7.75512307882309e-06, -6.372109055519104e-06, -4.989095032215118e-06, -3.606081008911133e-06, -2.2230669856071472e-06, -8.400529623031616e-07, 5.42961061000824e-07, 1.9259750843048096e-06, 3.308989107608795e-06, 4.692003130912781e-06, 6.075017154216766e-06, 7.458031177520752e-06, 8.841045200824738e-06, 1.0224059224128723e-05, 1.1607073247432709e-05, 1.2990087270736694e-05, 1.437310129404068e-05, 1.5756115317344666e-05, 1.713912934064865e-05, 1.8522143363952637e-05, 1.9905157387256622e-05, 2.1288171410560608e-05, 2.2671185433864594e-05, 2.405419945716858e-05, 2.5437213480472565e-05, 2.682022750377655e-05, 2.8203241527080536e-05, 2.958625555038452e-05, 3.096926957368851e-05, 3.235228359699249e-05, 3.373529762029648e-05, 3.5118311643600464e-05, 3.650132566690445e-05, 3.7884339690208435e-05, 3.926735371351242e-05, 4.0650367736816406e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 10.0, 12.0, 29.0, 38.0, 107.0, 184.0, 246.0, 176.0, 99.0, 65.0, 24.0, 17.0, 5.0, 3.0, 2.0], "bins": [-0.04766763746738434, -0.046808306127786636, -0.04594897851347923, -0.04508964717388153, -0.04423031955957413, -0.043370988219976425, -0.04251165688037872, -0.04165232926607132, -0.04079299792647362, -0.039933666586875916, -0.03907433897256851, -0.03821500763297081, -0.03735567629337311, -0.036496348679065704, -0.035637017339468, -0.0347776897251606, -0.0339183583855629, -0.033059027045965195, -0.03219969943165779, -0.03134036809206009, -0.030481038615107536, -0.029621709138154984, -0.02876237779855728, -0.02790304832160473, -0.027043718844652176, -0.026184389367699623, -0.02532505989074707, -0.02446572855114937, -0.023606399074196815, -0.022747069597244263, -0.02188773825764656, -0.021028408780694008, -0.020169077441096306, -0.019309747964143753, -0.01845041662454605, -0.017591087147593498, -0.016731757670640945, -0.015872428193688393, -0.015013097785413265, -0.014153767377138138, -0.013294437900185585, -0.012435108423233032, -0.011575778014957905, -0.010716447606682777, -0.009857118129730225, -0.008997788652777672, -0.008138458244502544, -0.007279128301888704, -0.0064197988249361515, -0.005560468882322311, -0.004701138939708471, -0.003841808997094631, -0.002982479054480791, -0.002123149111866951, -0.0012638191692531109, -0.0004044892266392708, 0.0004548407159745693, 0.0013141706585884094, 0.0021735006012022495, 0.0030328305438160896, 0.0038921604864299297, 0.00475149042904377, 0.00561082037165761, 0.00647015031427145, 0.00732948025688529]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 4.0, 15.0, 24.0, 25.0, 21.0, 25.0, 24.0, 31.0, 38.0, 42.0, 50.0, 43.0, 52.0, 50.0, 51.0, 63.0, 57.0, 35.0, 37.0, 43.0, 37.0, 26.0, 36.0, 31.0, 32.0, 18.0, 21.0, 14.0, 10.0, 7.0, 3.0, 7.0, 7.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.010161985643208027, -0.009899301454424858, -0.00963661726564169, -0.00937393307685852, -0.009111247956752777, -0.008848563767969608, -0.00858587957918644, -0.00832319539040327, -0.008060511201620102, -0.007797827012836933, -0.007535142824053764, -0.007272458169609308, -0.0070097739808261395, -0.006747089792042971, -0.0064844051375985146, -0.006221720948815346, -0.005959036760032177, -0.005696352571249008, -0.005433668382465839, -0.005170983728021383, -0.0049082995392382145, -0.004645615350455046, -0.00438293069601059, -0.004120246507227421, -0.003857562318444252, -0.0035948781296610832, -0.0033321937080472708, -0.0030695092864334583, -0.0028068250976502895, -0.0025441409088671207, -0.0022814564872533083, -0.002018772065639496, -0.0017560883425176144, -0.0014934040373191237, -0.0012307197321206331, -0.0009680354269221425, -0.0007053511217236519, -0.00044266681652516127, -0.00017998251132667065, 8.270179387181997e-05, 0.0003453860990703106, 0.0006080704042688012, 0.0008707547094672918, 0.0011334390146657825, 0.001396123319864273, 0.0016588076250627637, 0.0019214919302612543, 0.0021841763518750668, 0.0024468605406582355, 0.0027095447294414043, 0.002972229151055217, 0.0032349135726690292, 0.003497597761452198, 0.003760281950235367, 0.004022966139018536, 0.004285650793462992, 0.0045483349822461605, 0.004811019171029329, 0.005073703825473785, 0.005336388014256954, 0.005599072203040123, 0.005861756391823292, 0.006124440580606461, 0.006387125235050917, 0.0066498094238340855]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 7.0, 4.0, 8.0, 5.0, 7.0, 11.0, 11.0, 12.0, 19.0, 27.0, 25.0, 38.0, 52.0, 76.0, 193.0, 622.0, 2342.0, 11358.0, 62123.0, 352931.0, 494060.0, 101935.0, 17643.0, 3536.0, 902.0, 250.0, 107.0, 45.0, 38.0, 24.0, 27.0, 25.0, 19.0, 12.0, 14.0, 21.0, 13.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056671142578125, -0.054907798767089844, -0.05314445495605469, -0.05138111114501953, -0.049617767333984375, -0.04785442352294922, -0.04609107971191406, -0.044327735900878906, -0.04256439208984375, -0.040801048278808594, -0.03903770446777344, -0.03727436065673828, -0.035511016845703125, -0.03374767303466797, -0.03198432922363281, -0.030220985412597656, -0.0284576416015625, -0.026694297790527344, -0.024930953979492188, -0.02316761016845703, -0.021404266357421875, -0.01964092254638672, -0.017877578735351562, -0.016114234924316406, -0.01435089111328125, -0.012587547302246094, -0.010824203491210938, -0.009060859680175781, -0.007297515869140625, -0.005534172058105469, -0.0037708282470703125, -0.0020074844360351562, -0.000244140625, 0.0015192031860351562, 0.0032825469970703125, 0.005045890808105469, 0.006809234619140625, 0.008572578430175781, 0.010335922241210938, 0.012099266052246094, 0.01386260986328125, 0.015625953674316406, 0.017389297485351562, 0.01915264129638672, 0.020915985107421875, 0.02267932891845703, 0.024442672729492188, 0.026206016540527344, 0.0279693603515625, 0.029732704162597656, 0.03149604797363281, 0.03325939178466797, 0.035022735595703125, 0.03678607940673828, 0.03854942321777344, 0.040312767028808594, 0.04207611083984375, 0.043839454650878906, 0.04560279846191406, 0.04736614227294922, 0.049129486083984375, 0.05089282989501953, 0.05265617370605469, 0.054419517517089844, 0.056182861328125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 9.0, 14.0, 26.0, 39.0, 39.0, 53.0, 49.0, 63.0, 79.0, 80.0, 90.0, 81.0, 61.0, 74.0, 47.0, 42.0, 50.0, 30.0, 18.0, 17.0, 9.0, 2.0, 8.0, 5.0, 3.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0174407958984375, -0.01699817180633545, -0.0165555477142334, -0.016112923622131348, -0.015670299530029297, -0.015227675437927246, -0.014785051345825195, -0.014342427253723145, -0.013899803161621094, -0.013457179069519043, -0.013014554977416992, -0.012571930885314941, -0.01212930679321289, -0.01168668270111084, -0.011244058609008789, -0.010801434516906738, -0.010358810424804688, -0.009916186332702637, -0.009473562240600586, -0.009030938148498535, -0.008588314056396484, -0.008145689964294434, -0.007703065872192383, -0.007260441780090332, -0.006817817687988281, -0.0063751935958862305, -0.00593256950378418, -0.005489945411682129, -0.005047321319580078, -0.004604697227478027, -0.0041620731353759766, -0.0037194490432739258, -0.003276824951171875, -0.0028342008590698242, -0.0023915767669677734, -0.0019489526748657227, -0.0015063285827636719, -0.001063704490661621, -0.0006210803985595703, -0.00017845630645751953, 0.00026416778564453125, 0.000706791877746582, 0.0011494159698486328, 0.0015920400619506836, 0.0020346641540527344, 0.002477288246154785, 0.002919912338256836, 0.0033625364303588867, 0.0038051605224609375, 0.004247784614562988, 0.004690408706665039, 0.00513303279876709, 0.005575656890869141, 0.006018280982971191, 0.006460905075073242, 0.006903529167175293, 0.007346153259277344, 0.0077887773513793945, 0.008231401443481445, 0.008674025535583496, 0.009116649627685547, 0.009559273719787598, 0.010001897811889648, 0.0104445219039917, 0.01088714599609375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 7.0, 3.0, 3.0, 6.0, 5.0, 13.0, 13.0, 8.0, 11.0, 16.0, 24.0, 18.0, 21.0, 34.0, 30.0, 57.0, 116.0, 420.0, 1703.0, 7532.0, 35360.0, 170241.0, 507315.0, 256166.0, 54369.0, 11543.0, 2499.0, 553.0, 188.0, 60.0, 34.0, 27.0, 26.0, 19.0, 21.0, 9.0, 18.0, 13.0, 11.0, 10.0, 7.0, 4.0, 7.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04608154296875, -0.04471158981323242, -0.043341636657714844, -0.041971683502197266, -0.04060173034667969, -0.03923177719116211, -0.03786182403564453, -0.03649187088012695, -0.035121917724609375, -0.0337519645690918, -0.03238201141357422, -0.03101205825805664, -0.029642105102539062, -0.028272151947021484, -0.026902198791503906, -0.025532245635986328, -0.02416229248046875, -0.022792339324951172, -0.021422386169433594, -0.020052433013916016, -0.018682479858398438, -0.01731252670288086, -0.01594257354736328, -0.014572620391845703, -0.013202667236328125, -0.011832714080810547, -0.010462760925292969, -0.00909280776977539, -0.0077228546142578125, -0.006352901458740234, -0.004982948303222656, -0.003612995147705078, -0.0022430419921875, -0.0008730888366699219, 0.0004968643188476562, 0.0018668174743652344, 0.0032367706298828125, 0.004606723785400391, 0.005976676940917969, 0.007346630096435547, 0.008716583251953125, 0.010086536407470703, 0.011456489562988281, 0.01282644271850586, 0.014196395874023438, 0.015566349029541016, 0.016936302185058594, 0.018306255340576172, 0.01967620849609375, 0.021046161651611328, 0.022416114807128906, 0.023786067962646484, 0.025156021118164062, 0.02652597427368164, 0.02789592742919922, 0.029265880584716797, 0.030635833740234375, 0.03200578689575195, 0.03337574005126953, 0.03474569320678711, 0.03611564636230469, 0.037485599517822266, 0.038855552673339844, 0.04022550582885742, 0.041595458984375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 2.0, 5.0, 5.0, 15.0, 10.0, 12.0, 20.0, 10.0, 15.0, 23.0, 24.0, 30.0, 30.0, 25.0, 31.0, 36.0, 38.0, 40.0, 42.0, 38.0, 29.0, 29.0, 43.0, 42.0, 43.0, 36.0, 38.0, 33.0, 25.0, 33.0, 27.0, 23.0, 20.0, 11.0, 16.0, 13.0, 15.0, 8.0, 10.0, 7.0, 10.0, 7.0, 6.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00576019287109375, -0.005568146705627441, -0.005376100540161133, -0.005184054374694824, -0.004992008209228516, -0.004799962043762207, -0.0046079158782958984, -0.00441586971282959, -0.004223823547363281, -0.004031777381896973, -0.003839731216430664, -0.0036476850509643555, -0.003455638885498047, -0.0032635927200317383, -0.0030715465545654297, -0.002879500389099121, -0.0026874542236328125, -0.002495408058166504, -0.0023033618927001953, -0.0021113157272338867, -0.0019192695617675781, -0.0017272233963012695, -0.001535177230834961, -0.0013431310653686523, -0.0011510848999023438, -0.0009590387344360352, -0.0007669925689697266, -0.000574946403503418, -0.0003829002380371094, -0.00019085407257080078, 1.1920928955078125e-06, 0.0001932382583618164, 0.000385284423828125, 0.0005773305892944336, 0.0007693767547607422, 0.0009614229202270508, 0.0011534690856933594, 0.001345515251159668, 0.0015375614166259766, 0.0017296075820922852, 0.0019216537475585938, 0.0021136999130249023, 0.002305746078491211, 0.0024977922439575195, 0.002689838409423828, 0.0028818845748901367, 0.0030739307403564453, 0.003265976905822754, 0.0034580230712890625, 0.003650069236755371, 0.0038421154022216797, 0.004034161567687988, 0.004226207733154297, 0.0044182538986206055, 0.004610300064086914, 0.004802346229553223, 0.004994392395019531, 0.00518643856048584, 0.0053784847259521484, 0.005570530891418457, 0.005762577056884766, 0.005954623222351074, 0.006146669387817383, 0.006338715553283691, 0.00653076171875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 4.0, 14.0, 22.0, 31.0, 40.0, 54.0, 82.0, 134.0, 210.0, 318.0, 505.0, 863.0, 1486.0, 2711.0, 5699.0, 14243.0, 46912.0, 825410.0, 108211.0, 24221.0, 8690.0, 3909.0, 1884.0, 1134.0, 607.0, 417.0, 260.0, 160.0, 104.0, 73.0, 38.0, 41.0, 26.0, 11.0, 6.0, 13.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006134033203125, -0.005904674530029297, -0.005675315856933594, -0.005445957183837891, -0.0052165985107421875, -0.004987239837646484, -0.004757881164550781, -0.004528522491455078, -0.004299163818359375, -0.004069805145263672, -0.0038404464721679688, -0.0036110877990722656, -0.0033817291259765625, -0.0031523704528808594, -0.0029230117797851562, -0.002693653106689453, -0.00246429443359375, -0.002234935760498047, -0.0020055770874023438, -0.0017762184143066406, -0.0015468597412109375, -0.0013175010681152344, -0.0010881423950195312, -0.0008587837219238281, -0.000629425048828125, -0.0004000663757324219, -0.00017070770263671875, 5.8650970458984375e-05, 0.0002880096435546875, 0.0005173683166503906, 0.0007467269897460938, 0.0009760856628417969, 0.0012054443359375, 0.0014348030090332031, 0.0016641616821289062, 0.0018935203552246094, 0.0021228790283203125, 0.0023522377014160156, 0.0025815963745117188, 0.002810955047607422, 0.003040313720703125, 0.003269672393798828, 0.0034990310668945312, 0.0037283897399902344, 0.0039577484130859375, 0.004187107086181641, 0.004416465759277344, 0.004645824432373047, 0.00487518310546875, 0.005104541778564453, 0.005333900451660156, 0.005563259124755859, 0.0057926177978515625, 0.006021976470947266, 0.006251335144042969, 0.006480693817138672, 0.006710052490234375, 0.006939411163330078, 0.007168769836425781, 0.007398128509521484, 0.0076274871826171875, 0.00785684585571289, 0.008086204528808594, 0.008315563201904297, 0.008544921875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 7.0, 5.0, 4.0, 9.0, 4.0, 17.0, 18.0, 33.0, 38.0, 50.0, 81.0, 119.0, 142.0, 139.0, 99.0, 80.0, 48.0, 35.0, 26.0, 8.0, 13.0, 9.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.715557098388672e-06, -9.417533874511719e-06, -9.119510650634766e-06, -8.821487426757812e-06, -8.52346420288086e-06, -8.225440979003906e-06, -7.927417755126953e-06, -7.62939453125e-06, -7.331371307373047e-06, -7.033348083496094e-06, -6.735324859619141e-06, -6.4373016357421875e-06, -6.139278411865234e-06, -5.841255187988281e-06, -5.543231964111328e-06, -5.245208740234375e-06, -4.947185516357422e-06, -4.649162292480469e-06, -4.351139068603516e-06, -4.0531158447265625e-06, -3.7550926208496094e-06, -3.4570693969726562e-06, -3.159046173095703e-06, -2.86102294921875e-06, -2.562999725341797e-06, -2.2649765014648438e-06, -1.9669532775878906e-06, -1.6689300537109375e-06, -1.3709068298339844e-06, -1.0728836059570312e-06, -7.748603820800781e-07, -4.76837158203125e-07, -1.7881393432617188e-07, 1.1920928955078125e-07, 4.172325134277344e-07, 7.152557373046875e-07, 1.0132789611816406e-06, 1.3113021850585938e-06, 1.6093254089355469e-06, 1.9073486328125e-06, 2.205371856689453e-06, 2.5033950805664062e-06, 2.8014183044433594e-06, 3.0994415283203125e-06, 3.3974647521972656e-06, 3.6954879760742188e-06, 3.993511199951172e-06, 4.291534423828125e-06, 4.589557647705078e-06, 4.887580871582031e-06, 5.185604095458984e-06, 5.4836273193359375e-06, 5.781650543212891e-06, 6.079673767089844e-06, 6.377696990966797e-06, 6.67572021484375e-06, 6.973743438720703e-06, 7.271766662597656e-06, 7.569789886474609e-06, 7.867813110351562e-06, 8.165836334228516e-06, 8.463859558105469e-06, 8.761882781982422e-06, 9.059906005859375e-06, 9.357929229736328e-06]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 7.0, 2.0, 3.0, 5.0, 5.0, 11.0, 12.0, 19.0, 42.0, 71.0, 164.0, 298.0, 700.0, 1773.0, 5664.0, 21120.0, 182025.0, 799818.0, 26371.0, 6760.0, 2160.0, 813.0, 352.0, 177.0, 78.0, 33.0, 19.0, 10.0, 5.0, 5.0, 8.0, 0.0, 4.0, 2.0, 4.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00843048095703125, -0.008130192756652832, -0.007829904556274414, -0.007529616355895996, -0.007229328155517578, -0.00692903995513916, -0.006628751754760742, -0.006328463554382324, -0.006028175354003906, -0.005727887153625488, -0.00542759895324707, -0.005127310752868652, -0.004827022552490234, -0.004526734352111816, -0.0042264461517333984, -0.0039261579513549805, -0.0036258697509765625, -0.0033255815505981445, -0.0030252933502197266, -0.0027250051498413086, -0.0024247169494628906, -0.0021244287490844727, -0.0018241405487060547, -0.0015238523483276367, -0.0012235641479492188, -0.0009232759475708008, -0.0006229877471923828, -0.00032269954681396484, -2.2411346435546875e-05, 0.0002778768539428711, 0.0005781650543212891, 0.000878453254699707, 0.001178741455078125, 0.001479029655456543, 0.001779317855834961, 0.002079606056213379, 0.002379894256591797, 0.002680182456970215, 0.002980470657348633, 0.0032807588577270508, 0.0035810470581054688, 0.0038813352584838867, 0.004181623458862305, 0.004481911659240723, 0.004782199859619141, 0.005082488059997559, 0.0053827762603759766, 0.0056830644607543945, 0.0059833526611328125, 0.0062836408615112305, 0.0065839290618896484, 0.006884217262268066, 0.007184505462646484, 0.007484793663024902, 0.00778508186340332, 0.008085370063781738, 0.008385658264160156, 0.008685946464538574, 0.008986234664916992, 0.00928652286529541, 0.009586811065673828, 0.009887099266052246, 0.010187387466430664, 0.010487675666809082, 0.0107879638671875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 5.0, 4.0, 9.0, 8.0, 6.0, 5.0, 5.0, 9.0, 9.0, 11.0, 13.0, 12.0, 15.0, 20.0, 32.0, 50.0, 312.0, 245.0, 52.0, 29.0, 26.0, 14.0, 16.0, 11.0, 12.0, 11.0, 12.0, 10.0, 3.0, 5.0, 1.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.001407623291015625, -0.0013705044984817505, -0.001333385705947876, -0.0012962669134140015, -0.001259148120880127, -0.0012220293283462524, -0.001184910535812378, -0.0011477917432785034, -0.001110672950744629, -0.0010735541582107544, -0.0010364353656768799, -0.0009993165731430054, -0.0009621977806091309, -0.0009250789880752563, -0.0008879601955413818, -0.0008508414030075073, -0.0008137226104736328, -0.0007766038179397583, -0.0007394850254058838, -0.0007023662328720093, -0.0006652474403381348, -0.0006281286478042603, -0.0005910098552703857, -0.0005538910627365112, -0.0005167722702026367, -0.0004796534776687622, -0.0004425346851348877, -0.0004054158926010132, -0.00036829710006713867, -0.00033117830753326416, -0.00029405951499938965, -0.00025694072246551514, -0.00021982192993164062, -0.0001827031373977661, -0.0001455843448638916, -0.00010846555233001709, -7.134675979614258e-05, -3.4227967262268066e-05, 2.8908252716064453e-06, 4.000961780548096e-05, 7.712841033935547e-05, 0.00011424720287322998, 0.0001513659954071045, 0.000188484787940979, 0.00022560358047485352, 0.00026272237300872803, 0.00029984116554260254, 0.00033695995807647705, 0.00037407875061035156, 0.0004111975431442261, 0.0004483163356781006, 0.0004854351282119751, 0.0005225539207458496, 0.0005596727132797241, 0.0005967915058135986, 0.0006339102983474731, 0.0006710290908813477, 0.0007081478834152222, 0.0007452666759490967, 0.0007823854684829712, 0.0008195042610168457, 0.0008566230535507202, 0.0008937418460845947, 0.0009308606386184692, 0.0009679794311523438]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 27.0, 190.0, 654.0, 138.0, 12.0], "bins": [-0.18498356640338898, -0.18196925520896912, -0.17895495891571045, -0.1759406477212906, -0.17292635142803192, -0.16991204023361206, -0.1668977439403534, -0.16388343274593353, -0.16086912155151367, -0.1578548103570938, -0.15484051406383514, -0.15182620286941528, -0.14881190657615662, -0.14579759538173676, -0.1427832841873169, -0.13976898789405823, -0.13675469160079956, -0.1337403804063797, -0.13072608411312103, -0.12771177291870117, -0.12469746917486191, -0.12168316543102264, -0.11866886168718338, -0.11565455794334412, -0.11264024674892426, -0.10962594300508499, -0.10661163926124573, -0.10359732806682587, -0.1005830243229866, -0.09756872057914734, -0.09455441683530807, -0.09154011309146881, -0.08852580189704895, -0.08551149815320969, -0.08249719440937042, -0.07948288321495056, -0.0764685794711113, -0.07345427572727203, -0.07043997198343277, -0.0674256682395935, -0.06441135704517365, -0.06139705330133438, -0.05838274583220482, -0.055368442088365555, -0.05235413461923599, -0.04933983087539673, -0.046325527131557465, -0.0433112233877182, -0.04029691591858864, -0.037282612174749374, -0.03426830470561981, -0.03125400096178055, -0.028239695355296135, -0.025225389748811722, -0.022211086004972458, -0.019196780398488045, -0.01618247479200363, -0.013168169185519218, -0.01015386451035738, -0.007139559835195541, -0.004125254228711128, -0.001110948622226715, 0.0019033551216125488, 0.004917660728096962, 0.0079319654032588]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 9.0, 17.0, 25.0, 25.0, 30.0, 33.0, 47.0, 67.0, 65.0, 57.0, 75.0, 89.0, 75.0, 70.0, 76.0, 60.0, 40.0, 40.0, 31.0, 28.0, 16.0, 6.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017644450068473816, -0.01719694957137108, -0.01674944907426834, -0.016301946714520454, -0.015854446217417717, -0.01540694572031498, -0.014959445223212242, -0.014511944726109505, -0.014064443297684193, -0.013616942800581455, -0.013169441372156143, -0.012721940875053406, -0.012274440377950668, -0.011826938949525356, -0.011379438452422619, -0.010931937023997307, -0.01048443652689457, -0.010036936029791832, -0.00958943460136652, -0.009141934104263783, -0.00869443267583847, -0.008246932178735733, -0.007799431681632996, -0.007351930718868971, -0.006904429756104946, -0.006456928793340921, -0.006009427830576897, -0.005561927333474159, -0.0051144263707101345, -0.00466692540794611, -0.004219424910843372, -0.0037719239480793476, -0.0033244220539927483, -0.0028769210912287235, -0.0024294203612953424, -0.0019819196313619614, -0.0015344186685979366, -0.001086917705833912, -0.0006394169759005308, -0.00019191624596714973, 0.000255584716796875, 0.0007030855631455779, 0.0011505864094942808, 0.0015980872558429837, 0.0020455881021916866, 0.0024930890649557114, 0.0029405897948890924, 0.0033880905248224735, 0.0038355914875864983, 0.004283092450350523, 0.004730593413114548, 0.005178093910217285, 0.00562559487298131, 0.006073095835745335, 0.006520596332848072, 0.006968097295612097, 0.0074155982583761215, 0.007863098755478859, 0.008310600183904171, 0.008758100681006908, 0.00920560210943222, 0.009653102606534958, 0.010100603103637695, 0.010548103600740433, 0.010995605029165745]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 8.0, 4.0, 5.0, 10.0, 8.0, 17.0, 24.0, 44.0, 58.0, 81.0, 141.0, 218.0, 386.0, 629.0, 1183.0, 2311.0, 5005.0, 11800.0, 36519.0, 2843278.0, 1238309.0, 33002.0, 11311.0, 4892.0, 2418.0, 1211.0, 629.0, 324.0, 195.0, 109.0, 62.0, 32.0, 21.0, 16.0, 13.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0294036865234375, -0.028667688369750977, -0.027931690216064453, -0.02719569206237793, -0.026459693908691406, -0.025723695755004883, -0.02498769760131836, -0.024251699447631836, -0.023515701293945312, -0.02277970314025879, -0.022043704986572266, -0.021307706832885742, -0.02057170867919922, -0.019835710525512695, -0.019099712371826172, -0.01836371421813965, -0.017627716064453125, -0.0168917179107666, -0.016155719757080078, -0.015419721603393555, -0.014683723449707031, -0.013947725296020508, -0.013211727142333984, -0.012475728988647461, -0.011739730834960938, -0.011003732681274414, -0.01026773452758789, -0.009531736373901367, -0.008795738220214844, -0.00805974006652832, -0.007323741912841797, -0.0065877437591552734, -0.00585174560546875, -0.0051157474517822266, -0.004379749298095703, -0.0036437511444091797, -0.0029077529907226562, -0.002171754837036133, -0.0014357566833496094, -0.0006997585296630859, 3.62396240234375e-05, 0.0007722377777099609, 0.0015082359313964844, 0.002244234085083008, 0.0029802322387695312, 0.0037162303924560547, 0.004452228546142578, 0.0051882266998291016, 0.005924224853515625, 0.0066602230072021484, 0.007396221160888672, 0.008132219314575195, 0.008868217468261719, 0.009604215621948242, 0.010340213775634766, 0.011076211929321289, 0.011812210083007812, 0.012548208236694336, 0.01328420639038086, 0.014020204544067383, 0.014756202697753906, 0.01549220085144043, 0.016228199005126953, 0.016964197158813477, 0.0177001953125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 6.0, 3.0, 6.0, 9.0, 11.0, 14.0, 18.0, 7.0, 26.0, 21.0, 28.0, 28.0, 26.0, 34.0, 43.0, 30.0, 50.0, 46.0, 49.0, 31.0, 50.0, 50.0, 47.0, 45.0, 49.0, 38.0, 30.0, 34.0, 27.0, 26.0, 16.0, 19.0, 24.0, 5.0, 10.0, 12.0, 2.0, 10.0, 6.0, 4.0, 10.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0066070556640625, -0.0063860416412353516, -0.006165027618408203, -0.005944013595581055, -0.005722999572753906, -0.005501985549926758, -0.005280971527099609, -0.005059957504272461, -0.0048389434814453125, -0.004617929458618164, -0.004396915435791016, -0.004175901412963867, -0.003954887390136719, -0.0037338733673095703, -0.003512859344482422, -0.0032918453216552734, -0.003070831298828125, -0.0028498172760009766, -0.002628803253173828, -0.0024077892303466797, -0.0021867752075195312, -0.001965761184692383, -0.0017447471618652344, -0.001523733139038086, -0.0013027191162109375, -0.001081705093383789, -0.0008606910705566406, -0.0006396770477294922, -0.00041866302490234375, -0.0001976490020751953, 2.3365020751953125e-05, 0.00024437904357910156, 0.00046539306640625, 0.0006864070892333984, 0.0009074211120605469, 0.0011284351348876953, 0.0013494491577148438, 0.0015704631805419922, 0.0017914772033691406, 0.002012491226196289, 0.0022335052490234375, 0.002454519271850586, 0.0026755332946777344, 0.002896547317504883, 0.0031175613403320312, 0.0033385753631591797, 0.003559589385986328, 0.0037806034088134766, 0.004001617431640625, 0.0042226314544677734, 0.004443645477294922, 0.00466465950012207, 0.004885673522949219, 0.005106687545776367, 0.005327701568603516, 0.005548715591430664, 0.0057697296142578125, 0.005990743637084961, 0.006211757659912109, 0.006432771682739258, 0.006653785705566406, 0.006874799728393555, 0.007095813751220703, 0.0073168277740478516, 0.007537841796875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 6.0, 7.0, 12.0, 17.0, 37.0, 73.0, 183.0, 979.0, 9555.0, 3997762.0, 180356.0, 4518.0, 563.0, 129.0, 47.0, 15.0, 12.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0399169921875, -0.037400245666503906, -0.03488349914550781, -0.03236675262451172, -0.029850006103515625, -0.02733325958251953, -0.024816513061523438, -0.022299766540527344, -0.01978302001953125, -0.017266273498535156, -0.014749526977539062, -0.012232780456542969, -0.009716033935546875, -0.007199287414550781, -0.0046825408935546875, -0.0021657943725585938, 0.0003509521484375, 0.0028676986694335938, 0.0053844451904296875, 0.007901191711425781, 0.010417938232421875, 0.012934684753417969, 0.015451431274414062, 0.017968177795410156, 0.02048492431640625, 0.023001670837402344, 0.025518417358398438, 0.02803516387939453, 0.030551910400390625, 0.03306865692138672, 0.03558540344238281, 0.038102149963378906, 0.040618896484375, 0.043135643005371094, 0.04565238952636719, 0.04816913604736328, 0.050685882568359375, 0.05320262908935547, 0.05571937561035156, 0.058236122131347656, 0.06075286865234375, 0.06326961517333984, 0.06578636169433594, 0.06830310821533203, 0.07081985473632812, 0.07333660125732422, 0.07585334777832031, 0.0783700942993164, 0.0808868408203125, 0.0834035873413086, 0.08592033386230469, 0.08843708038330078, 0.09095382690429688, 0.09347057342529297, 0.09598731994628906, 0.09850406646728516, 0.10102081298828125, 0.10353755950927734, 0.10605430603027344, 0.10857105255126953, 0.11108779907226562, 0.11360454559326172, 0.11612129211425781, 0.1186380386352539, 0.12115478515625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 3.0, 9.0, 16.0, 14.0, 18.0, 32.0, 51.0, 125.0, 389.0, 1448.0, 1258.0, 384.0, 126.0, 47.0, 43.0, 27.0, 22.0, 10.0, 10.0, 12.0, 7.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006702423095703125, -0.006546467542648315, -0.006390511989593506, -0.006234556436538696, -0.006078600883483887, -0.005922645330429077, -0.005766689777374268, -0.005610734224319458, -0.0054547786712646484, -0.005298823118209839, -0.005142867565155029, -0.00498691201210022, -0.00483095645904541, -0.004675000905990601, -0.004519045352935791, -0.0043630897998809814, -0.004207134246826172, -0.004051178693771362, -0.0038952231407165527, -0.003739267587661743, -0.0035833120346069336, -0.003427356481552124, -0.0032714009284973145, -0.003115445375442505, -0.0029594898223876953, -0.0028035342693328857, -0.002647578716278076, -0.0024916231632232666, -0.002335667610168457, -0.0021797120571136475, -0.002023756504058838, -0.0018678009510040283, -0.0017118453979492188, -0.0015558898448944092, -0.0013999342918395996, -0.00124397873878479, -0.0010880231857299805, -0.0009320676326751709, -0.0007761120796203613, -0.0006201565265655518, -0.0004642009735107422, -0.0003082454204559326, -0.00015228986740112305, 3.6656856536865234e-06, 0.0001596212387084961, 0.00031557679176330566, 0.00047153234481811523, 0.0006274878978729248, 0.0007834434509277344, 0.0009393990039825439, 0.0010953545570373535, 0.001251310110092163, 0.0014072656631469727, 0.0015632212162017822, 0.0017191767692565918, 0.0018751323223114014, 0.002031087875366211, 0.0021870434284210205, 0.00234299898147583, 0.0024989545345306396, 0.0026549100875854492, 0.002810865640640259, 0.0029668211936950684, 0.003122776746749878, 0.0032787322998046875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 25.0, 139.0, 445.0, 318.0, 71.0, 19.0], "bins": [-0.09747523814439774, -0.0958714708685875, -0.09426771104335785, -0.09266394376754761, -0.09106017649173737, -0.08945640921592712, -0.08785264194011688, -0.08624888211488724, -0.084645114839077, -0.08304134756326675, -0.08143758773803711, -0.07983382046222687, -0.07823005318641663, -0.07662628591060638, -0.07502251863479614, -0.0734187588095665, -0.07181499153375626, -0.07021122425794601, -0.06860746443271637, -0.06700369715690613, -0.06539992988109589, -0.06379616260528564, -0.0621923990547657, -0.06058863550424576, -0.058984868228435516, -0.057381100952625275, -0.05577733740210533, -0.05417357385158539, -0.052569806575775146, -0.050966039299964905, -0.04936227574944496, -0.04775851219892502, -0.046154748648405075, -0.04455098509788513, -0.04294721782207489, -0.04134345054626465, -0.039739686995744705, -0.03813592344522476, -0.03653215616941452, -0.03492838889360428, -0.033324625343084335, -0.03172086179256439, -0.03011709451675415, -0.028513329103589058, -0.026909563690423965, -0.025305798277258873, -0.02370203286409378, -0.022098267450928688, -0.020494502037763596, -0.018890736624598503, -0.01728697121143341, -0.015683205798268318, -0.014079440385103226, -0.012475674971938133, -0.01087190955877304, -0.009268144145607948, -0.007664377801120281, -0.006060612387955189, -0.004456846974790096, -0.002853081561625004, -0.0012493161484599113, 0.0003544492647051811, 0.0019582146778702736, 0.003561980091035366, 0.0051657455042004585]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 6.0, 5.0, 12.0, 12.0, 6.0, 14.0, 12.0, 17.0, 19.0, 28.0, 22.0, 28.0, 29.0, 29.0, 39.0, 38.0, 34.0, 32.0, 44.0, 49.0, 39.0, 38.0, 32.0, 42.0, 40.0, 40.0, 41.0, 39.0, 27.0, 26.0, 31.0, 23.0, 21.0, 12.0, 13.0, 9.0, 10.0, 9.0, 8.0, 5.0, 9.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006525201257318258, -0.0063241696916520596, -0.006123138125985861, -0.005922106560319662, -0.005721074528992176, -0.005520042963325977, -0.005319011397659779, -0.00511797983199358, -0.004916948266327381, -0.004715916700661182, -0.004514885134994984, -0.004313853569328785, -0.004112822003662586, -0.0039117904379963875, -0.0037107584066689014, -0.0035097268410027027, -0.003308695275336504, -0.0031076637096703053, -0.0029066321440041065, -0.002705600345507264, -0.0025045687798410654, -0.0023035372141748667, -0.0021025054156780243, -0.0019014738500118256, -0.0017004422843456268, -0.001499410718679428, -0.0012983790365979075, -0.001097347354516387, -0.0008963157888501883, -0.0006952842231839895, -0.000494252541102469, -0.0002932208590209484, -9.218975901603699e-05, 0.00010884186485782266, 0.0003098734887316823, 0.0005109051126055419, 0.0007119367364794016, 0.0009129683021456003, 0.0011139999842271209, 0.0013150316663086414, 0.0015160632319748402, 0.001717094797641039, 0.0019181264797225595, 0.00211915816180408, 0.0023201897274702787, 0.0025212212931364775, 0.00272225309163332, 0.0029232846572995186, 0.0031243162229657173, 0.003325347788631916, 0.0035263793542981148, 0.003727411152794957, 0.003928442485630512, 0.004129474051296711, 0.004330506082624197, 0.004531537648290396, 0.0047325692139565945, 0.004933600779622793, 0.005134632345288992, 0.005335663910955191, 0.005536695942282677, 0.005737727507948875, 0.005938759073615074, 0.006139790639281273, 0.006340822204947472]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 13.0, 12.0, 27.0, 35.0, 54.0, 90.0, 164.0, 225.0, 304.0, 454.0, 735.0, 1014.0, 1456.0, 2150.0, 3121.0, 4497.0, 6600.0, 9767.0, 14421.0, 22022.0, 34005.0, 55034.0, 96712.0, 182314.0, 244529.0, 150568.0, 81354.0, 47483.0, 29853.0, 19265.0, 12779.0, 8718.0, 6066.0, 3939.0, 2771.0, 1877.0, 1315.0, 931.0, 642.0, 437.0, 267.0, 174.0, 141.0, 84.0, 52.0, 32.0, 16.0, 17.0, 13.0, 8.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.002471923828125, -0.0023978054523468018, -0.0023236870765686035, -0.0022495687007904053, -0.002175450325012207, -0.002101331949234009, -0.0020272135734558105, -0.0019530951976776123, -0.001878976821899414, -0.0018048584461212158, -0.0017307400703430176, -0.0016566216945648193, -0.001582503318786621, -0.0015083849430084229, -0.0014342665672302246, -0.0013601481914520264, -0.0012860298156738281, -0.0012119114398956299, -0.0011377930641174316, -0.0010636746883392334, -0.0009895563125610352, -0.0009154379367828369, -0.0008413195610046387, -0.0007672011852264404, -0.0006930828094482422, -0.0006189644336700439, -0.0005448460578918457, -0.00047072768211364746, -0.0003966093063354492, -0.000322490930557251, -0.00024837255477905273, -0.0001742541790008545, -0.00010013580322265625, -2.6017427444458008e-05, 4.8100948333740234e-05, 0.00012221932411193848, 0.00019633769989013672, 0.00027045607566833496, 0.0003445744514465332, 0.00041869282722473145, 0.0004928112030029297, 0.0005669295787811279, 0.0006410479545593262, 0.0007151663303375244, 0.0007892847061157227, 0.0008634030818939209, 0.0009375214576721191, 0.0010116398334503174, 0.0010857582092285156, 0.0011598765850067139, 0.0012339949607849121, 0.0013081133365631104, 0.0013822317123413086, 0.0014563500881195068, 0.001530468463897705, 0.0016045868396759033, 0.0016787052154541016, 0.0017528235912322998, 0.001826941967010498, 0.0019010603427886963, 0.0019751787185668945, 0.0020492970943450928, 0.002123415470123291, 0.0021975338459014893, 0.0022716522216796875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 5.0, 5.0, 9.0, 5.0, 8.0, 13.0, 14.0, 17.0, 19.0, 21.0, 24.0, 32.0, 28.0, 26.0, 29.0, 33.0, 34.0, 37.0, 42.0, 34.0, 45.0, 44.0, 35.0, 36.0, 47.0, 46.0, 29.0, 47.0, 26.0, 40.0, 22.0, 18.0, 21.0, 14.0, 22.0, 12.0, 9.0, 8.0, 8.0, 11.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005443572998046875, -0.005273759365081787, -0.005103945732116699, -0.004934132099151611, -0.0047643184661865234, -0.0045945048332214355, -0.004424691200256348, -0.00425487756729126, -0.004085063934326172, -0.003915250301361084, -0.003745436668395996, -0.003575623035430908, -0.0034058094024658203, -0.0032359957695007324, -0.0030661821365356445, -0.0028963685035705566, -0.0027265548706054688, -0.002556741237640381, -0.002386927604675293, -0.002217113971710205, -0.002047300338745117, -0.0018774867057800293, -0.0017076730728149414, -0.0015378594398498535, -0.0013680458068847656, -0.0011982321739196777, -0.0010284185409545898, -0.000858604907989502, -0.0006887912750244141, -0.0005189776420593262, -0.0003491640090942383, -0.0001793503761291504, -9.5367431640625e-06, 0.0001602768898010254, 0.0003300905227661133, 0.0004999041557312012, 0.0006697177886962891, 0.000839531421661377, 0.0010093450546264648, 0.0011791586875915527, 0.0013489723205566406, 0.0015187859535217285, 0.0016885995864868164, 0.0018584132194519043, 0.002028226852416992, 0.00219804048538208, 0.002367854118347168, 0.002537667751312256, 0.0027074813842773438, 0.0028772950172424316, 0.0030471086502075195, 0.0032169222831726074, 0.0033867359161376953, 0.003556549549102783, 0.003726363182067871, 0.003896176815032959, 0.004065990447998047, 0.004235804080963135, 0.004405617713928223, 0.0045754313468933105, 0.0047452449798583984, 0.004915058612823486, 0.005084872245788574, 0.005254685878753662, 0.00542449951171875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 11.0, 14.0, 10.0, 19.0, 32.0, 47.0, 71.0, 95.0, 133.0, 201.0, 258.0, 444.0, 612.0, 902.0, 1383.0, 1963.0, 2984.0, 4642.0, 6969.0, 10978.0, 17154.0, 27860.0, 47319.0, 87897.0, 190488.0, 319609.0, 147471.0, 72120.0, 40109.0, 23857.0, 14673.0, 9639.0, 6325.0, 4088.0, 2714.0, 1756.0, 1165.0, 813.0, 522.0, 373.0, 254.0, 185.0, 107.0, 99.0, 58.0, 39.0, 29.0, 24.0, 15.0, 12.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.00257110595703125, -0.0024916231632232666, -0.002412140369415283, -0.0023326575756073, -0.0022531747817993164, -0.002173691987991333, -0.0020942091941833496, -0.002014726400375366, -0.0019352436065673828, -0.0018557608127593994, -0.001776278018951416, -0.0016967952251434326, -0.0016173124313354492, -0.0015378296375274658, -0.0014583468437194824, -0.001378864049911499, -0.0012993812561035156, -0.0012198984622955322, -0.0011404156684875488, -0.0010609328746795654, -0.000981450080871582, -0.0009019672870635986, -0.0008224844932556152, -0.0007430016994476318, -0.0006635189056396484, -0.000584036111831665, -0.0005045533180236816, -0.00042507052421569824, -0.00034558773040771484, -0.00026610493659973145, -0.00018662214279174805, -0.00010713934898376465, -2.765655517578125e-05, 5.182623863220215e-05, 0.00013130903244018555, 0.00021079182624816895, 0.00029027462005615234, 0.00036975741386413574, 0.00044924020767211914, 0.0005287230014801025, 0.0006082057952880859, 0.0006876885890960693, 0.0007671713829040527, 0.0008466541767120361, 0.0009261369705200195, 0.001005619764328003, 0.0010851025581359863, 0.0011645853519439697, 0.0012440681457519531, 0.0013235509395599365, 0.00140303373336792, 0.0014825165271759033, 0.0015619993209838867, 0.0016414821147918701, 0.0017209649085998535, 0.001800447702407837, 0.0018799304962158203, 0.0019594132900238037, 0.002038896083831787, 0.0021183788776397705, 0.002197861671447754, 0.0022773444652557373, 0.0023568272590637207, 0.002436310052871704, 0.0025157928466796875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 5.0, 6.0, 12.0, 16.0, 11.0, 12.0, 18.0, 13.0, 20.0, 24.0, 26.0, 20.0, 33.0, 28.0, 37.0, 31.0, 50.0, 38.0, 49.0, 38.0, 39.0, 48.0, 39.0, 37.0, 32.0, 36.0, 37.0, 34.0, 33.0, 31.0, 22.0, 32.0, 13.0, 15.0, 15.0, 9.0, 9.0, 11.0, 10.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032634735107421875, -0.0031522810459136963, -0.003041088581085205, -0.002929896116256714, -0.0028187036514282227, -0.0027075111865997314, -0.0025963187217712402, -0.002485126256942749, -0.002373933792114258, -0.0022627413272857666, -0.0021515488624572754, -0.002040356397628784, -0.001929163932800293, -0.0018179714679718018, -0.0017067790031433105, -0.0015955865383148193, -0.0014843940734863281, -0.001373201608657837, -0.0012620091438293457, -0.0011508166790008545, -0.0010396242141723633, -0.0009284317493438721, -0.0008172392845153809, -0.0007060468196868896, -0.0005948543548583984, -0.0004836618900299072, -0.000372469425201416, -0.0002612769603729248, -0.0001500844955444336, -3.889203071594238e-05, 7.230043411254883e-05, 0.00018349289894104004, 0.00029468536376953125, 0.00040587782859802246, 0.0005170702934265137, 0.0006282627582550049, 0.0007394552230834961, 0.0008506476879119873, 0.0009618401527404785, 0.0010730326175689697, 0.001184225082397461, 0.0012954175472259521, 0.0014066100120544434, 0.0015178024768829346, 0.0016289949417114258, 0.001740187406539917, 0.0018513798713684082, 0.0019625723361968994, 0.0020737648010253906, 0.002184957265853882, 0.002296149730682373, 0.0024073421955108643, 0.0025185346603393555, 0.0026297271251678467, 0.002740919589996338, 0.002852112054824829, 0.0029633045196533203, 0.0030744969844818115, 0.0031856894493103027, 0.003296881914138794, 0.003408074378967285, 0.0035192668437957764, 0.0036304593086242676, 0.003741651773452759, 0.00385284423828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 7.0, 8.0, 6.0, 15.0, 17.0, 22.0, 28.0, 44.0, 65.0, 88.0, 106.0, 168.0, 287.0, 384.0, 570.0, 944.0, 1427.0, 2374.0, 3893.0, 6741.0, 12596.0, 23782.0, 50689.0, 126939.0, 504070.0, 185508.0, 63375.0, 29402.0, 14845.0, 8098.0, 4650.0, 2780.0, 1653.0, 1026.0, 673.0, 411.0, 284.0, 170.0, 118.0, 74.0, 80.0, 46.0, 12.0, 28.0, 24.0, 13.0, 7.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001252889633178711, -0.00012145098298788071, -0.00011761300265789032, -0.00011377502232789993, -0.00010993704199790955, -0.00010609906166791916, -0.00010226108133792877, -9.842310100793839e-05, -9.4585120677948e-05, -9.074714034795761e-05, -8.690916001796722e-05, -8.307117968797684e-05, -7.923319935798645e-05, -7.539521902799606e-05, -7.155723869800568e-05, -6.771925836801529e-05, -6.38812780380249e-05, -6.0043297708034515e-05, -5.620531737804413e-05, -5.236733704805374e-05, -4.8529356718063354e-05, -4.469137638807297e-05, -4.085339605808258e-05, -3.7015415728092194e-05, -3.317743539810181e-05, -2.933945506811142e-05, -2.5501474738121033e-05, -2.1663494408130646e-05, -1.782551407814026e-05, -1.3987533748149872e-05, -1.0149553418159485e-05, -6.311573088169098e-06, -2.473592758178711e-06, 1.364387571811676e-06, 5.202367901802063e-06, 9.04034823179245e-06, 1.2878328561782837e-05, 1.6716308891773224e-05, 2.055428922176361e-05, 2.4392269551753998e-05, 2.8230249881744385e-05, 3.206823021173477e-05, 3.590621054172516e-05, 3.9744190871715546e-05, 4.358217120170593e-05, 4.742015153169632e-05, 5.1258131861686707e-05, 5.5096112191677094e-05, 5.893409252166748e-05, 6.277207285165787e-05, 6.661005318164825e-05, 7.044803351163864e-05, 7.428601384162903e-05, 7.812399417161942e-05, 8.19619745016098e-05, 8.579995483160019e-05, 8.963793516159058e-05, 9.347591549158096e-05, 9.731389582157135e-05, 0.00010115187615156174, 0.00010498985648155212, 0.00010882783681154251, 0.0001126658171415329, 0.00011650379747152328, 0.00012034177780151367]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 2.0, 2.0, 4.0, 6.0, 14.0, 10.0, 11.0, 17.0, 26.0, 32.0, 41.0, 75.0, 86.0, 121.0, 101.0, 100.0, 78.0, 81.0, 62.0, 39.0, 23.0, 15.0, 10.0, 7.0, 7.0, 8.0, 2.0, 6.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4483928680419922e-05, -1.3974495232105255e-05, -1.3465061783790588e-05, -1.2955628335475922e-05, -1.2446194887161255e-05, -1.1936761438846588e-05, -1.1427327990531921e-05, -1.0917894542217255e-05, -1.0408461093902588e-05, -9.899027645587921e-06, -9.389594197273254e-06, -8.880160748958588e-06, -8.370727300643921e-06, -7.861293852329254e-06, -7.351860404014587e-06, -6.842426955699921e-06, -6.332993507385254e-06, -5.823560059070587e-06, -5.31412661075592e-06, -4.804693162441254e-06, -4.295259714126587e-06, -3.78582626581192e-06, -3.2763928174972534e-06, -2.7669593691825867e-06, -2.25752592086792e-06, -1.7480924725532532e-06, -1.2386590242385864e-06, -7.292255759239197e-07, -2.1979212760925293e-07, 2.896413207054138e-07, 7.990747690200806e-07, 1.3085082173347473e-06, 1.817941665649414e-06, 2.327375113964081e-06, 2.8368085622787476e-06, 3.3462420105934143e-06, 3.855675458908081e-06, 4.365108907222748e-06, 4.8745423555374146e-06, 5.383975803852081e-06, 5.893409252166748e-06, 6.402842700481415e-06, 6.9122761487960815e-06, 7.421709597110748e-06, 7.931143045425415e-06, 8.440576493740082e-06, 8.950009942054749e-06, 9.459443390369415e-06, 9.968876838684082e-06, 1.0478310286998749e-05, 1.0987743735313416e-05, 1.1497177183628082e-05, 1.2006610631942749e-05, 1.2516044080257416e-05, 1.3025477528572083e-05, 1.353491097688675e-05, 1.4044344425201416e-05, 1.4553777873516083e-05, 1.506321132183075e-05, 1.5572644770145416e-05, 1.6082078218460083e-05, 1.659151166677475e-05, 1.7100945115089417e-05, 1.7610378563404083e-05, 1.811981201171875e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 11.0, 4.0, 10.0, 18.0, 21.0, 22.0, 53.0, 58.0, 93.0, 216.0, 1763.0, 240967.0, 801603.0, 3122.0, 252.0, 90.0, 67.0, 51.0, 35.0, 34.0, 17.0, 7.0, 9.0, 8.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001049041748046875, -0.00101529061794281, -0.0009815394878387451, -0.0009477883577346802, -0.0009140372276306152, -0.0008802860975265503, -0.0008465349674224854, -0.0008127838373184204, -0.0007790327072143555, -0.0007452815771102905, -0.0007115304470062256, -0.0006777793169021606, -0.0006440281867980957, -0.0006102770566940308, -0.0005765259265899658, -0.0005427747964859009, -0.0005090236663818359, -0.000475272536277771, -0.00044152140617370605, -0.0004077702760696411, -0.00037401914596557617, -0.00034026801586151123, -0.0003065168857574463, -0.00027276575565338135, -0.0002390146255493164, -0.00020526349544525146, -0.00017151236534118652, -0.00013776123523712158, -0.00010401010513305664, -7.02589750289917e-05, -3.650784492492676e-05, -2.7567148208618164e-06, 3.0994415283203125e-05, 6.474554538726807e-05, 9.849667549133301e-05, 0.00013224780559539795, 0.0001659989356994629, 0.00019975006580352783, 0.00023350119590759277, 0.0002672523260116577, 0.00030100345611572266, 0.0003347545862197876, 0.00036850571632385254, 0.0004022568464279175, 0.0004360079765319824, 0.00046975910663604736, 0.0005035102367401123, 0.0005372613668441772, 0.0005710124969482422, 0.0006047636270523071, 0.0006385147571563721, 0.000672265887260437, 0.000706017017364502, 0.0007397681474685669, 0.0007735192775726318, 0.0008072704076766968, 0.0008410215377807617, 0.0008747726678848267, 0.0009085237979888916, 0.0009422749280929565, 0.0009760260581970215, 0.0010097771883010864, 0.0010435283184051514, 0.0010772794485092163, 0.0011110305786132812]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 1.0, 4.0, 5.0, 6.0, 6.0, 7.0, 10.0, 15.0, 17.0, 18.0, 25.0, 27.0, 32.0, 56.0, 57.0, 70.0, 95.0, 96.0, 74.0, 58.0, 77.0, 41.0, 34.0, 26.0, 27.0, 25.0, 19.0, 12.0, 13.0, 9.0, 12.0, 2.0, 4.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.7060508728027344e-05, -2.625584602355957e-05, -2.5451183319091797e-05, -2.4646520614624023e-05, -2.384185791015625e-05, -2.3037195205688477e-05, -2.2232532501220703e-05, -2.142786979675293e-05, -2.0623207092285156e-05, -1.9818544387817383e-05, -1.901388168334961e-05, -1.8209218978881836e-05, -1.7404556274414062e-05, -1.659989356994629e-05, -1.5795230865478516e-05, -1.4990568161010742e-05, -1.4185905456542969e-05, -1.3381242752075195e-05, -1.2576580047607422e-05, -1.1771917343139648e-05, -1.0967254638671875e-05, -1.0162591934204102e-05, -9.357929229736328e-06, -8.553266525268555e-06, -7.748603820800781e-06, -6.943941116333008e-06, -6.139278411865234e-06, -5.334615707397461e-06, -4.5299530029296875e-06, -3.725290298461914e-06, -2.9206275939941406e-06, -2.115964889526367e-06, -1.3113021850585938e-06, -5.066394805908203e-07, 2.980232238769531e-07, 1.1026859283447266e-06, 1.9073486328125e-06, 2.7120113372802734e-06, 3.516674041748047e-06, 4.32133674621582e-06, 5.125999450683594e-06, 5.930662155151367e-06, 6.735324859619141e-06, 7.539987564086914e-06, 8.344650268554688e-06, 9.149312973022461e-06, 9.953975677490234e-06, 1.0758638381958008e-05, 1.1563301086425781e-05, 1.2367963790893555e-05, 1.3172626495361328e-05, 1.3977289199829102e-05, 1.4781951904296875e-05, 1.558661460876465e-05, 1.6391277313232422e-05, 1.7195940017700195e-05, 1.800060272216797e-05, 1.8805265426635742e-05, 1.9609928131103516e-05, 2.041459083557129e-05, 2.1219253540039062e-05, 2.2023916244506836e-05, 2.282857894897461e-05, 2.3633241653442383e-05, 2.4437904357910156e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 9.0, 13.0, 38.0, 60.0, 99.0, 135.0, 162.0, 160.0, 120.0, 92.0, 51.0, 24.0, 15.0, 13.0, 6.0, 5.0, 1.0, 2.0], "bins": [-0.027524862438440323, -0.027002884075045586, -0.02648090571165085, -0.02595892734825611, -0.025436948984861374, -0.024914972484111786, -0.0243929922580719, -0.02387101575732231, -0.023349037393927574, -0.022827059030532837, -0.0223050806671381, -0.021783102303743362, -0.021261123940348625, -0.020739145576953888, -0.0202171690762043, -0.019695190712809563, -0.019173212349414825, -0.018651233986020088, -0.01812925562262535, -0.017607277259230614, -0.017085298895835876, -0.01656332239508629, -0.016041342169046402, -0.01551936473697424, -0.014997385442256927, -0.01447540707886219, -0.013953428715467453, -0.013431450352072716, -0.012909472920000553, -0.012387494556605816, -0.011865516193211079, -0.011343537829816341, -0.01082155853509903, -0.010299580171704292, -0.009777601808309555, -0.009255623444914818, -0.008733646012842655, -0.008211667649447918, -0.007689689286053181, -0.0071677109226584435, -0.006645733490586281, -0.006123755127191544, -0.005601777229458094, -0.005079798866063356, -0.0045578209683299065, -0.004035842604935169, -0.003513864241540432, -0.0029918861109763384, -0.002469907980412245, -0.0019479298498481512, -0.0014259516028687358, -0.0009039733558893204, -0.0003819952253252268, 0.0001399829052388668, 0.000661961268633604, 0.0011839393991976976, 0.0017059175297617912, 0.002227895660325885, 0.0027498737908899784, 0.0032718521542847157, 0.0037938302848488092, 0.004315808415412903, 0.00483778677880764, 0.005359765142202377, 0.005881743039935827]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 7.0, 7.0, 16.0, 10.0, 15.0, 7.0, 22.0, 21.0, 19.0, 34.0, 25.0, 21.0, 24.0, 38.0, 43.0, 36.0, 34.0, 51.0, 43.0, 43.0, 26.0, 38.0, 44.0, 41.0, 43.0, 31.0, 27.0, 30.0, 28.0, 20.0, 24.0, 19.0, 23.0, 19.0, 8.0, 7.0, 16.0, 5.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.005077775102108717, -0.004920319654047489, -0.004762864671647549, -0.004605409223586321, -0.004447953775525093, -0.004290498793125153, -0.004133043345063925, -0.003975587897002697, -0.0038181329146027565, -0.0036606776993721724, -0.003503222484141588, -0.0033457670360803604, -0.0031883118208497763, -0.003030856605619192, -0.0028734011575579643, -0.00271594594232738, -0.002558490727096796, -0.002401035511866212, -0.0022435802966356277, -0.0020861248485744, -0.0019286696333438158, -0.0017712144181132317, -0.0016137590864673257, -0.0014563037548214197, -0.0012988485395908356, -0.0011413933243602514, -0.0009839379927143455, -0.0008264827192761004, -0.0006690274458378553, -0.0005115721723996103, -0.0003541168989613652, -0.00019666156731545925, -3.920635208487511e-05, 0.00011824892135336995, 0.000275704194791615, 0.00043315946822986007, 0.0005906147416681051, 0.0007480700151063502, 0.0009055252885445952, 0.0010629806201905012, 0.0012204358354210854, 0.0013778910506516695, 0.0015353463822975755, 0.0016928017139434814, 0.0018502569291740656, 0.0020077121444046497, 0.0021651675924658775, 0.0023226228076964617, 0.002480078022927046, 0.00263753323815763, 0.002794988453388214, 0.002952443901449442, 0.003109899116680026, 0.00326735433191061, 0.003424809779971838, 0.003582264995202422, 0.0037397202104330063, 0.0038971754256635904, 0.004054630640894175, 0.004212086088955402, 0.004369541071355343, 0.004526996519416571, 0.0046844519674777985, 0.004841906949877739, 0.004999362397938967]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 4.0, 10.0, 8.0, 10.0, 18.0, 23.0, 37.0, 57.0, 67.0, 112.0, 203.0, 246.0, 356.0, 562.0, 916.0, 1434.0, 2213.0, 3455.0, 5643.0, 8919.0, 14407.0, 23964.0, 39716.0, 64904.0, 102126.0, 149606.0, 178355.0, 157534.0, 110748.0, 70877.0, 43311.0, 26358.0, 15957.0, 9790.0, 5999.0, 3716.0, 2389.0, 1572.0, 990.0, 635.0, 417.0, 306.0, 198.0, 119.0, 76.0, 49.0, 49.0, 32.0, 21.0, 16.0, 10.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0118255615234375, -0.011425971984863281, -0.011026382446289062, -0.010626792907714844, -0.010227203369140625, -0.009827613830566406, -0.009428024291992188, -0.009028434753417969, -0.00862884521484375, -0.008229255676269531, -0.007829666137695312, -0.007430076599121094, -0.007030487060546875, -0.006630897521972656, -0.0062313079833984375, -0.005831718444824219, -0.00543212890625, -0.005032539367675781, -0.0046329498291015625, -0.004233360290527344, -0.003833770751953125, -0.0034341812133789062, -0.0030345916748046875, -0.0026350021362304688, -0.00223541259765625, -0.0018358230590820312, -0.0014362335205078125, -0.0010366439819335938, -0.000637054443359375, -0.00023746490478515625, 0.0001621246337890625, 0.0005617141723632812, 0.0009613037109375, 0.0013608932495117188, 0.0017604827880859375, 0.0021600723266601562, 0.002559661865234375, 0.0029592514038085938, 0.0033588409423828125, 0.0037584304809570312, 0.00415802001953125, 0.004557609558105469, 0.0049571990966796875, 0.005356788635253906, 0.005756378173828125, 0.006155967712402344, 0.0065555572509765625, 0.006955146789550781, 0.007354736328125, 0.007754325866699219, 0.008153915405273438, 0.008553504943847656, 0.008953094482421875, 0.009352684020996094, 0.009752273559570312, 0.010151863098144531, 0.01055145263671875, 0.010951042175292969, 0.011350631713867188, 0.011750221252441406, 0.012149810791015625, 0.012549400329589844, 0.012948989868164062, 0.013348579406738281, 0.0137481689453125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 14.0, 8.0, 11.0, 11.0, 24.0, 28.0, 24.0, 42.0, 30.0, 38.0, 38.0, 61.0, 30.0, 60.0, 56.0, 60.0, 52.0, 35.0, 50.0, 48.0, 41.0, 46.0, 32.0, 26.0, 21.0, 27.0, 25.0, 14.0, 13.0, 3.0, 4.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005207061767578125, -0.00499957799911499, -0.0047920942306518555, -0.004584610462188721, -0.004377126693725586, -0.004169642925262451, -0.003962159156799316, -0.0037546753883361816, -0.003547191619873047, -0.003339707851409912, -0.0031322240829467773, -0.0029247403144836426, -0.002717256546020508, -0.002509772777557373, -0.0023022890090942383, -0.0020948052406311035, -0.0018873214721679688, -0.001679837703704834, -0.0014723539352416992, -0.0012648701667785645, -0.0010573863983154297, -0.0008499026298522949, -0.0006424188613891602, -0.0004349350929260254, -0.00022745132446289062, -1.996755599975586e-05, 0.0001875162124633789, 0.00039499998092651367, 0.0006024837493896484, 0.0008099675178527832, 0.001017451286315918, 0.0012249350547790527, 0.0014324188232421875, 0.0016399025917053223, 0.001847386360168457, 0.002054870128631592, 0.0022623538970947266, 0.0024698376655578613, 0.002677321434020996, 0.002884805202484131, 0.0030922889709472656, 0.0032997727394104004, 0.003507256507873535, 0.00371474027633667, 0.003922224044799805, 0.0041297078132629395, 0.004337191581726074, 0.004544675350189209, 0.004752159118652344, 0.0049596428871154785, 0.005167126655578613, 0.005374610424041748, 0.005582094192504883, 0.005789577960968018, 0.005997061729431152, 0.006204545497894287, 0.006412029266357422, 0.006619513034820557, 0.006826996803283691, 0.007034480571746826, 0.007241964340209961, 0.007449448108673096, 0.0076569318771362305, 0.007864415645599365, 0.0080718994140625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 8.0, 4.0, 7.0, 11.0, 6.0, 8.0, 17.0, 12.0, 19.0, 18.0, 19.0, 23.0, 36.0, 81.0, 212.0, 631.0, 2237.0, 7926.0, 28688.0, 101753.0, 310567.0, 384551.0, 151833.0, 43115.0, 11956.0, 3325.0, 918.0, 252.0, 92.0, 59.0, 37.0, 27.0, 19.0, 8.0, 12.0, 22.0, 10.0, 4.0, 7.0, 3.0, 7.0, 9.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0261077880859375, -0.02529597282409668, -0.02448415756225586, -0.02367234230041504, -0.02286052703857422, -0.0220487117767334, -0.021236896514892578, -0.020425081253051758, -0.019613265991210938, -0.018801450729370117, -0.017989635467529297, -0.017177820205688477, -0.016366004943847656, -0.015554189682006836, -0.014742374420166016, -0.013930559158325195, -0.013118743896484375, -0.012306928634643555, -0.011495113372802734, -0.010683298110961914, -0.009871482849121094, -0.009059667587280273, -0.008247852325439453, -0.007436037063598633, -0.0066242218017578125, -0.005812406539916992, -0.005000591278076172, -0.0041887760162353516, -0.0033769607543945312, -0.002565145492553711, -0.0017533302307128906, -0.0009415149688720703, -0.00012969970703125, 0.0006821155548095703, 0.0014939308166503906, 0.002305746078491211, 0.0031175613403320312, 0.0039293766021728516, 0.004741191864013672, 0.005553007125854492, 0.0063648223876953125, 0.007176637649536133, 0.007988452911376953, 0.008800268173217773, 0.009612083435058594, 0.010423898696899414, 0.011235713958740234, 0.012047529220581055, 0.012859344482421875, 0.013671159744262695, 0.014482975006103516, 0.015294790267944336, 0.016106605529785156, 0.016918420791625977, 0.017730236053466797, 0.018542051315307617, 0.019353866577148438, 0.020165681838989258, 0.020977497100830078, 0.0217893123626709, 0.02260112762451172, 0.02341294288635254, 0.02422475814819336, 0.02503657341003418, 0.025848388671875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 6.0, 7.0, 10.0, 10.0, 10.0, 9.0, 12.0, 18.0, 20.0, 18.0, 26.0, 37.0, 33.0, 34.0, 26.0, 38.0, 34.0, 33.0, 46.0, 48.0, 32.0, 52.0, 46.0, 38.0, 39.0, 37.0, 28.0, 22.0, 40.0, 20.0, 26.0, 15.0, 22.0, 10.0, 11.0, 16.0, 13.0, 9.0, 11.0, 8.0, 8.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.004192352294921875, -0.004058241844177246, -0.003924131393432617, -0.0037900209426879883, -0.0036559104919433594, -0.0035218000411987305, -0.0033876895904541016, -0.0032535791397094727, -0.0031194686889648438, -0.002985358238220215, -0.002851247787475586, -0.002717137336730957, -0.002583026885986328, -0.0024489164352416992, -0.0023148059844970703, -0.0021806955337524414, -0.0020465850830078125, -0.0019124746322631836, -0.0017783641815185547, -0.0016442537307739258, -0.0015101432800292969, -0.001376032829284668, -0.001241922378540039, -0.0011078119277954102, -0.0009737014770507812, -0.0008395910263061523, -0.0007054805755615234, -0.0005713701248168945, -0.0004372596740722656, -0.0003031492233276367, -0.0001690387725830078, -3.4928321838378906e-05, 9.918212890625e-05, 0.0002332925796508789, 0.0003674030303955078, 0.0005015134811401367, 0.0006356239318847656, 0.0007697343826293945, 0.0009038448333740234, 0.0010379552841186523, 0.0011720657348632812, 0.0013061761856079102, 0.001440286636352539, 0.001574397087097168, 0.0017085075378417969, 0.0018426179885864258, 0.0019767284393310547, 0.0021108388900756836, 0.0022449493408203125, 0.0023790597915649414, 0.0025131702423095703, 0.0026472806930541992, 0.002781391143798828, 0.002915501594543457, 0.003049612045288086, 0.003183722496032715, 0.0033178329467773438, 0.0034519433975219727, 0.0035860538482666016, 0.0037201642990112305, 0.0038542747497558594, 0.003988385200500488, 0.004122495651245117, 0.004256606101989746, 0.004390716552734375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 3.0, 8.0, 10.0, 15.0, 10.0, 11.0, 30.0, 36.0, 41.0, 62.0, 86.0, 118.0, 169.0, 296.0, 444.0, 703.0, 1157.0, 2136.0, 3910.0, 8404.0, 27045.0, 898602.0, 79324.0, 13543.0, 5568.0, 2753.0, 1519.0, 851.0, 562.0, 370.0, 212.0, 184.0, 104.0, 84.0, 48.0, 33.0, 26.0, 17.0, 20.0, 11.0, 4.0, 7.0, 8.0, 1.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0077056884765625, -0.007454991340637207, -0.007204294204711914, -0.006953597068786621, -0.006702899932861328, -0.006452202796936035, -0.006201505661010742, -0.005950808525085449, -0.005700111389160156, -0.005449414253234863, -0.00519871711730957, -0.004948019981384277, -0.004697322845458984, -0.004446625709533691, -0.0041959285736083984, -0.0039452314376831055, -0.0036945343017578125, -0.0034438371658325195, -0.0031931400299072266, -0.0029424428939819336, -0.0026917457580566406, -0.0024410486221313477, -0.0021903514862060547, -0.0019396543502807617, -0.0016889572143554688, -0.0014382600784301758, -0.0011875629425048828, -0.0009368658065795898, -0.0006861686706542969, -0.0004354715347290039, -0.00018477439880371094, 6.592273712158203e-05, 0.000316619873046875, 0.000567317008972168, 0.0008180141448974609, 0.001068711280822754, 0.0013194084167480469, 0.0015701055526733398, 0.0018208026885986328, 0.0020714998245239258, 0.0023221969604492188, 0.0025728940963745117, 0.0028235912322998047, 0.0030742883682250977, 0.0033249855041503906, 0.0035756826400756836, 0.0038263797760009766, 0.0040770769119262695, 0.0043277740478515625, 0.0045784711837768555, 0.0048291683197021484, 0.005079865455627441, 0.005330562591552734, 0.005581259727478027, 0.00583195686340332, 0.006082653999328613, 0.006333351135253906, 0.006584048271179199, 0.006834745407104492, 0.007085442543029785, 0.007336139678955078, 0.007586836814880371, 0.007837533950805664, 0.008088231086730957, 0.00833892822265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 6.0, 5.0, 9.0, 20.0, 13.0, 26.0, 32.0, 56.0, 94.0, 100.0, 146.0, 142.0, 106.0, 77.0, 49.0, 31.0, 25.0, 21.0, 5.0, 8.0, 4.0, 0.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2814998626708984e-05, -1.244712620973587e-05, -1.2079253792762756e-05, -1.1711381375789642e-05, -1.1343508958816528e-05, -1.0975636541843414e-05, -1.06077641248703e-05, -1.0239891707897186e-05, -9.872019290924072e-06, -9.504146873950958e-06, -9.136274456977844e-06, -8.76840204000473e-06, -8.400529623031616e-06, -8.032657206058502e-06, -7.664784789085388e-06, -7.296912372112274e-06, -6.92903995513916e-06, -6.561167538166046e-06, -6.193295121192932e-06, -5.825422704219818e-06, -5.457550287246704e-06, -5.08967787027359e-06, -4.721805453300476e-06, -4.353933036327362e-06, -3.986060619354248e-06, -3.618188202381134e-06, -3.25031578540802e-06, -2.882443368434906e-06, -2.514570951461792e-06, -2.146698534488678e-06, -1.778826117515564e-06, -1.41095370054245e-06, -1.043081283569336e-06, -6.752088665962219e-07, -3.073364496231079e-07, 6.05359673500061e-08, 4.284083843231201e-07, 7.962808012962341e-07, 1.1641532182693481e-06, 1.5320256352424622e-06, 1.8998980522155762e-06, 2.26777046918869e-06, 2.635642886161804e-06, 3.0035153031349182e-06, 3.3713877201080322e-06, 3.7392601370811462e-06, 4.10713255405426e-06, 4.475004971027374e-06, 4.842877388000488e-06, 5.210749804973602e-06, 5.578622221946716e-06, 5.94649463891983e-06, 6.314367055892944e-06, 6.682239472866058e-06, 7.050111889839172e-06, 7.417984306812286e-06, 7.7858567237854e-06, 8.153729140758514e-06, 8.521601557731628e-06, 8.889473974704742e-06, 9.257346391677856e-06, 9.62521880865097e-06, 9.993091225624084e-06, 1.0360963642597198e-05, 1.0728836059570312e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 16.0, 25.0, 45.0, 94.0, 205.0, 434.0, 1015.0, 2913.0, 14080.0, 1006907.0, 17667.0, 3138.0, 1140.0, 456.0, 225.0, 106.0, 40.0, 21.0, 10.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019866943359375, -0.019237041473388672, -0.018607139587402344, -0.017977237701416016, -0.017347335815429688, -0.01671743392944336, -0.01608753204345703, -0.015457630157470703, -0.014827728271484375, -0.014197826385498047, -0.013567924499511719, -0.01293802261352539, -0.012308120727539062, -0.011678218841552734, -0.011048316955566406, -0.010418415069580078, -0.00978851318359375, -0.009158611297607422, -0.008528709411621094, -0.007898807525634766, -0.0072689056396484375, -0.006639003753662109, -0.006009101867675781, -0.005379199981689453, -0.004749298095703125, -0.004119396209716797, -0.0034894943237304688, -0.0028595924377441406, -0.0022296905517578125, -0.0015997886657714844, -0.0009698867797851562, -0.0003399848937988281, 0.0002899169921875, 0.0009198188781738281, 0.0015497207641601562, 0.0021796226501464844, 0.0028095245361328125, 0.0034394264221191406, 0.004069328308105469, 0.004699230194091797, 0.005329132080078125, 0.005959033966064453, 0.006588935852050781, 0.007218837738037109, 0.007848739624023438, 0.008478641510009766, 0.009108543395996094, 0.009738445281982422, 0.01036834716796875, 0.010998249053955078, 0.011628150939941406, 0.012258052825927734, 0.012887954711914062, 0.01351785659790039, 0.014147758483886719, 0.014777660369873047, 0.015407562255859375, 0.016037464141845703, 0.01666736602783203, 0.01729726791381836, 0.017927169799804688, 0.018557071685791016, 0.019186973571777344, 0.019816875457763672, 0.02044677734375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 2.0, 5.0, 7.0, 8.0, 26.0, 24.0, 146.0, 596.0, 100.0, 43.0, 18.0, 10.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00334930419921875, -0.0032458901405334473, -0.0031424760818481445, -0.003039062023162842, -0.002935647964477539, -0.0028322339057922363, -0.0027288198471069336, -0.002625405788421631, -0.002521991729736328, -0.0024185776710510254, -0.0023151636123657227, -0.00221174955368042, -0.002108335494995117, -0.0020049214363098145, -0.0019015073776245117, -0.001798093318939209, -0.0016946792602539062, -0.0015912652015686035, -0.0014878511428833008, -0.001384437084197998, -0.0012810230255126953, -0.0011776089668273926, -0.0010741949081420898, -0.0009707808494567871, -0.0008673667907714844, -0.0007639527320861816, -0.0006605386734008789, -0.0005571246147155762, -0.00045371055603027344, -0.0003502964973449707, -0.00024688243865966797, -0.00014346837997436523, -4.00543212890625e-05, 6.335973739624023e-05, 0.00016677379608154297, 0.0002701878547668457, 0.00037360191345214844, 0.00047701597213745117, 0.0005804300308227539, 0.0006838440895080566, 0.0007872581481933594, 0.0008906722068786621, 0.0009940862655639648, 0.0010975003242492676, 0.0012009143829345703, 0.001304328441619873, 0.0014077425003051758, 0.0015111565589904785, 0.0016145706176757812, 0.001717984676361084, 0.0018213987350463867, 0.0019248127937316895, 0.002028226852416992, 0.002131640911102295, 0.0022350549697875977, 0.0023384690284729004, 0.002441883087158203, 0.002545297145843506, 0.0026487112045288086, 0.0027521252632141113, 0.002855539321899414, 0.002958953380584717, 0.0030623674392700195, 0.0031657814979553223, 0.003269195556640625]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 24.0, 282.0, 615.0, 90.0, 8.0], "bins": [-0.1465194970369339, -0.14412765204906464, -0.14173580706119537, -0.1393439620733261, -0.13695211708545685, -0.13456027209758759, -0.13216842710971832, -0.12977656722068787, -0.1273847222328186, -0.12499287724494934, -0.12260103225708008, -0.12020918726921082, -0.11781734228134155, -0.1154254898428917, -0.11303364485502243, -0.11064179986715317, -0.1082499623298645, -0.10585811734199524, -0.10346627235412598, -0.10107442736625671, -0.09868258237838745, -0.09629072993993759, -0.09389888495206833, -0.09150703996419907, -0.0891151949763298, -0.08672334998846054, -0.08433150500059128, -0.08193966001272202, -0.07954780757427216, -0.0771559625864029, -0.07476411759853363, -0.07237227261066437, -0.0699804276227951, -0.06758858263492584, -0.06519673764705658, -0.06280489265918732, -0.060413043946027756, -0.05802119895815849, -0.05562935024499893, -0.05323750525712967, -0.050845663994550705, -0.04845381900668144, -0.04606197029352188, -0.04367012530565262, -0.041278280317783356, -0.03888643532991409, -0.03649459034204483, -0.03410274162888527, -0.031710896641016006, -0.029319051653146744, -0.026927204802632332, -0.02453535795211792, -0.022143512964248657, -0.019751667976379395, -0.017359821125864983, -0.01496797427535057, -0.012576129287481308, -0.01018428336828947, -0.007792437449097633, -0.005400591529905796, -0.0030087456107139587, -0.0006168996915221214, 0.0017749462276697159, 0.004166793078184128, 0.006558638531714678]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 12.0, 11.0, 19.0, 14.0, 15.0, 18.0, 26.0, 30.0, 36.0, 36.0, 29.0, 29.0, 39.0, 23.0, 39.0, 39.0, 42.0, 55.0, 43.0, 44.0, 29.0, 38.0, 47.0, 44.0, 36.0, 35.0, 23.0, 24.0, 19.0, 24.0, 20.0, 9.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005150225479155779, -0.004961082246154547, -0.004771939013153315, -0.004582795314490795, -0.004393652081489563, -0.004204508848488331, -0.004015365615487099, -0.0038262223824858665, -0.0036370789166539907, -0.0034479356836527586, -0.003258792217820883, -0.0030696489848196507, -0.0028805057518184185, -0.0026913622859865427, -0.0025022190529853106, -0.0023130755871534348, -0.0021239323541522026, -0.0019347890047356486, -0.0017456456553190947, -0.0015565024223178625, -0.0013673590729013085, -0.0011782157234847546, -0.0009890724904835224, -0.0007999291410669684, -0.0006107857916504145, -0.00042164247133769095, -0.00023249915102496743, -4.335585981607437e-05, 0.0001457874896004796, 0.0003349308390170336, 0.0005240740720182657, 0.0007132174214348197, 0.0009023603051900864, 0.0010915036546066403, 0.0012806470040231943, 0.0014697902370244265, 0.0016589335864409804, 0.0018480769358575344, 0.0020372201688587666, 0.0022263634018599987, 0.0024155068676918745, 0.0026046501006931067, 0.0027937935665249825, 0.0029829367995262146, 0.0031720800325274467, 0.0033612234983593225, 0.0035503667313605547, 0.0037395101971924305, 0.003928653430193663, 0.004117796663194895, 0.004306939896196127, 0.004496083594858646, 0.0046852268278598785, 0.004874370060861111, 0.005063513293862343, 0.005252656526863575, 0.005441799759864807, 0.005630942992866039, 0.005820086225867271, 0.006009229458868504, 0.006198373157531023, 0.006387516390532255, 0.006576659623533487, 0.0067658028565347195, 0.006954946555197239]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 8.0, 17.0, 19.0, 29.0, 43.0, 54.0, 80.0, 115.0, 161.0, 215.0, 281.0, 426.0, 593.0, 829.0, 1263.0, 1844.0, 2736.0, 4174.0, 6499.0, 10181.0, 16761.0, 29409.0, 61689.0, 220097.0, 2531061.0, 1059544.0, 136388.0, 45313.0, 23646.0, 14200.0, 8683.0, 5608.0, 3768.0, 2472.0, 1763.0, 1189.0, 880.0, 605.0, 417.0, 342.0, 226.0, 159.0, 112.0, 101.0, 72.0, 53.0, 47.0, 29.0, 26.0, 16.0, 16.0, 14.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.0067291259765625, -0.006511032581329346, -0.006292939186096191, -0.006074845790863037, -0.005856752395629883, -0.0056386590003967285, -0.005420565605163574, -0.00520247220993042, -0.004984378814697266, -0.004766285419464111, -0.004548192024230957, -0.004330098628997803, -0.0041120052337646484, -0.003893911838531494, -0.00367581844329834, -0.0034577250480651855, -0.0032396316528320312, -0.003021538257598877, -0.0028034448623657227, -0.0025853514671325684, -0.002367258071899414, -0.0021491646766662598, -0.0019310712814331055, -0.0017129778861999512, -0.0014948844909667969, -0.0012767910957336426, -0.0010586977005004883, -0.000840604305267334, -0.0006225109100341797, -0.0004044175148010254, -0.0001863241195678711, 3.17692756652832e-05, 0.0002498626708984375, 0.0004679560661315918, 0.0006860494613647461, 0.0009041428565979004, 0.0011222362518310547, 0.001340329647064209, 0.0015584230422973633, 0.0017765164375305176, 0.001994609832763672, 0.002212703227996826, 0.0024307966232299805, 0.0026488900184631348, 0.002866983413696289, 0.0030850768089294434, 0.0033031702041625977, 0.003521263599395752, 0.0037393569946289062, 0.0039574503898620605, 0.004175543785095215, 0.004393637180328369, 0.0046117305755615234, 0.004829823970794678, 0.005047917366027832, 0.005266010761260986, 0.005484104156494141, 0.005702197551727295, 0.005920290946960449, 0.0061383843421936035, 0.006356477737426758, 0.006574571132659912, 0.006792664527893066, 0.007010757923126221, 0.007228851318359375]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [5.0, 3.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 8.0, 13.0, 5.0, 5.0, 8.0, 15.0, 11.0, 14.0, 17.0, 17.0, 24.0, 27.0, 34.0, 28.0, 36.0, 40.0, 25.0, 38.0, 33.0, 31.0, 39.0, 44.0, 36.0, 42.0, 44.0, 27.0, 49.0, 36.0, 38.0, 26.0, 25.0, 26.0, 18.0, 23.0, 18.0, 14.0, 12.0, 7.0, 8.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0038394927978515625, -0.00370749831199646, -0.0035755038261413574, -0.003443509340286255, -0.0033115148544311523, -0.00317952036857605, -0.0030475258827209473, -0.0029155313968658447, -0.002783536911010742, -0.0026515424251556396, -0.002519547939300537, -0.0023875534534454346, -0.002255558967590332, -0.0021235644817352295, -0.001991569995880127, -0.0018595755100250244, -0.0017275810241699219, -0.0015955865383148193, -0.0014635920524597168, -0.0013315975666046143, -0.0011996030807495117, -0.0010676085948944092, -0.0009356141090393066, -0.0008036196231842041, -0.0006716251373291016, -0.000539630651473999, -0.0004076361656188965, -0.00027564167976379395, -0.0001436471939086914, -1.1652708053588867e-05, 0.00012034177780151367, 0.0002523362636566162, 0.00038433074951171875, 0.0005163252353668213, 0.0006483197212219238, 0.0007803142070770264, 0.0009123086929321289, 0.0010443031787872314, 0.001176297664642334, 0.0013082921504974365, 0.001440286636352539, 0.0015722811222076416, 0.0017042756080627441, 0.0018362700939178467, 0.0019682645797729492, 0.0021002590656280518, 0.0022322535514831543, 0.002364248037338257, 0.0024962425231933594, 0.002628237009048462, 0.0027602314949035645, 0.002892225980758667, 0.0030242204666137695, 0.003156214952468872, 0.0032882094383239746, 0.003420203924179077, 0.0035521984100341797, 0.0036841928958892822, 0.0038161873817443848, 0.003948181867599487, 0.00408017635345459, 0.004212170839309692, 0.004344165325164795, 0.0044761598110198975, 0.004608154296875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 3.0, 5.0, 5.0, 8.0, 10.0, 18.0, 22.0, 60.0, 149.0, 626.0, 9472.0, 4118819.0, 63332.0, 1381.0, 221.0, 65.0, 23.0, 20.0, 18.0, 8.0, 5.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06146240234375, -0.059243202209472656, -0.05702400207519531, -0.05480480194091797, -0.052585601806640625, -0.05036640167236328, -0.04814720153808594, -0.045928001403808594, -0.04370880126953125, -0.041489601135253906, -0.03927040100097656, -0.03705120086669922, -0.034832000732421875, -0.03261280059814453, -0.030393600463867188, -0.028174400329589844, -0.0259552001953125, -0.023736000061035156, -0.021516799926757812, -0.01929759979248047, -0.017078399658203125, -0.014859199523925781, -0.012639999389648438, -0.010420799255371094, -0.00820159912109375, -0.005982398986816406, -0.0037631988525390625, -0.0015439987182617188, 0.000675201416015625, 0.0028944015502929688, 0.0051136016845703125, 0.007332801818847656, 0.009552001953125, 0.011771202087402344, 0.013990402221679688, 0.01620960235595703, 0.018428802490234375, 0.02064800262451172, 0.022867202758789062, 0.025086402893066406, 0.02730560302734375, 0.029524803161621094, 0.03174400329589844, 0.03396320343017578, 0.036182403564453125, 0.03840160369873047, 0.04062080383300781, 0.042840003967285156, 0.0450592041015625, 0.047278404235839844, 0.04949760437011719, 0.05171680450439453, 0.053936004638671875, 0.05615520477294922, 0.05837440490722656, 0.060593605041503906, 0.06281280517578125, 0.0650320053100586, 0.06725120544433594, 0.06947040557861328, 0.07168960571289062, 0.07390880584716797, 0.07612800598144531, 0.07834720611572266, 0.08056640625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 4.0, 8.0, 10.0, 11.0, 16.0, 47.0, 64.0, 127.0, 241.0, 592.0, 1595.0, 756.0, 284.0, 121.0, 73.0, 31.0, 35.0, 24.0, 13.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034618377685546875, -0.003336399793624878, -0.0032109618186950684, -0.003085523843765259, -0.0029600858688354492, -0.0028346478939056396, -0.00270920991897583, -0.0025837719440460205, -0.002458333969116211, -0.0023328959941864014, -0.002207458019256592, -0.0020820200443267822, -0.0019565820693969727, -0.001831144094467163, -0.0017057061195373535, -0.001580268144607544, -0.0014548301696777344, -0.0013293921947479248, -0.0012039542198181152, -0.0010785162448883057, -0.0009530782699584961, -0.0008276402950286865, -0.000702202320098877, -0.0005767643451690674, -0.0004513263702392578, -0.00032588839530944824, -0.00020045042037963867, -7.50124454498291e-05, 5.042552947998047e-05, 0.00017586350440979004, 0.0003013014793395996, 0.0004267394542694092, 0.0005521774291992188, 0.0006776154041290283, 0.0008030533790588379, 0.0009284913539886475, 0.001053929328918457, 0.0011793673038482666, 0.0013048052787780762, 0.0014302432537078857, 0.0015556812286376953, 0.0016811192035675049, 0.0018065571784973145, 0.001931995153427124, 0.0020574331283569336, 0.002182871103286743, 0.0023083090782165527, 0.0024337470531463623, 0.002559185028076172, 0.0026846230030059814, 0.002810060977935791, 0.0029354989528656006, 0.00306093692779541, 0.0031863749027252197, 0.0033118128776550293, 0.003437250852584839, 0.0035626888275146484, 0.003688126802444458, 0.0038135647773742676, 0.003939002752304077, 0.004064440727233887, 0.004189878702163696, 0.004315316677093506, 0.004440754652023315, 0.004566192626953125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 23.0, 49.0, 120.0, 238.0, 304.0, 158.0, 61.0, 40.0, 11.0, 6.0, 0.0, 0.0, 2.0], "bins": [-0.03771545737981796, -0.03703078627586365, -0.03634611889719963, -0.035661447793245316, -0.0349767804145813, -0.034292109310626984, -0.03360743820667267, -0.03292277082800865, -0.03223809972405434, -0.03155342862010002, -0.030868761241436005, -0.03018409013748169, -0.029499420896172523, -0.028814751654863358, -0.02813008241355419, -0.027445413172245026, -0.02676074579358101, -0.026076076552271843, -0.025391407310962677, -0.024706736207008362, -0.024022066965699196, -0.02333739772439003, -0.022652728483080864, -0.021968059241771698, -0.021283388137817383, -0.020598718896508217, -0.01991404965519905, -0.019229378551244736, -0.01854470930993557, -0.017860040068626404, -0.017175370827317238, -0.016490701586008072, -0.015806032344698906, -0.01512136310338974, -0.014436692930758, -0.013752023689448833, -0.013067354448139668, -0.012382684275507927, -0.011698015034198761, -0.011013345792889595, -0.010328676551580429, -0.009644007310271263, -0.008959337137639523, -0.008274667896330357, -0.007589998655021191, -0.006905328948050737, -0.006220659241080284, -0.005535989999771118, -0.004851319827139378, -0.004166650120168924, -0.0034819808788597584, -0.002797311171889305, -0.0021126416977494955, -0.001427972223609686, -0.0007433025166392326, -5.863327533006668e-05, 0.0006260364316403866, 0.0013107059057801962, 0.001995375379920006, 0.002680045086890459, 0.0033647145610302687, 0.004049384035170078, 0.0047340537421405315, 0.0054187229834496975, 0.006103392690420151]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 11.0, 5.0, 3.0, 5.0, 10.0, 6.0, 13.0, 7.0, 8.0, 14.0, 16.0, 15.0, 36.0, 27.0, 22.0, 19.0, 28.0, 34.0, 27.0, 38.0, 41.0, 56.0, 25.0, 33.0, 44.0, 37.0, 41.0, 42.0, 35.0, 34.0, 40.0, 23.0, 26.0, 32.0, 22.0, 18.0, 19.0, 19.0, 12.0, 11.0, 11.0, 7.0, 8.0, 8.0, 6.0, 7.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003692765487357974, -0.003551504574716091, -0.003410243894904852, -0.003268982982262969, -0.0031277223024517298, -0.002986461389809847, -0.0028452007099986076, -0.0027039397973567247, -0.002562678884714842, -0.002421417972072959, -0.0022801572922617197, -0.002138896379619837, -0.0019976356998085976, -0.0018563747871667147, -0.0017151139909401536, -0.0015738531947135925, -0.0014325925149023533, -0.0012913317186757922, -0.0011500709224492311, -0.0010088100098073483, -0.0008675492717884481, -0.000726288475561887, -0.000585027621127665, -0.000443766824901104, -0.0003025060286745429, -0.0001612452178960666, -1.9984407117590308e-05, 0.00012127641821280122, 0.0002625372144393623, 0.00040379801066592336, 0.0005450588651001453, 0.0006863196613267064, 0.0008275802247226238, 0.0009688410209491849, 0.001110101817175746, 0.0012513627298176289, 0.001392623409628868, 0.001533884322270751, 0.001675145118497312, 0.0018164059147238731, 0.0019576665945351124, 0.0020989275071769953, 0.0022401881869882345, 0.0023814490996301174, 0.0025227097794413567, 0.0026639706920832396, 0.0028052316047251225, 0.0029464922845363617, 0.0030877531971782446, 0.0032290141098201275, 0.0033702747896313667, 0.0035115357022732496, 0.003652796382084489, 0.0037940572947263718, 0.003935317974537611, 0.00407657865434885, 0.004217839799821377, 0.004359100479632616, 0.004500361625105143, 0.004641622304916382, 0.004782882984727621, 0.00492414366453886, 0.005065404810011387, 0.005206665489822626, 0.005347926169633865]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 13.0, 7.0, 13.0, 18.0, 40.0, 49.0, 72.0, 110.0, 182.0, 175.0, 305.0, 381.0, 540.0, 853.0, 1152.0, 1670.0, 2402.0, 3624.0, 5315.0, 7902.0, 12103.0, 18506.0, 29154.0, 46855.0, 76511.0, 126448.0, 212308.0, 195575.0, 115564.0, 69802.0, 42965.0, 26745.0, 17208.0, 11023.0, 7316.0, 4857.0, 3327.0, 2253.0, 1525.0, 1095.0, 731.0, 573.0, 371.0, 269.0, 192.0, 120.0, 97.0, 63.0, 54.0, 46.0, 29.0, 9.0, 11.0, 14.0, 4.0, 2.0, 4.0, 7.0], "bins": [-0.0015211105346679688, -0.0014748871326446533, -0.0014286637306213379, -0.0013824403285980225, -0.001336216926574707, -0.0012899935245513916, -0.0012437701225280762, -0.0011975467205047607, -0.0011513233184814453, -0.0011050999164581299, -0.0010588765144348145, -0.001012653112411499, -0.0009664297103881836, -0.0009202063083648682, -0.0008739829063415527, -0.0008277595043182373, -0.0007815361022949219, -0.0007353127002716064, -0.000689089298248291, -0.0006428658962249756, -0.0005966424942016602, -0.0005504190921783447, -0.0005041956901550293, -0.00045797228813171387, -0.00041174888610839844, -0.000365525484085083, -0.0003193020820617676, -0.00027307868003845215, -0.00022685527801513672, -0.0001806318759918213, -0.00013440847396850586, -8.818507194519043e-05, -4.1961669921875e-05, 4.26173210144043e-06, 5.048513412475586e-05, 9.670853614807129e-05, 0.00014293193817138672, 0.00018915534019470215, 0.00023537874221801758, 0.000281602144241333, 0.00032782554626464844, 0.00037404894828796387, 0.0004202723503112793, 0.0004664957523345947, 0.0005127191543579102, 0.0005589425563812256, 0.000605165958404541, 0.0006513893604278564, 0.0006976127624511719, 0.0007438361644744873, 0.0007900595664978027, 0.0008362829685211182, 0.0008825063705444336, 0.000928729772567749, 0.0009749531745910645, 0.0010211765766143799, 0.0010673999786376953, 0.0011136233806610107, 0.0011598467826843262, 0.0012060701847076416, 0.001252293586730957, 0.0012985169887542725, 0.0013447403907775879, 0.0013909637928009033, 0.0014371871948242188]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 3.0, 7.0, 7.0, 10.0, 11.0, 9.0, 8.0, 12.0, 16.0, 18.0, 15.0, 25.0, 21.0, 25.0, 17.0, 30.0, 32.0, 28.0, 33.0, 36.0, 40.0, 30.0, 30.0, 33.0, 45.0, 40.0, 38.0, 46.0, 36.0, 29.0, 34.0, 32.0, 23.0, 28.0, 18.0, 18.0, 18.0, 17.0, 10.0, 16.0, 15.0, 8.0, 2.0, 4.0, 8.0, 4.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003612518310546875, -0.003490447998046875, -0.003368377685546875, -0.003246307373046875, -0.003124237060546875, -0.003002166748046875, -0.002880096435546875, -0.002758026123046875, -0.002635955810546875, -0.002513885498046875, -0.002391815185546875, -0.002269744873046875, -0.002147674560546875, -0.002025604248046875, -0.001903533935546875, -0.001781463623046875, -0.001659393310546875, -0.001537322998046875, -0.001415252685546875, -0.001293182373046875, -0.001171112060546875, -0.001049041748046875, -0.000926971435546875, -0.000804901123046875, -0.000682830810546875, -0.000560760498046875, -0.000438690185546875, -0.000316619873046875, -0.000194549560546875, -7.2479248046875e-05, 4.9591064453125e-05, 0.000171661376953125, 0.000293731689453125, 0.000415802001953125, 0.000537872314453125, 0.000659942626953125, 0.000782012939453125, 0.000904083251953125, 0.001026153564453125, 0.001148223876953125, 0.001270294189453125, 0.001392364501953125, 0.001514434814453125, 0.001636505126953125, 0.001758575439453125, 0.001880645751953125, 0.002002716064453125, 0.002124786376953125, 0.002246856689453125, 0.002368927001953125, 0.002490997314453125, 0.002613067626953125, 0.002735137939453125, 0.002857208251953125, 0.002979278564453125, 0.003101348876953125, 0.003223419189453125, 0.003345489501953125, 0.003467559814453125, 0.003589630126953125, 0.003711700439453125, 0.003833770751953125, 0.003955841064453125, 0.004077911376953125, 0.004199981689453125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 12.0, 7.0, 7.0, 12.0, 19.0, 26.0, 43.0, 57.0, 73.0, 138.0, 180.0, 255.0, 409.0, 551.0, 903.0, 1381.0, 2087.0, 3396.0, 5162.0, 8213.0, 13361.0, 21531.0, 36747.0, 65527.0, 132796.0, 313390.0, 218096.0, 97518.0, 50625.0, 28942.0, 17253.0, 10759.0, 6879.0, 4324.0, 2705.0, 1764.0, 1129.0, 761.0, 477.0, 333.0, 215.0, 138.0, 125.0, 79.0, 39.0, 35.0, 30.0, 11.0, 17.0, 8.0, 7.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0018224716186523438, -0.001766890287399292, -0.0017113089561462402, -0.0016557276248931885, -0.0016001462936401367, -0.001544564962387085, -0.0014889836311340332, -0.0014334022998809814, -0.0013778209686279297, -0.001322239637374878, -0.0012666583061218262, -0.0012110769748687744, -0.0011554956436157227, -0.001099914312362671, -0.0010443329811096191, -0.0009887516498565674, -0.0009331703186035156, -0.0008775889873504639, -0.0008220076560974121, -0.0007664263248443604, -0.0007108449935913086, -0.0006552636623382568, -0.0005996823310852051, -0.0005441009998321533, -0.0004885196685791016, -0.0004329383373260498, -0.00037735700607299805, -0.0003217756748199463, -0.00026619434356689453, -0.00021061301231384277, -0.00015503168106079102, -9.945034980773926e-05, -4.38690185546875e-05, 1.1712312698364258e-05, 6.729364395141602e-05, 0.00012287497520446777, 0.00017845630645751953, 0.0002340376377105713, 0.00028961896896362305, 0.0003452003002166748, 0.00040078163146972656, 0.0004563629627227783, 0.0005119442939758301, 0.0005675256252288818, 0.0006231069564819336, 0.0006786882877349854, 0.0007342696189880371, 0.0007898509502410889, 0.0008454322814941406, 0.0009010136127471924, 0.0009565949440002441, 0.001012176275253296, 0.0010677576065063477, 0.0011233389377593994, 0.0011789202690124512, 0.001234501600265503, 0.0012900829315185547, 0.0013456642627716064, 0.0014012455940246582, 0.00145682692527771, 0.0015124082565307617, 0.0015679895877838135, 0.0016235709190368652, 0.001679152250289917, 0.0017347335815429688]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 9.0, 13.0, 14.0, 11.0, 13.0, 14.0, 19.0, 20.0, 24.0, 27.0, 36.0, 26.0, 29.0, 42.0, 39.0, 49.0, 50.0, 39.0, 52.0, 54.0, 39.0, 40.0, 31.0, 31.0, 33.0, 27.0, 25.0, 24.0, 21.0, 14.0, 20.0, 21.0, 22.0, 18.0, 6.0, 6.0, 3.0, 8.0, 3.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0029449462890625, -0.00285494327545166, -0.0027649402618408203, -0.0026749372482299805, -0.0025849342346191406, -0.0024949312210083008, -0.002404928207397461, -0.002314925193786621, -0.0022249221801757812, -0.0021349191665649414, -0.0020449161529541016, -0.0019549131393432617, -0.0018649101257324219, -0.001774907112121582, -0.0016849040985107422, -0.0015949010848999023, -0.0015048980712890625, -0.0014148950576782227, -0.0013248920440673828, -0.001234889030456543, -0.0011448860168457031, -0.0010548830032348633, -0.0009648799896240234, -0.0008748769760131836, -0.0007848739624023438, -0.0006948709487915039, -0.0006048679351806641, -0.0005148649215698242, -0.0004248619079589844, -0.00033485889434814453, -0.0002448558807373047, -0.00015485286712646484, -6.4849853515625e-05, 2.5153160095214844e-05, 0.00011515617370605469, 0.00020515918731689453, 0.0002951622009277344, 0.0003851652145385742, 0.00047516822814941406, 0.0005651712417602539, 0.0006551742553710938, 0.0007451772689819336, 0.0008351802825927734, 0.0009251832962036133, 0.0010151863098144531, 0.001105189323425293, 0.0011951923370361328, 0.0012851953506469727, 0.0013751983642578125, 0.0014652013778686523, 0.0015552043914794922, 0.001645207405090332, 0.0017352104187011719, 0.0018252134323120117, 0.0019152164459228516, 0.0020052194595336914, 0.0020952224731445312, 0.002185225486755371, 0.002275228500366211, 0.0023652315139770508, 0.0024552345275878906, 0.0025452375411987305, 0.0026352405548095703, 0.00272524356842041, 0.00281524658203125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 10.0, 9.0, 17.0, 26.0, 37.0, 60.0, 90.0, 128.0, 197.0, 292.0, 473.0, 741.0, 1479.0, 2376.0, 4573.0, 9331.0, 20163.0, 52012.0, 180927.0, 584591.0, 119022.0, 39624.0, 16275.0, 7235.0, 3746.0, 1966.0, 1205.0, 710.0, 425.0, 268.0, 168.0, 126.0, 77.0, 51.0, 34.0, 24.0, 17.0, 18.0, 11.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.1552734375e-05, -8.853711187839508e-05, -8.552148938179016e-05, -8.250586688518524e-05, -7.949024438858032e-05, -7.64746218919754e-05, -7.345899939537048e-05, -7.044337689876556e-05, -6.742775440216064e-05, -6.441213190555573e-05, -6.13965094089508e-05, -5.8380886912345886e-05, -5.536526441574097e-05, -5.234964191913605e-05, -4.933401942253113e-05, -4.631839692592621e-05, -4.330277442932129e-05, -4.028715193271637e-05, -3.727152943611145e-05, -3.425590693950653e-05, -3.124028444290161e-05, -2.8224661946296692e-05, -2.5209039449691772e-05, -2.2193416953086853e-05, -1.9177794456481934e-05, -1.6162171959877014e-05, -1.3146549463272095e-05, -1.0130926966667175e-05, -7.115304470062256e-06, -4.0996819734573364e-06, -1.084059476852417e-06, 1.9315630197525024e-06, 4.947185516357422e-06, 7.962808012962341e-06, 1.097843050956726e-05, 1.399405300617218e-05, 1.70096755027771e-05, 2.002529799938202e-05, 2.304092049598694e-05, 2.6056542992591858e-05, 2.9072165489196777e-05, 3.20877879858017e-05, 3.5103410482406616e-05, 3.8119032979011536e-05, 4.1134655475616455e-05, 4.4150277972221375e-05, 4.7165900468826294e-05, 5.018152296543121e-05, 5.319714546203613e-05, 5.621276795864105e-05, 5.922839045524597e-05, 6.224401295185089e-05, 6.525963544845581e-05, 6.827525794506073e-05, 7.129088044166565e-05, 7.430650293827057e-05, 7.732212543487549e-05, 8.033774793148041e-05, 8.335337042808533e-05, 8.636899292469025e-05, 8.938461542129517e-05, 9.240023791790009e-05, 9.5415860414505e-05, 9.843148291110992e-05, 0.00010144710540771484]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 8.0, 8.0, 9.0, 14.0, 17.0, 24.0, 19.0, 36.0, 35.0, 55.0, 46.0, 65.0, 76.0, 76.0, 51.0, 87.0, 70.0, 52.0, 43.0, 51.0, 23.0, 34.0, 22.0, 14.0, 14.0, 13.0, 5.0, 6.0, 0.0, 2.0, 3.0, 7.0, 3.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.4007091522216797e-05, -1.360476016998291e-05, -1.3202428817749023e-05, -1.2800097465515137e-05, -1.239776611328125e-05, -1.1995434761047363e-05, -1.1593103408813477e-05, -1.119077205657959e-05, -1.0788440704345703e-05, -1.0386109352111816e-05, -9.98377799987793e-06, -9.581446647644043e-06, -9.179115295410156e-06, -8.77678394317627e-06, -8.374452590942383e-06, -7.972121238708496e-06, -7.569789886474609e-06, -7.167458534240723e-06, -6.765127182006836e-06, -6.362795829772949e-06, -5.9604644775390625e-06, -5.558133125305176e-06, -5.155801773071289e-06, -4.753470420837402e-06, -4.351139068603516e-06, -3.948807716369629e-06, -3.546476364135742e-06, -3.1441450119018555e-06, -2.7418136596679688e-06, -2.339482307434082e-06, -1.9371509552001953e-06, -1.5348196029663086e-06, -1.1324882507324219e-06, -7.301568984985352e-07, -3.2782554626464844e-07, 7.450580596923828e-08, 4.76837158203125e-07, 8.791685104370117e-07, 1.2814998626708984e-06, 1.6838312149047852e-06, 2.086162567138672e-06, 2.4884939193725586e-06, 2.8908252716064453e-06, 3.293156623840332e-06, 3.6954879760742188e-06, 4.0978193283081055e-06, 4.500150680541992e-06, 4.902482032775879e-06, 5.304813385009766e-06, 5.707144737243652e-06, 6.109476089477539e-06, 6.511807441711426e-06, 6.9141387939453125e-06, 7.316470146179199e-06, 7.718801498413086e-06, 8.121132850646973e-06, 8.52346420288086e-06, 8.925795555114746e-06, 9.328126907348633e-06, 9.73045825958252e-06, 1.0132789611816406e-05, 1.0535120964050293e-05, 1.093745231628418e-05, 1.1339783668518066e-05, 1.1742115020751953e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 3.0, 7.0, 11.0, 8.0, 15.0, 17.0, 25.0, 42.0, 50.0, 90.0, 182.0, 736.0, 6699.0, 136770.0, 870372.0, 30494.0, 2280.0, 367.0, 119.0, 59.0, 36.0, 22.0, 16.0, 23.0, 24.0, 10.0, 10.0, 10.0, 7.0, 10.0, 2.0, 5.0, 3.0, 1.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003268718719482422, -0.00031443312764167786, -0.0003019943833351135, -0.0002895556390285492, -0.00027711689472198486, -0.00026467815041542053, -0.0002522394061088562, -0.00023980066180229187, -0.00022736191749572754, -0.0002149231731891632, -0.00020248442888259888, -0.00019004568457603455, -0.00017760694026947021, -0.00016516819596290588, -0.00015272945165634155, -0.00014029070734977722, -0.0001278519630432129, -0.00011541321873664856, -0.00010297447443008423, -9.05357301235199e-05, -7.809698581695557e-05, -6.565824151039124e-05, -5.3219497203826904e-05, -4.078075289726257e-05, -2.8342008590698242e-05, -1.590326428413391e-05, -3.46451997756958e-06, 8.974224328994751e-06, 2.1412968635559082e-05, 3.385171294212341e-05, 4.6290457248687744e-05, 5.8729201555252075e-05, 7.11679458618164e-05, 8.360669016838074e-05, 9.604543447494507e-05, 0.0001084841787815094, 0.00012092292308807373, 0.00013336166739463806, 0.0001458004117012024, 0.00015823915600776672, 0.00017067790031433105, 0.00018311664462089539, 0.00019555538892745972, 0.00020799413323402405, 0.00022043287754058838, 0.0002328716218471527, 0.00024531036615371704, 0.00025774911046028137, 0.0002701878547668457, 0.00028262659907341003, 0.00029506534337997437, 0.0003075040876865387, 0.00031994283199310303, 0.00033238157629966736, 0.0003448203206062317, 0.000357259064912796, 0.00036969780921936035, 0.0003821365535259247, 0.000394575297832489, 0.00040701404213905334, 0.0004194527864456177, 0.000431891530752182, 0.00044433027505874634, 0.00045676901936531067, 0.000469207763671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 11.0, 23.0, 16.0, 26.0, 25.0, 44.0, 64.0, 49.0, 55.0, 102.0, 88.0, 103.0, 87.0, 67.0, 43.0, 30.0, 29.0, 33.0, 21.0, 9.0, 11.0, 8.0, 12.0, 6.0, 4.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1517276763916016e-05, -2.0734965801239014e-05, -1.9952654838562012e-05, -1.917034387588501e-05, -1.8388032913208008e-05, -1.7605721950531006e-05, -1.6823410987854004e-05, -1.6041100025177002e-05, -1.52587890625e-05, -1.4476478099822998e-05, -1.3694167137145996e-05, -1.2911856174468994e-05, -1.2129545211791992e-05, -1.134723424911499e-05, -1.0564923286437988e-05, -9.782612323760986e-06, -9.000301361083984e-06, -8.217990398406982e-06, -7.4356794357299805e-06, -6.6533684730529785e-06, -5.8710575103759766e-06, -5.088746547698975e-06, -4.306435585021973e-06, -3.5241246223449707e-06, -2.7418136596679688e-06, -1.959502696990967e-06, -1.1771917343139648e-06, -3.948807716369629e-07, 3.8743019104003906e-07, 1.169741153717041e-06, 1.952052116394043e-06, 2.734363079071045e-06, 3.516674041748047e-06, 4.298985004425049e-06, 5.081295967102051e-06, 5.863606929779053e-06, 6.645917892456055e-06, 7.428228855133057e-06, 8.210539817810059e-06, 8.99285078048706e-06, 9.775161743164062e-06, 1.0557472705841064e-05, 1.1339783668518066e-05, 1.2122094631195068e-05, 1.290440559387207e-05, 1.3686716556549072e-05, 1.4469027519226074e-05, 1.5251338481903076e-05, 1.6033649444580078e-05, 1.681596040725708e-05, 1.7598271369934082e-05, 1.8380582332611084e-05, 1.9162893295288086e-05, 1.9945204257965088e-05, 2.072751522064209e-05, 2.1509826183319092e-05, 2.2292137145996094e-05, 2.3074448108673096e-05, 2.3856759071350098e-05, 2.46390700340271e-05, 2.54213809967041e-05, 2.6203691959381104e-05, 2.6986002922058105e-05, 2.7768313884735107e-05, 2.855062484741211e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 9.0, 2.0, 11.0, 15.0, 27.0, 38.0, 62.0, 89.0, 128.0, 141.0, 164.0, 114.0, 77.0, 51.0, 31.0, 24.0, 15.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01658397726714611, -0.016228437423706055, -0.015872897580266, -0.015517356805503368, -0.015161816030740738, -0.014806276187300682, -0.014450735412538052, -0.014095195569097996, -0.013739654794335365, -0.01338411495089531, -0.013028574176132679, -0.012673034332692623, -0.012317493557929993, -0.011961953714489937, -0.011606412939727306, -0.01125087309628725, -0.01089533232152462, -0.010539792478084564, -0.010184251703321934, -0.009828711859881878, -0.009473171085119247, -0.009117631241679192, -0.008762090466916561, -0.008406550623476505, -0.00805101078003645, -0.007695470470935106, -0.007339930161833763, -0.00698438985273242, -0.006628849543631077, -0.006273309234529734, -0.0059177689254283905, -0.005562229081988335, -0.005206688307225704, -0.004851147998124361, -0.004495607689023018, -0.004140067379921675, -0.0037845270708203316, -0.0034289867617189884, -0.003073446685448289, -0.0027179063763469458, -0.0023623660672456026, -0.0020068257581442595, -0.0016512854490429163, -0.001295745256356895, -0.0009402049472555518, -0.0005846646381542087, -0.00022912444546818733, 0.00012641586363315582, 0.000481956172734499, 0.0008374964818358421, 0.0011930367909371853, 0.0015485769836232066, 0.0019041172927245498, 0.0022596577182412148, 0.0026151977945119143, 0.0029707381036132574, 0.0033262784127146006, 0.0036818187218159437, 0.004037358798086643, 0.004392899107187986, 0.0047484394162893295, 0.005103979725390673, 0.005459520034492016, 0.005815060343593359, 0.006170600652694702]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 8.0, 4.0, 8.0, 4.0, 8.0, 11.0, 8.0, 9.0, 10.0, 15.0, 21.0, 23.0, 24.0, 25.0, 26.0, 29.0, 29.0, 34.0, 25.0, 41.0, 48.0, 35.0, 47.0, 31.0, 42.0, 34.0, 44.0, 47.0, 42.0, 39.0, 32.0, 25.0, 28.0, 25.0, 23.0, 13.0, 20.0, 14.0, 8.0, 9.0, 8.0, 10.0, 8.0, 5.0, 8.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003193438984453678, -0.003068499034270644, -0.0029435590840876102, -0.0028186189010739326, -0.0026936789508908987, -0.0025687390007078648, -0.002443799050524831, -0.002318859100341797, -0.0021939189173281193, -0.0020689789671450853, -0.0019440389005467296, -0.0018190989503636956, -0.0016941588837653399, -0.001569218933582306, -0.001444278983399272, -0.001319339033216238, -0.001194399083033204, -0.0010694591328501701, -0.0009445190662518144, -0.0008195791160687804, -0.0006946391076780856, -0.0005696990992873907, -0.00044475914910435677, -0.0003198191407136619, -0.00019487913232296705, -6.993913848418742e-05, 5.5000855354592204e-05, 0.0001799408346414566, 0.00030488084303215146, 0.0004298208514228463, 0.0005547608016058803, 0.0006797008099965751, 0.00080464081838727, 0.0009295808267779648, 0.0010545208351686597, 0.0011794607853516936, 0.0013044008519500494, 0.0014293408021330833, 0.0015542807523161173, 0.0016792207024991512, 0.001804160769097507, 0.001929100719280541, 0.0020540407858788967, 0.0021789807360619307, 0.0023039206862449646, 0.002428860869258642, 0.0025538005866110325, 0.00267874076962471, 0.002803680719807744, 0.002928620669990778, 0.003053560620173812, 0.003178500570356846, 0.0033034407533705235, 0.0034283807035535574, 0.0035533206537365913, 0.0036782606039196253, 0.0038032005541026592, 0.003928140737116337, 0.004053080454468727, 0.004178020637482405, 0.004302960354834795, 0.004427900537848473, 0.004552840255200863, 0.0046777804382145405, 0.004802720621228218]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 8.0, 7.0, 10.0, 14.0, 32.0, 39.0, 73.0, 117.0, 199.0, 530.0, 1298.0, 4126.0, 15245.0, 64685.0, 278882.0, 478297.0, 156504.0, 35633.0, 8698.0, 2529.0, 862.0, 363.0, 162.0, 85.0, 51.0, 30.0, 24.0, 16.0, 14.0, 10.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031982421875, -0.031021833419799805, -0.03006124496459961, -0.029100656509399414, -0.02814006805419922, -0.027179479598999023, -0.026218891143798828, -0.025258302688598633, -0.024297714233398438, -0.023337125778198242, -0.022376537322998047, -0.02141594886779785, -0.020455360412597656, -0.01949477195739746, -0.018534183502197266, -0.01757359504699707, -0.016613006591796875, -0.01565241813659668, -0.014691829681396484, -0.013731241226196289, -0.012770652770996094, -0.011810064315795898, -0.010849475860595703, -0.009888887405395508, -0.008928298950195312, -0.007967710494995117, -0.007007122039794922, -0.0060465335845947266, -0.005085945129394531, -0.004125356674194336, -0.0031647682189941406, -0.0022041797637939453, -0.00124359130859375, -0.0002830028533935547, 0.0006775856018066406, 0.001638174057006836, 0.0025987625122070312, 0.0035593509674072266, 0.004519939422607422, 0.005480527877807617, 0.0064411163330078125, 0.007401704788208008, 0.008362293243408203, 0.009322881698608398, 0.010283470153808594, 0.011244058609008789, 0.012204647064208984, 0.01316523551940918, 0.014125823974609375, 0.01508641242980957, 0.016047000885009766, 0.01700758934020996, 0.017968177795410156, 0.01892876625061035, 0.019889354705810547, 0.020849943161010742, 0.021810531616210938, 0.022771120071411133, 0.023731708526611328, 0.024692296981811523, 0.02565288543701172, 0.026613473892211914, 0.02757406234741211, 0.028534650802612305, 0.0294952392578125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 8.0, 8.0, 11.0, 19.0, 25.0, 30.0, 41.0, 58.0, 65.0, 84.0, 94.0, 80.0, 68.0, 84.0, 61.0, 68.0, 68.0, 37.0, 22.0, 33.0, 13.0, 9.0, 10.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00513458251953125, -0.004889488220214844, -0.0046443939208984375, -0.004399299621582031, -0.004154205322265625, -0.003909111022949219, -0.0036640167236328125, -0.0034189224243164062, -0.003173828125, -0.0029287338256835938, -0.0026836395263671875, -0.0024385452270507812, -0.002193450927734375, -0.0019483566284179688, -0.0017032623291015625, -0.0014581680297851562, -0.00121307373046875, -0.0009679794311523438, -0.0007228851318359375, -0.00047779083251953125, -0.000232696533203125, 1.239776611328125e-05, 0.0002574920654296875, 0.0005025863647460938, 0.0007476806640625, 0.0009927749633789062, 0.0012378692626953125, 0.0014829635620117188, 0.001728057861328125, 0.0019731521606445312, 0.0022182464599609375, 0.0024633407592773438, 0.00270843505859375, 0.0029535293579101562, 0.0031986236572265625, 0.0034437179565429688, 0.003688812255859375, 0.003933906555175781, 0.0041790008544921875, 0.004424095153808594, 0.004669189453125, 0.004914283752441406, 0.0051593780517578125, 0.005404472351074219, 0.005649566650390625, 0.005894660949707031, 0.0061397552490234375, 0.006384849548339844, 0.00662994384765625, 0.006875038146972656, 0.0071201324462890625, 0.007365226745605469, 0.007610321044921875, 0.007855415344238281, 0.008100509643554688, 0.008345603942871094, 0.0085906982421875, 0.008835792541503906, 0.009080886840820312, 0.009325981140136719, 0.009571075439453125, 0.009816169738769531, 0.010061264038085938, 0.010306358337402344, 0.01055145263671875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 3.0, 7.0, 9.0, 14.0, 17.0, 19.0, 32.0, 53.0, 75.0, 160.0, 212.0, 379.0, 599.0, 1054.0, 1875.0, 3246.0, 6099.0, 11877.0, 23859.0, 50429.0, 107791.0, 213638.0, 281418.0, 177767.0, 86372.0, 40590.0, 19629.0, 9793.0, 4996.0, 2708.0, 1515.0, 879.0, 527.0, 343.0, 195.0, 125.0, 77.0, 50.0, 36.0, 27.0, 17.0, 9.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.01354217529296875, -0.013136148452758789, -0.012730121612548828, -0.012324094772338867, -0.011918067932128906, -0.011512041091918945, -0.011106014251708984, -0.010699987411499023, -0.010293960571289062, -0.009887933731079102, -0.00948190689086914, -0.00907588005065918, -0.008669853210449219, -0.008263826370239258, -0.007857799530029297, -0.007451772689819336, -0.007045745849609375, -0.006639719009399414, -0.006233692169189453, -0.005827665328979492, -0.005421638488769531, -0.00501561164855957, -0.004609584808349609, -0.0042035579681396484, -0.0037975311279296875, -0.0033915042877197266, -0.0029854774475097656, -0.0025794506072998047, -0.0021734237670898438, -0.0017673969268798828, -0.0013613700866699219, -0.0009553432464599609, -0.00054931640625, -0.00014328956604003906, 0.0002627372741699219, 0.0006687641143798828, 0.0010747909545898438, 0.0014808177947998047, 0.0018868446350097656, 0.0022928714752197266, 0.0026988983154296875, 0.0031049251556396484, 0.0035109519958496094, 0.00391697883605957, 0.004323005676269531, 0.004729032516479492, 0.005135059356689453, 0.005541086196899414, 0.005947113037109375, 0.006353139877319336, 0.006759166717529297, 0.007165193557739258, 0.007571220397949219, 0.00797724723815918, 0.00838327407836914, 0.008789300918579102, 0.009195327758789062, 0.009601354598999023, 0.010007381439208984, 0.010413408279418945, 0.010819435119628906, 0.011225461959838867, 0.011631488800048828, 0.012037515640258789, 0.01244354248046875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 11.0, 5.0, 4.0, 19.0, 10.0, 22.0, 29.0, 23.0, 25.0, 30.0, 32.0, 34.0, 31.0, 50.0, 53.0, 56.0, 47.0, 48.0, 48.0, 51.0, 39.0, 46.0, 41.0, 38.0, 36.0, 28.0, 22.0, 24.0, 14.0, 19.0, 10.0, 8.0, 14.0, 7.0, 10.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.005451202392578125, -0.005307555198669434, -0.005163908004760742, -0.005020260810852051, -0.004876613616943359, -0.004732966423034668, -0.0045893192291259766, -0.004445672035217285, -0.004302024841308594, -0.004158377647399902, -0.004014730453491211, -0.0038710832595825195, -0.003727436065673828, -0.0035837888717651367, -0.0034401416778564453, -0.003296494483947754, -0.0031528472900390625, -0.003009200096130371, -0.0028655529022216797, -0.0027219057083129883, -0.002578258514404297, -0.0024346113204956055, -0.002290964126586914, -0.0021473169326782227, -0.0020036697387695312, -0.0018600225448608398, -0.0017163753509521484, -0.001572728157043457, -0.0014290809631347656, -0.0012854337692260742, -0.0011417865753173828, -0.0009981393814086914, -0.0008544921875, -0.0007108449935913086, -0.0005671977996826172, -0.0004235506057739258, -0.0002799034118652344, -0.00013625621795654297, 7.3909759521484375e-06, 0.00015103816986083984, 0.00029468536376953125, 0.00043833255767822266, 0.0005819797515869141, 0.0007256269454956055, 0.0008692741394042969, 0.0010129213333129883, 0.0011565685272216797, 0.001300215721130371, 0.0014438629150390625, 0.001587510108947754, 0.0017311573028564453, 0.0018748044967651367, 0.002018451690673828, 0.0021620988845825195, 0.002305746078491211, 0.0024493932723999023, 0.0025930404663085938, 0.002736687660217285, 0.0028803348541259766, 0.003023982048034668, 0.0031676292419433594, 0.0033112764358520508, 0.003454923629760742, 0.0035985708236694336, 0.003742218017578125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 3.0, 3.0, 6.0, 7.0, 7.0, 16.0, 21.0, 15.0, 29.0, 46.0, 52.0, 80.0, 128.0, 155.0, 232.0, 379.0, 600.0, 1082.0, 2031.0, 4089.0, 9568.0, 25280.0, 94632.0, 775910.0, 91337.0, 24588.0, 9469.0, 4034.0, 2011.0, 1012.0, 595.0, 358.0, 227.0, 168.0, 96.0, 73.0, 60.0, 41.0, 31.0, 25.0, 24.0, 11.0, 11.0, 6.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007427215576171875, -0.0071836113929748535, -0.006940007209777832, -0.0066964030265808105, -0.006452798843383789, -0.006209194660186768, -0.005965590476989746, -0.005721986293792725, -0.005478382110595703, -0.005234777927398682, -0.00499117374420166, -0.004747569561004639, -0.004503965377807617, -0.004260361194610596, -0.004016757011413574, -0.0037731528282165527, -0.0035295486450195312, -0.0032859444618225098, -0.0030423402786254883, -0.002798736095428467, -0.0025551319122314453, -0.002311527729034424, -0.0020679235458374023, -0.0018243193626403809, -0.0015807151794433594, -0.0013371109962463379, -0.0010935068130493164, -0.0008499026298522949, -0.0006062984466552734, -0.00036269426345825195, -0.00011909008026123047, 0.00012451410293579102, 0.0003681182861328125, 0.000611722469329834, 0.0008553266525268555, 0.001098930835723877, 0.0013425350189208984, 0.00158613920211792, 0.0018297433853149414, 0.002073347568511963, 0.0023169517517089844, 0.002560555934906006, 0.0028041601181030273, 0.003047764301300049, 0.0032913684844970703, 0.003534972667694092, 0.0037785768508911133, 0.004022181034088135, 0.004265785217285156, 0.004509389400482178, 0.004752993583679199, 0.004996597766876221, 0.005240201950073242, 0.005483806133270264, 0.005727410316467285, 0.005971014499664307, 0.006214618682861328, 0.00645822286605835, 0.006701827049255371, 0.006945431232452393, 0.007189035415649414, 0.0074326395988464355, 0.007676243782043457, 0.007919847965240479, 0.0081634521484375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 6.0, 13.0, 12.0, 8.0, 15.0, 27.0, 35.0, 55.0, 88.0, 99.0, 139.0, 110.0, 108.0, 57.0, 66.0, 30.0, 29.0, 29.0, 20.0, 8.0, 6.0, 4.0, 4.0, 4.0, 8.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2755393981933594e-05, -1.2367963790893555e-05, -1.1980533599853516e-05, -1.1593103408813477e-05, -1.1205673217773438e-05, -1.0818243026733398e-05, -1.043081283569336e-05, -1.004338264465332e-05, -9.655952453613281e-06, -9.268522262573242e-06, -8.881092071533203e-06, -8.493661880493164e-06, -8.106231689453125e-06, -7.718801498413086e-06, -7.331371307373047e-06, -6.943941116333008e-06, -6.556510925292969e-06, -6.16908073425293e-06, -5.781650543212891e-06, -5.3942203521728516e-06, -5.0067901611328125e-06, -4.6193599700927734e-06, -4.231929779052734e-06, -3.844499588012695e-06, -3.4570693969726562e-06, -3.069639205932617e-06, -2.682209014892578e-06, -2.294778823852539e-06, -1.9073486328125e-06, -1.519918441772461e-06, -1.1324882507324219e-06, -7.450580596923828e-07, -3.5762786865234375e-07, 2.9802322387695312e-08, 4.172325134277344e-07, 8.046627044677734e-07, 1.1920928955078125e-06, 1.5795230865478516e-06, 1.9669532775878906e-06, 2.3543834686279297e-06, 2.7418136596679688e-06, 3.129243850708008e-06, 3.516674041748047e-06, 3.904104232788086e-06, 4.291534423828125e-06, 4.678964614868164e-06, 5.066394805908203e-06, 5.453824996948242e-06, 5.841255187988281e-06, 6.22868537902832e-06, 6.616115570068359e-06, 7.0035457611083984e-06, 7.3909759521484375e-06, 7.778406143188477e-06, 8.165836334228516e-06, 8.553266525268555e-06, 8.940696716308594e-06, 9.328126907348633e-06, 9.715557098388672e-06, 1.0102987289428711e-05, 1.049041748046875e-05, 1.0877847671508789e-05, 1.1265277862548828e-05, 1.1652708053588867e-05, 1.2040138244628906e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 9.0, 15.0, 26.0, 58.0, 77.0, 129.0, 235.0, 465.0, 933.0, 2350.0, 5999.0, 18457.0, 84124.0, 835044.0, 73988.0, 16805.0, 5758.0, 2170.0, 919.0, 437.0, 215.0, 132.0, 79.0, 49.0, 31.0, 10.0, 16.0, 4.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00848388671875, -0.008205413818359375, -0.00792694091796875, -0.007648468017578125, -0.0073699951171875, -0.007091522216796875, -0.00681304931640625, -0.006534576416015625, -0.006256103515625, -0.005977630615234375, -0.00569915771484375, -0.005420684814453125, -0.0051422119140625, -0.004863739013671875, -0.00458526611328125, -0.004306793212890625, -0.0040283203125, -0.003749847412109375, -0.00347137451171875, -0.003192901611328125, -0.0029144287109375, -0.002635955810546875, -0.00235748291015625, -0.002079010009765625, -0.001800537109375, -0.001522064208984375, -0.00124359130859375, -0.000965118408203125, -0.0006866455078125, -0.000408172607421875, -0.00012969970703125, 0.000148773193359375, 0.00042724609375, 0.000705718994140625, 0.00098419189453125, 0.001262664794921875, 0.0015411376953125, 0.001819610595703125, 0.00209808349609375, 0.002376556396484375, 0.002655029296875, 0.002933502197265625, 0.00321197509765625, 0.003490447998046875, 0.0037689208984375, 0.004047393798828125, 0.00432586669921875, 0.004604339599609375, 0.0048828125, 0.005161285400390625, 0.00543975830078125, 0.005718231201171875, 0.0059967041015625, 0.006275177001953125, 0.00655364990234375, 0.006832122802734375, 0.007110595703125, 0.007389068603515625, 0.00766754150390625, 0.007946014404296875, 0.0082244873046875, 0.008502960205078125, 0.00878143310546875, 0.009059906005859375, 0.00933837890625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 10.0, 10.0, 6.0, 11.0, 14.0, 23.0, 33.0, 44.0, 44.0, 117.0, 350.0, 116.0, 60.0, 37.0, 22.0, 19.0, 17.0, 11.0, 17.0, 11.0, 8.0, 5.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002185821533203125, -0.0021141767501831055, -0.002042531967163086, -0.0019708871841430664, -0.0018992424011230469, -0.0018275976181030273, -0.0017559528350830078, -0.0016843080520629883, -0.0016126632690429688, -0.0015410184860229492, -0.0014693737030029297, -0.0013977289199829102, -0.0013260841369628906, -0.001254439353942871, -0.0011827945709228516, -0.001111149787902832, -0.0010395050048828125, -0.000967860221862793, -0.0008962154388427734, -0.0008245706558227539, -0.0007529258728027344, -0.0006812810897827148, -0.0006096363067626953, -0.0005379915237426758, -0.00046634674072265625, -0.0003947019577026367, -0.0003230571746826172, -0.00025141239166259766, -0.00017976760864257812, -0.0001081228256225586, -3.647804260253906e-05, 3.516674041748047e-05, 0.0001068115234375, 0.00017845630645751953, 0.00025010108947753906, 0.0003217458724975586, 0.0003933906555175781, 0.00046503543853759766, 0.0005366802215576172, 0.0006083250045776367, 0.0006799697875976562, 0.0007516145706176758, 0.0008232593536376953, 0.0008949041366577148, 0.0009665489196777344, 0.001038193702697754, 0.0011098384857177734, 0.001181483268737793, 0.0012531280517578125, 0.001324772834777832, 0.0013964176177978516, 0.001468062400817871, 0.0015397071838378906, 0.0016113519668579102, 0.0016829967498779297, 0.0017546415328979492, 0.0018262863159179688, 0.0018979310989379883, 0.001969575881958008, 0.0020412206649780273, 0.002112865447998047, 0.0021845102310180664, 0.002256155014038086, 0.0023277997970581055, 0.002399444580078125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 13.0, 45.0, 99.0, 332.0, 347.0, 126.0, 37.0, 10.0, 5.0, 2.0, 2.0], "bins": [-0.062192708253860474, -0.06110205501317978, -0.060011398047208786, -0.05892074480652809, -0.0578300915658474, -0.056739434599876404, -0.05564878135919571, -0.054558128118515015, -0.05346747487783432, -0.052376821637153625, -0.05128616467118263, -0.05019551143050194, -0.04910485818982124, -0.04801420122385025, -0.046923547983169556, -0.04583289474248886, -0.04474223777651787, -0.04365158453583717, -0.04256092756986618, -0.041470274329185486, -0.04037962108850479, -0.0392889678478241, -0.038198310881853104, -0.03710765764117241, -0.036017000675201416, -0.03492634743452072, -0.03383569046854973, -0.032745037227869034, -0.03165438398718834, -0.030563728883862495, -0.02947307378053665, -0.028382420539855957, -0.027291767299175262, -0.02620111219584942, -0.025110458955168724, -0.02401980385184288, -0.022929150611162186, -0.021838495507836342, -0.020747840404510498, -0.019657187163829803, -0.01856653206050396, -0.017475876957178116, -0.01638522371649742, -0.015294568613171577, -0.014203914441168308, -0.013113260269165039, -0.012022605165839195, -0.010931950993835926, -0.009841296821832657, -0.008750642649829388, -0.007659988012164831, -0.006569333374500275, -0.0054786792024970055, -0.004388025030493736, -0.0032973703928291798, -0.0022067157551646233, -0.001116061583161354, -2.5407178327441216e-05, 0.0010652472265064716, 0.0021559016313403845, 0.0032465560361742973, 0.0043372102081775665, 0.005427864845842123, 0.0065185194835066795, 0.007609173655509949]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 6.0, 9.0, 9.0, 16.0, 15.0, 29.0, 36.0, 38.0, 37.0, 47.0, 46.0, 56.0, 66.0, 53.0, 65.0, 71.0, 69.0, 67.0, 41.0, 41.0, 30.0, 39.0, 30.0, 18.0, 20.0, 9.0, 8.0, 8.0, 11.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0059243300929665565, -0.005690362770110369, -0.005456395447254181, -0.00522242859005928, -0.004988461267203093, -0.004754493944346905, -0.004520526621490717, -0.004286559298634529, -0.004052592441439629, -0.0038186251185834408, -0.0035846580285578966, -0.003350690705701709, -0.0031167236156761646, -0.002882756292819977, -0.002648788969963789, -0.002414821647107601, -0.0021808543242514133, -0.0019468871178105474, -0.0017129199113696814, -0.0014789525885134935, -0.0012449853820726275, -0.0010110181756317616, -0.0007770508527755737, -0.0005430836463347077, -0.00030911643989384174, -7.51492043491453e-05, 0.00015881803119555116, 0.00039278529584407806, 0.0006267525022849441, 0.00086071970872581, 0.0010946870315819979, 0.0013286542380228639, 0.0015626214444637299, 0.0017965886509045959, 0.002030555857345462, 0.0022645231802016497, 0.002498490270227194, 0.0027324575930833817, 0.0029664249159395695, 0.0032003922387957573, 0.0034343593288213015, 0.0036683266516774893, 0.0039022937417030334, 0.004136261064559221, 0.004370228387415409, 0.00460419524461031, 0.004838163033127785, 0.005072129890322685, 0.005306097213178873, 0.005540064536035061, 0.005774031858891249, 0.0060079991817474365, 0.006241966038942337, 0.006475933361798525, 0.006709900684654713, 0.0069438680075109005, 0.007177835330367088, 0.007411802653223276, 0.007645769976079464, 0.007879736833274364, 0.00811370462179184, 0.00834767147898674, 0.00858163833618164, 0.008815606124699116, 0.009049572981894016]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 6.0, 9.0, 24.0, 24.0, 59.0, 79.0, 156.0, 288.0, 522.0, 910.0, 1718.0, 3156.0, 5787.0, 11341.0, 21796.0, 47266.0, 128121.0, 610525.0, 2913806.0, 296615.0, 81231.0, 34455.0, 16777.0, 8569.0, 4676.0, 2715.0, 1520.0, 851.0, 535.0, 289.0, 175.0, 101.0, 78.0, 42.0, 23.0, 18.0, 10.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00537109375, -0.005130410194396973, -0.004889726638793945, -0.004649043083190918, -0.004408359527587891, -0.004167675971984863, -0.003926992416381836, -0.0036863088607788086, -0.0034456253051757812, -0.003204941749572754, -0.0029642581939697266, -0.0027235746383666992, -0.002482891082763672, -0.0022422075271606445, -0.002001523971557617, -0.0017608404159545898, -0.0015201568603515625, -0.0012794733047485352, -0.0010387897491455078, -0.0007981061935424805, -0.0005574226379394531, -0.0003167390823364258, -7.605552673339844e-05, 0.0001646280288696289, 0.00040531158447265625, 0.0006459951400756836, 0.0008866786956787109, 0.0011273622512817383, 0.0013680458068847656, 0.001608729362487793, 0.0018494129180908203, 0.0020900964736938477, 0.002330780029296875, 0.0025714635848999023, 0.0028121471405029297, 0.003052830696105957, 0.0032935142517089844, 0.0035341978073120117, 0.003774881362915039, 0.004015564918518066, 0.004256248474121094, 0.004496932029724121, 0.0047376155853271484, 0.004978299140930176, 0.005218982696533203, 0.0054596662521362305, 0.005700349807739258, 0.005941033363342285, 0.0061817169189453125, 0.00642240047454834, 0.006663084030151367, 0.0069037675857543945, 0.007144451141357422, 0.007385134696960449, 0.0076258182525634766, 0.007866501808166504, 0.008107185363769531, 0.008347868919372559, 0.008588552474975586, 0.008829236030578613, 0.00906991958618164, 0.009310603141784668, 0.009551286697387695, 0.009791970252990723, 0.01003265380859375]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 8.0, 7.0, 19.0, 14.0, 30.0, 27.0, 29.0, 37.0, 35.0, 39.0, 41.0, 64.0, 52.0, 45.0, 59.0, 60.0, 57.0, 57.0, 50.0, 37.0, 35.0, 28.0, 29.0, 20.0, 23.0, 16.0, 14.0, 12.0, 9.0, 11.0, 9.0, 6.0, 5.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004474639892578125, -0.004299819469451904, -0.004124999046325684, -0.003950178623199463, -0.003775358200073242, -0.0036005377769470215, -0.0034257173538208008, -0.00325089693069458, -0.0030760765075683594, -0.0029012560844421387, -0.002726435661315918, -0.0025516152381896973, -0.0023767948150634766, -0.002201974391937256, -0.002027153968811035, -0.0018523335456848145, -0.0016775131225585938, -0.001502692699432373, -0.0013278722763061523, -0.0011530518531799316, -0.000978231430053711, -0.0008034110069274902, -0.0006285905838012695, -0.00045377016067504883, -0.0002789497375488281, -0.00010412931442260742, 7.069110870361328e-05, 0.000245511531829834, 0.0004203319549560547, 0.0005951523780822754, 0.0007699728012084961, 0.0009447932243347168, 0.0011196136474609375, 0.0012944340705871582, 0.001469254493713379, 0.0016440749168395996, 0.0018188953399658203, 0.001993715763092041, 0.0021685361862182617, 0.0023433566093444824, 0.002518177032470703, 0.002692997455596924, 0.0028678178787231445, 0.0030426383018493652, 0.003217458724975586, 0.0033922791481018066, 0.0035670995712280273, 0.003741919994354248, 0.003916740417480469, 0.0040915608406066895, 0.00426638126373291, 0.004441201686859131, 0.0046160221099853516, 0.004790842533111572, 0.004965662956237793, 0.005140483379364014, 0.005315303802490234, 0.005490124225616455, 0.005664944648742676, 0.0058397650718688965, 0.006014585494995117, 0.006189405918121338, 0.006364226341247559, 0.006539046764373779, 0.0067138671875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 5.0, 11.0, 12.0, 8.0, 20.0, 28.0, 78.0, 204.0, 723.0, 4057.0, 220951.0, 3956520.0, 9784.0, 1368.0, 324.0, 100.0, 35.0, 18.0, 9.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061614990234375, -0.06008148193359375, -0.0585479736328125, -0.05701446533203125, -0.05548095703125, -0.05394744873046875, -0.0524139404296875, -0.05088043212890625, -0.049346923828125, -0.04781341552734375, -0.0462799072265625, -0.04474639892578125, -0.043212890625, -0.04167938232421875, -0.0401458740234375, -0.03861236572265625, -0.037078857421875, -0.03554534912109375, -0.0340118408203125, -0.03247833251953125, -0.03094482421875, -0.02941131591796875, -0.0278778076171875, -0.02634429931640625, -0.024810791015625, -0.02327728271484375, -0.0217437744140625, -0.02021026611328125, -0.0186767578125, -0.01714324951171875, -0.0156097412109375, -0.01407623291015625, -0.012542724609375, -0.01100921630859375, -0.0094757080078125, -0.00794219970703125, -0.00640869140625, -0.00487518310546875, -0.0033416748046875, -0.00180816650390625, -0.000274658203125, 0.00125885009765625, 0.0027923583984375, 0.00432586669921875, 0.005859375, 0.00739288330078125, 0.0089263916015625, 0.01045989990234375, 0.011993408203125, 0.01352691650390625, 0.0150604248046875, 0.01659393310546875, 0.01812744140625, 0.01966094970703125, 0.0211944580078125, 0.02272796630859375, 0.024261474609375, 0.02579498291015625, 0.0273284912109375, 0.02886199951171875, 0.0303955078125, 0.03192901611328125, 0.0334625244140625, 0.03499603271484375, 0.036529541015625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 12.0, 10.0, 27.0, 54.0, 110.0, 222.0, 368.0, 901.0, 1441.0, 460.0, 210.0, 109.0, 61.0, 27.0, 15.0, 15.0, 10.0, 6.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0041351318359375, -0.004023909568786621, -0.003912687301635742, -0.0038014650344848633, -0.0036902427673339844, -0.0035790205001831055, -0.0034677982330322266, -0.0033565759658813477, -0.0032453536987304688, -0.00313413143157959, -0.003022909164428711, -0.002911686897277832, -0.002800464630126953, -0.0026892423629760742, -0.0025780200958251953, -0.0024667978286743164, -0.0023555755615234375, -0.0022443532943725586, -0.0021331310272216797, -0.0020219087600708008, -0.0019106864929199219, -0.001799464225769043, -0.001688241958618164, -0.0015770196914672852, -0.0014657974243164062, -0.0013545751571655273, -0.0012433528900146484, -0.0011321306228637695, -0.0010209083557128906, -0.0009096860885620117, -0.0007984638214111328, -0.0006872415542602539, -0.000576019287109375, -0.0004647970199584961, -0.0003535747528076172, -0.00024235248565673828, -0.00013113021850585938, -1.990795135498047e-05, 9.131431579589844e-05, 0.00020253658294677734, 0.00031375885009765625, 0.00042498111724853516, 0.0005362033843994141, 0.000647425651550293, 0.0007586479187011719, 0.0008698701858520508, 0.0009810924530029297, 0.0010923147201538086, 0.0012035369873046875, 0.0013147592544555664, 0.0014259815216064453, 0.0015372037887573242, 0.0016484260559082031, 0.001759648323059082, 0.001870870590209961, 0.00198209285736084, 0.0020933151245117188, 0.0022045373916625977, 0.0023157596588134766, 0.0024269819259643555, 0.0025382041931152344, 0.0026494264602661133, 0.002760648727416992, 0.002871870994567871, 0.00298309326171875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 4.0, 8.0, 16.0, 21.0, 21.0, 61.0, 79.0, 132.0, 120.0, 150.0, 127.0, 99.0, 56.0, 35.0, 31.0, 13.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010381083004176617, -0.010067419148981571, -0.0097537562251091, -0.009440092369914055, -0.00912642851471901, -0.008812765590846539, -0.008499101735651493, -0.008185438811779022, -0.007871774956583977, -0.007558111567050219, -0.00724444817751646, -0.006930784322321415, -0.006617120932787657, -0.006303457543253899, -0.005989793688058853, -0.005676130298525095, -0.005362466908991337, -0.005048803519457579, -0.0047351401299238205, -0.004421476274728775, -0.004107812885195017, -0.0037941494956612587, -0.003480485873296857, -0.003166822250932455, -0.002853158861398697, -0.0025394954718649387, -0.002225831849500537, -0.001912168343551457, -0.001598504837602377, -0.001284841331653297, -0.000971177825704217, -0.0006575142033398151, -0.00034384988248348236, -3.018637653440237e-05, 0.0002834771294146776, 0.0005971406353637576, 0.0009108041413128376, 0.0012244676472619176, 0.0015381311532109976, 0.0018517947755753994, 0.0021654581651091576, 0.0024791215546429157, 0.0027927851770073175, 0.0031064487993717194, 0.0034201121889054775, 0.0037337755784392357, 0.004047439433634281, 0.004361102823168039, 0.0046747662127017975, 0.004988429602235556, 0.005302092991769314, 0.005615756846964359, 0.0059294202364981174, 0.006243083626031876, 0.006556747481226921, 0.006870410870760679, 0.007184074260294437, 0.007497737649828196, 0.007811401039361954, 0.008125064894557, 0.008438728749752045, 0.008752391673624516, 0.009066055528819561, 0.009379718452692032, 0.009693382307887077]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 6.0, 6.0, 4.0, 5.0, 10.0, 8.0, 10.0, 12.0, 19.0, 23.0, 20.0, 21.0, 31.0, 28.0, 36.0, 41.0, 43.0, 42.0, 52.0, 44.0, 46.0, 53.0, 50.0, 53.0, 35.0, 39.0, 33.0, 22.0, 28.0, 29.0, 22.0, 24.0, 19.0, 23.0, 14.0, 11.0, 6.0, 7.0, 9.0, 9.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.004575618077069521, -0.004423396196216345, -0.004271174781024456, -0.00411895290017128, -0.003966731484979391, -0.003814509604126215, -0.0036622879561036825, -0.00351006630808115, -0.0033578446600586176, -0.003205623012036085, -0.0030534013640135527, -0.00290117971599102, -0.002748957835137844, -0.0025967364199459553, -0.002444514539092779, -0.0022922928910702467, -0.0021400712430477142, -0.0019878495950251818, -0.0018356279470026493, -0.001683406182564795, -0.0015311845345422626, -0.00137896288651973, -0.0012267411220818758, -0.0010745194740593433, -0.0009222978260368109, -0.0007700761780142784, -0.000617854471784085, -0.0004656327946577221, -0.0003134111175313592, -0.00016118946950882673, -8.967763278633356e-06, 0.00014325394295156002, 0.0002954751253128052, 0.0004476968024391681, 0.000599918479565531, 0.0007521401857957244, 0.0009043618338182569, 0.0010565834818407893, 0.0012088052462786436, 0.001361026894301176, 0.0015132485423237085, 0.001665470190346241, 0.0018176918383687735, 0.001969913486391306, 0.002122135367244482, 0.002274356782436371, 0.002426578663289547, 0.0025788003113120794, 0.002731021959334612, 0.0028832436073571444, 0.003035465255379677, 0.0031876869034022093, 0.0033399085514247417, 0.003492130432277918, 0.0036443520803004503, 0.003796573728322983, 0.003948795609176159, 0.004101017490029335, 0.004253238905221224, 0.0044054607860744, 0.004557682201266289, 0.004709904082119465, 0.004862125497311354, 0.00501434737816453, 0.005166568793356419]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 4.0, 7.0, 13.0, 14.0, 28.0, 40.0, 64.0, 90.0, 139.0, 250.0, 335.0, 496.0, 827.0, 1371.0, 2067.0, 3203.0, 5402.0, 8919.0, 14978.0, 25708.0, 46134.0, 83740.0, 156531.0, 255659.0, 198058.0, 107132.0, 57692.0, 32588.0, 18778.0, 10945.0, 6577.0, 3945.0, 2440.0, 1598.0, 1003.0, 639.0, 399.0, 248.0, 166.0, 118.0, 68.0, 52.0, 25.0, 26.0, 17.0, 10.0, 8.0, 0.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012989044189453125, -0.0012551695108413696, -0.0012114346027374268, -0.0011676996946334839, -0.001123964786529541, -0.0010802298784255981, -0.0010364949703216553, -0.0009927600622177124, -0.0009490251541137695, -0.0009052902460098267, -0.0008615553379058838, -0.0008178204298019409, -0.000774085521697998, -0.0007303506135940552, -0.0006866157054901123, -0.0006428807973861694, -0.0005991458892822266, -0.0005554109811782837, -0.0005116760730743408, -0.00046794116497039795, -0.0004242062568664551, -0.0003804713487625122, -0.00033673644065856934, -0.00029300153255462646, -0.0002492666244506836, -0.00020553171634674072, -0.00016179680824279785, -0.00011806190013885498, -7.432699203491211e-05, -3.059208393096924e-05, 1.3142824172973633e-05, 5.6877732276916504e-05, 0.00010061264038085938, 0.00014434754848480225, 0.00018808245658874512, 0.000231817364692688, 0.00027555227279663086, 0.00031928718090057373, 0.0003630220890045166, 0.00040675699710845947, 0.00045049190521240234, 0.0004942268133163452, 0.0005379617214202881, 0.000581696629524231, 0.0006254315376281738, 0.0006691664457321167, 0.0007129013538360596, 0.0007566362619400024, 0.0008003711700439453, 0.0008441060781478882, 0.0008878409862518311, 0.0009315758943557739, 0.0009753108024597168, 0.0010190457105636597, 0.0010627806186676025, 0.0011065155267715454, 0.0011502504348754883, 0.0011939853429794312, 0.001237720251083374, 0.001281455159187317, 0.0013251900672912598, 0.0013689249753952026, 0.0014126598834991455, 0.0014563947916030884, 0.0015001296997070312]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 3.0, 9.0, 8.0, 7.0, 10.0, 20.0, 17.0, 25.0, 16.0, 30.0, 34.0, 26.0, 43.0, 36.0, 43.0, 37.0, 49.0, 68.0, 64.0, 47.0, 43.0, 30.0, 41.0, 35.0, 36.0, 35.0, 21.0, 26.0, 14.0, 23.0, 24.0, 16.0, 11.0, 9.0, 6.0, 6.0, 14.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.004474639892578125, -0.004332363605499268, -0.00419008731842041, -0.004047811031341553, -0.0039055347442626953, -0.003763258457183838, -0.0036209821701049805, -0.003478705883026123, -0.0033364295959472656, -0.003194153308868408, -0.0030518770217895508, -0.0029096007347106934, -0.002767324447631836, -0.0026250481605529785, -0.002482771873474121, -0.0023404955863952637, -0.0021982192993164062, -0.002055943012237549, -0.0019136667251586914, -0.001771390438079834, -0.0016291141510009766, -0.0014868378639221191, -0.0013445615768432617, -0.0012022852897644043, -0.0010600090026855469, -0.0009177327156066895, -0.000775456428527832, -0.0006331801414489746, -0.0004909038543701172, -0.00034862756729125977, -0.00020635128021240234, -6.407499313354492e-05, 7.82012939453125e-05, 0.00022047758102416992, 0.00036275386810302734, 0.0005050301551818848, 0.0006473064422607422, 0.0007895827293395996, 0.000931859016418457, 0.0010741353034973145, 0.0012164115905761719, 0.0013586878776550293, 0.0015009641647338867, 0.0016432404518127441, 0.0017855167388916016, 0.001927793025970459, 0.0020700693130493164, 0.002212345600128174, 0.0023546218872070312, 0.0024968981742858887, 0.002639174461364746, 0.0027814507484436035, 0.002923727035522461, 0.0030660033226013184, 0.0032082796096801758, 0.003350555896759033, 0.0034928321838378906, 0.003635108470916748, 0.0037773847579956055, 0.003919661045074463, 0.00406193733215332, 0.004204213619232178, 0.004346489906311035, 0.004488766193389893, 0.00463104248046875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 7.0, 5.0, 8.0, 10.0, 26.0, 29.0, 52.0, 93.0, 134.0, 197.0, 267.0, 453.0, 694.0, 1056.0, 1663.0, 2661.0, 4084.0, 6317.0, 10122.0, 16038.0, 26111.0, 43147.0, 73174.0, 133614.0, 266153.0, 205069.0, 104544.0, 59286.0, 35337.0, 21225.0, 13717.0, 8382.0, 5384.0, 3361.0, 2212.0, 1395.0, 896.0, 572.0, 382.0, 246.0, 154.0, 100.0, 65.0, 30.0, 34.0, 22.0, 15.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011806488037109375, -0.0011423230171203613, -0.0011039972305297852, -0.001065671443939209, -0.0010273456573486328, -0.0009890198707580566, -0.0009506940841674805, -0.0009123682975769043, -0.0008740425109863281, -0.000835716724395752, -0.0007973909378051758, -0.0007590651512145996, -0.0007207393646240234, -0.0006824135780334473, -0.0006440877914428711, -0.0006057620048522949, -0.0005674362182617188, -0.0005291104316711426, -0.0004907846450805664, -0.00045245885848999023, -0.00041413307189941406, -0.0003758072853088379, -0.0003374814987182617, -0.00029915571212768555, -0.0002608299255371094, -0.0002225041389465332, -0.00018417835235595703, -0.00014585256576538086, -0.00010752677917480469, -6.920099258422852e-05, -3.0875205993652344e-05, 7.450580596923828e-06, 4.57763671875e-05, 8.410215377807617e-05, 0.00012242794036865234, 0.00016075372695922852, 0.0001990795135498047, 0.00023740530014038086, 0.00027573108673095703, 0.0003140568733215332, 0.0003523826599121094, 0.00039070844650268555, 0.0004290342330932617, 0.0004673600196838379, 0.0005056858062744141, 0.0005440115928649902, 0.0005823373794555664, 0.0006206631660461426, 0.0006589889526367188, 0.0006973147392272949, 0.0007356405258178711, 0.0007739663124084473, 0.0008122920989990234, 0.0008506178855895996, 0.0008889436721801758, 0.000927269458770752, 0.0009655952453613281, 0.0010039210319519043, 0.0010422468185424805, 0.0010805726051330566, 0.0011188983917236328, 0.001157224178314209, 0.0011955499649047852, 0.0012338757514953613, 0.0012722015380859375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 6.0, 5.0, 7.0, 19.0, 16.0, 15.0, 9.0, 25.0, 27.0, 17.0, 32.0, 29.0, 31.0, 34.0, 32.0, 35.0, 52.0, 37.0, 43.0, 42.0, 40.0, 41.0, 46.0, 37.0, 29.0, 27.0, 30.0, 25.0, 30.0, 28.0, 19.0, 20.0, 12.0, 24.0, 6.0, 9.0, 10.0, 10.0, 9.0, 12.0, 5.0, 1.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00244140625, -0.0023629367351531982, -0.0022844672203063965, -0.0022059977054595947, -0.002127528190612793, -0.002049058675765991, -0.0019705891609191895, -0.0018921196460723877, -0.001813650131225586, -0.0017351806163787842, -0.0016567111015319824, -0.0015782415866851807, -0.001499772071838379, -0.0014213025569915771, -0.0013428330421447754, -0.0012643635272979736, -0.0011858940124511719, -0.0011074244976043701, -0.0010289549827575684, -0.0009504854679107666, -0.0008720159530639648, -0.0007935464382171631, -0.0007150769233703613, -0.0006366074085235596, -0.0005581378936767578, -0.00047966837882995605, -0.0004011988639831543, -0.00032272934913635254, -0.0002442598342895508, -0.00016579031944274902, -8.732080459594727e-05, -8.851289749145508e-06, 6.961822509765625e-05, 0.000148087739944458, 0.00022655725479125977, 0.0003050267696380615, 0.0003834962844848633, 0.00046196579933166504, 0.0005404353141784668, 0.0006189048290252686, 0.0006973743438720703, 0.0007758438587188721, 0.0008543133735656738, 0.0009327828884124756, 0.0010112524032592773, 0.001089721918106079, 0.0011681914329528809, 0.0012466609477996826, 0.0013251304626464844, 0.0014035999774932861, 0.0014820694923400879, 0.0015605390071868896, 0.0016390085220336914, 0.0017174780368804932, 0.001795947551727295, 0.0018744170665740967, 0.0019528865814208984, 0.0020313560962677, 0.002109825611114502, 0.0021882951259613037, 0.0022667646408081055, 0.0023452341556549072, 0.002423703670501709, 0.0025021731853485107, 0.0025806427001953125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 6.0, 5.0, 2.0, 10.0, 13.0, 15.0, 25.0, 42.0, 50.0, 66.0, 97.0, 135.0, 198.0, 288.0, 424.0, 667.0, 1075.0, 1759.0, 2904.0, 5215.0, 9158.0, 17482.0, 36415.0, 90530.0, 474836.0, 274123.0, 70405.0, 29151.0, 14555.0, 7673.0, 4385.0, 2503.0, 1521.0, 946.0, 591.0, 384.0, 265.0, 191.0, 128.0, 88.0, 84.0, 35.0, 31.0, 27.0, 17.0, 9.0, 12.0, 6.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.98377799987793e-05, -9.67998057603836e-05, -9.376183152198792e-05, -9.072385728359222e-05, -8.768588304519653e-05, -8.464790880680084e-05, -8.160993456840515e-05, -7.857196033000946e-05, -7.553398609161377e-05, -7.249601185321808e-05, -6.945803761482239e-05, -6.64200633764267e-05, -6.3382089138031e-05, -6.0344114899635315e-05, -5.7306140661239624e-05, -5.426816642284393e-05, -5.123019218444824e-05, -4.819221794605255e-05, -4.515424370765686e-05, -4.211626946926117e-05, -3.907829523086548e-05, -3.604032099246979e-05, -3.30023467540741e-05, -2.9964372515678406e-05, -2.6926398277282715e-05, -2.3888424038887024e-05, -2.0850449800491333e-05, -1.7812475562095642e-05, -1.4774501323699951e-05, -1.173652708530426e-05, -8.69855284690857e-06, -5.660578608512878e-06, -2.6226043701171875e-06, 4.153698682785034e-07, 3.4533441066741943e-06, 6.491318345069885e-06, 9.529292583465576e-06, 1.2567266821861267e-05, 1.5605241060256958e-05, 1.864321529865265e-05, 2.168118953704834e-05, 2.471916377544403e-05, 2.775713801383972e-05, 3.079511225223541e-05, 3.3833086490631104e-05, 3.6871060729026794e-05, 3.9909034967422485e-05, 4.2947009205818176e-05, 4.598498344421387e-05, 4.902295768260956e-05, 5.206093192100525e-05, 5.509890615940094e-05, 5.813688039779663e-05, 6.117485463619232e-05, 6.421282887458801e-05, 6.72508031129837e-05, 7.02887773513794e-05, 7.332675158977509e-05, 7.636472582817078e-05, 7.940270006656647e-05, 8.244067430496216e-05, 8.547864854335785e-05, 8.851662278175354e-05, 9.155459702014923e-05, 9.459257125854492e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 7.0, 2.0, 5.0, 7.0, 9.0, 9.0, 9.0, 12.0, 17.0, 25.0, 16.0, 33.0, 41.0, 51.0, 46.0, 60.0, 61.0, 43.0, 74.0, 61.0, 45.0, 47.0, 53.0, 45.0, 40.0, 34.0, 25.0, 30.0, 24.0, 10.0, 16.0, 21.0, 8.0, 5.0, 5.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.735324859619141e-06, -6.455928087234497e-06, -6.1765313148498535e-06, -5.89713454246521e-06, -5.617737770080566e-06, -5.338340997695923e-06, -5.058944225311279e-06, -4.779547452926636e-06, -4.500150680541992e-06, -4.220753908157349e-06, -3.941357135772705e-06, -3.6619603633880615e-06, -3.382563591003418e-06, -3.1031668186187744e-06, -2.823770046234131e-06, -2.5443732738494873e-06, -2.2649765014648438e-06, -1.9855797290802e-06, -1.7061829566955566e-06, -1.426786184310913e-06, -1.1473894119262695e-06, -8.67992639541626e-07, -5.885958671569824e-07, -3.0919909477233887e-07, -2.9802322387695312e-08, 2.4959444999694824e-07, 5.289912223815918e-07, 8.083879947662354e-07, 1.087784767150879e-06, 1.3671815395355225e-06, 1.646578311920166e-06, 1.9259750843048096e-06, 2.205371856689453e-06, 2.4847686290740967e-06, 2.7641654014587402e-06, 3.043562173843384e-06, 3.3229589462280273e-06, 3.602355718612671e-06, 3.8817524909973145e-06, 4.161149263381958e-06, 4.4405460357666016e-06, 4.719942808151245e-06, 4.999339580535889e-06, 5.278736352920532e-06, 5.558133125305176e-06, 5.837529897689819e-06, 6.116926670074463e-06, 6.3963234424591064e-06, 6.67572021484375e-06, 6.9551169872283936e-06, 7.234513759613037e-06, 7.513910531997681e-06, 7.793307304382324e-06, 8.072704076766968e-06, 8.352100849151611e-06, 8.631497621536255e-06, 8.910894393920898e-06, 9.190291166305542e-06, 9.469687938690186e-06, 9.749084711074829e-06, 1.0028481483459473e-05, 1.0307878255844116e-05, 1.058727502822876e-05, 1.0866671800613403e-05, 1.1146068572998047e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 6.0, 13.0, 12.0, 13.0, 30.0, 28.0, 36.0, 58.0, 110.0, 364.0, 1776.0, 15254.0, 474884.0, 537684.0, 15631.0, 1909.0, 388.0, 100.0, 64.0, 33.0, 22.0, 19.0, 13.0, 20.0, 20.0, 7.0, 11.0, 6.0, 3.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0004642009735107422, -0.00044969841837882996, -0.0004351958632469177, -0.0004206933081150055, -0.00040619075298309326, -0.00039168819785118103, -0.0003771856427192688, -0.00036268308758735657, -0.00034818053245544434, -0.0003336779773235321, -0.0003191754221916199, -0.00030467286705970764, -0.0002901703119277954, -0.0002756677567958832, -0.00026116520166397095, -0.0002466626465320587, -0.00023216009140014648, -0.00021765753626823425, -0.00020315498113632202, -0.0001886524260044098, -0.00017414987087249756, -0.00015964731574058533, -0.0001451447606086731, -0.00013064220547676086, -0.00011613965034484863, -0.0001016370952129364, -8.713454008102417e-05, -7.263198494911194e-05, -5.812942981719971e-05, -4.3626874685287476e-05, -2.9124319553375244e-05, -1.4621764421463013e-05, -1.1920928955078125e-07, 1.438334584236145e-05, 2.888590097427368e-05, 4.338845610618591e-05, 5.7891011238098145e-05, 7.239356637001038e-05, 8.689612150192261e-05, 0.00010139867663383484, 0.00011590123176574707, 0.0001304037868976593, 0.00014490634202957153, 0.00015940889716148376, 0.000173911452293396, 0.00018841400742530823, 0.00020291656255722046, 0.0002174191176891327, 0.00023192167282104492, 0.00024642422795295715, 0.0002609267830848694, 0.0002754293382167816, 0.00028993189334869385, 0.0003044344484806061, 0.0003189370036125183, 0.00033343955874443054, 0.0003479421138763428, 0.000362444669008255, 0.00037694722414016724, 0.00039144977927207947, 0.0004059523344039917, 0.00042045488953590393, 0.00043495744466781616, 0.0004494599997997284, 0.0004639625549316406]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 11.0, 12.0, 10.0, 23.0, 13.0, 42.0, 27.0, 68.0, 80.0, 120.0, 120.0, 114.0, 75.0, 64.0, 37.0, 41.0, 27.0, 18.0, 14.0, 14.0, 11.0, 10.0, 16.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.7954578399658203e-05, -2.70698219537735e-05, -2.6185065507888794e-05, -2.530030906200409e-05, -2.4415552616119385e-05, -2.353079617023468e-05, -2.2646039724349976e-05, -2.176128327846527e-05, -2.0876526832580566e-05, -1.9991770386695862e-05, -1.9107013940811157e-05, -1.8222257494926453e-05, -1.7337501049041748e-05, -1.6452744603157043e-05, -1.556798815727234e-05, -1.4683231711387634e-05, -1.379847526550293e-05, -1.2913718819618225e-05, -1.202896237373352e-05, -1.1144205927848816e-05, -1.0259449481964111e-05, -9.374693036079407e-06, -8.489936590194702e-06, -7.6051801443099976e-06, -6.720423698425293e-06, -5.835667252540588e-06, -4.950910806655884e-06, -4.066154360771179e-06, -3.1813979148864746e-06, -2.29664146900177e-06, -1.4118850231170654e-06, -5.271285772323608e-07, 3.5762786865234375e-07, 1.2423843145370483e-06, 2.127140760421753e-06, 3.0118972063064575e-06, 3.896653652191162e-06, 4.781410098075867e-06, 5.666166543960571e-06, 6.550922989845276e-06, 7.4356794357299805e-06, 8.320435881614685e-06, 9.20519232749939e-06, 1.0089948773384094e-05, 1.0974705219268799e-05, 1.1859461665153503e-05, 1.2744218111038208e-05, 1.3628974556922913e-05, 1.4513731002807617e-05, 1.5398487448692322e-05, 1.6283243894577026e-05, 1.716800034046173e-05, 1.8052756786346436e-05, 1.893751323223114e-05, 1.9822269678115845e-05, 2.070702612400055e-05, 2.1591782569885254e-05, 2.247653901576996e-05, 2.3361295461654663e-05, 2.4246051907539368e-05, 2.5130808353424072e-05, 2.6015564799308777e-05, 2.690032124519348e-05, 2.7785077691078186e-05, 2.866983413696289e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 3.0, 10.0, 7.0, 7.0, 9.0, 13.0, 10.0, 20.0, 36.0, 46.0, 53.0, 57.0, 79.0, 68.0, 72.0, 86.0, 91.0, 65.0, 65.0, 42.0, 32.0, 28.0, 26.0, 20.0, 9.0, 11.0, 10.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.005957295652478933, -0.0057692439295351505, -0.00558119174093008, -0.005393140017986298, -0.0052050878293812275, -0.005017036106437445, -0.004828983917832375, -0.004640932194888592, -0.004452880006283522, -0.004264828283339739, -0.004076776094734669, -0.0038887241389602423, -0.003700672183185816, -0.0035126202274113894, -0.003324568271636963, -0.00313651654869318, -0.0029484645929187536, -0.002760412637144327, -0.0025723606813699007, -0.0023843087255954742, -0.0021962567698210478, -0.0020082048140466213, -0.0018201529746875167, -0.0016321010189130902, -0.0014440490631386638, -0.0012559971073642373, -0.0010679451515898108, -0.0008798932540230453, -0.0006918412982486188, -0.0005037893424741924, -0.00031573744490742683, -0.00012768548913300037, 6.0366466641426086e-05, 0.00024841842241585255, 0.00043647034908644855, 0.0006245222757570446, 0.000812574231531471, 0.0010006262455135584, 0.001188678084872663, 0.0013767300406470895, 0.001564781996421516, 0.0017528339521959424, 0.0019408859079703689, 0.0021289377473294735, 0.0023169897031039, 0.0025050416588783264, 0.002693093614652753, 0.0028811455704271793, 0.003069197526201606, 0.0032572494819760323, 0.0034453014377504587, 0.003633353393524885, 0.0038214053492993116, 0.004009457305073738, 0.004197509028017521, 0.004385561216622591, 0.004573612939566374, 0.004761664662510157, 0.004949716851115227, 0.0051377685740590096, 0.00532582076266408, 0.0055138724856078625, 0.005701924674212933, 0.005889976397156715, 0.0060780285857617855]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 6.0, 7.0, 10.0, 6.0, 16.0, 15.0, 19.0, 20.0, 20.0, 22.0, 23.0, 39.0, 32.0, 41.0, 47.0, 38.0, 45.0, 56.0, 49.0, 44.0, 54.0, 48.0, 40.0, 37.0, 26.0, 27.0, 21.0, 26.0, 20.0, 31.0, 23.0, 17.0, 11.0, 13.0, 8.0, 10.0, 6.0, 9.0, 7.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0038565758150070906, -0.003727301023900509, -0.0035980259999632835, -0.003468751208856702, -0.00333947641775012, -0.003210201393812895, -0.003080926602706313, -0.0029516518115997314, -0.002822376787662506, -0.0026931019965559244, -0.002563826972618699, -0.0024345521815121174, -0.0023052773904055357, -0.002176002599298954, -0.0020467275753617287, -0.001917452784255147, -0.0017881779931485653, -0.0016589030856266618, -0.00152962829452008, -0.0014003533869981766, -0.0012710785958915949, -0.0011418036883696914, -0.0010125287808477879, -0.0008832539315335453, -0.0007539790822193027, -0.00062470423290506, -0.0004954293835908175, -0.00036615447606891394, -0.00023687962675467134, -0.00010760477744042873, 2.167013008147478e-05, 0.00015094497939571738, 0.00028021959587931633, 0.00040949444519355893, 0.0005387692945078015, 0.000668044202029705, 0.0007973190513439476, 0.0009265939006581903, 0.0010558688081800938, 0.0011851435992866755, 0.001314418506808579, 0.0014436934143304825, 0.0015729682054370642, 0.0017022431129589677, 0.0018315180204808712, 0.001960792811587453, 0.0020900676026940346, 0.00221934262663126, 0.0023486174177378416, 0.0024778922088444233, 0.0026071672327816486, 0.0027364420238882303, 0.002865716814994812, 0.0029949918389320374, 0.003124266630038619, 0.0032535414211452007, 0.003382816445082426, 0.0035120912361890078, 0.003641366260126233, 0.003770641051232815, 0.0038999158423393965, 0.004029190633445978, 0.0041584656573832035, 0.004287740681320429, 0.004417015239596367]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 11.0, 6.0, 9.0, 13.0, 23.0, 31.0, 52.0, 74.0, 171.0, 291.0, 575.0, 1121.0, 2332.0, 5050.0, 11578.0, 28199.0, 74872.0, 218403.0, 409616.0, 187383.0, 64901.0, 24723.0, 10365.0, 4564.0, 2068.0, 1003.0, 492.0, 251.0, 169.0, 74.0, 40.0, 39.0, 20.0, 14.0, 3.0, 8.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01995849609375, -0.0193026065826416, -0.018646717071533203, -0.017990827560424805, -0.017334938049316406, -0.016679048538208008, -0.01602315902709961, -0.015367269515991211, -0.014711380004882812, -0.014055490493774414, -0.013399600982666016, -0.012743711471557617, -0.012087821960449219, -0.01143193244934082, -0.010776042938232422, -0.010120153427124023, -0.009464263916015625, -0.008808374404907227, -0.008152484893798828, -0.00749659538269043, -0.006840705871582031, -0.006184816360473633, -0.005528926849365234, -0.004873037338256836, -0.0042171478271484375, -0.003561258316040039, -0.0029053688049316406, -0.002249479293823242, -0.0015935897827148438, -0.0009377002716064453, -0.0002818107604980469, 0.00037407875061035156, 0.00102996826171875, 0.0016858577728271484, 0.002341747283935547, 0.0029976367950439453, 0.0036535263061523438, 0.004309415817260742, 0.004965305328369141, 0.005621194839477539, 0.0062770843505859375, 0.006932973861694336, 0.007588863372802734, 0.008244752883911133, 0.008900642395019531, 0.00955653190612793, 0.010212421417236328, 0.010868310928344727, 0.011524200439453125, 0.012180089950561523, 0.012835979461669922, 0.01349186897277832, 0.014147758483886719, 0.014803647994995117, 0.015459537506103516, 0.016115427017211914, 0.016771316528320312, 0.01742720603942871, 0.01808309555053711, 0.018738985061645508, 0.019394874572753906, 0.020050764083862305, 0.020706653594970703, 0.0213625431060791, 0.0220184326171875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 11.0, 9.0, 13.0, 14.0, 21.0, 28.0, 37.0, 48.0, 50.0, 48.0, 63.0, 71.0, 73.0, 64.0, 70.0, 60.0, 55.0, 48.0, 45.0, 43.0, 34.0, 20.0, 22.0, 13.0, 19.0, 10.0, 7.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003543853759765625, -0.003398597240447998, -0.003253340721130371, -0.003108084201812744, -0.002962827682495117, -0.0028175711631774902, -0.0026723146438598633, -0.0025270581245422363, -0.0023818016052246094, -0.0022365450859069824, -0.0020912885665893555, -0.0019460320472717285, -0.0018007755279541016, -0.0016555190086364746, -0.0015102624893188477, -0.0013650059700012207, -0.0012197494506835938, -0.0010744929313659668, -0.0009292364120483398, -0.0007839798927307129, -0.0006387233734130859, -0.000493466854095459, -0.00034821033477783203, -0.00020295381546020508, -5.7697296142578125e-05, 8.755922317504883e-05, 0.00023281574249267578, 0.00037807226181030273, 0.0005233287811279297, 0.0006685853004455566, 0.0008138418197631836, 0.0009590983390808105, 0.0011043548583984375, 0.0012496113777160645, 0.0013948678970336914, 0.0015401244163513184, 0.0016853809356689453, 0.0018306374549865723, 0.0019758939743041992, 0.002121150493621826, 0.002266407012939453, 0.00241166353225708, 0.002556920051574707, 0.002702176570892334, 0.002847433090209961, 0.002992689609527588, 0.003137946128845215, 0.003283202648162842, 0.0034284591674804688, 0.0035737156867980957, 0.0037189722061157227, 0.0038642287254333496, 0.0040094852447509766, 0.0041547417640686035, 0.0042999982833862305, 0.004445254802703857, 0.004590511322021484, 0.004735767841339111, 0.004881024360656738, 0.005026280879974365, 0.005171537399291992, 0.005316793918609619, 0.005462050437927246, 0.005607306957244873, 0.0057525634765625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 5.0, 10.0, 6.0, 10.0, 15.0, 26.0, 30.0, 55.0, 43.0, 75.0, 104.0, 180.0, 222.0, 345.0, 540.0, 748.0, 1174.0, 1797.0, 2865.0, 4407.0, 7334.0, 12068.0, 20401.0, 35976.0, 64469.0, 118696.0, 205830.0, 235054.0, 147000.0, 80951.0, 44502.0, 25156.0, 14699.0, 8674.0, 5352.0, 3407.0, 2106.0, 1332.0, 917.0, 615.0, 428.0, 285.0, 191.0, 127.0, 107.0, 59.0, 62.0, 35.0, 22.0, 17.0, 10.0, 8.0, 8.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.007762908935546875, -0.007513940334320068, -0.007264971733093262, -0.007016003131866455, -0.0067670345306396484, -0.006518065929412842, -0.006269097328186035, -0.0060201287269592285, -0.005771160125732422, -0.005522191524505615, -0.005273222923278809, -0.005024254322052002, -0.004775285720825195, -0.004526317119598389, -0.004277348518371582, -0.004028379917144775, -0.0037794113159179688, -0.003530442714691162, -0.0032814741134643555, -0.003032505512237549, -0.002783536911010742, -0.0025345683097839355, -0.002285599708557129, -0.0020366311073303223, -0.0017876625061035156, -0.001538693904876709, -0.0012897253036499023, -0.0010407567024230957, -0.0007917881011962891, -0.0005428194999694824, -0.0002938508987426758, -4.488229751586914e-05, 0.0002040863037109375, 0.00045305490493774414, 0.0007020235061645508, 0.0009509921073913574, 0.001199960708618164, 0.0014489293098449707, 0.0016978979110717773, 0.001946866512298584, 0.0021958351135253906, 0.0024448037147521973, 0.002693772315979004, 0.0029427409172058105, 0.003191709518432617, 0.003440678119659424, 0.0036896467208862305, 0.003938615322113037, 0.004187583923339844, 0.00443655252456665, 0.004685521125793457, 0.004934489727020264, 0.00518345832824707, 0.005432426929473877, 0.005681395530700684, 0.00593036413192749, 0.006179332733154297, 0.0064283013343811035, 0.00667726993560791, 0.006926238536834717, 0.0071752071380615234, 0.00742417573928833, 0.007673144340515137, 0.007922112941741943, 0.00817108154296875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 5.0, 6.0, 5.0, 12.0, 9.0, 12.0, 11.0, 16.0, 21.0, 18.0, 27.0, 28.0, 35.0, 28.0, 26.0, 35.0, 31.0, 39.0, 38.0, 54.0, 46.0, 37.0, 34.0, 52.0, 51.0, 38.0, 33.0, 36.0, 29.0, 24.0, 29.0, 14.0, 12.0, 13.0, 16.0, 12.0, 9.0, 11.0, 11.0, 8.0, 5.0, 4.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0025424957275390625, -0.0024600625038146973, -0.002377629280090332, -0.002295196056365967, -0.0022127628326416016, -0.0021303296089172363, -0.002047896385192871, -0.001965463161468506, -0.0018830299377441406, -0.0018005967140197754, -0.0017181634902954102, -0.001635730266571045, -0.0015532970428466797, -0.0014708638191223145, -0.0013884305953979492, -0.001305997371673584, -0.0012235641479492188, -0.0011411309242248535, -0.0010586977005004883, -0.000976264476776123, -0.0008938312530517578, -0.0008113980293273926, -0.0007289648056030273, -0.0006465315818786621, -0.0005640983581542969, -0.00048166513442993164, -0.0003992319107055664, -0.00031679868698120117, -0.00023436546325683594, -0.0001519322395324707, -6.949901580810547e-05, 1.2934207916259766e-05, 9.5367431640625e-05, 0.00017780065536499023, 0.00026023387908935547, 0.0003426671028137207, 0.00042510032653808594, 0.0005075335502624512, 0.0005899667739868164, 0.0006723999977111816, 0.0007548332214355469, 0.0008372664451599121, 0.0009196996688842773, 0.0010021328926086426, 0.0010845661163330078, 0.001166999340057373, 0.0012494325637817383, 0.0013318657875061035, 0.0014142990112304688, 0.001496732234954834, 0.0015791654586791992, 0.0016615986824035645, 0.0017440319061279297, 0.001826465129852295, 0.0019088983535766602, 0.0019913315773010254, 0.0020737648010253906, 0.002156198024749756, 0.002238631248474121, 0.0023210644721984863, 0.0024034976959228516, 0.002485930919647217, 0.002568364143371582, 0.0026507973670959473, 0.0027332305908203125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 10.0, 10.0, 31.0, 35.0, 45.0, 76.0, 89.0, 142.0, 171.0, 242.0, 273.0, 359.0, 499.0, 641.0, 913.0, 1230.0, 1877.0, 2793.0, 4645.0, 8535.0, 20876.0, 81696.0, 770664.0, 104040.0, 24386.0, 9475.0, 4899.0, 3001.0, 1908.0, 1256.0, 928.0, 669.0, 480.0, 409.0, 319.0, 210.0, 172.0, 149.0, 107.0, 84.0, 63.0, 35.0, 36.0, 12.0, 16.0, 14.0, 6.0, 6.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.01024627685546875, -0.009921669960021973, -0.009597063064575195, -0.009272456169128418, -0.00894784927368164, -0.008623242378234863, -0.008298635482788086, -0.007974028587341309, -0.007649421691894531, -0.007324814796447754, -0.0070002079010009766, -0.006675601005554199, -0.006350994110107422, -0.0060263872146606445, -0.005701780319213867, -0.00537717342376709, -0.0050525665283203125, -0.004727959632873535, -0.004403352737426758, -0.0040787458419799805, -0.003754138946533203, -0.0034295320510864258, -0.0031049251556396484, -0.002780318260192871, -0.0024557113647460938, -0.0021311044692993164, -0.001806497573852539, -0.0014818906784057617, -0.0011572837829589844, -0.000832676887512207, -0.0005080699920654297, -0.00018346309661865234, 0.000141143798828125, 0.00046575069427490234, 0.0007903575897216797, 0.001114964485168457, 0.0014395713806152344, 0.0017641782760620117, 0.002088785171508789, 0.0024133920669555664, 0.0027379989624023438, 0.003062605857849121, 0.0033872127532958984, 0.0037118196487426758, 0.004036426544189453, 0.0043610334396362305, 0.004685640335083008, 0.005010247230529785, 0.0053348541259765625, 0.00565946102142334, 0.005984067916870117, 0.0063086748123168945, 0.006633281707763672, 0.006957888603210449, 0.0072824954986572266, 0.007607102394104004, 0.007931709289550781, 0.008256316184997559, 0.008580923080444336, 0.008905529975891113, 0.00923013687133789, 0.009554743766784668, 0.009879350662231445, 0.010203957557678223, 0.010528564453125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 11.0, 6.0, 7.0, 10.0, 7.0, 12.0, 15.0, 13.0, 26.0, 37.0, 53.0, 89.0, 112.0, 114.0, 110.0, 111.0, 74.0, 44.0, 31.0, 21.0, 17.0, 11.0, 3.0, 11.0, 7.0, 8.0, 5.0, 5.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1563301086425781e-05, -1.1199153959751129e-05, -1.0835006833076477e-05, -1.0470859706401825e-05, -1.0106712579727173e-05, -9.74256545305252e-06, -9.378418326377869e-06, -9.014271199703217e-06, -8.650124073028564e-06, -8.285976946353912e-06, -7.92182981967926e-06, -7.557682693004608e-06, -7.193535566329956e-06, -6.829388439655304e-06, -6.465241312980652e-06, -6.101094186306e-06, -5.736947059631348e-06, -5.3727999329566956e-06, -5.0086528062820435e-06, -4.644505679607391e-06, -4.280358552932739e-06, -3.916211426258087e-06, -3.552064299583435e-06, -3.187917172908783e-06, -2.823770046234131e-06, -2.4596229195594788e-06, -2.0954757928848267e-06, -1.7313286662101746e-06, -1.3671815395355225e-06, -1.0030344128608704e-06, -6.388872861862183e-07, -2.7474015951156616e-07, 8.940696716308594e-08, 4.5355409383773804e-07, 8.177012205123901e-07, 1.1818483471870422e-06, 1.5459954738616943e-06, 1.9101426005363464e-06, 2.2742897272109985e-06, 2.6384368538856506e-06, 3.0025839805603027e-06, 3.366731107234955e-06, 3.730878233909607e-06, 4.095025360584259e-06, 4.459172487258911e-06, 4.823319613933563e-06, 5.187466740608215e-06, 5.5516138672828674e-06, 5.9157609939575195e-06, 6.279908120632172e-06, 6.644055247306824e-06, 7.008202373981476e-06, 7.372349500656128e-06, 7.73649662733078e-06, 8.100643754005432e-06, 8.464790880680084e-06, 8.828938007354736e-06, 9.193085134029388e-06, 9.55723226070404e-06, 9.921379387378693e-06, 1.0285526514053345e-05, 1.0649673640727997e-05, 1.1013820767402649e-05, 1.1377967894077301e-05, 1.1742115020751953e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 6.0, 16.0, 17.0, 24.0, 28.0, 31.0, 72.0, 79.0, 133.0, 195.0, 314.0, 503.0, 814.0, 1443.0, 2428.0, 4568.0, 9701.0, 29688.0, 209661.0, 718336.0, 45223.0, 12624.0, 5452.0, 2989.0, 1658.0, 933.0, 571.0, 340.0, 211.0, 154.0, 100.0, 80.0, 47.0, 42.0, 18.0, 19.0, 6.0, 6.0, 9.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01361083984375, -0.013187289237976074, -0.012763738632202148, -0.012340188026428223, -0.011916637420654297, -0.011493086814880371, -0.011069536209106445, -0.01064598560333252, -0.010222434997558594, -0.009798884391784668, -0.009375333786010742, -0.008951783180236816, -0.00852823257446289, -0.008104681968688965, -0.007681131362915039, -0.007257580757141113, -0.0068340301513671875, -0.006410479545593262, -0.005986928939819336, -0.00556337833404541, -0.005139827728271484, -0.004716277122497559, -0.004292726516723633, -0.003869175910949707, -0.0034456253051757812, -0.0030220746994018555, -0.0025985240936279297, -0.002174973487854004, -0.0017514228820800781, -0.0013278722763061523, -0.0009043216705322266, -0.0004807710647583008, -5.7220458984375e-05, 0.0003663301467895508, 0.0007898807525634766, 0.0012134313583374023, 0.0016369819641113281, 0.002060532569885254, 0.0024840831756591797, 0.0029076337814331055, 0.0033311843872070312, 0.003754734992980957, 0.004178285598754883, 0.004601836204528809, 0.005025386810302734, 0.00544893741607666, 0.005872488021850586, 0.006296038627624512, 0.0067195892333984375, 0.007143139839172363, 0.007566690444946289, 0.007990241050720215, 0.00841379165649414, 0.008837342262268066, 0.009260892868041992, 0.009684443473815918, 0.010107994079589844, 0.01053154468536377, 0.010955095291137695, 0.011378645896911621, 0.011802196502685547, 0.012225747108459473, 0.012649297714233398, 0.013072848320007324, 0.01349639892578125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 6.0, 5.0, 8.0, 17.0, 30.0, 44.0, 83.0, 379.0, 212.0, 80.0, 49.0, 19.0, 6.0, 13.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0042877197265625, -0.004164665937423706, -0.004041612148284912, -0.003918558359146118, -0.0037955045700073242, -0.0036724507808685303, -0.0035493969917297363, -0.0034263432025909424, -0.0033032894134521484, -0.0031802356243133545, -0.0030571818351745605, -0.0029341280460357666, -0.0028110742568969727, -0.0026880204677581787, -0.0025649666786193848, -0.002441912889480591, -0.002318859100341797, -0.002195805311203003, -0.002072751522064209, -0.001949697732925415, -0.001826643943786621, -0.0017035901546478271, -0.0015805363655090332, -0.0014574825763702393, -0.0013344287872314453, -0.0012113749980926514, -0.0010883212089538574, -0.0009652674198150635, -0.0008422136306762695, -0.0007191598415374756, -0.0005961060523986816, -0.0004730522632598877, -0.00034999847412109375, -0.0002269446849822998, -0.00010389089584350586, 1.9162893295288086e-05, 0.00014221668243408203, 0.000265270471572876, 0.0003883242607116699, 0.0005113780498504639, 0.0006344318389892578, 0.0007574856281280518, 0.0008805394172668457, 0.0010035932064056396, 0.0011266469955444336, 0.0012497007846832275, 0.0013727545738220215, 0.0014958083629608154, 0.0016188621520996094, 0.0017419159412384033, 0.0018649697303771973, 0.001988023519515991, 0.002111077308654785, 0.002234131097793579, 0.002357184886932373, 0.002480238676071167, 0.002603292465209961, 0.002726346254348755, 0.002849400043487549, 0.0029724538326263428, 0.0030955076217651367, 0.0032185614109039307, 0.0033416152000427246, 0.0034646689891815186, 0.0035877227783203125]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 10.0, 20.0, 83.0, 245.0, 401.0, 180.0, 48.0, 23.0, 5.0, 4.0], "bins": [-0.06226911395788193, -0.06120150536298752, -0.06013390049338341, -0.059066291898489, -0.05799868702888489, -0.05693107843399048, -0.05586347356438637, -0.05479586496949196, -0.05372826009988785, -0.05266065150499344, -0.05159304663538933, -0.05052543804049492, -0.04945783317089081, -0.0483902245759964, -0.04732261970639229, -0.04625501111149788, -0.04518740624189377, -0.04411979764699936, -0.04305219277739525, -0.04198458418250084, -0.04091697931289673, -0.03984937071800232, -0.03878176584839821, -0.0377141572535038, -0.03664654865860939, -0.03557894006371498, -0.03451133519411087, -0.03344372659921646, -0.03237612172961235, -0.03130851313471794, -0.03024090826511383, -0.02917329967021942, -0.02810569293797016, -0.0270380862057209, -0.02597047947347164, -0.02490287274122238, -0.02383526600897312, -0.02276765927672386, -0.021700050681829453, -0.020632445812225342, -0.019564837217330933, -0.018497230485081673, -0.017429623752832413, -0.016362017020583153, -0.015294410288333893, -0.014226803556084633, -0.013159195892512798, -0.012091589160263538, -0.011023983359336853, -0.009956376627087593, -0.008888769894838333, -0.007821163162589073, -0.006753555964678526, -0.005685949232429266, -0.004618342034518719, -0.0035507353022694588, -0.0024831281043589115, -0.0014155212556943297, -0.00034791440702974796, 0.0007196925580501556, 0.0017872992902994156, 0.0028549060225486755, 0.003922513220459223, 0.004990119952708483, 0.006057726684957743]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 4.0, 11.0, 3.0, 9.0, 6.0, 14.0, 19.0, 11.0, 21.0, 25.0, 29.0, 25.0, 29.0, 36.0, 44.0, 53.0, 49.0, 54.0, 47.0, 32.0, 55.0, 38.0, 51.0, 46.0, 33.0, 34.0, 38.0, 30.0, 22.0, 28.0, 27.0, 14.0, 15.0, 13.0, 15.0, 5.0, 12.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0049187131226062775, -0.0047861626371741295, -0.004653612617403269, -0.004521062597632408, -0.00438851211220026, -0.004255961626768112, -0.0041234116069972515, -0.003990861587226391, -0.003858311101794243, -0.0037257608491927385, -0.003593210596591234, -0.00346066034398973, -0.0033281100913882256, -0.0031955598387867212, -0.003063009586185217, -0.0029304593335837126, -0.0027979090809822083, -0.002665358828380704, -0.0025328085757791996, -0.0024002583231776953, -0.002267708070576191, -0.0021351578179746866, -0.0020026075653731823, -0.001870057312771678, -0.0017375070601701736, -0.0016049568075686693, -0.001472406554967165, -0.0013398563023656607, -0.0012073060497641563, -0.001074755797162652, -0.0009422055445611477, -0.0008096552919596434, -0.0006771045736968517, -0.0005445543210953474, -0.0004120040684938431, -0.00027945381589233875, -0.00014690356329083443, -1.4353310689330101e-05, 0.00011819694191217422, 0.00025074719451367855, 0.0003832974471151829, 0.0005158476997166872, 0.0006483979523181915, 0.0007809482049196959, 0.0009134984575212002, 0.0010460487101227045, 0.0011785989627242088, 0.0013111492153257132, 0.0014436994679272175, 0.0015762497205287218, 0.0017087999731302261, 0.0018413502257317305, 0.001973900478333235, 0.002106450730934739, 0.0022390009835362434, 0.0023715512361377478, 0.002504101488739252, 0.0026366517413407564, 0.0027692019939422607, 0.002901752246543765, 0.0030343024991452694, 0.0031668527517467737, 0.003299403004348278, 0.0034319532569497824, 0.0035645035095512867]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 8.0, 5.0, 10.0, 6.0, 16.0, 26.0, 39.0, 46.0, 65.0, 109.0, 140.0, 247.0, 390.0, 579.0, 1020.0, 1757.0, 3047.0, 6034.0, 14032.0, 70864.0, 886308.0, 2893294.0, 264913.0, 31309.0, 9654.0, 4553.0, 2331.0, 1354.0, 772.0, 471.0, 300.0, 184.0, 109.0, 76.0, 75.0, 37.0, 21.0, 17.0, 19.0, 12.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.015716552734375, -0.015244007110595703, -0.014771461486816406, -0.01429891586303711, -0.013826370239257812, -0.013353824615478516, -0.012881278991699219, -0.012408733367919922, -0.011936187744140625, -0.011463642120361328, -0.010991096496582031, -0.010518550872802734, -0.010046005249023438, -0.00957345962524414, -0.009100914001464844, -0.008628368377685547, -0.00815582275390625, -0.007683277130126953, -0.007210731506347656, -0.006738185882568359, -0.0062656402587890625, -0.005793094635009766, -0.005320549011230469, -0.004848003387451172, -0.004375457763671875, -0.003902912139892578, -0.0034303665161132812, -0.0029578208923339844, -0.0024852752685546875, -0.0020127296447753906, -0.0015401840209960938, -0.0010676383972167969, -0.0005950927734375, -0.00012254714965820312, 0.00034999847412109375, 0.0008225440979003906, 0.0012950897216796875, 0.0017676353454589844, 0.0022401809692382812, 0.002712726593017578, 0.003185272216796875, 0.003657817840576172, 0.004130363464355469, 0.004602909088134766, 0.0050754547119140625, 0.005548000335693359, 0.006020545959472656, 0.006493091583251953, 0.00696563720703125, 0.007438182830810547, 0.007910728454589844, 0.00838327407836914, 0.008855819702148438, 0.009328365325927734, 0.009800910949707031, 0.010273456573486328, 0.010746002197265625, 0.011218547821044922, 0.011691093444824219, 0.012163639068603516, 0.012636184692382812, 0.01310873031616211, 0.013581275939941406, 0.014053821563720703, 0.0145263671875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 11.0, 3.0, 10.0, 5.0, 17.0, 12.0, 16.0, 16.0, 19.0, 32.0, 25.0, 25.0, 32.0, 41.0, 39.0, 36.0, 34.0, 39.0, 42.0, 41.0, 40.0, 47.0, 43.0, 44.0, 31.0, 25.0, 28.0, 39.0, 21.0, 28.0, 26.0, 13.0, 22.0, 21.0, 16.0, 9.0, 9.0, 7.0, 5.0, 7.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0028514862060546875, -0.002767026424407959, -0.0026825666427612305, -0.002598106861114502, -0.0025136470794677734, -0.002429187297821045, -0.0023447275161743164, -0.002260267734527588, -0.0021758079528808594, -0.002091348171234131, -0.0020068883895874023, -0.0019224286079406738, -0.0018379688262939453, -0.0017535090446472168, -0.0016690492630004883, -0.0015845894813537598, -0.0015001296997070312, -0.0014156699180603027, -0.0013312101364135742, -0.0012467503547668457, -0.0011622905731201172, -0.0010778307914733887, -0.0009933710098266602, -0.0009089112281799316, -0.0008244514465332031, -0.0007399916648864746, -0.0006555318832397461, -0.0005710721015930176, -0.00048661231994628906, -0.00040215253829956055, -0.00031769275665283203, -0.00023323297500610352, -0.000148773193359375, -6.431341171264648e-05, 2.014636993408203e-05, 0.00010460615158081055, 0.00018906593322753906, 0.0002735257148742676, 0.0003579854965209961, 0.0004424452781677246, 0.0005269050598144531, 0.0006113648414611816, 0.0006958246231079102, 0.0007802844047546387, 0.0008647441864013672, 0.0009492039680480957, 0.0010336637496948242, 0.0011181235313415527, 0.0012025833129882812, 0.0012870430946350098, 0.0013715028762817383, 0.0014559626579284668, 0.0015404224395751953, 0.0016248822212219238, 0.0017093420028686523, 0.0017938017845153809, 0.0018782615661621094, 0.001962721347808838, 0.0020471811294555664, 0.002131640911102295, 0.0022161006927490234, 0.002300560474395752, 0.0023850202560424805, 0.002469480037689209, 0.0025539398193359375]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 9.0, 18.0, 25.0, 35.0, 56.0, 102.0, 210.0, 499.0, 1368.0, 3759.0, 12764.0, 57031.0, 1737817.0, 2299068.0, 61723.0, 13484.0, 3967.0, 1326.0, 545.0, 206.0, 108.0, 55.0, 34.0, 19.0, 11.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022705078125, -0.021973133087158203, -0.021241188049316406, -0.02050924301147461, -0.019777297973632812, -0.019045352935791016, -0.01831340789794922, -0.017581462860107422, -0.016849517822265625, -0.016117572784423828, -0.015385627746582031, -0.014653682708740234, -0.013921737670898438, -0.01318979263305664, -0.012457847595214844, -0.011725902557373047, -0.01099395751953125, -0.010262012481689453, -0.009530067443847656, -0.00879812240600586, -0.008066177368164062, -0.007334232330322266, -0.006602287292480469, -0.005870342254638672, -0.005138397216796875, -0.004406452178955078, -0.0036745071411132812, -0.0029425621032714844, -0.0022106170654296875, -0.0014786720275878906, -0.0007467269897460938, -1.4781951904296875e-05, 0.0007171630859375, 0.0014491081237792969, 0.0021810531616210938, 0.0029129981994628906, 0.0036449432373046875, 0.004376888275146484, 0.005108833312988281, 0.005840778350830078, 0.006572723388671875, 0.007304668426513672, 0.008036613464355469, 0.008768558502197266, 0.009500503540039062, 0.01023244857788086, 0.010964393615722656, 0.011696338653564453, 0.01242828369140625, 0.013160228729248047, 0.013892173767089844, 0.01462411880493164, 0.015356063842773438, 0.016088008880615234, 0.01681995391845703, 0.017551898956298828, 0.018283843994140625, 0.019015789031982422, 0.01974773406982422, 0.020479679107666016, 0.021211624145507812, 0.02194356918334961, 0.022675514221191406, 0.023407459259033203, 0.024139404296875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 8.0, 5.0, 14.0, 8.0, 11.0, 17.0, 23.0, 34.0, 38.0, 41.0, 113.0, 219.0, 421.0, 726.0, 862.0, 664.0, 314.0, 196.0, 103.0, 50.0, 37.0, 30.0, 25.0, 18.0, 15.0, 17.0, 10.0, 9.0, 8.0, 5.0, 5.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026569366455078125, -0.0025749504566192627, -0.002492964267730713, -0.002410978078842163, -0.0023289918899536133, -0.0022470057010650635, -0.0021650195121765137, -0.002083033323287964, -0.002001047134399414, -0.0019190609455108643, -0.0018370747566223145, -0.0017550885677337646, -0.0016731023788452148, -0.001591116189956665, -0.0015091300010681152, -0.0014271438121795654, -0.0013451576232910156, -0.0012631714344024658, -0.001181185245513916, -0.0010991990566253662, -0.0010172128677368164, -0.0009352266788482666, -0.0008532404899597168, -0.000771254301071167, -0.0006892681121826172, -0.0006072819232940674, -0.0005252957344055176, -0.0004433095455169678, -0.00036132335662841797, -0.00027933716773986816, -0.00019735097885131836, -0.00011536478996276855, -3.337860107421875e-05, 4.8607587814331055e-05, 0.00013059377670288086, 0.00021257996559143066, 0.00029456615447998047, 0.0003765523433685303, 0.0004585385322570801, 0.0005405247211456299, 0.0006225109100341797, 0.0007044970989227295, 0.0007864832878112793, 0.0008684694766998291, 0.0009504556655883789, 0.0010324418544769287, 0.0011144280433654785, 0.0011964142322540283, 0.0012784004211425781, 0.001360386610031128, 0.0014423727989196777, 0.0015243589878082275, 0.0016063451766967773, 0.0016883313655853271, 0.001770317554473877, 0.0018523037433624268, 0.0019342899322509766, 0.0020162761211395264, 0.002098262310028076, 0.002180248498916626, 0.0022622346878051758, 0.0023442208766937256, 0.0024262070655822754, 0.002508193254470825, 0.002590179443359375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 6.0, 9.0, 19.0, 28.0, 56.0, 84.0, 117.0, 203.0, 186.0, 121.0, 79.0, 37.0, 20.0, 19.0, 7.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.016909023746848106, -0.016539962962269783, -0.01617090031504631, -0.015801839530467987, -0.015432776883244514, -0.015063715167343616, -0.014694653451442719, -0.01432559173554182, -0.013956530019640923, -0.013587468303740025, -0.013218406587839127, -0.012849344871938229, -0.01248028315603733, -0.012111221440136433, -0.011742159724235535, -0.011373098008334637, -0.011004036292433739, -0.01063497457653284, -0.010265912860631943, -0.009896851144731045, -0.009527789428830147, -0.009158727712929249, -0.00878966599702835, -0.008420604281127453, -0.00805154349654913, -0.0076824817806482315, -0.0073134200647473335, -0.0069443583488464355, -0.006575296632945538, -0.00620623491704464, -0.005837173201143742, -0.005468111485242844, -0.005099049303680658, -0.00472998758777976, -0.004360925871878862, -0.003991864155977964, -0.0036228024400770664, -0.0032537407241761684, -0.002884679241105914, -0.002515617525205016, -0.002146555809304118, -0.0017774940934032202, -0.0014084323775023222, -0.001039370778016746, -0.0006703090621158481, -0.0003012473462149501, 6.781425327062607e-05, 0.00043687596917152405, 0.000805937685072422, 0.00117499940097332, 0.001544061116874218, 0.0019131227163597941, 0.002282184548676014, 0.002651246264576912, 0.0030203077476471663, 0.0033893694635480642, 0.003758431179448962, 0.0041274926625192165, 0.0044965543784201145, 0.0048656160943210125, 0.0052346778102219105, 0.0056037395261228085, 0.0059728012420237064, 0.006341862957924604, 0.006710924673825502]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 9.0, 16.0, 13.0, 13.0, 16.0, 9.0, 20.0, 20.0, 18.0, 32.0, 26.0, 38.0, 30.0, 31.0, 30.0, 29.0, 45.0, 49.0, 44.0, 35.0, 51.0, 35.0, 39.0, 31.0, 35.0, 35.0, 29.0, 35.0, 23.0, 23.0, 24.0, 21.0, 10.0, 12.0, 12.0, 12.0, 13.0, 7.0, 7.0, 6.0, 0.0, 0.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0033469628542661667, -0.003238585777580738, -0.0031302087008953094, -0.003021831624209881, -0.002913454547524452, -0.0028050774708390236, -0.002696700394153595, -0.0025883233174681664, -0.0024799462407827377, -0.002371569164097309, -0.0022631920874118805, -0.002154815010726452, -0.0020464379340410233, -0.0019380608573555946, -0.0018296838970854878, -0.0017213068204000592, -0.0016129298601299524, -0.0015045527834445238, -0.0013961757067590952, -0.0012877986300736666, -0.001179421553388238, -0.0010710444767028093, -0.0009626675164327025, -0.0008542904397472739, -0.0007459133630618453, -0.0006375362863764167, -0.0005291592096909881, -0.00042078219121322036, -0.00031240511452779174, -0.00020402803784236312, -9.565101936459541e-05, 1.2726057320833206e-05, 0.00012110336683690548, 0.00022948042897041887, 0.00033785749110393226, 0.0004462345386855304, 0.000554611615370959, 0.0006629886920563877, 0.0007713657105341554, 0.000879742787219584, 0.0009881198639050126, 0.0010964969405904412, 0.0012048740172758698, 0.0013132509775459766, 0.0014216280542314053, 0.0015300051309168339, 0.0016383822076022625, 0.0017467592842876911, 0.0018551363609731197, 0.0019635134376585484, 0.002071890514343977, 0.0021802675910294056, 0.002288644667714834, 0.002397021744400263, 0.0025053988210856915, 0.00261377589777112, 0.0027221529744565487, 0.0028305300511419773, 0.002938907127827406, 0.0030472842045128345, 0.003155661281198263, 0.003264038357883692, 0.0033724154345691204, 0.003480792511254549, 0.003589169355109334]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 8.0, 9.0, 25.0, 27.0, 32.0, 52.0, 95.0, 135.0, 190.0, 268.0, 390.0, 518.0, 852.0, 1159.0, 1757.0, 2440.0, 3566.0, 5164.0, 7436.0, 11020.0, 16069.0, 23347.0, 33470.0, 49360.0, 71329.0, 105119.0, 151347.0, 168666.0, 124409.0, 84688.0, 57937.0, 40098.0, 27339.0, 18832.0, 13134.0, 8858.0, 6038.0, 4257.0, 2844.0, 2019.0, 1383.0, 911.0, 604.0, 433.0, 315.0, 213.0, 140.0, 83.0, 60.0, 40.0, 22.0, 27.0, 11.0, 10.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0], "bins": [-0.0008578300476074219, -0.0008303523063659668, -0.0008028745651245117, -0.0007753968238830566, -0.0007479190826416016, -0.0007204413414001465, -0.0006929636001586914, -0.0006654858589172363, -0.0006380081176757812, -0.0006105303764343262, -0.0005830526351928711, -0.000555574893951416, -0.0005280971527099609, -0.0005006194114685059, -0.0004731416702270508, -0.0004456639289855957, -0.0004181861877441406, -0.00039070844650268555, -0.00036323070526123047, -0.0003357529640197754, -0.0003082752227783203, -0.00028079748153686523, -0.00025331974029541016, -0.00022584199905395508, -0.0001983642578125, -0.00017088651657104492, -0.00014340877532958984, -0.00011593103408813477, -8.845329284667969e-05, -6.097555160522461e-05, -3.349781036376953e-05, -6.020069122314453e-06, 2.1457672119140625e-05, 4.89354133605957e-05, 7.641315460205078e-05, 0.00010389089584350586, 0.00013136863708496094, 0.00015884637832641602, 0.0001863241195678711, 0.00021380186080932617, 0.00024127960205078125, 0.00026875734329223633, 0.0002962350845336914, 0.0003237128257751465, 0.00035119056701660156, 0.00037866830825805664, 0.0004061460494995117, 0.0004336237907409668, 0.0004611015319824219, 0.000488579273223877, 0.000516057014465332, 0.0005435347557067871, 0.0005710124969482422, 0.0005984902381896973, 0.0006259679794311523, 0.0006534457206726074, 0.0006809234619140625, 0.0007084012031555176, 0.0007358789443969727, 0.0007633566856384277, 0.0007908344268798828, 0.0008183121681213379, 0.000845789909362793, 0.000873267650604248, 0.0009007453918457031]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 7.0, 6.0, 13.0, 10.0, 8.0, 9.0, 11.0, 15.0, 15.0, 22.0, 24.0, 22.0, 14.0, 33.0, 35.0, 40.0, 27.0, 25.0, 37.0, 41.0, 44.0, 31.0, 44.0, 39.0, 35.0, 36.0, 39.0, 34.0, 38.0, 34.0, 21.0, 28.0, 20.0, 16.0, 25.0, 16.0, 15.0, 14.0, 8.0, 15.0, 9.0, 6.0, 7.0, 4.0, 6.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.003662109375, -0.0035542547702789307, -0.0034464001655578613, -0.003338545560836792, -0.0032306909561157227, -0.0031228363513946533, -0.003014981746673584, -0.0029071271419525146, -0.0027992725372314453, -0.002691417932510376, -0.0025835633277893066, -0.0024757087230682373, -0.002367854118347168, -0.0022599995136260986, -0.0021521449089050293, -0.00204429030418396, -0.0019364356994628906, -0.0018285810947418213, -0.001720726490020752, -0.0016128718852996826, -0.0015050172805786133, -0.001397162675857544, -0.0012893080711364746, -0.0011814534664154053, -0.001073598861694336, -0.0009657442569732666, -0.0008578896522521973, -0.0007500350475311279, -0.0006421804428100586, -0.0005343258380889893, -0.0004264712333679199, -0.0003186166286468506, -0.00021076202392578125, -0.00010290741920471191, 4.947185516357422e-06, 0.00011280179023742676, 0.0002206563949584961, 0.00032851099967956543, 0.00043636560440063477, 0.0005442202091217041, 0.0006520748138427734, 0.0007599294185638428, 0.0008677840232849121, 0.0009756386280059814, 0.0010834932327270508, 0.0011913478374481201, 0.0012992024421691895, 0.0014070570468902588, 0.0015149116516113281, 0.0016227662563323975, 0.0017306208610534668, 0.0018384754657745361, 0.0019463300704956055, 0.002054184675216675, 0.002162039279937744, 0.0022698938846588135, 0.002377748489379883, 0.002485603094100952, 0.0025934576988220215, 0.002701312303543091, 0.00280916690826416, 0.0029170215129852295, 0.003024876117706299, 0.003132730722427368, 0.0032405853271484375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 8.0, 21.0, 31.0, 24.0, 39.0, 87.0, 126.0, 192.0, 274.0, 464.0, 668.0, 991.0, 1496.0, 2267.0, 3546.0, 5436.0, 8498.0, 13366.0, 21372.0, 34360.0, 55732.0, 93646.0, 168647.0, 257558.0, 153514.0, 86902.0, 52089.0, 31601.0, 20073.0, 12713.0, 8165.0, 5258.0, 3252.0, 2156.0, 1394.0, 857.0, 600.0, 400.0, 250.0, 146.0, 108.0, 70.0, 47.0, 40.0, 27.0, 11.0, 13.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010061264038085938, -0.0009730607271194458, -0.0009399950504302979, -0.0009069293737411499, -0.000873863697052002, -0.000840798020362854, -0.0008077323436737061, -0.0007746666669845581, -0.0007416009902954102, -0.0007085353136062622, -0.0006754696369171143, -0.0006424039602279663, -0.0006093382835388184, -0.0005762726068496704, -0.0005432069301605225, -0.0005101412534713745, -0.00047707557678222656, -0.0004440099000930786, -0.00041094422340393066, -0.0003778785467147827, -0.00034481287002563477, -0.0003117471933364868, -0.00027868151664733887, -0.0002456158399581909, -0.00021255016326904297, -0.00017948448657989502, -0.00014641880989074707, -0.00011335313320159912, -8.028745651245117e-05, -4.722177982330322e-05, -1.4156103134155273e-05, 1.8909573554992676e-05, 5.1975250244140625e-05, 8.504092693328857e-05, 0.00011810660362243652, 0.00015117228031158447, 0.00018423795700073242, 0.00021730363368988037, 0.0002503693103790283, 0.00028343498706817627, 0.0003165006637573242, 0.00034956634044647217, 0.0003826320171356201, 0.00041569769382476807, 0.000448763370513916, 0.00048182904720306396, 0.0005148947238922119, 0.0005479604005813599, 0.0005810260772705078, 0.0006140917539596558, 0.0006471574306488037, 0.0006802231073379517, 0.0007132887840270996, 0.0007463544607162476, 0.0007794201374053955, 0.0008124858140945435, 0.0008455514907836914, 0.0008786171674728394, 0.0009116828441619873, 0.0009447485208511353, 0.0009778141975402832, 0.0010108798742294312, 0.001043945550918579, 0.001077011227607727, 0.001110076904296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 8.0, 7.0, 11.0, 10.0, 14.0, 17.0, 24.0, 26.0, 27.0, 28.0, 24.0, 27.0, 28.0, 31.0, 34.0, 40.0, 36.0, 32.0, 41.0, 36.0, 38.0, 41.0, 44.0, 43.0, 25.0, 32.0, 35.0, 20.0, 27.0, 27.0, 32.0, 23.0, 16.0, 16.0, 13.0, 13.0, 7.0, 8.0, 8.0, 8.0, 2.0, 2.0, 5.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0022640228271484375, -0.0021918118000030518, -0.002119600772857666, -0.0020473897457122803, -0.0019751787185668945, -0.0019029676914215088, -0.001830756664276123, -0.0017585456371307373, -0.0016863346099853516, -0.0016141235828399658, -0.00154191255569458, -0.0014697015285491943, -0.0013974905014038086, -0.0013252794742584229, -0.0012530684471130371, -0.0011808574199676514, -0.0011086463928222656, -0.0010364353656768799, -0.0009642243385314941, -0.0008920133113861084, -0.0008198022842407227, -0.0007475912570953369, -0.0006753802299499512, -0.0006031692028045654, -0.0005309581756591797, -0.00045874714851379395, -0.0003865361213684082, -0.00031432509422302246, -0.00024211406707763672, -0.00016990303993225098, -9.769201278686523e-05, -2.5480985641479492e-05, 4.673004150390625e-05, 0.00011894106864929199, 0.00019115209579467773, 0.0002633631229400635, 0.0003355741500854492, 0.00040778517723083496, 0.0004799962043762207, 0.0005522072315216064, 0.0006244182586669922, 0.0006966292858123779, 0.0007688403129577637, 0.0008410513401031494, 0.0009132623672485352, 0.000985473394393921, 0.0010576844215393066, 0.0011298954486846924, 0.0012021064758300781, 0.0012743175029754639, 0.0013465285301208496, 0.0014187395572662354, 0.001490950584411621, 0.0015631616115570068, 0.0016353726387023926, 0.0017075836658477783, 0.001779794692993164, 0.0018520057201385498, 0.0019242167472839355, 0.0019964277744293213, 0.002068638801574707, 0.0021408498287200928, 0.0022130608558654785, 0.0022852718830108643, 0.00235748291015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 7.0, 9.0, 10.0, 15.0, 22.0, 22.0, 47.0, 62.0, 89.0, 128.0, 175.0, 241.0, 376.0, 561.0, 894.0, 1472.0, 2459.0, 4137.0, 7450.0, 14150.0, 31050.0, 82328.0, 365120.0, 388665.0, 83406.0, 32400.0, 15035.0, 7543.0, 4093.0, 2386.0, 1474.0, 930.0, 593.0, 387.0, 240.0, 151.0, 133.0, 75.0, 63.0, 33.0, 40.0, 29.0, 16.0, 16.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.432699203491211e-05, -7.193069905042648e-05, -6.953440606594086e-05, -6.713811308145523e-05, -6.47418200969696e-05, -6.234552711248398e-05, -5.994923412799835e-05, -5.7552941143512726e-05, -5.51566481590271e-05, -5.2760355174541473e-05, -5.036406219005585e-05, -4.796776920557022e-05, -4.5571476221084595e-05, -4.317518323659897e-05, -4.077889025211334e-05, -3.8382597267627716e-05, -3.598630428314209e-05, -3.3590011298656464e-05, -3.119371831417084e-05, -2.879742532968521e-05, -2.6401132345199585e-05, -2.400483936071396e-05, -2.1608546376228333e-05, -1.9212253391742706e-05, -1.681596040725708e-05, -1.4419667422771454e-05, -1.2023374438285828e-05, -9.627081453800201e-06, -7.230788469314575e-06, -4.834495484828949e-06, -2.4382025003433228e-06, -4.190951585769653e-08, 2.3543834686279297e-06, 4.750676453113556e-06, 7.146969437599182e-06, 9.543262422084808e-06, 1.1939555406570435e-05, 1.433584839105606e-05, 1.6732141375541687e-05, 1.9128434360027313e-05, 2.152472734451294e-05, 2.3921020328998566e-05, 2.6317313313484192e-05, 2.8713606297969818e-05, 3.1109899282455444e-05, 3.350619226694107e-05, 3.59024852514267e-05, 3.829877823591232e-05, 4.069507122039795e-05, 4.3091364204883575e-05, 4.54876571893692e-05, 4.788395017385483e-05, 5.0280243158340454e-05, 5.267653614282608e-05, 5.5072829127311707e-05, 5.746912211179733e-05, 5.986541509628296e-05, 6.226170808076859e-05, 6.465800106525421e-05, 6.705429404973984e-05, 6.945058703422546e-05, 7.184688001871109e-05, 7.424317300319672e-05, 7.663946598768234e-05, 7.903575897216797e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 14.0, 5.0, 12.0, 19.0, 24.0, 17.0, 26.0, 27.0, 28.0, 31.0, 41.0, 55.0, 38.0, 40.0, 68.0, 66.0, 69.0, 51.0, 53.0, 41.0, 42.0, 42.0, 19.0, 28.0, 19.0, 20.0, 18.0, 17.0, 13.0, 11.0, 6.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-1.138448715209961e-05, -1.1052936315536499e-05, -1.0721385478973389e-05, -1.0389834642410278e-05, -1.0058283805847168e-05, -9.726732969284058e-06, -9.395182132720947e-06, -9.063631296157837e-06, -8.732080459594727e-06, -8.400529623031616e-06, -8.068978786468506e-06, -7.737427949905396e-06, -7.405877113342285e-06, -7.074326276779175e-06, -6.7427754402160645e-06, -6.411224603652954e-06, -6.079673767089844e-06, -5.748122930526733e-06, -5.416572093963623e-06, -5.085021257400513e-06, -4.753470420837402e-06, -4.421919584274292e-06, -4.090368747711182e-06, -3.7588179111480713e-06, -3.427267074584961e-06, -3.0957162380218506e-06, -2.7641654014587402e-06, -2.43261456489563e-06, -2.1010637283325195e-06, -1.7695128917694092e-06, -1.4379620552062988e-06, -1.1064112186431885e-06, -7.748603820800781e-07, -4.4330954551696777e-07, -1.1175870895385742e-07, 2.1979212760925293e-07, 5.513429641723633e-07, 8.828938007354736e-07, 1.214444637298584e-06, 1.5459954738616943e-06, 1.8775463104248047e-06, 2.209097146987915e-06, 2.5406479835510254e-06, 2.8721988201141357e-06, 3.203749656677246e-06, 3.5353004932403564e-06, 3.866851329803467e-06, 4.198402166366577e-06, 4.5299530029296875e-06, 4.861503839492798e-06, 5.193054676055908e-06, 5.5246055126190186e-06, 5.856156349182129e-06, 6.187707185745239e-06, 6.51925802230835e-06, 6.85080885887146e-06, 7.18235969543457e-06, 7.513910531997681e-06, 7.845461368560791e-06, 8.177012205123901e-06, 8.508563041687012e-06, 8.840113878250122e-06, 9.171664714813232e-06, 9.503215551376343e-06, 9.834766387939453e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 8.0, 17.0, 15.0, 44.0, 68.0, 99.0, 177.0, 327.0, 617.0, 1177.0, 2390.0, 4974.0, 11774.0, 30558.0, 98163.0, 484291.0, 303780.0, 69680.0, 23156.0, 9192.0, 4004.0, 1872.0, 916.0, 524.0, 277.0, 165.0, 95.0, 49.0, 40.0, 28.0, 13.0, 14.0, 3.0, 6.0, 7.0, 1.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.00011742115020751953, -0.00011414662003517151, -0.00011087208986282349, -0.00010759755969047546, -0.00010432302951812744, -0.00010104849934577942, -9.77739691734314e-05, -9.449943900108337e-05, -9.122490882873535e-05, -8.795037865638733e-05, -8.46758484840393e-05, -8.140131831169128e-05, -7.812678813934326e-05, -7.485225796699524e-05, -7.157772779464722e-05, -6.83031976222992e-05, -6.502866744995117e-05, -6.175413727760315e-05, -5.847960710525513e-05, -5.5205076932907104e-05, -5.193054676055908e-05, -4.865601658821106e-05, -4.538148641586304e-05, -4.2106956243515015e-05, -3.883242607116699e-05, -3.555789589881897e-05, -3.228336572647095e-05, -2.9008835554122925e-05, -2.5734305381774902e-05, -2.245977520942688e-05, -1.9185245037078857e-05, -1.5910714864730835e-05, -1.2636184692382812e-05, -9.36165452003479e-06, -6.087124347686768e-06, -2.812594175338745e-06, 4.6193599700927734e-07, 3.7364661693573e-06, 7.010996341705322e-06, 1.0285526514053345e-05, 1.3560056686401367e-05, 1.683458685874939e-05, 2.0109117031097412e-05, 2.3383647203445435e-05, 2.6658177375793457e-05, 2.993270754814148e-05, 3.32072377204895e-05, 3.6481767892837524e-05, 3.975629806518555e-05, 4.303082823753357e-05, 4.630535840988159e-05, 4.9579888582229614e-05, 5.285441875457764e-05, 5.612894892692566e-05, 5.940347909927368e-05, 6.26780092716217e-05, 6.595253944396973e-05, 6.922706961631775e-05, 7.250159978866577e-05, 7.57761299610138e-05, 7.905066013336182e-05, 8.232519030570984e-05, 8.559972047805786e-05, 8.887425065040588e-05, 9.21487808227539e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 8.0, 5.0, 2.0, 2.0, 5.0, 7.0, 11.0, 12.0, 16.0, 19.0, 23.0, 21.0, 28.0, 48.0, 44.0, 62.0, 83.0, 79.0, 99.0, 62.0, 53.0, 54.0, 57.0, 34.0, 28.0, 30.0, 26.0, 16.0, 16.0, 5.0, 10.0, 8.0, 7.0, 3.0, 6.0, 6.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.7642974853515625e-05, -1.7142854630947113e-05, -1.66427344083786e-05, -1.614261418581009e-05, -1.5642493963241577e-05, -1.5142373740673065e-05, -1.4642253518104553e-05, -1.4142133295536041e-05, -1.364201307296753e-05, -1.3141892850399017e-05, -1.2641772627830505e-05, -1.2141652405261993e-05, -1.1641532182693481e-05, -1.114141196012497e-05, -1.0641291737556458e-05, -1.0141171514987946e-05, -9.641051292419434e-06, -9.140931069850922e-06, -8.64081084728241e-06, -8.140690624713898e-06, -7.640570402145386e-06, -7.140450179576874e-06, -6.640329957008362e-06, -6.14020973443985e-06, -5.640089511871338e-06, -5.139969289302826e-06, -4.639849066734314e-06, -4.139728844165802e-06, -3.63960862159729e-06, -3.139488399028778e-06, -2.639368176460266e-06, -2.139247953891754e-06, -1.6391277313232422e-06, -1.1390075087547302e-06, -6.388872861862183e-07, -1.387670636177063e-07, 3.6135315895080566e-07, 8.614733815193176e-07, 1.3615936040878296e-06, 1.8617138266563416e-06, 2.3618340492248535e-06, 2.8619542717933655e-06, 3.3620744943618774e-06, 3.862194716930389e-06, 4.362314939498901e-06, 4.862435162067413e-06, 5.362555384635925e-06, 5.862675607204437e-06, 6.362795829772949e-06, 6.862916052341461e-06, 7.363036274909973e-06, 7.863156497478485e-06, 8.363276720046997e-06, 8.863396942615509e-06, 9.363517165184021e-06, 9.863637387752533e-06, 1.0363757610321045e-05, 1.0863877832889557e-05, 1.1363998055458069e-05, 1.186411827802658e-05, 1.2364238500595093e-05, 1.2864358723163605e-05, 1.3364478945732117e-05, 1.3864599168300629e-05, 1.436471939086914e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 9.0, 5.0, 10.0, 15.0, 16.0, 24.0, 28.0, 48.0, 34.0, 62.0, 74.0, 102.0, 112.0, 102.0, 85.0, 73.0, 47.0, 38.0, 27.0, 19.0, 14.0, 10.0, 6.0, 5.0, 12.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005620893556624651, -0.005422908812761307, -0.005224923603236675, -0.005026938393712044, -0.0048289536498487, -0.004630968905985355, -0.004432983696460724, -0.004234998486936092, -0.004037013743072748, -0.0038390287663787603, -0.0036410437896847725, -0.0034430588129907846, -0.003245073836296797, -0.003047088859602809, -0.002849103882908821, -0.0026511189062148333, -0.0024531339295208454, -0.0022551489528268576, -0.0020571639761328697, -0.0018591789994388819, -0.001661194022744894, -0.0014632090460509062, -0.0012652240693569183, -0.0010672390926629305, -0.0008692541159689426, -0.0006712691392749548, -0.00047328416258096695, -0.0002752991858869791, -7.731420919299126e-05, 0.00012067076750099659, 0.00031865574419498444, 0.0005166407208889723, 0.0007146256975829601, 0.000912610674276948, 0.0011105956509709358, 0.0013085806276649237, 0.0015065656043589115, 0.0017045505810528994, 0.0019025355577468872, 0.002100520534440875, 0.002298505511134863, 0.0024964904878288507, 0.0026944754645228386, 0.0028924604412168264, 0.0030904454179108143, 0.003288430394604802, 0.00348641537129879, 0.003684400347992778, 0.0038823853246867657, 0.00408037006855011, 0.004278355278074741, 0.004476340487599373, 0.004674325231462717, 0.004872309975326061, 0.005070295184850693, 0.005268280394375324, 0.0054662651382386684, 0.005664249882102013, 0.005862235091626644, 0.006060220301151276, 0.00625820504501462, 0.006456189788877964, 0.0066541749984025955, 0.006852160207927227, 0.007050144951790571]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 10.0, 7.0, 8.0, 16.0, 14.0, 14.0, 13.0, 10.0, 22.0, 17.0, 20.0, 29.0, 29.0, 36.0, 33.0, 26.0, 32.0, 37.0, 39.0, 48.0, 40.0, 37.0, 43.0, 41.0, 42.0, 33.0, 31.0, 31.0, 32.0, 36.0, 25.0, 21.0, 26.0, 19.0, 10.0, 15.0, 11.0, 13.0, 12.0, 7.0, 7.0, 6.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0033098396379500628, -0.003202778287231922, -0.0030957169365137815, -0.002988655585795641, -0.0028815942350775003, -0.0027745328843593597, -0.002667471533641219, -0.0025604101829230785, -0.002453348832204938, -0.0023462874814867973, -0.0022392261307686567, -0.002132164780050516, -0.0020251034293323755, -0.001918042078614235, -0.0018109807278960943, -0.0017039193771779537, -0.0015968580264598131, -0.0014897966757416725, -0.001382735325023532, -0.0012756739743053913, -0.0011686126235872507, -0.00106155127286911, -0.0009544899221509695, -0.0008474285714328289, -0.0007403672207146883, -0.0006333058699965477, -0.0005262445192784071, -0.0004191831685602665, -0.0003121218178421259, -0.0002050604671239853, -9.799911640584469e-05, 9.062234312295914e-06, 0.00011612358503043652, 0.00022318493574857712, 0.0003302462864667177, 0.0004373076371848583, 0.0005443689879029989, 0.0006514303386211395, 0.0007584916893392801, 0.0008655530400574207, 0.0009726143907755613, 0.001079675741493702, 0.0011867370922118425, 0.0012937984429299831, 0.0014008597936481237, 0.0015079211443662643, 0.001614982495084405, 0.0017220438458025455, 0.0018291051965206861, 0.0019361665472388268, 0.0020432278979569674, 0.002150289248675108, 0.0022573505993932486, 0.002364411950111389, 0.0024714733008295298, 0.0025785346515476704, 0.002685596002265811, 0.0027926573529839516, 0.002899718703702092, 0.0030067800544202328, 0.0031138414051383734, 0.003220902755856514, 0.0033279641065746546, 0.003435025457292795, 0.003542086808010936]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 8.0, 10.0, 7.0, 12.0, 23.0, 32.0, 53.0, 66.0, 83.0, 138.0, 185.0, 290.0, 460.0, 724.0, 1196.0, 2016.0, 3828.0, 7656.0, 16152.0, 38703.0, 106932.0, 346202.0, 345207.0, 107027.0, 38464.0, 16306.0, 7576.0, 3859.0, 2061.0, 1200.0, 717.0, 472.0, 290.0, 183.0, 133.0, 87.0, 44.0, 47.0, 35.0, 33.0, 21.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01367950439453125, -0.013207793235778809, -0.012736082077026367, -0.012264370918273926, -0.011792659759521484, -0.011320948600769043, -0.010849237442016602, -0.01037752628326416, -0.009905815124511719, -0.009434103965759277, -0.008962392807006836, -0.008490681648254395, -0.008018970489501953, -0.007547259330749512, -0.00707554817199707, -0.006603837013244629, -0.0061321258544921875, -0.005660414695739746, -0.005188703536987305, -0.004716992378234863, -0.004245281219482422, -0.0037735700607299805, -0.003301858901977539, -0.0028301477432250977, -0.0023584365844726562, -0.0018867254257202148, -0.0014150142669677734, -0.000943303108215332, -0.0004715919494628906, 1.1920928955078125e-07, 0.0004718303680419922, 0.0009435415267944336, 0.001415252685546875, 0.0018869638442993164, 0.002358675003051758, 0.0028303861618041992, 0.0033020973205566406, 0.003773808479309082, 0.0042455196380615234, 0.004717230796813965, 0.005188941955566406, 0.005660653114318848, 0.006132364273071289, 0.0066040754318237305, 0.007075786590576172, 0.007547497749328613, 0.008019208908081055, 0.008490920066833496, 0.008962631225585938, 0.009434342384338379, 0.00990605354309082, 0.010377764701843262, 0.010849475860595703, 0.011321187019348145, 0.011792898178100586, 0.012264609336853027, 0.012736320495605469, 0.01320803165435791, 0.013679742813110352, 0.014151453971862793, 0.014623165130615234, 0.015094876289367676, 0.015566587448120117, 0.01603829860687256, 0.016510009765625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 10.0, 7.0, 9.0, 15.0, 9.0, 18.0, 16.0, 18.0, 20.0, 23.0, 24.0, 38.0, 32.0, 41.0, 33.0, 46.0, 43.0, 69.0, 55.0, 48.0, 43.0, 55.0, 40.0, 39.0, 30.0, 43.0, 22.0, 28.0, 21.0, 23.0, 17.0, 18.0, 11.0, 13.0, 10.0, 8.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0029697418212890625, -0.0028857290744781494, -0.0028017163276672363, -0.0027177035808563232, -0.00263369083404541, -0.002549678087234497, -0.002465665340423584, -0.002381652593612671, -0.002297639846801758, -0.0022136270999908447, -0.0021296143531799316, -0.0020456016063690186, -0.0019615888595581055, -0.0018775761127471924, -0.0017935633659362793, -0.0017095506191253662, -0.0016255378723144531, -0.00154152512550354, -0.001457512378692627, -0.0013734996318817139, -0.0012894868850708008, -0.0012054741382598877, -0.0011214613914489746, -0.0010374486446380615, -0.0009534358978271484, -0.0008694231510162354, -0.0007854104042053223, -0.0007013976573944092, -0.0006173849105834961, -0.000533372163772583, -0.0004493594169616699, -0.00036534667015075684, -0.00028133392333984375, -0.00019732117652893066, -0.00011330842971801758, -2.9295682907104492e-05, 5.4717063903808594e-05, 0.00013872981071472168, 0.00022274255752563477, 0.00030675530433654785, 0.00039076805114746094, 0.000474780797958374, 0.0005587935447692871, 0.0006428062915802002, 0.0007268190383911133, 0.0008108317852020264, 0.0008948445320129395, 0.0009788572788238525, 0.0010628700256347656, 0.0011468827724456787, 0.0012308955192565918, 0.0013149082660675049, 0.001398921012878418, 0.001482933759689331, 0.0015669465065002441, 0.0016509592533111572, 0.0017349720001220703, 0.0018189847469329834, 0.0019029974937438965, 0.0019870102405548096, 0.0020710229873657227, 0.0021550357341766357, 0.002239048480987549, 0.002323061227798462, 0.002407073974609375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 9.0, 10.0, 18.0, 19.0, 32.0, 47.0, 51.0, 82.0, 143.0, 203.0, 419.0, 601.0, 999.0, 1650.0, 2615.0, 4601.0, 7919.0, 14037.0, 26093.0, 51140.0, 105364.0, 234314.0, 302978.0, 148633.0, 68582.0, 34817.0, 18426.0, 10249.0, 5765.0, 3415.0, 1983.0, 1219.0, 759.0, 491.0, 307.0, 176.0, 130.0, 74.0, 44.0, 38.0, 17.0, 21.0, 17.0, 9.0, 9.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.008544921875, -0.008287668228149414, -0.008030414581298828, -0.007773160934448242, -0.007515907287597656, -0.00725865364074707, -0.007001399993896484, -0.0067441463470458984, -0.0064868927001953125, -0.0062296390533447266, -0.005972385406494141, -0.005715131759643555, -0.005457878112792969, -0.005200624465942383, -0.004943370819091797, -0.004686117172241211, -0.004428863525390625, -0.004171609878540039, -0.003914356231689453, -0.003657102584838867, -0.0033998489379882812, -0.0031425952911376953, -0.0028853416442871094, -0.0026280879974365234, -0.0023708343505859375, -0.0021135807037353516, -0.0018563270568847656, -0.0015990734100341797, -0.0013418197631835938, -0.0010845661163330078, -0.0008273124694824219, -0.0005700588226318359, -0.00031280517578125, -5.555152893066406e-05, 0.00020170211791992188, 0.0004589557647705078, 0.0007162094116210938, 0.0009734630584716797, 0.0012307167053222656, 0.0014879703521728516, 0.0017452239990234375, 0.0020024776458740234, 0.0022597312927246094, 0.0025169849395751953, 0.0027742385864257812, 0.003031492233276367, 0.003288745880126953, 0.003545999526977539, 0.003803253173828125, 0.004060506820678711, 0.004317760467529297, 0.004575014114379883, 0.004832267761230469, 0.005089521408081055, 0.005346775054931641, 0.0056040287017822266, 0.0058612823486328125, 0.0061185359954833984, 0.006375789642333984, 0.00663304328918457, 0.006890296936035156, 0.007147550582885742, 0.007404804229736328, 0.007662057876586914, 0.0079193115234375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 2.0, 10.0, 11.0, 10.0, 16.0, 13.0, 14.0, 26.0, 14.0, 27.0, 32.0, 37.0, 33.0, 34.0, 40.0, 50.0, 53.0, 49.0, 63.0, 52.0, 36.0, 41.0, 57.0, 46.0, 24.0, 33.0, 28.0, 24.0, 22.0, 17.0, 17.0, 12.0, 9.0, 13.0, 7.0, 3.0, 4.0, 5.0, 2.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00222015380859375, -0.002146512269973755, -0.0020728707313537598, -0.0019992291927337646, -0.0019255876541137695, -0.0018519461154937744, -0.0017783045768737793, -0.0017046630382537842, -0.001631021499633789, -0.001557379961013794, -0.0014837384223937988, -0.0014100968837738037, -0.0013364553451538086, -0.0012628138065338135, -0.0011891722679138184, -0.0011155307292938232, -0.0010418891906738281, -0.000968247652053833, -0.0008946061134338379, -0.0008209645748138428, -0.0007473230361938477, -0.0006736814975738525, -0.0006000399589538574, -0.0005263984203338623, -0.0004527568817138672, -0.00037911534309387207, -0.00030547380447387695, -0.00023183226585388184, -0.00015819072723388672, -8.45491886138916e-05, -1.0907649993896484e-05, 6.273388862609863e-05, 0.00013637542724609375, 0.00021001696586608887, 0.000283658504486084, 0.0003573000431060791, 0.0004309415817260742, 0.0005045831203460693, 0.0005782246589660645, 0.0006518661975860596, 0.0007255077362060547, 0.0007991492748260498, 0.0008727908134460449, 0.00094643235206604, 0.0010200738906860352, 0.0010937154293060303, 0.0011673569679260254, 0.0012409985065460205, 0.0013146400451660156, 0.0013882815837860107, 0.0014619231224060059, 0.001535564661026001, 0.001609206199645996, 0.0016828477382659912, 0.0017564892768859863, 0.0018301308155059814, 0.0019037723541259766, 0.0019774138927459717, 0.002051055431365967, 0.002124696969985962, 0.002198338508605957, 0.002271980047225952, 0.0023456215858459473, 0.0024192631244659424, 0.0024929046630859375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 5.0, 13.0, 20.0, 20.0, 20.0, 31.0, 48.0, 76.0, 96.0, 118.0, 202.0, 312.0, 475.0, 739.0, 1193.0, 1901.0, 3270.0, 5590.0, 10227.0, 21187.0, 75477.0, 842794.0, 46843.0, 16856.0, 8677.0, 4836.0, 2736.0, 1658.0, 1095.0, 619.0, 429.0, 316.0, 203.0, 118.0, 99.0, 71.0, 56.0, 31.0, 26.0, 15.0, 11.0, 16.0, 3.0, 9.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.008209228515625, -0.007970333099365234, -0.007731437683105469, -0.007492542266845703, -0.0072536468505859375, -0.007014751434326172, -0.006775856018066406, -0.006536960601806641, -0.006298065185546875, -0.006059169769287109, -0.005820274353027344, -0.005581378936767578, -0.0053424835205078125, -0.005103588104248047, -0.004864692687988281, -0.004625797271728516, -0.00438690185546875, -0.004148006439208984, -0.003909111022949219, -0.003670215606689453, -0.0034313201904296875, -0.003192424774169922, -0.0029535293579101562, -0.0027146339416503906, -0.002475738525390625, -0.0022368431091308594, -0.0019979476928710938, -0.0017590522766113281, -0.0015201568603515625, -0.0012812614440917969, -0.0010423660278320312, -0.0008034706115722656, -0.0005645751953125, -0.0003256797790527344, -8.678436279296875e-05, 0.00015211105346679688, 0.0003910064697265625, 0.0006299018859863281, 0.0008687973022460938, 0.0011076927185058594, 0.001346588134765625, 0.0015854835510253906, 0.0018243789672851562, 0.002063274383544922, 0.0023021697998046875, 0.002541065216064453, 0.0027799606323242188, 0.0030188560485839844, 0.00325775146484375, 0.0034966468811035156, 0.0037355422973632812, 0.003974437713623047, 0.0042133331298828125, 0.004452228546142578, 0.004691123962402344, 0.004930019378662109, 0.005168914794921875, 0.005407810211181641, 0.005646705627441406, 0.005885601043701172, 0.0061244964599609375, 0.006363391876220703, 0.006602287292480469, 0.006841182708740234, 0.007080078125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 3.0, 7.0, 17.0, 13.0, 22.0, 29.0, 30.0, 63.0, 91.0, 133.0, 197.0, 127.0, 76.0, 48.0, 46.0, 19.0, 23.0, 12.0, 10.0, 8.0, 5.0, 8.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0967254638671875e-05, -1.0591931641101837e-05, -1.02166086435318e-05, -9.841285645961761e-06, -9.465962648391724e-06, -9.090639650821686e-06, -8.715316653251648e-06, -8.33999365568161e-06, -7.964670658111572e-06, -7.5893476605415344e-06, -7.214024662971497e-06, -6.838701665401459e-06, -6.463378667831421e-06, -6.088055670261383e-06, -5.712732672691345e-06, -5.337409675121307e-06, -4.9620866775512695e-06, -4.586763679981232e-06, -4.211440682411194e-06, -3.836117684841156e-06, -3.460794687271118e-06, -3.0854716897010803e-06, -2.7101486921310425e-06, -2.3348256945610046e-06, -1.959502696990967e-06, -1.584179699420929e-06, -1.2088567018508911e-06, -8.335337042808533e-07, -4.5821070671081543e-07, -8.288770914077759e-08, 2.9243528842926025e-07, 6.677582859992981e-07, 1.043081283569336e-06, 1.4184042811393738e-06, 1.7937272787094116e-06, 2.1690502762794495e-06, 2.5443732738494873e-06, 2.919696271419525e-06, 3.295019268989563e-06, 3.670342266559601e-06, 4.045665264129639e-06, 4.4209882616996765e-06, 4.796311259269714e-06, 5.171634256839752e-06, 5.54695725440979e-06, 5.922280251979828e-06, 6.297603249549866e-06, 6.6729262471199036e-06, 7.048249244689941e-06, 7.423572242259979e-06, 7.798895239830017e-06, 8.174218237400055e-06, 8.549541234970093e-06, 8.92486423254013e-06, 9.300187230110168e-06, 9.675510227680206e-06, 1.0050833225250244e-05, 1.0426156222820282e-05, 1.080147922039032e-05, 1.1176802217960358e-05, 1.1552125215530396e-05, 1.1927448213100433e-05, 1.2302771210670471e-05, 1.2678094208240509e-05, 1.3053417205810547e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 11.0, 16.0, 21.0, 30.0, 44.0, 86.0, 123.0, 222.0, 356.0, 650.0, 1309.0, 2810.0, 6645.0, 18462.0, 118408.0, 857127.0, 26315.0, 8732.0, 3645.0, 1688.0, 823.0, 408.0, 230.0, 149.0, 87.0, 61.0, 32.0, 23.0, 16.0, 3.0, 7.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01412200927734375, -0.013720273971557617, -0.013318538665771484, -0.012916803359985352, -0.012515068054199219, -0.012113332748413086, -0.011711597442626953, -0.01130986213684082, -0.010908126831054688, -0.010506391525268555, -0.010104656219482422, -0.009702920913696289, -0.009301185607910156, -0.008899450302124023, -0.00849771499633789, -0.008095979690551758, -0.007694244384765625, -0.007292509078979492, -0.006890773773193359, -0.0064890384674072266, -0.006087303161621094, -0.005685567855834961, -0.005283832550048828, -0.004882097244262695, -0.0044803619384765625, -0.00407862663269043, -0.003676891326904297, -0.003275156021118164, -0.0028734207153320312, -0.0024716854095458984, -0.0020699501037597656, -0.0016682147979736328, -0.0012664794921875, -0.0008647441864013672, -0.0004630088806152344, -6.127357482910156e-05, 0.00034046173095703125, 0.0007421970367431641, 0.0011439323425292969, 0.0015456676483154297, 0.0019474029541015625, 0.0023491382598876953, 0.002750873565673828, 0.003152608871459961, 0.0035543441772460938, 0.0039560794830322266, 0.004357814788818359, 0.004759550094604492, 0.005161285400390625, 0.005563020706176758, 0.005964756011962891, 0.0063664913177490234, 0.006768226623535156, 0.007169961929321289, 0.007571697235107422, 0.007973432540893555, 0.008375167846679688, 0.00877690315246582, 0.009178638458251953, 0.009580373764038086, 0.009982109069824219, 0.010383844375610352, 0.010785579681396484, 0.011187314987182617, 0.01158905029296875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 3.0, 9.0, 10.0, 9.0, 15.0, 20.0, 28.0, 111.0, 557.0, 108.0, 40.0, 15.0, 11.0, 10.0, 9.0, 2.0, 4.0, 4.0, 7.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0034160614013671875, -0.0033224523067474365, -0.0032288432121276855, -0.0031352341175079346, -0.0030416250228881836, -0.0029480159282684326, -0.0028544068336486816, -0.0027607977390289307, -0.0026671886444091797, -0.0025735795497894287, -0.0024799704551696777, -0.0023863613605499268, -0.0022927522659301758, -0.002199143171310425, -0.002105534076690674, -0.002011924982070923, -0.0019183158874511719, -0.001824706792831421, -0.00173109769821167, -0.001637488603591919, -0.001543879508972168, -0.001450270414352417, -0.001356661319732666, -0.001263052225112915, -0.001169443130493164, -0.001075834035873413, -0.0009822249412536621, -0.0008886158466339111, -0.0007950067520141602, -0.0007013976573944092, -0.0006077885627746582, -0.0005141794681549072, -0.00042057037353515625, -0.0003269612789154053, -0.0002333521842956543, -0.00013974308967590332, -4.6133995056152344e-05, 4.747509956359863e-05, 0.0001410841941833496, 0.00023469328880310059, 0.00032830238342285156, 0.00042191147804260254, 0.0005155205726623535, 0.0006091296672821045, 0.0007027387619018555, 0.0007963478565216064, 0.0008899569511413574, 0.0009835660457611084, 0.0010771751403808594, 0.0011707842350006104, 0.0012643933296203613, 0.0013580024242401123, 0.0014516115188598633, 0.0015452206134796143, 0.0016388297080993652, 0.0017324388027191162, 0.0018260478973388672, 0.0019196569919586182, 0.002013266086578369, 0.00210687518119812, 0.002200484275817871, 0.002294093370437622, 0.002387702465057373, 0.002481311559677124, 0.002574920654296875]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 16.0, 25.0, 115.0, 362.0, 309.0, 129.0, 44.0, 6.0, 5.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.04648544266819954, -0.045640118420124054, -0.04479479417204857, -0.043949466198682785, -0.0431041419506073, -0.042258817702531815, -0.04141349345445633, -0.040568165481090546, -0.03972284123301506, -0.038877516984939575, -0.03803219273686409, -0.037186864763498306, -0.03634154051542282, -0.035496216267347336, -0.03465089201927185, -0.03380556404590607, -0.03296024352312088, -0.032114919275045395, -0.03126959502696991, -0.030424268916249275, -0.02957894280552864, -0.028733618557453156, -0.02788829430937767, -0.027042968198657036, -0.0261976420879364, -0.025352317839860916, -0.02450699172914028, -0.023661667481064796, -0.022816341370344162, -0.021971017122268677, -0.02112569287419319, -0.020280366763472557, -0.019435040652751923, -0.018589716404676437, -0.017744390293955803, -0.016899066045880318, -0.016053739935159683, -0.015208415687084198, -0.014363090507686138, -0.013517765328288078, -0.012672440148890018, -0.011827114969491959, -0.010981789790093899, -0.010136464610695839, -0.009291140362620354, -0.00844581425189972, -0.007600490003824234, -0.006755164824426174, -0.005909839645028114, -0.0050645144656300545, -0.004219189286231995, -0.003373864572495222, -0.0025285393930971622, -0.0016832142136991024, -0.0008378894999623299, 7.4356794357299805e-06, 0.0008527608588337898, 0.0016980859218165278, 0.002543410984799266, 0.003388735931366682, 0.004234061110764742, 0.005079386290162802, 0.005924711003899574, 0.006770036183297634, 0.007615361362695694]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 6.0, 12.0, 9.0, 10.0, 12.0, 13.0, 22.0, 33.0, 21.0, 24.0, 21.0, 28.0, 35.0, 40.0, 33.0, 43.0, 41.0, 38.0, 44.0, 39.0, 35.0, 41.0, 37.0, 33.0, 33.0, 21.0, 30.0, 27.0, 33.0, 25.0, 29.0, 20.0, 9.0, 10.0, 18.0, 20.0, 9.0, 11.0, 4.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002789224497973919, -0.0026965944562107325, -0.002603964414447546, -0.0025113343726843596, -0.002418704330921173, -0.0023260745219886303, -0.0022334442473948, -0.0021408144384622574, -0.002048184396699071, -0.0019555543549358845, -0.001862924313172698, -0.0017702942714095116, -0.001677664346061647, -0.0015850343042984605, -0.001492404262535274, -0.0013997743371874094, -0.0013071441790089011, -0.0012145141372457147, -0.0011218840954825282, -0.0010292541701346636, -0.0009366241283714771, -0.0008439940866082907, -0.0007513640448451042, -0.0006587340612895787, -0.0005661040195263922, -0.0004734740068670362, -0.0003808439942076802, -0.00028821395244449377, -0.00019558393978513777, -0.00010295392712578177, -1.032388536259532e-05, 8.230609819293022e-05, 0.00017493613995611668, 0.0002675661526154727, 0.00036019616527482867, 0.00045282620703801513, 0.0005454561905935407, 0.0006380862323567271, 0.0007307162741199136, 0.0008233462576754391, 0.0009159762994386256, 0.0010086062829941511, 0.0011012363247573376, 0.001193866366520524, 0.0012864964082837105, 0.001379126450046897, 0.0014717564918100834, 0.001564386417157948, 0.0016570164589211345, 0.001749646500684321, 0.0018422765424475074, 0.001934906467795372, 0.0020275365095585585, 0.002120166551321745, 0.0022127965930849314, 0.002305426634848118, 0.0023980566766113043, 0.0024906867183744907, 0.002583316760137677, 0.0026759468019008636, 0.00276857684366405, 0.0028612068854272366, 0.0029538366943597794, 0.003046466736122966, 0.0031390967778861523]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 14.0, 19.0, 19.0, 23.0, 33.0, 45.0, 64.0, 86.0, 133.0, 173.0, 237.0, 332.0, 527.0, 817.0, 1493.0, 3133.0, 8067.0, 24098.0, 79044.0, 332673.0, 2576536.0, 938577.0, 159443.0, 43238.0, 14375.0, 5409.0, 2357.0, 1150.0, 671.0, 434.0, 254.0, 219.0, 154.0, 115.0, 68.0, 74.0, 50.0, 35.0, 21.0, 19.0, 18.0, 11.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.00772857666015625, -0.007506310939788818, -0.007284045219421387, -0.007061779499053955, -0.0068395137786865234, -0.006617248058319092, -0.00639498233795166, -0.0061727166175842285, -0.005950450897216797, -0.005728185176849365, -0.005505919456481934, -0.005283653736114502, -0.00506138801574707, -0.004839122295379639, -0.004616856575012207, -0.004394590854644775, -0.004172325134277344, -0.003950059413909912, -0.0037277936935424805, -0.003505527973175049, -0.003283262252807617, -0.0030609965324401855, -0.002838730812072754, -0.0026164650917053223, -0.0023941993713378906, -0.002171933650970459, -0.0019496679306030273, -0.0017274022102355957, -0.001505136489868164, -0.0012828707695007324, -0.0010606050491333008, -0.0008383393287658691, -0.0006160736083984375, -0.00039380788803100586, -0.00017154216766357422, 5.072355270385742e-05, 0.00027298927307128906, 0.0004952549934387207, 0.0007175207138061523, 0.000939786434173584, 0.0011620521545410156, 0.0013843178749084473, 0.001606583595275879, 0.0018288493156433105, 0.002051115036010742, 0.002273380756378174, 0.0024956464767456055, 0.002717912197113037, 0.0029401779174804688, 0.0031624436378479004, 0.003384709358215332, 0.0036069750785827637, 0.0038292407989501953, 0.004051506519317627, 0.004273772239685059, 0.00449603796005249, 0.004718303680419922, 0.0049405694007873535, 0.005162835121154785, 0.005385100841522217, 0.0056073665618896484, 0.00582963228225708, 0.006051898002624512, 0.006274163722991943, 0.006496429443359375]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 1.0, 5.0, 6.0, 11.0, 7.0, 10.0, 21.0, 15.0, 22.0, 15.0, 15.0, 28.0, 36.0, 30.0, 33.0, 51.0, 50.0, 49.0, 50.0, 39.0, 51.0, 39.0, 49.0, 62.0, 40.0, 36.0, 35.0, 21.0, 20.0, 23.0, 25.0, 21.0, 19.0, 15.0, 12.0, 9.0, 9.0, 5.0, 8.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003070831298828125, -0.0029752254486083984, -0.002879619598388672, -0.0027840137481689453, -0.0026884078979492188, -0.002592802047729492, -0.0024971961975097656, -0.002401590347290039, -0.0023059844970703125, -0.002210378646850586, -0.0021147727966308594, -0.002019166946411133, -0.0019235610961914062, -0.0018279552459716797, -0.0017323493957519531, -0.0016367435455322266, -0.0015411376953125, -0.0014455318450927734, -0.0013499259948730469, -0.0012543201446533203, -0.0011587142944335938, -0.0010631084442138672, -0.0009675025939941406, -0.0008718967437744141, -0.0007762908935546875, -0.0006806850433349609, -0.0005850791931152344, -0.0004894733428955078, -0.00039386749267578125, -0.0002982616424560547, -0.00020265579223632812, -0.00010704994201660156, -1.1444091796875e-05, 8.416175842285156e-05, 0.00017976760864257812, 0.0002753734588623047, 0.00037097930908203125, 0.0004665851593017578, 0.0005621910095214844, 0.0006577968597412109, 0.0007534027099609375, 0.0008490085601806641, 0.0009446144104003906, 0.0010402202606201172, 0.0011358261108398438, 0.0012314319610595703, 0.0013270378112792969, 0.0014226436614990234, 0.00151824951171875, 0.0016138553619384766, 0.0017094612121582031, 0.0018050670623779297, 0.0019006729125976562, 0.001996278762817383, 0.0020918846130371094, 0.002187490463256836, 0.0022830963134765625, 0.002378702163696289, 0.0024743080139160156, 0.002569913864135742, 0.0026655197143554688, 0.0027611255645751953, 0.002856731414794922, 0.0029523372650146484, 0.003047943115234375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 13.0, 17.0, 30.0, 76.0, 187.0, 599.0, 2434.0, 32553.0, 4131366.0, 24025.0, 2195.0, 492.0, 164.0, 51.0, 39.0, 13.0, 5.0, 6.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0303955078125, -0.028749465942382812, -0.027103424072265625, -0.025457382202148438, -0.02381134033203125, -0.022165298461914062, -0.020519256591796875, -0.018873214721679688, -0.0172271728515625, -0.015581130981445312, -0.013935089111328125, -0.012289047241210938, -0.01064300537109375, -0.008996963500976562, -0.007350921630859375, -0.0057048797607421875, -0.004058837890625, -0.0024127960205078125, -0.000766754150390625, 0.0008792877197265625, 0.00252532958984375, 0.0041713714599609375, 0.005817413330078125, 0.0074634552001953125, 0.0091094970703125, 0.010755538940429688, 0.012401580810546875, 0.014047622680664062, 0.01569366455078125, 0.017339706420898438, 0.018985748291015625, 0.020631790161132812, 0.02227783203125, 0.023923873901367188, 0.025569915771484375, 0.027215957641601562, 0.02886199951171875, 0.030508041381835938, 0.032154083251953125, 0.03380012512207031, 0.0354461669921875, 0.03709220886230469, 0.038738250732421875, 0.04038429260253906, 0.04203033447265625, 0.04367637634277344, 0.045322418212890625, 0.04696846008300781, 0.048614501953125, 0.05026054382324219, 0.051906585693359375, 0.05355262756347656, 0.05519866943359375, 0.05684471130371094, 0.058490753173828125, 0.06013679504394531, 0.0617828369140625, 0.06342887878417969, 0.06507492065429688, 0.06672096252441406, 0.06836700439453125, 0.07001304626464844, 0.07165908813476562, 0.07330513000488281, 0.074951171875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 8.0, 10.0, 19.0, 55.0, 127.0, 233.0, 565.0, 1163.0, 1020.0, 455.0, 212.0, 98.0, 31.0, 25.0, 14.0, 6.0, 8.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00220489501953125, -0.002088308334350586, -0.001971721649169922, -0.0018551349639892578, -0.0017385482788085938, -0.0016219615936279297, -0.0015053749084472656, -0.0013887882232666016, -0.0012722015380859375, -0.0011556148529052734, -0.0010390281677246094, -0.0009224414825439453, -0.0008058547973632812, -0.0006892681121826172, -0.0005726814270019531, -0.00045609474182128906, -0.000339508056640625, -0.00022292137145996094, -0.00010633468627929688, 1.0251998901367188e-05, 0.00012683868408203125, 0.0002434253692626953, 0.0003600120544433594, 0.00047659873962402344, 0.0005931854248046875, 0.0007097721099853516, 0.0008263587951660156, 0.0009429454803466797, 0.0010595321655273438, 0.0011761188507080078, 0.0012927055358886719, 0.001409292221069336, 0.00152587890625, 0.001642465591430664, 0.0017590522766113281, 0.0018756389617919922, 0.0019922256469726562, 0.0021088123321533203, 0.0022253990173339844, 0.0023419857025146484, 0.0024585723876953125, 0.0025751590728759766, 0.0026917457580566406, 0.0028083324432373047, 0.0029249191284179688, 0.003041505813598633, 0.003158092498779297, 0.003274679183959961, 0.003391265869140625, 0.003507852554321289, 0.003624439239501953, 0.003741025924682617, 0.0038576126098632812, 0.003974199295043945, 0.004090785980224609, 0.0042073726654052734, 0.0043239593505859375, 0.0044405460357666016, 0.004557132720947266, 0.00467371940612793, 0.004790306091308594, 0.004906892776489258, 0.005023479461669922, 0.005140066146850586, 0.00525665283203125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 11.0, 19.0, 26.0, 45.0, 74.0, 100.0, 159.0, 187.0, 142.0, 89.0, 51.0, 30.0, 23.0, 20.0, 8.0, 5.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.013825763948261738, -0.01352679543197155, -0.013227826915681362, -0.012928859330713749, -0.012629890814423561, -0.012330922298133373, -0.012031953781843185, -0.011732986196875572, -0.011434017680585384, -0.011135049164295197, -0.010836080648005009, -0.010537113063037395, -0.010238144546747208, -0.00993917603045702, -0.009640207514166832, -0.009341239929199219, -0.009042270481586456, -0.008743301965296268, -0.00844433344900608, -0.008145365864038467, -0.00784639734774828, -0.007547428831458092, -0.007248460315167904, -0.006949492264539003, -0.006650524213910103, -0.006351555697619915, -0.0060525876469910145, -0.005753619130700827, -0.005454651080071926, -0.005155682563781738, -0.0048567140474915504, -0.00455774599686265, -0.004258777946233749, -0.0039598094299435616, -0.003660841379314661, -0.003361872863024473, -0.0030629048123955727, -0.002763936296105385, -0.0024649680126458406, -0.0021659997291862965, -0.0018670314457267523, -0.001568063162267208, -0.001269094878807664, -0.0009701264789327979, -0.0006711581954732537, -0.00037218991201370955, -7.322151213884354e-05, 0.00022574677132070065, 0.0005247150547802448, 0.000823683338239789, 0.0011226516216993332, 0.0014216200215741992, 0.0017205883050337434, 0.0020195567049086094, 0.0023185249883681536, 0.0026174932718276978, 0.002916461555287242, 0.003215429838746786, 0.0035143981222063303, 0.0038133664056658745, 0.004112334921956062, 0.004411302972584963, 0.004710271488875151, 0.005009239539504051, 0.005308208055794239]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 11.0, 9.0, 11.0, 8.0, 16.0, 13.0, 19.0, 19.0, 25.0, 27.0, 27.0, 36.0, 36.0, 32.0, 47.0, 48.0, 38.0, 32.0, 42.0, 48.0, 35.0, 38.0, 33.0, 39.0, 38.0, 30.0, 40.0, 29.0, 25.0, 18.0, 15.0, 22.0, 15.0, 13.0, 16.0, 14.0, 6.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0035127419978380203, -0.003406031057238579, -0.0032993201166391373, -0.0031926091760396957, -0.003085898235440254, -0.0029791872948408127, -0.002872476354241371, -0.0027657654136419296, -0.002659054473042488, -0.0025523435324430466, -0.002445632591843605, -0.0023389216512441635, -0.002232210710644722, -0.0021254997700452805, -0.002018788829445839, -0.0019120778888463974, -0.0018053669482469559, -0.0016986560076475143, -0.0015919450670480728, -0.0014852341264486313, -0.0013785231858491898, -0.0012718122452497482, -0.0011651013046503067, -0.0010583903640508652, -0.0009516794234514236, -0.0008449684828519821, -0.0007382575422525406, -0.0006315466016530991, -0.0005248356610536575, -0.000418124720454216, -0.0003114137798547745, -0.00020470283925533295, -9.799189865589142e-05, 8.71904194355011e-06, 0.00011542998254299164, 0.00022214092314243317, 0.0003288518637418747, 0.0004355628043413162, 0.0005422737449407578, 0.0006489846855401993, 0.0007556956261396408, 0.0008624065667390823, 0.0009691175073385239, 0.0010758284479379654, 0.001182539388537407, 0.0012892503291368484, 0.00139596126973629, 0.0015026722103357315, 0.001609383150935173, 0.0017160940915346146, 0.001822805032134056, 0.0019295159727334976, 0.002036226913332939, 0.0021429378539323807, 0.002249648794531822, 0.0023563597351312637, 0.0024630706757307053, 0.002569781616330147, 0.0026764925569295883, 0.00278320349752903, 0.0028899144381284714, 0.002996625378727913, 0.0031033363193273544, 0.003210047259926796, 0.0033167582005262375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 7.0, 13.0, 31.0, 32.0, 57.0, 70.0, 95.0, 142.0, 220.0, 298.0, 428.0, 669.0, 902.0, 1431.0, 2069.0, 3096.0, 4643.0, 7245.0, 11085.0, 17461.0, 27462.0, 43798.0, 69259.0, 108777.0, 165389.0, 192670.0, 141173.0, 91269.0, 57729.0, 35990.0, 22900.0, 14508.0, 9334.0, 6116.0, 3939.0, 2703.0, 1761.0, 1207.0, 790.0, 534.0, 411.0, 279.0, 175.0, 126.0, 78.0, 65.0, 41.0, 18.0, 18.0, 8.0, 13.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0008416175842285156, -0.0008147284388542175, -0.0007878392934799194, -0.0007609501481056213, -0.0007340610027313232, -0.0007071718573570251, -0.000680282711982727, -0.000653393566608429, -0.0006265044212341309, -0.0005996152758598328, -0.0005727261304855347, -0.0005458369851112366, -0.0005189478397369385, -0.0004920586943626404, -0.0004651695489883423, -0.0004382804036140442, -0.0004113912582397461, -0.000384502112865448, -0.0003576129674911499, -0.0003307238221168518, -0.0003038346767425537, -0.0002769455313682556, -0.0002500563859939575, -0.00022316724061965942, -0.00019627809524536133, -0.00016938894987106323, -0.00014249980449676514, -0.00011561065912246704, -8.872151374816895e-05, -6.183236837387085e-05, -3.4943222999572754e-05, -8.054077625274658e-06, 1.8835067749023438e-05, 4.572421312332153e-05, 7.261335849761963e-05, 9.950250387191772e-05, 0.00012639164924621582, 0.00015328079462051392, 0.000180169939994812, 0.0002070590853691101, 0.0002339482307434082, 0.0002608373761177063, 0.0002877265214920044, 0.0003146156668663025, 0.0003415048122406006, 0.0003683939576148987, 0.0003952831029891968, 0.0004221722483634949, 0.00044906139373779297, 0.00047595053911209106, 0.0005028396844863892, 0.0005297288298606873, 0.0005566179752349854, 0.0005835071206092834, 0.0006103962659835815, 0.0006372854113578796, 0.0006641745567321777, 0.0006910637021064758, 0.0007179528474807739, 0.000744841992855072, 0.0007717311382293701, 0.0007986202836036682, 0.0008255094289779663, 0.0008523985743522644, 0.0008792877197265625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 7.0, 6.0, 8.0, 12.0, 9.0, 13.0, 15.0, 19.0, 18.0, 22.0, 32.0, 39.0, 37.0, 27.0, 34.0, 54.0, 46.0, 43.0, 43.0, 50.0, 40.0, 39.0, 33.0, 52.0, 38.0, 31.0, 35.0, 27.0, 32.0, 17.0, 26.0, 17.0, 15.0, 7.0, 14.0, 13.0, 9.0, 9.0, 4.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0036563873291015625, -0.0035467445850372314, -0.0034371018409729004, -0.0033274590969085693, -0.0032178163528442383, -0.0031081736087799072, -0.002998530864715576, -0.002888888120651245, -0.002779245376586914, -0.002669602632522583, -0.002559959888458252, -0.002450317144393921, -0.00234067440032959, -0.002231031656265259, -0.0021213889122009277, -0.0020117461681365967, -0.0019021034240722656, -0.0017924606800079346, -0.0016828179359436035, -0.0015731751918792725, -0.0014635324478149414, -0.0013538897037506104, -0.0012442469596862793, -0.0011346042156219482, -0.0010249614715576172, -0.0009153187274932861, -0.0008056759834289551, -0.000696033239364624, -0.000586390495300293, -0.0004767477512359619, -0.00036710500717163086, -0.0002574622631072998, -0.00014781951904296875, -3.8176774978637695e-05, 7.146596908569336e-05, 0.00018110871315002441, 0.00029075145721435547, 0.0004003942012786865, 0.0005100369453430176, 0.0006196796894073486, 0.0007293224334716797, 0.0008389651775360107, 0.0009486079216003418, 0.0010582506656646729, 0.001167893409729004, 0.001277536153793335, 0.001387178897857666, 0.001496821641921997, 0.0016064643859863281, 0.0017161071300506592, 0.0018257498741149902, 0.0019353926181793213, 0.0020450353622436523, 0.0021546781063079834, 0.0022643208503723145, 0.0023739635944366455, 0.0024836063385009766, 0.0025932490825653076, 0.0027028918266296387, 0.0028125345706939697, 0.0029221773147583008, 0.003031820058822632, 0.003141462802886963, 0.003251105546951294, 0.003360748291015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 7.0, 10.0, 23.0, 35.0, 51.0, 72.0, 107.0, 145.0, 203.0, 361.0, 505.0, 835.0, 1305.0, 1908.0, 3128.0, 4836.0, 7818.0, 12291.0, 20443.0, 34084.0, 58917.0, 106589.0, 211586.0, 269001.0, 135320.0, 72262.0, 41924.0, 24561.0, 14839.0, 9242.0, 5742.0, 3705.0, 2340.0, 1507.0, 969.0, 586.0, 476.0, 283.0, 177.0, 132.0, 80.0, 59.0, 35.0, 18.0, 18.0, 1.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.001049041748046875, -0.0010174289345741272, -0.0009858161211013794, -0.0009542033076286316, -0.0009225904941558838, -0.000890977680683136, -0.0008593648672103882, -0.0008277520537376404, -0.0007961392402648926, -0.0007645264267921448, -0.000732913613319397, -0.0007013007998466492, -0.0006696879863739014, -0.0006380751729011536, -0.0006064623594284058, -0.000574849545955658, -0.0005432367324829102, -0.0005116239190101624, -0.00048001110553741455, -0.00044839829206466675, -0.00041678547859191895, -0.00038517266511917114, -0.00035355985164642334, -0.00032194703817367554, -0.00029033422470092773, -0.00025872141122817993, -0.00022710859775543213, -0.00019549578428268433, -0.00016388297080993652, -0.00013227015733718872, -0.00010065734386444092, -6.904453039169312e-05, -3.743171691894531e-05, -5.81890344619751e-06, 2.5793910026550293e-05, 5.7406723499298096e-05, 8.90195369720459e-05, 0.0001206323504447937, 0.0001522451639175415, 0.0001838579773902893, 0.0002154707908630371, 0.0002470836043357849, 0.0002786964178085327, 0.0003103092312812805, 0.0003419220447540283, 0.0003735348582267761, 0.0004051476716995239, 0.00043676048517227173, 0.00046837329864501953, 0.0004999861121177673, 0.0005315989255905151, 0.0005632117390632629, 0.0005948245525360107, 0.0006264373660087585, 0.0006580501794815063, 0.0006896629929542542, 0.000721275806427002, 0.0007528886198997498, 0.0007845014333724976, 0.0008161142468452454, 0.0008477270603179932, 0.000879339873790741, 0.0009109526872634888, 0.0009425655007362366, 0.0009741783142089844]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 14.0, 6.0, 10.0, 6.0, 12.0, 16.0, 13.0, 13.0, 16.0, 21.0, 16.0, 30.0, 28.0, 30.0, 23.0, 34.0, 41.0, 51.0, 47.0, 42.0, 44.0, 43.0, 30.0, 38.0, 54.0, 26.0, 33.0, 22.0, 36.0, 26.0, 28.0, 30.0, 18.0, 15.0, 15.0, 16.0, 14.0, 14.0, 6.0, 5.0, 4.0, 5.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.0021457672119140625, -0.002078711986541748, -0.0020116567611694336, -0.0019446015357971191, -0.0018775463104248047, -0.0018104910850524902, -0.0017434358596801758, -0.0016763806343078613, -0.0016093254089355469, -0.0015422701835632324, -0.001475214958190918, -0.0014081597328186035, -0.001341104507446289, -0.0012740492820739746, -0.0012069940567016602, -0.0011399388313293457, -0.0010728836059570312, -0.0010058283805847168, -0.0009387731552124023, -0.0008717179298400879, -0.0008046627044677734, -0.000737607479095459, -0.0006705522537231445, -0.0006034970283508301, -0.0005364418029785156, -0.00046938657760620117, -0.0004023313522338867, -0.00033527612686157227, -0.0002682209014892578, -0.00020116567611694336, -0.0001341104507446289, -6.705522537231445e-05, 0.0, 6.705522537231445e-05, 0.0001341104507446289, 0.00020116567611694336, 0.0002682209014892578, 0.00033527612686157227, 0.0004023313522338867, 0.00046938657760620117, 0.0005364418029785156, 0.0006034970283508301, 0.0006705522537231445, 0.000737607479095459, 0.0008046627044677734, 0.0008717179298400879, 0.0009387731552124023, 0.0010058283805847168, 0.0010728836059570312, 0.0011399388313293457, 0.0012069940567016602, 0.0012740492820739746, 0.001341104507446289, 0.0014081597328186035, 0.001475214958190918, 0.0015422701835632324, 0.0016093254089355469, 0.0016763806343078613, 0.0017434358596801758, 0.0018104910850524902, 0.0018775463104248047, 0.0019446015357971191, 0.0020116567611694336, 0.002078711986541748, 0.0021457672119140625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 7.0, 7.0, 5.0, 16.0, 19.0, 28.0, 34.0, 44.0, 71.0, 106.0, 154.0, 202.0, 347.0, 502.0, 765.0, 1191.0, 1991.0, 2922.0, 5034.0, 9098.0, 16340.0, 32885.0, 76533.0, 304526.0, 422246.0, 92097.0, 38759.0, 18256.0, 9688.0, 5540.0, 3373.0, 2026.0, 1241.0, 884.0, 516.0, 336.0, 238.0, 147.0, 118.0, 78.0, 66.0, 35.0, 33.0, 21.0, 8.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.799531936645508e-05, -5.6129880249500275e-05, -5.426444113254547e-05, -5.239900201559067e-05, -5.0533562898635864e-05, -4.866812378168106e-05, -4.680268466472626e-05, -4.4937245547771454e-05, -4.307180643081665e-05, -4.120636731386185e-05, -3.9340928196907043e-05, -3.747548907995224e-05, -3.5610049962997437e-05, -3.374461084604263e-05, -3.187917172908783e-05, -3.0013732612133026e-05, -2.8148293495178223e-05, -2.628285437822342e-05, -2.4417415261268616e-05, -2.2551976144313812e-05, -2.068653702735901e-05, -1.8821097910404205e-05, -1.6955658793449402e-05, -1.5090219676494598e-05, -1.3224780559539795e-05, -1.1359341442584991e-05, -9.493902325630188e-06, -7.6284632086753845e-06, -5.763024091720581e-06, -3.897584974765778e-06, -2.032145857810974e-06, -1.6670674085617065e-07, 1.6987323760986328e-06, 3.5641714930534363e-06, 5.42961061000824e-06, 7.295049726963043e-06, 9.160488843917847e-06, 1.102592796087265e-05, 1.2891367077827454e-05, 1.4756806194782257e-05, 1.662224531173706e-05, 1.8487684428691864e-05, 2.0353123545646667e-05, 2.221856266260147e-05, 2.4084001779556274e-05, 2.5949440896511078e-05, 2.781488001346588e-05, 2.9680319130420685e-05, 3.154575824737549e-05, 3.341119736433029e-05, 3.5276636481285095e-05, 3.71420755982399e-05, 3.90075147151947e-05, 4.0872953832149506e-05, 4.273839294910431e-05, 4.460383206605911e-05, 4.6469271183013916e-05, 4.833471029996872e-05, 5.020014941692352e-05, 5.2065588533878326e-05, 5.393102765083313e-05, 5.579646676778793e-05, 5.766190588474274e-05, 5.952734500169754e-05, 6.139278411865234e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 1.0, 5.0, 3.0, 5.0, 10.0, 8.0, 16.0, 5.0, 18.0, 18.0, 31.0, 21.0, 25.0, 37.0, 49.0, 54.0, 68.0, 36.0, 55.0, 53.0, 64.0, 59.0, 56.0, 46.0, 29.0, 34.0, 37.0, 34.0, 17.0, 23.0, 18.0, 14.0, 10.0, 7.0, 5.0, 3.0, 7.0, 7.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.775161743164062e-06, -9.482726454734802e-06, -9.190291166305542e-06, -8.897855877876282e-06, -8.605420589447021e-06, -8.312985301017761e-06, -8.020550012588501e-06, -7.72811472415924e-06, -7.4356794357299805e-06, -7.14324414730072e-06, -6.85080885887146e-06, -6.5583735704422e-06, -6.2659382820129395e-06, -5.973502993583679e-06, -5.681067705154419e-06, -5.388632416725159e-06, -5.0961971282958984e-06, -4.803761839866638e-06, -4.511326551437378e-06, -4.218891263008118e-06, -3.926455974578857e-06, -3.634020686149597e-06, -3.341585397720337e-06, -3.0491501092910767e-06, -2.7567148208618164e-06, -2.464279532432556e-06, -2.171844244003296e-06, -1.8794089555740356e-06, -1.5869736671447754e-06, -1.2945383787155151e-06, -1.0021030902862549e-06, -7.096678018569946e-07, -4.172325134277344e-07, -1.2479722499847412e-07, 1.6763806343078613e-07, 4.600733518600464e-07, 7.525086402893066e-07, 1.044943928718567e-06, 1.3373792171478271e-06, 1.6298145055770874e-06, 1.9222497940063477e-06, 2.214685082435608e-06, 2.507120370864868e-06, 2.7995556592941284e-06, 3.0919909477233887e-06, 3.384426236152649e-06, 3.676861524581909e-06, 3.9692968130111694e-06, 4.26173210144043e-06, 4.55416738986969e-06, 4.84660267829895e-06, 5.1390379667282104e-06, 5.431473255157471e-06, 5.723908543586731e-06, 6.016343832015991e-06, 6.3087791204452515e-06, 6.601214408874512e-06, 6.893649697303772e-06, 7.186084985733032e-06, 7.4785202741622925e-06, 7.770955562591553e-06, 8.063390851020813e-06, 8.355826139450073e-06, 8.648261427879333e-06, 8.940696716308594e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 6.0, 5.0, 9.0, 17.0, 24.0, 38.0, 65.0, 214.0, 1132.0, 9085.0, 146932.0, 851248.0, 35718.0, 3227.0, 553.0, 113.0, 56.0, 29.0, 13.0, 11.0, 13.0, 6.0, 4.0, 3.0, 2.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024962425231933594, -0.00024047121405601501, -0.0002313181757926941, -0.00022216513752937317, -0.00021301209926605225, -0.00020385906100273132, -0.0001947060227394104, -0.00018555298447608948, -0.00017639994621276855, -0.00016724690794944763, -0.0001580938696861267, -0.00014894083142280579, -0.00013978779315948486, -0.00013063475489616394, -0.00012148171663284302, -0.0001123286783695221, -0.00010317564010620117, -9.402260184288025e-05, -8.486956357955933e-05, -7.57165253162384e-05, -6.656348705291748e-05, -5.741044878959656e-05, -4.8257410526275635e-05, -3.910437226295471e-05, -2.995133399963379e-05, -2.0798295736312866e-05, -1.1645257472991943e-05, -2.4922192096710205e-06, 6.660819053649902e-06, 1.5813857316970825e-05, 2.4966895580291748e-05, 3.411993384361267e-05, 4.3272972106933594e-05, 5.2426010370254517e-05, 6.157904863357544e-05, 7.073208689689636e-05, 7.988512516021729e-05, 8.903816342353821e-05, 9.819120168685913e-05, 0.00010734423995018005, 0.00011649727821350098, 0.0001256503164768219, 0.00013480335474014282, 0.00014395639300346375, 0.00015310943126678467, 0.0001622624695301056, 0.00017141550779342651, 0.00018056854605674744, 0.00018972158432006836, 0.00019887462258338928, 0.0002080276608467102, 0.00021718069911003113, 0.00022633373737335205, 0.00023548677563667297, 0.0002446398138999939, 0.0002537928521633148, 0.00026294589042663574, 0.00027209892868995667, 0.0002812519669532776, 0.0002904050052165985, 0.00029955804347991943, 0.00030871108174324036, 0.0003178641200065613, 0.0003270171582698822, 0.0003361701965332031]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 2.0, 7.0, 5.0, 11.0, 15.0, 12.0, 17.0, 18.0, 24.0, 42.0, 53.0, 53.0, 75.0, 145.0, 163.0, 78.0, 53.0, 36.0, 43.0, 35.0, 22.0, 19.0, 14.0, 9.0, 12.0, 4.0, 6.0, 3.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.621246337890625e-05, -1.5615485608577728e-05, -1.5018507838249207e-05, -1.4421530067920685e-05, -1.3824552297592163e-05, -1.3227574527263641e-05, -1.263059675693512e-05, -1.2033618986606598e-05, -1.1436641216278076e-05, -1.0839663445949554e-05, -1.0242685675621033e-05, -9.645707905292511e-06, -9.04873013496399e-06, -8.451752364635468e-06, -7.854774594306946e-06, -7.257796823978424e-06, -6.660819053649902e-06, -6.063841283321381e-06, -5.466863512992859e-06, -4.869885742664337e-06, -4.2729079723358154e-06, -3.6759302020072937e-06, -3.078952431678772e-06, -2.4819746613502502e-06, -1.8849968910217285e-06, -1.2880191206932068e-06, -6.910413503646851e-07, -9.406358003616333e-08, 5.029141902923584e-07, 1.0998919606208801e-06, 1.6968697309494019e-06, 2.2938475012779236e-06, 2.8908252716064453e-06, 3.487803041934967e-06, 4.084780812263489e-06, 4.6817585825920105e-06, 5.278736352920532e-06, 5.875714123249054e-06, 6.472691893577576e-06, 7.069669663906097e-06, 7.666647434234619e-06, 8.263625204563141e-06, 8.860602974891663e-06, 9.457580745220184e-06, 1.0054558515548706e-05, 1.0651536285877228e-05, 1.124851405620575e-05, 1.1845491826534271e-05, 1.2442469596862793e-05, 1.3039447367191315e-05, 1.3636425137519836e-05, 1.4233402907848358e-05, 1.483038067817688e-05, 1.54273584485054e-05, 1.6024336218833923e-05, 1.6621313989162445e-05, 1.7218291759490967e-05, 1.781526952981949e-05, 1.841224730014801e-05, 1.9009225070476532e-05, 1.9606202840805054e-05, 2.0203180611133575e-05, 2.0800158381462097e-05, 2.139713615179062e-05, 2.199411392211914e-05]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 7.0, 15.0, 19.0, 17.0, 20.0, 30.0, 47.0, 45.0, 74.0, 87.0, 90.0, 102.0, 99.0, 75.0, 73.0, 43.0, 29.0, 26.0, 17.0, 17.0, 11.0, 10.0, 16.0, 4.0, 3.0, 1.0, 6.0, 8.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005124259274452925, -0.004955008160322905, -0.0047857570461928844, -0.004616505466401577, -0.004447254352271557, -0.004278003238141537, -0.004108752124011517, -0.003939501009881496, -0.0037702496629208326, -0.0036009985487908125, -0.0034317472018301487, -0.0032624960877001286, -0.0030932449735701084, -0.0029239936266094446, -0.0027547425124794245, -0.0025854911655187607, -0.0024162400513887405, -0.0022469889372587204, -0.0020777375902980566, -0.0019084864761680365, -0.0017392352456226945, -0.0015699840150773525, -0.0014007329009473324, -0.0012314816704019904, -0.0010622304398566484, -0.0008929792093113065, -0.0007237280369736254, -0.0005544768646359444, -0.0003852256340906024, -0.00021597440354526043, -4.672328941524029e-05, 0.00012252794113010168, 0.00029177870601415634, 0.00046102990745566785, 0.0006302811088971794, 0.0007995322812348604, 0.0009687835117802024, 0.0011380347423255444, 0.0013072858564555645, 0.0014765370870009065, 0.0016457883175462484, 0.0018150395480915904, 0.0019842907786369324, 0.0021535418927669525, 0.0023227930068969727, 0.0024920443538576365, 0.0026612954679876566, 0.0028305468149483204, 0.0029997979290783405, 0.0031690490432083607, 0.0033383003901690245, 0.0035075515042990446, 0.0036768028512597084, 0.0038460539653897285, 0.004015305079519749, 0.004184556193649769, 0.004353807307779789, 0.004523058421909809, 0.004692309536039829, 0.004861560650169849, 0.005030812229961157, 0.005200063344091177, 0.005369314458221197, 0.005538565572351217, 0.005707817152142525]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 11.0, 10.0, 15.0, 10.0, 21.0, 21.0, 16.0, 21.0, 28.0, 35.0, 42.0, 29.0, 43.0, 39.0, 52.0, 31.0, 42.0, 42.0, 46.0, 36.0, 33.0, 43.0, 35.0, 28.0, 37.0, 41.0, 27.0, 20.0, 14.0, 17.0, 19.0, 16.0, 12.0, 15.0, 10.0, 8.0, 5.0, 3.0, 2.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0032984104473143816, -0.003199760103598237, -0.003101109527051449, -0.0030024591833353043, -0.0029038088396191597, -0.002805158495903015, -0.002706507919356227, -0.0026078575756400824, -0.002509206999093294, -0.0024105566553771496, -0.0023119060788303614, -0.002213255735114217, -0.0021146053913980722, -0.002015954814851284, -0.0019173044711351395, -0.001818654127418995, -0.0017200037837028503, -0.001621353323571384, -0.0015227029798552394, -0.001424052519723773, -0.0013254021760076284, -0.001226751715876162, -0.0011281012557446957, -0.001029450912028551, -0.0009308004518970847, -0.0008321500499732792, -0.0007334996480494738, -0.0006348491879180074, -0.0005361987859942019, -0.0004375483840703964, -0.00033889792393893003, -0.00024024752201512456, -0.00014159688726067543, -4.294647078495473e-05, 5.570394569076598e-05, 0.0001543543767184019, 0.0002530047786422074, 0.00035165518056601286, 0.00045030564069747925, 0.0005489560426212847, 0.0006476064445450902, 0.0007462568464688957, 0.0008449072483927011, 0.0009435577085241675, 0.001042208168655634, 0.0011408585123717785, 0.0012395089725032449, 0.0013381594326347113, 0.0014368097763508558, 0.0015354602364823222, 0.0016341105801984668, 0.0017327610403299332, 0.0018314113840460777, 0.0019300618441775441, 0.0020287123043090105, 0.002127362648025155, 0.0022260132245719433, 0.002324663568288088, 0.002423314144834876, 0.0025219644885510206, 0.002620614832267165, 0.0027192654088139534, 0.002817915752530098, 0.0029165660962462425, 0.003015216439962387]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 8.0, 6.0, 9.0, 19.0, 18.0, 24.0, 39.0, 67.0, 73.0, 124.0, 234.0, 349.0, 537.0, 878.0, 1624.0, 2852.0, 5185.0, 9809.0, 19178.0, 40177.0, 90774.0, 211463.0, 327468.0, 185810.0, 79044.0, 35608.0, 17382.0, 8854.0, 4666.0, 2609.0, 1399.0, 873.0, 473.0, 319.0, 201.0, 139.0, 75.0, 52.0, 40.0, 29.0, 21.0, 13.0, 10.0, 9.0, 7.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.0128326416015625, -0.012448668479919434, -0.012064695358276367, -0.0116807222366333, -0.011296749114990234, -0.010912775993347168, -0.010528802871704102, -0.010144829750061035, -0.009760856628417969, -0.009376883506774902, -0.008992910385131836, -0.00860893726348877, -0.008224964141845703, -0.007840991020202637, -0.00745701789855957, -0.007073044776916504, -0.0066890716552734375, -0.006305098533630371, -0.005921125411987305, -0.005537152290344238, -0.005153179168701172, -0.0047692060470581055, -0.004385232925415039, -0.004001259803771973, -0.0036172866821289062, -0.00323331356048584, -0.0028493404388427734, -0.002465367317199707, -0.0020813941955566406, -0.0016974210739135742, -0.0013134479522705078, -0.0009294748306274414, -0.000545501708984375, -0.0001615285873413086, 0.0002224445343017578, 0.0006064176559448242, 0.0009903907775878906, 0.001374363899230957, 0.0017583370208740234, 0.00214231014251709, 0.0025262832641601562, 0.0029102563858032227, 0.003294229507446289, 0.0036782026290893555, 0.004062175750732422, 0.004446148872375488, 0.004830121994018555, 0.005214095115661621, 0.0055980682373046875, 0.005982041358947754, 0.00636601448059082, 0.006749987602233887, 0.007133960723876953, 0.0075179338455200195, 0.007901906967163086, 0.008285880088806152, 0.008669853210449219, 0.009053826332092285, 0.009437799453735352, 0.009821772575378418, 0.010205745697021484, 0.01058971881866455, 0.010973691940307617, 0.011357665061950684, 0.01174163818359375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 1.0, 5.0, 11.0, 9.0, 11.0, 9.0, 16.0, 16.0, 18.0, 21.0, 35.0, 35.0, 42.0, 47.0, 48.0, 49.0, 47.0, 49.0, 54.0, 44.0, 39.0, 49.0, 42.0, 41.0, 29.0, 50.0, 28.0, 28.0, 20.0, 20.0, 21.0, 15.0, 13.0, 12.0, 10.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0035724639892578125, -0.003475099802017212, -0.0033777356147766113, -0.0032803714275360107, -0.00318300724029541, -0.0030856430530548096, -0.002988278865814209, -0.0028909146785736084, -0.002793550491333008, -0.0026961863040924072, -0.0025988221168518066, -0.002501457929611206, -0.0024040937423706055, -0.002306729555130005, -0.0022093653678894043, -0.0021120011806488037, -0.002014636993408203, -0.0019172728061676025, -0.001819908618927002, -0.0017225444316864014, -0.0016251802444458008, -0.0015278160572052002, -0.0014304518699645996, -0.001333087682723999, -0.0012357234954833984, -0.0011383593082427979, -0.0010409951210021973, -0.0009436309337615967, -0.0008462667465209961, -0.0007489025592803955, -0.0006515383720397949, -0.0005541741847991943, -0.00045680999755859375, -0.00035944581031799316, -0.0002620816230773926, -0.000164717435836792, -6.73532485961914e-05, 3.001093864440918e-05, 0.00012737512588500977, 0.00022473931312561035, 0.00032210350036621094, 0.0004194676876068115, 0.0005168318748474121, 0.0006141960620880127, 0.0007115602493286133, 0.0008089244365692139, 0.0009062886238098145, 0.001003652811050415, 0.0011010169982910156, 0.0011983811855316162, 0.0012957453727722168, 0.0013931095600128174, 0.001490473747253418, 0.0015878379344940186, 0.0016852021217346191, 0.0017825663089752197, 0.0018799304962158203, 0.001977294683456421, 0.0020746588706970215, 0.002172023057937622, 0.0022693872451782227, 0.0023667514324188232, 0.002464115619659424, 0.0025614798069000244, 0.002658843994140625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 7.0, 5.0, 9.0, 9.0, 14.0, 13.0, 30.0, 40.0, 71.0, 137.0, 259.0, 551.0, 1341.0, 3204.0, 8579.0, 23598.0, 69237.0, 230015.0, 461283.0, 168089.0, 52787.0, 17911.0, 6699.0, 2600.0, 1096.0, 482.0, 227.0, 95.0, 51.0, 30.0, 26.0, 9.0, 10.0, 14.0, 11.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015167236328125, -0.01469874382019043, -0.01423025131225586, -0.013761758804321289, -0.013293266296386719, -0.012824773788452148, -0.012356281280517578, -0.011887788772583008, -0.011419296264648438, -0.010950803756713867, -0.010482311248779297, -0.010013818740844727, -0.009545326232910156, -0.009076833724975586, -0.008608341217041016, -0.008139848709106445, -0.007671356201171875, -0.007202863693237305, -0.006734371185302734, -0.006265878677368164, -0.005797386169433594, -0.0053288936614990234, -0.004860401153564453, -0.004391908645629883, -0.0039234161376953125, -0.003454923629760742, -0.002986431121826172, -0.0025179386138916016, -0.0020494461059570312, -0.001580953598022461, -0.0011124610900878906, -0.0006439685821533203, -0.00017547607421875, 0.0002930164337158203, 0.0007615089416503906, 0.001230001449584961, 0.0016984939575195312, 0.0021669864654541016, 0.002635478973388672, 0.003103971481323242, 0.0035724639892578125, 0.004040956497192383, 0.004509449005126953, 0.0049779415130615234, 0.005446434020996094, 0.005914926528930664, 0.006383419036865234, 0.006851911544799805, 0.007320404052734375, 0.007788896560668945, 0.008257389068603516, 0.008725881576538086, 0.009194374084472656, 0.009662866592407227, 0.010131359100341797, 0.010599851608276367, 0.011068344116210938, 0.011536836624145508, 0.012005329132080078, 0.012473821640014648, 0.012942314147949219, 0.013410806655883789, 0.01387929916381836, 0.01434779167175293, 0.0148162841796875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 8.0, 7.0, 10.0, 11.0, 7.0, 13.0, 15.0, 18.0, 14.0, 20.0, 25.0, 26.0, 22.0, 33.0, 30.0, 32.0, 36.0, 44.0, 35.0, 43.0, 32.0, 52.0, 42.0, 34.0, 41.0, 32.0, 39.0, 30.0, 34.0, 25.0, 24.0, 33.0, 19.0, 14.0, 16.0, 13.0, 8.0, 6.0, 14.0, 5.0, 7.0, 5.0, 4.0, 2.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.002410888671875, -0.002336740493774414, -0.002262592315673828, -0.002188444137573242, -0.0021142959594726562, -0.0020401477813720703, -0.0019659996032714844, -0.0018918514251708984, -0.0018177032470703125, -0.0017435550689697266, -0.0016694068908691406, -0.0015952587127685547, -0.0015211105346679688, -0.0014469623565673828, -0.0013728141784667969, -0.001298666000366211, -0.001224517822265625, -0.001150369644165039, -0.0010762214660644531, -0.0010020732879638672, -0.0009279251098632812, -0.0008537769317626953, -0.0007796287536621094, -0.0007054805755615234, -0.0006313323974609375, -0.0005571842193603516, -0.0004830360412597656, -0.0004088878631591797, -0.00033473968505859375, -0.0002605915069580078, -0.00018644332885742188, -0.00011229515075683594, -3.814697265625e-05, 3.600120544433594e-05, 0.00011014938354492188, 0.0001842975616455078, 0.00025844573974609375, 0.0003325939178466797, 0.0004067420959472656, 0.00048089027404785156, 0.0005550384521484375, 0.0006291866302490234, 0.0007033348083496094, 0.0007774829864501953, 0.0008516311645507812, 0.0009257793426513672, 0.0009999275207519531, 0.001074075698852539, 0.001148223876953125, 0.001222372055053711, 0.0012965202331542969, 0.0013706684112548828, 0.0014448165893554688, 0.0015189647674560547, 0.0015931129455566406, 0.0016672611236572266, 0.0017414093017578125, 0.0018155574798583984, 0.0018897056579589844, 0.0019638538360595703, 0.0020380020141601562, 0.002112150192260742, 0.002186298370361328, 0.002260446548461914, 0.0023345947265625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 3.0, 16.0, 17.0, 18.0, 54.0, 72.0, 77.0, 97.0, 159.0, 229.0, 321.0, 442.0, 686.0, 946.0, 1399.0, 2102.0, 3391.0, 5921.0, 10932.0, 24676.0, 70679.0, 655837.0, 188394.0, 43508.0, 17290.0, 8227.0, 4509.0, 2872.0, 1755.0, 1201.0, 816.0, 558.0, 398.0, 281.0, 199.0, 148.0, 111.0, 53.0, 43.0, 37.0, 24.0, 16.0, 13.0, 6.0, 6.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00780487060546875, -0.0075337886810302734, -0.007262706756591797, -0.00699162483215332, -0.006720542907714844, -0.006449460983276367, -0.006178379058837891, -0.005907297134399414, -0.0056362152099609375, -0.005365133285522461, -0.005094051361083984, -0.004822969436645508, -0.004551887512207031, -0.004280805587768555, -0.004009723663330078, -0.0037386417388916016, -0.003467559814453125, -0.0031964778900146484, -0.002925395965576172, -0.0026543140411376953, -0.0023832321166992188, -0.002112150192260742, -0.0018410682678222656, -0.001569986343383789, -0.0012989044189453125, -0.001027822494506836, -0.0007567405700683594, -0.0004856586456298828, -0.00021457672119140625, 5.650520324707031e-05, 0.0003275871276855469, 0.0005986690521240234, 0.0008697509765625, 0.0011408329010009766, 0.0014119148254394531, 0.0016829967498779297, 0.0019540786743164062, 0.002225160598754883, 0.0024962425231933594, 0.002767324447631836, 0.0030384063720703125, 0.003309488296508789, 0.0035805702209472656, 0.003851652145385742, 0.004122734069824219, 0.004393815994262695, 0.004664897918701172, 0.0049359798431396484, 0.005207061767578125, 0.0054781436920166016, 0.005749225616455078, 0.006020307540893555, 0.006291389465332031, 0.006562471389770508, 0.006833553314208984, 0.007104635238647461, 0.0073757171630859375, 0.007646799087524414, 0.00791788101196289, 0.008188962936401367, 0.008460044860839844, 0.00873112678527832, 0.009002208709716797, 0.009273290634155273, 0.00954437255859375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 10.0, 13.0, 19.0, 24.0, 34.0, 52.0, 57.0, 77.0, 92.0, 136.0, 107.0, 88.0, 82.0, 62.0, 45.0, 27.0, 27.0, 16.0, 11.0, 2.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0907649993896484e-05, -1.0533258318901062e-05, -1.015886664390564e-05, -9.784474968910217e-06, -9.410083293914795e-06, -9.035691618919373e-06, -8.66129994392395e-06, -8.286908268928528e-06, -7.912516593933105e-06, -7.538124918937683e-06, -7.163733243942261e-06, -6.789341568946838e-06, -6.414949893951416e-06, -6.040558218955994e-06, -5.666166543960571e-06, -5.291774868965149e-06, -4.9173831939697266e-06, -4.542991518974304e-06, -4.168599843978882e-06, -3.7942081689834595e-06, -3.419816493988037e-06, -3.0454248189926147e-06, -2.6710331439971924e-06, -2.29664146900177e-06, -1.9222497940063477e-06, -1.5478581190109253e-06, -1.173466444015503e-06, -7.990747690200806e-07, -4.246830940246582e-07, -5.029141902923584e-08, 3.241002559661865e-07, 6.984919309616089e-07, 1.0728836059570312e-06, 1.4472752809524536e-06, 1.821666955947876e-06, 2.1960586309432983e-06, 2.5704503059387207e-06, 2.944841980934143e-06, 3.3192336559295654e-06, 3.693625330924988e-06, 4.06801700592041e-06, 4.4424086809158325e-06, 4.816800355911255e-06, 5.191192030906677e-06, 5.5655837059021e-06, 5.939975380897522e-06, 6.314367055892944e-06, 6.688758730888367e-06, 7.063150405883789e-06, 7.4375420808792114e-06, 7.811933755874634e-06, 8.186325430870056e-06, 8.560717105865479e-06, 8.935108780860901e-06, 9.309500455856323e-06, 9.683892130851746e-06, 1.0058283805847168e-05, 1.043267548084259e-05, 1.0807067155838013e-05, 1.1181458830833435e-05, 1.1555850505828857e-05, 1.193024218082428e-05, 1.2304633855819702e-05, 1.2679025530815125e-05, 1.3053417205810547e-05]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 5.0, 4.0, 9.0, 13.0, 27.0, 36.0, 56.0, 89.0, 159.0, 266.0, 416.0, 702.0, 1086.0, 1817.0, 2925.0, 4997.0, 9912.0, 21305.0, 62326.0, 683281.0, 188369.0, 37897.0, 15156.0, 7407.0, 4103.0, 2374.0, 1479.0, 900.0, 543.0, 322.0, 199.0, 135.0, 86.0, 56.0, 33.0, 28.0, 10.0, 11.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0102081298828125, -0.009865522384643555, -0.00952291488647461, -0.009180307388305664, -0.008837699890136719, -0.008495092391967773, -0.008152484893798828, -0.007809877395629883, -0.0074672698974609375, -0.007124662399291992, -0.006782054901123047, -0.0064394474029541016, -0.006096839904785156, -0.005754232406616211, -0.005411624908447266, -0.00506901741027832, -0.004726409912109375, -0.00438380241394043, -0.004041194915771484, -0.003698587417602539, -0.0033559799194335938, -0.0030133724212646484, -0.002670764923095703, -0.002328157424926758, -0.0019855499267578125, -0.0016429424285888672, -0.0013003349304199219, -0.0009577274322509766, -0.0006151199340820312, -0.00027251243591308594, 7.009506225585938e-05, 0.0004127025604248047, 0.00075531005859375, 0.0010979175567626953, 0.0014405250549316406, 0.001783132553100586, 0.0021257400512695312, 0.0024683475494384766, 0.002810955047607422, 0.003153562545776367, 0.0034961700439453125, 0.003838777542114258, 0.004181385040283203, 0.0045239925384521484, 0.004866600036621094, 0.005209207534790039, 0.005551815032958984, 0.00589442253112793, 0.006237030029296875, 0.00657963752746582, 0.006922245025634766, 0.007264852523803711, 0.007607460021972656, 0.007950067520141602, 0.008292675018310547, 0.008635282516479492, 0.008977890014648438, 0.009320497512817383, 0.009663105010986328, 0.010005712509155273, 0.010348320007324219, 0.010690927505493164, 0.01103353500366211, 0.011376142501831055, 0.01171875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 2.0, 6.0, 6.0, 8.0, 14.0, 12.0, 11.0, 15.0, 20.0, 41.0, 74.0, 143.0, 285.0, 130.0, 56.0, 47.0, 24.0, 19.0, 17.0, 12.0, 6.0, 7.0, 4.0, 4.0, 4.0, 4.0, 7.0, 2.0, 5.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025653839111328125, -0.0024719834327697754, -0.0023785829544067383, -0.002285182476043701, -0.002191781997680664, -0.002098381519317627, -0.00200498104095459, -0.0019115805625915527, -0.0018181800842285156, -0.0017247796058654785, -0.0016313791275024414, -0.0015379786491394043, -0.0014445781707763672, -0.00135117769241333, -0.001257777214050293, -0.0011643767356872559, -0.0010709762573242188, -0.0009775757789611816, -0.0008841753005981445, -0.0007907748222351074, -0.0006973743438720703, -0.0006039738655090332, -0.0005105733871459961, -0.000417172908782959, -0.0003237724304199219, -0.00023037195205688477, -0.00013697147369384766, -4.357099533081055e-05, 4.982948303222656e-05, 0.00014322996139526367, 0.00023663043975830078, 0.0003300309181213379, 0.000423431396484375, 0.0005168318748474121, 0.0006102323532104492, 0.0007036328315734863, 0.0007970333099365234, 0.0008904337882995605, 0.0009838342666625977, 0.0010772347450256348, 0.0011706352233886719, 0.001264035701751709, 0.001357436180114746, 0.0014508366584777832, 0.0015442371368408203, 0.0016376376152038574, 0.0017310380935668945, 0.0018244385719299316, 0.0019178390502929688, 0.002011239528656006, 0.002104640007019043, 0.00219804048538208, 0.002291440963745117, 0.0023848414421081543, 0.0024782419204711914, 0.0025716423988342285, 0.0026650428771972656, 0.0027584433555603027, 0.00285184383392334, 0.002945244312286377, 0.003038644790649414, 0.003132045269012451, 0.0032254457473754883, 0.0033188462257385254, 0.0034122467041015625]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 9.0, 14.0, 18.0, 26.0, 65.0, 105.0, 184.0, 228.0, 166.0, 86.0, 37.0, 27.0, 15.0, 9.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01304792519658804, -0.012486757710576057, -0.011925590224564075, -0.011364422738552094, -0.010803255252540112, -0.01024208776652813, -0.009680919349193573, -0.009119752794504166, -0.008558584377169609, -0.007997416891157627, -0.007436249405145645, -0.006875081919133663, -0.006313914433121681, -0.005752746947109699, -0.00519157899543643, -0.004630411509424448, -0.004069244489073753, -0.0035080770030617714, -0.0029469095170497894, -0.002385741798207164, -0.0018245743121951818, -0.0012634068261831999, -0.0007022391073405743, -0.0001410716213285923, 0.00042009586468338966, 0.0009812633506953716, 0.0015424309531226754, 0.002103598555549979, 0.002664766041561961, 0.003225933527573943, 0.0037871012464165688, 0.004348268732428551, 0.004909435287117958, 0.00547060277312994, 0.006031770259141922, 0.006592937745153904, 0.007154105231165886, 0.007715272717177868, 0.00827644020318985, 0.008837608620524406, 0.009398775175213814, 0.009959942661225796, 0.010521110147237778, 0.01108227763324976, 0.011643445119261742, 0.012204612605273724, 0.012765780091285706, 0.013326948508620262, 0.013888115994632244, 0.014449283480644226, 0.015010450966656208, 0.01557161845266819, 0.016132786870002747, 0.016693953424692154, 0.01725512184202671, 0.017816288396716118, 0.018377456814050674, 0.01893862523138523, 0.01949979178607464, 0.020060960203409195, 0.020622126758098602, 0.02118329517543316, 0.021744461730122566, 0.022305630147457123, 0.02286679670214653]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 6.0, 4.0, 6.0, 7.0, 7.0, 8.0, 15.0, 18.0, 28.0, 19.0, 26.0, 26.0, 23.0, 24.0, 28.0, 24.0, 46.0, 42.0, 33.0, 44.0, 34.0, 33.0, 44.0, 49.0, 36.0, 48.0, 35.0, 35.0, 35.0, 32.0, 38.0, 23.0, 24.0, 18.0, 21.0, 8.0, 12.0, 7.0, 8.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0038122236728668213, -0.0036950267385691404, -0.0035778300371021032, -0.0034606331028044224, -0.003343436401337385, -0.0032262394670397043, -0.003109042765572667, -0.0029918458312749863, -0.002874649129807949, -0.002757452195510268, -0.002640255494043231, -0.00252305855974555, -0.002405861858278513, -0.002288664923980832, -0.002171468222513795, -0.002054271288216114, -0.001937074470333755, -0.001819877652451396, -0.001702680834569037, -0.001585484016686678, -0.001468287198804319, -0.0013510903809219599, -0.001233893446624279, -0.0011166967451572418, -0.000999499810859561, -0.0008823029929772019, -0.0007651061750948429, -0.0006479093572124839, -0.0005307125393301249, -0.0004135156632401049, -0.0002963188453577459, -0.00017912202747538686, -6.192526780068874e-05, 5.52715573576279e-05, 0.00017246838251594454, 0.0002896652149502188, 0.0004068620328325778, 0.0005240588798187673, 0.0006412556977011263, 0.0007584525155834854, 0.0008756493334658444, 0.0009928462095558643, 0.0011100430274382234, 0.0012272398453205824, 0.0013444366632029414, 0.0014616334810853004, 0.0015788302989676595, 0.0016960271168500185, 0.0018132239347323775, 0.0019304207526147366, 0.0020476176869124174, 0.0021648143883794546, 0.0022820113226771355, 0.0023992080241441727, 0.0025164049584418535, 0.0026336016599088907, 0.0027507985942065716, 0.0028679955285042524, 0.0029851922299712896, 0.0031023891642689705, 0.0032195858657360077, 0.0033367828000336885, 0.0034539795015007257, 0.0035711764357984066, 0.003688373137265444]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [5.0, 3.0, 1.0, 3.0, 1.0, 8.0, 2.0, 6.0, 1.0, 3.0, 12.0, 6.0, 10.0, 12.0, 11.0, 15.0, 23.0, 23.0, 22.0, 32.0, 42.0, 38.0, 88.0, 153.0, 304.0, 633.0, 2129.0, 11231.0, 124357.0, 3595643.0, 424335.0, 29190.0, 3988.0, 975.0, 376.0, 190.0, 106.0, 65.0, 58.0, 33.0, 27.0, 24.0, 17.0, 15.0, 15.0, 10.0, 10.0, 9.0, 3.0, 9.0, 3.0, 4.0, 5.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.015869140625, -0.015334844589233398, -0.014800548553466797, -0.014266252517700195, -0.013731956481933594, -0.013197660446166992, -0.01266336441040039, -0.012129068374633789, -0.011594772338867188, -0.011060476303100586, -0.010526180267333984, -0.009991884231567383, -0.009457588195800781, -0.00892329216003418, -0.008388996124267578, -0.007854700088500977, -0.007320404052734375, -0.0067861080169677734, -0.006251811981201172, -0.00571751594543457, -0.005183219909667969, -0.004648923873901367, -0.004114627838134766, -0.003580331802368164, -0.0030460357666015625, -0.002511739730834961, -0.0019774436950683594, -0.0014431476593017578, -0.0009088516235351562, -0.0003745555877685547, 0.00015974044799804688, 0.0006940364837646484, 0.00122833251953125, 0.0017626285552978516, 0.002296924591064453, 0.0028312206268310547, 0.0033655166625976562, 0.003899812698364258, 0.004434108734130859, 0.004968404769897461, 0.0055027008056640625, 0.006036996841430664, 0.006571292877197266, 0.007105588912963867, 0.007639884948730469, 0.00817418098449707, 0.008708477020263672, 0.009242773056030273, 0.009777069091796875, 0.010311365127563477, 0.010845661163330078, 0.01137995719909668, 0.011914253234863281, 0.012448549270629883, 0.012982845306396484, 0.013517141342163086, 0.014051437377929688, 0.014585733413696289, 0.01512002944946289, 0.015654325485229492, 0.016188621520996094, 0.016722917556762695, 0.017257213592529297, 0.0177915096282959, 0.0183258056640625]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [6.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 2.0, 4.0, 8.0, 6.0, 9.0, 13.0, 8.0, 13.0, 18.0, 16.0, 18.0, 19.0, 24.0, 30.0, 28.0, 24.0, 23.0, 27.0, 36.0, 36.0, 45.0, 38.0, 39.0, 39.0, 33.0, 39.0, 35.0, 29.0, 40.0, 28.0, 29.0, 38.0, 33.0, 30.0, 17.0, 15.0, 21.0, 11.0, 11.0, 16.0, 5.0, 7.0, 8.0, 7.0, 5.0, 6.0, 1.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.003173828125, -0.0030683577060699463, -0.0029628872871398926, -0.002857416868209839, -0.002751946449279785, -0.0026464760303497314, -0.0025410056114196777, -0.002435535192489624, -0.0023300647735595703, -0.0022245943546295166, -0.002119123935699463, -0.002013653516769409, -0.0019081830978393555, -0.0018027126789093018, -0.001697242259979248, -0.0015917718410491943, -0.0014863014221191406, -0.001380831003189087, -0.0012753605842590332, -0.0011698901653289795, -0.0010644197463989258, -0.0009589493274688721, -0.0008534789085388184, -0.0007480084896087646, -0.0006425380706787109, -0.0005370676517486572, -0.0004315972328186035, -0.0003261268138885498, -0.0002206563949584961, -0.00011518597602844238, -9.715557098388672e-06, 9.575486183166504e-05, 0.00020122528076171875, 0.00030669569969177246, 0.00041216611862182617, 0.0005176365375518799, 0.0006231069564819336, 0.0007285773754119873, 0.000834047794342041, 0.0009395182132720947, 0.0010449886322021484, 0.0011504590511322021, 0.0012559294700622559, 0.0013613998889923096, 0.0014668703079223633, 0.001572340726852417, 0.0016778111457824707, 0.0017832815647125244, 0.0018887519836425781, 0.001994222402572632, 0.0020996928215026855, 0.0022051632404327393, 0.002310633659362793, 0.0024161040782928467, 0.0025215744972229004, 0.002627044916152954, 0.002732515335083008, 0.0028379857540130615, 0.0029434561729431152, 0.003048926591873169, 0.0031543970108032227, 0.0032598674297332764, 0.00336533784866333, 0.003470808267593384, 0.0035762786865234375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 10.0, 19.0, 23.0, 28.0, 25.0, 36.0, 57.0, 117.0, 214.0, 474.0, 1121.0, 3461.0, 19203.0, 1472980.0, 2669098.0, 21685.0, 3521.0, 1203.0, 457.0, 202.0, 107.0, 66.0, 46.0, 26.0, 29.0, 14.0, 8.0, 11.0, 7.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0302276611328125, -0.029364585876464844, -0.028501510620117188, -0.02763843536376953, -0.026775360107421875, -0.02591228485107422, -0.025049209594726562, -0.024186134338378906, -0.02332305908203125, -0.022459983825683594, -0.021596908569335938, -0.02073383331298828, -0.019870758056640625, -0.01900768280029297, -0.018144607543945312, -0.017281532287597656, -0.01641845703125, -0.015555381774902344, -0.014692306518554688, -0.013829231262207031, -0.012966156005859375, -0.012103080749511719, -0.011240005493164062, -0.010376930236816406, -0.00951385498046875, -0.008650779724121094, -0.0077877044677734375, -0.006924629211425781, -0.006061553955078125, -0.005198478698730469, -0.0043354034423828125, -0.0034723281860351562, -0.0026092529296875, -0.0017461776733398438, -0.0008831024169921875, -2.002716064453125e-05, 0.000843048095703125, 0.0017061233520507812, 0.0025691986083984375, 0.0034322738647460938, 0.00429534912109375, 0.005158424377441406, 0.0060214996337890625, 0.006884574890136719, 0.007747650146484375, 0.008610725402832031, 0.009473800659179688, 0.010336875915527344, 0.011199951171875, 0.012063026428222656, 0.012926101684570312, 0.013789176940917969, 0.014652252197265625, 0.015515327453613281, 0.016378402709960938, 0.017241477966308594, 0.01810455322265625, 0.018967628479003906, 0.019830703735351562, 0.02069377899169922, 0.021556854248046875, 0.02241992950439453, 0.023283004760742188, 0.024146080017089844, 0.0250091552734375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 2.0, 10.0, 14.0, 37.0, 69.0, 229.0, 519.0, 1659.0, 945.0, 316.0, 129.0, 71.0, 31.0, 15.0, 14.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.00677490234375, -0.006636172533035278, -0.006497442722320557, -0.006358712911605835, -0.006219983100891113, -0.006081253290176392, -0.00594252347946167, -0.005803793668746948, -0.0056650638580322266, -0.005526334047317505, -0.005387604236602783, -0.0052488744258880615, -0.00511014461517334, -0.004971414804458618, -0.0048326849937438965, -0.004693955183029175, -0.004555225372314453, -0.0044164955615997314, -0.00427776575088501, -0.004139035940170288, -0.004000306129455566, -0.0038615763187408447, -0.003722846508026123, -0.0035841166973114014, -0.0034453868865966797, -0.003306657075881958, -0.0031679272651672363, -0.0030291974544525146, -0.002890467643737793, -0.0027517378330230713, -0.0026130080223083496, -0.002474278211593628, -0.0023355484008789062, -0.0021968185901641846, -0.002058088779449463, -0.0019193589687347412, -0.0017806291580200195, -0.0016418993473052979, -0.0015031695365905762, -0.0013644397258758545, -0.0012257099151611328, -0.0010869801044464111, -0.0009482502937316895, -0.0008095204830169678, -0.0006707906723022461, -0.0005320608615875244, -0.00039333105087280273, -0.00025460124015808105, -0.00011587142944335938, 2.2858381271362305e-05, 0.00016158819198608398, 0.00030031800270080566, 0.00043904781341552734, 0.000577777624130249, 0.0007165074348449707, 0.0008552372455596924, 0.000993967056274414, 0.0011326968669891357, 0.0012714266777038574, 0.001410156488418579, 0.0015488862991333008, 0.0016876161098480225, 0.0018263459205627441, 0.001965075731277466, 0.0021038055419921875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 7.0, 20.0, 18.0, 16.0, 15.0, 29.0, 39.0, 41.0, 79.0, 78.0, 76.0, 102.0, 73.0, 87.0, 68.0, 46.0, 35.0, 27.0, 19.0, 25.0, 18.0, 16.0, 8.0, 3.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.005276018753647804, -0.005097667220979929, -0.004919315222650766, -0.004740963689982891, -0.0045626116916537285, -0.004384260158985853, -0.004205908626317978, -0.004027556627988815, -0.0038492048624902964, -0.0036708530969917774, -0.0034925013314932585, -0.0033141495659947395, -0.0031357980333268642, -0.0029574460349977016, -0.0027790945023298264, -0.0026007427368313074, -0.0024223909713327885, -0.0022440392058342695, -0.0020656874403357506, -0.0018873357912525535, -0.0017089840257540345, -0.0015306322602555156, -0.0013522806111723185, -0.0011739288456737995, -0.0009955770801752806, -0.0008172253146767616, -0.0006388736073859036, -0.00046052190009504557, -0.0002821701345965266, -0.00010381836909800768, 7.453327998518944e-05, 0.0002528850454837084, 0.00043123634532094, 0.000609588110819459, 0.000787939818110317, 0.000966291525401175, 0.001144643290899694, 0.001322995056398213, 0.00150134670548141, 0.001679698470979929, 0.001858050236478448, 0.002036402001976967, 0.002214753767475486, 0.0023931055329740047, 0.00257145706564188, 0.0027498090639710426, 0.002928160596638918, 0.003106512362137437, 0.003284864127635956, 0.0034632158931344748, 0.0036415676586329937, 0.003819919191300869, 0.003998271189630032, 0.004176622722297907, 0.004354974254965782, 0.004533326253294945, 0.004711678251624107, 0.004890029784291983, 0.005068381782621145, 0.0052467333152890205, 0.005425085313618183, 0.005603436846286058, 0.005781788378953934, 0.005960140377283096, 0.006138491909950972]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 3.0, 2.0, 11.0, 7.0, 5.0, 12.0, 19.0, 9.0, 14.0, 17.0, 26.0, 18.0, 25.0, 25.0, 31.0, 25.0, 29.0, 30.0, 33.0, 43.0, 37.0, 32.0, 42.0, 38.0, 31.0, 31.0, 41.0, 29.0, 31.0, 30.0, 27.0, 31.0, 25.0, 23.0, 32.0, 26.0, 11.0, 15.0, 18.0, 11.0, 10.0, 8.0, 2.0, 8.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.003483766922727227, -0.003381410613656044, -0.0032790545374155045, -0.0031766982283443213, -0.003074341919273138, -0.0029719858430325985, -0.0028696295339614153, -0.002767273224890232, -0.0026649171486496925, -0.0025625608395785093, -0.0024602047633379698, -0.0023578484542667866, -0.002255492378026247, -0.002153136068955064, -0.0020507797598838806, -0.0019484235672280192, -0.0018460673745721579, -0.0017437111819162965, -0.001641354989260435, -0.001538998680189252, -0.0014366424875333905, -0.0013342862948775291, -0.001231929985806346, -0.0011295737931504846, -0.0010272176004946232, -0.0009248614078387618, -0.0008225051569752395, -0.0007201489061117172, -0.0006177927134558558, -0.0005154365207999945, -0.0004130802699364722, -0.0003107240190729499, -0.0002083678264170885, -0.00010601160465739667, -3.6553828977048397e-06, 9.8700838861987e-05, 0.00020105706062167883, 0.0003034132532775402, 0.0004057695041410625, 0.0005081257550045848, 0.0006104819476604462, 0.0007128381403163075, 0.0008151943911798298, 0.0009175506420433521, 0.0010199068346992135, 0.0011222630273550749, 0.001224619336426258, 0.0013269755290821195, 0.0014293317217379808, 0.0015316879143938422, 0.0016340441070497036, 0.0017364004161208868, 0.0018387566087767482, 0.0019411128014326096, 0.0020434691105037928, 0.002145825419574976, 0.0022481814958155155, 0.0023505378048866987, 0.0024528938811272383, 0.0025552501901984215, 0.002657606266438961, 0.0027599625755101442, 0.0028623188845813274, 0.002964674960821867, 0.00306703126989305]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 8.0, 10.0, 14.0, 19.0, 34.0, 40.0, 73.0, 68.0, 159.0, 209.0, 308.0, 508.0, 716.0, 1119.0, 1700.0, 2586.0, 3987.0, 6383.0, 9929.0, 15992.0, 25330.0, 40709.0, 66006.0, 106572.0, 170928.0, 212610.0, 144930.0, 89668.0, 55211.0, 34093.0, 21147.0, 13568.0, 8511.0, 5327.0, 3558.0, 2157.0, 1496.0, 990.0, 621.0, 416.0, 295.0, 151.0, 133.0, 96.0, 45.0, 41.0, 33.0, 18.0, 12.0, 12.0, 4.0, 3.0, 2.0, 5.0, 4.0], "bins": [-0.0010194778442382812, -0.000989772379398346, -0.0009600669145584106, -0.0009303614497184753, -0.00090065598487854, -0.0008709505200386047, -0.0008412450551986694, -0.0008115395903587341, -0.0007818341255187988, -0.0007521286606788635, -0.0007224231958389282, -0.0006927177309989929, -0.0006630122661590576, -0.0006333068013191223, -0.000603601336479187, -0.0005738958716392517, -0.0005441904067993164, -0.0005144849419593811, -0.0004847794771194458, -0.0004550740122795105, -0.0004253685474395752, -0.0003956630825996399, -0.0003659576177597046, -0.0003362521529197693, -0.000306546688079834, -0.0002768412232398987, -0.0002471357583999634, -0.00021743029356002808, -0.00018772482872009277, -0.00015801936388015747, -0.00012831389904022217, -9.860843420028687e-05, -6.890296936035156e-05, -3.919750452041626e-05, -9.492039680480957e-06, 2.0213425159454346e-05, 4.991888999938965e-05, 7.962435483932495e-05, 0.00010932981967926025, 0.00013903528451919556, 0.00016874074935913086, 0.00019844621419906616, 0.00022815167903900146, 0.00025785714387893677, 0.00028756260871887207, 0.0003172680735588074, 0.0003469735383987427, 0.000376679003238678, 0.0004063844680786133, 0.0004360899329185486, 0.0004657953977584839, 0.0004955008625984192, 0.0005252063274383545, 0.0005549117922782898, 0.0005846172571182251, 0.0006143227219581604, 0.0006440281867980957, 0.000673733651638031, 0.0007034391164779663, 0.0007331445813179016, 0.0007628500461578369, 0.0007925555109977722, 0.0008222609758377075, 0.0008519664406776428, 0.0008816719055175781]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 5.0, 7.0, 8.0, 3.0, 17.0, 10.0, 14.0, 16.0, 14.0, 20.0, 17.0, 15.0, 29.0, 29.0, 31.0, 24.0, 27.0, 38.0, 49.0, 29.0, 37.0, 45.0, 31.0, 40.0, 45.0, 33.0, 25.0, 34.0, 32.0, 29.0, 32.0, 37.0, 20.0, 26.0, 18.0, 16.0, 22.0, 16.0, 8.0, 12.0, 9.0, 9.0, 3.0, 2.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00347900390625, -0.0033746659755706787, -0.0032703280448913574, -0.003165990114212036, -0.003061652183532715, -0.0029573142528533936, -0.0028529763221740723, -0.002748638391494751, -0.0026443004608154297, -0.0025399625301361084, -0.002435624599456787, -0.002331286668777466, -0.0022269487380981445, -0.0021226108074188232, -0.002018272876739502, -0.0019139349460601807, -0.0018095970153808594, -0.001705259084701538, -0.0016009211540222168, -0.0014965832233428955, -0.0013922452926635742, -0.001287907361984253, -0.0011835694313049316, -0.0010792315006256104, -0.0009748935699462891, -0.0008705556392669678, -0.0007662177085876465, -0.0006618797779083252, -0.0005575418472290039, -0.0004532039165496826, -0.00034886598587036133, -0.00024452805519104004, -0.00014019012451171875, -3.585219383239746e-05, 6.848573684692383e-05, 0.00017282366752624512, 0.0002771615982055664, 0.0003814995288848877, 0.000485837459564209, 0.0005901753902435303, 0.0006945133209228516, 0.0007988512516021729, 0.0009031891822814941, 0.0010075271129608154, 0.0011118650436401367, 0.001216202974319458, 0.0013205409049987793, 0.0014248788356781006, 0.0015292167663574219, 0.0016335546970367432, 0.0017378926277160645, 0.0018422305583953857, 0.001946568489074707, 0.0020509064197540283, 0.0021552443504333496, 0.002259582281112671, 0.002363920211791992, 0.0024682581424713135, 0.0025725960731506348, 0.002676934003829956, 0.0027812719345092773, 0.0028856098651885986, 0.00298994779586792, 0.003094285726547241, 0.0031986236572265625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 16.0, 23.0, 34.0, 56.0, 100.0, 142.0, 212.0, 409.0, 643.0, 1033.0, 1732.0, 2838.0, 4652.0, 7899.0, 13972.0, 25115.0, 45995.0, 89375.0, 187799.0, 328646.0, 163838.0, 78925.0, 41543.0, 22635.0, 12657.0, 7215.0, 4289.0, 2621.0, 1574.0, 997.0, 567.0, 383.0, 254.0, 130.0, 90.0, 42.0, 35.0, 16.0, 21.0, 9.0, 5.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001201629638671875, -0.001164555549621582, -0.001127481460571289, -0.001090407371520996, -0.0010533332824707031, -0.0010162591934204102, -0.0009791851043701172, -0.0009421110153198242, -0.0009050369262695312, -0.0008679628372192383, -0.0008308887481689453, -0.0007938146591186523, -0.0007567405700683594, -0.0007196664810180664, -0.0006825923919677734, -0.0006455183029174805, -0.0006084442138671875, -0.0005713701248168945, -0.0005342960357666016, -0.0004972219467163086, -0.0004601478576660156, -0.00042307376861572266, -0.0003859996795654297, -0.0003489255905151367, -0.00031185150146484375, -0.0002747774124145508, -0.0002377033233642578, -0.00020062923431396484, -0.00016355514526367188, -0.0001264810562133789, -8.940696716308594e-05, -5.233287811279297e-05, -1.52587890625e-05, 2.181529998779297e-05, 5.888938903808594e-05, 9.59634780883789e-05, 0.00013303756713867188, 0.00017011165618896484, 0.0002071857452392578, 0.0002442598342895508, 0.00028133392333984375, 0.0003184080123901367, 0.0003554821014404297, 0.00039255619049072266, 0.0004296302795410156, 0.0004667043685913086, 0.0005037784576416016, 0.0005408525466918945, 0.0005779266357421875, 0.0006150007247924805, 0.0006520748138427734, 0.0006891489028930664, 0.0007262229919433594, 0.0007632970809936523, 0.0008003711700439453, 0.0008374452590942383, 0.0008745193481445312, 0.0009115934371948242, 0.0009486675262451172, 0.0009857416152954102, 0.0010228157043457031, 0.001059889793395996, 0.001096963882446289, 0.001134037971496582, 0.001171112060546875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 6.0, 6.0, 9.0, 8.0, 11.0, 13.0, 9.0, 20.0, 12.0, 8.0, 19.0, 25.0, 27.0, 29.0, 39.0, 44.0, 38.0, 43.0, 36.0, 43.0, 33.0, 41.0, 42.0, 54.0, 33.0, 36.0, 37.0, 30.0, 27.0, 29.0, 28.0, 24.0, 19.0, 24.0, 9.0, 18.0, 9.0, 12.0, 7.0, 12.0, 6.0, 4.0, 8.0, 3.0, 3.0, 0.0, 4.0, 4.0], "bins": [-0.0026760101318359375, -0.0026044994592666626, -0.0025329887866973877, -0.002461478114128113, -0.002389967441558838, -0.002318456768989563, -0.002246946096420288, -0.002175435423851013, -0.0021039247512817383, -0.0020324140787124634, -0.0019609034061431885, -0.0018893927335739136, -0.0018178820610046387, -0.0017463713884353638, -0.0016748607158660889, -0.001603350043296814, -0.001531839370727539, -0.0014603286981582642, -0.0013888180255889893, -0.0013173073530197144, -0.0012457966804504395, -0.0011742860078811646, -0.0011027753353118896, -0.0010312646627426147, -0.0009597539901733398, -0.0008882433176040649, -0.00081673264503479, -0.0007452219724655151, -0.0006737112998962402, -0.0006022006273269653, -0.0005306899547576904, -0.00045917928218841553, -0.0003876686096191406, -0.0003161579370498657, -0.0002446472644805908, -0.00017313659191131592, -0.00010162591934204102, -3.0115246772766113e-05, 4.139542579650879e-05, 0.00011290609836578369, 0.0001844167709350586, 0.0002559274435043335, 0.0003274381160736084, 0.0003989487886428833, 0.0004704594612121582, 0.0005419701337814331, 0.000613480806350708, 0.0006849914789199829, 0.0007565021514892578, 0.0008280128240585327, 0.0008995234966278076, 0.0009710341691970825, 0.0010425448417663574, 0.0011140555143356323, 0.0011855661869049072, 0.0012570768594741821, 0.001328587532043457, 0.001400098204612732, 0.0014716088771820068, 0.0015431195497512817, 0.0016146302223205566, 0.0016861408948898315, 0.0017576515674591064, 0.0018291622400283813, 0.0019006729125976562]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 7.0, 13.0, 20.0, 35.0, 24.0, 47.0, 75.0, 114.0, 167.0, 249.0, 318.0, 503.0, 690.0, 1054.0, 1700.0, 2405.0, 4028.0, 6713.0, 11349.0, 19662.0, 36502.0, 72987.0, 186261.0, 445277.0, 129732.0, 57374.0, 29632.0, 16448.0, 9450.0, 5764.0, 3448.0, 2119.0, 1433.0, 931.0, 602.0, 427.0, 269.0, 189.0, 135.0, 93.0, 72.0, 71.0, 42.0, 40.0, 17.0, 19.0, 11.0, 11.0, 4.0, 4.0, 7.0, 1.0, 3.0], "bins": [-6.335973739624023e-05, -6.151478737592697e-05, -5.966983735561371e-05, -5.7824887335300446e-05, -5.597993731498718e-05, -5.413498729467392e-05, -5.229003727436066e-05, -5.0445087254047394e-05, -4.860013723373413e-05, -4.675518721342087e-05, -4.4910237193107605e-05, -4.306528717279434e-05, -4.122033715248108e-05, -3.9375387132167816e-05, -3.753043711185455e-05, -3.568548709154129e-05, -3.384053707122803e-05, -3.1995587050914764e-05, -3.01506370306015e-05, -2.830568701028824e-05, -2.6460736989974976e-05, -2.4615786969661713e-05, -2.277083694934845e-05, -2.0925886929035187e-05, -1.9080936908721924e-05, -1.723598688840866e-05, -1.5391036868095398e-05, -1.3546086847782135e-05, -1.1701136827468872e-05, -9.856186807155609e-06, -8.011236786842346e-06, -6.166286766529083e-06, -4.32133674621582e-06, -2.4763867259025574e-06, -6.314367055892944e-07, 1.2135133147239685e-06, 3.0584633350372314e-06, 4.903413355350494e-06, 6.748363375663757e-06, 8.59331339597702e-06, 1.0438263416290283e-05, 1.2283213436603546e-05, 1.4128163456916809e-05, 1.5973113477230072e-05, 1.7818063497543335e-05, 1.9663013517856598e-05, 2.150796353816986e-05, 2.3352913558483124e-05, 2.5197863578796387e-05, 2.704281359910965e-05, 2.8887763619422913e-05, 3.0732713639736176e-05, 3.257766366004944e-05, 3.44226136803627e-05, 3.6267563700675964e-05, 3.811251372098923e-05, 3.995746374130249e-05, 4.180241376161575e-05, 4.3647363781929016e-05, 4.549231380224228e-05, 4.733726382255554e-05, 4.9182213842868805e-05, 5.102716386318207e-05, 5.287211388349533e-05, 5.4717063903808594e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 2.0, 11.0, 3.0, 6.0, 9.0, 7.0, 13.0, 19.0, 10.0, 20.0, 18.0, 38.0, 28.0, 22.0, 45.0, 23.0, 31.0, 56.0, 52.0, 46.0, 29.0, 44.0, 49.0, 27.0, 60.0, 38.0, 37.0, 39.0, 42.0, 23.0, 33.0, 23.0, 11.0, 20.0, 14.0, 6.0, 11.0, 7.0, 8.0, 6.0, 4.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.585141479969025e-06, -5.388632416725159e-06, -5.192123353481293e-06, -4.995614290237427e-06, -4.799105226993561e-06, -4.602596163749695e-06, -4.406087100505829e-06, -4.209578037261963e-06, -4.013068974018097e-06, -3.816559910774231e-06, -3.620050847530365e-06, -3.423541784286499e-06, -3.227032721042633e-06, -3.030523657798767e-06, -2.834014594554901e-06, -2.637505531311035e-06, -2.440996468067169e-06, -2.2444874048233032e-06, -2.0479783415794373e-06, -1.8514692783355713e-06, -1.6549602150917053e-06, -1.4584511518478394e-06, -1.2619420886039734e-06, -1.0654330253601074e-06, -8.689239621162415e-07, -6.724148988723755e-07, -4.759058356285095e-07, -2.7939677238464355e-07, -8.288770914077759e-08, 1.1362135410308838e-07, 3.1013041734695435e-07, 5.066394805908203e-07, 7.031485438346863e-07, 8.996576070785522e-07, 1.0961666703224182e-06, 1.2926757335662842e-06, 1.4891847968101501e-06, 1.6856938600540161e-06, 1.882202923297882e-06, 2.078711986541748e-06, 2.275221049785614e-06, 2.47173011302948e-06, 2.668239176273346e-06, 2.864748239517212e-06, 3.061257302761078e-06, 3.257766366004944e-06, 3.45427542924881e-06, 3.6507844924926758e-06, 3.847293555736542e-06, 4.043802618980408e-06, 4.240311682224274e-06, 4.43682074546814e-06, 4.633329808712006e-06, 4.829838871955872e-06, 5.0263479351997375e-06, 5.2228569984436035e-06, 5.4193660616874695e-06, 5.6158751249313354e-06, 5.812384188175201e-06, 6.008893251419067e-06, 6.205402314662933e-06, 6.401911377906799e-06, 6.598420441150665e-06, 6.794929504394531e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 10.0, 8.0, 5.0, 4.0, 6.0, 6.0, 12.0, 24.0, 33.0, 75.0, 160.0, 412.0, 1026.0, 3176.0, 10893.0, 44502.0, 274124.0, 612385.0, 77022.0, 17270.0, 4847.0, 1572.0, 508.0, 225.0, 95.0, 42.0, 24.0, 12.0, 15.0, 9.0, 9.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.00018835067749023438, -0.00018283911049365997, -0.00017732754349708557, -0.00017181597650051117, -0.00016630440950393677, -0.00016079284250736237, -0.00015528127551078796, -0.00014976970851421356, -0.00014425814151763916, -0.00013874657452106476, -0.00013323500752449036, -0.00012772344052791595, -0.00012221187353134155, -0.00011670030653476715, -0.00011118873953819275, -0.00010567717254161835, -0.00010016560554504395, -9.465403854846954e-05, -8.914247155189514e-05, -8.363090455532074e-05, -7.811933755874634e-05, -7.260777056217194e-05, -6.709620356559753e-05, -6.158463656902313e-05, -5.607306957244873e-05, -5.056150257587433e-05, -4.504993557929993e-05, -3.9538368582725525e-05, -3.402680158615112e-05, -2.851523458957672e-05, -2.300366759300232e-05, -1.7492100596427917e-05, -1.1980533599853516e-05, -6.468966603279114e-06, -9.57399606704712e-07, 4.55416738986969e-06, 1.0065734386444092e-05, 1.5577301383018494e-05, 2.1088868379592896e-05, 2.6600435376167297e-05, 3.21120023727417e-05, 3.76235693693161e-05, 4.31351363658905e-05, 4.8646703362464905e-05, 5.415827035903931e-05, 5.966983735561371e-05, 6.518140435218811e-05, 7.069297134876251e-05, 7.620453834533691e-05, 8.171610534191132e-05, 8.722767233848572e-05, 9.273923933506012e-05, 9.825080633163452e-05, 0.00010376237332820892, 0.00010927394032478333, 0.00011478550732135773, 0.00012029707431793213, 0.00012580864131450653, 0.00013132020831108093, 0.00013683177530765533, 0.00014234334230422974, 0.00014785490930080414, 0.00015336647629737854, 0.00015887804329395294, 0.00016438961029052734]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 3.0, 2.0, 5.0, 10.0, 2.0, 7.0, 10.0, 19.0, 13.0, 24.0, 34.0, 31.0, 39.0, 44.0, 61.0, 74.0, 63.0, 85.0, 65.0, 77.0, 60.0, 55.0, 44.0, 42.0, 21.0, 25.0, 19.0, 15.0, 9.0, 10.0, 4.0, 7.0, 5.0, 10.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6391277313232422e-05, -1.5819445252418518e-05, -1.5247613191604614e-05, -1.467578113079071e-05, -1.4103949069976807e-05, -1.3532117009162903e-05, -1.2960284948348999e-05, -1.2388452887535095e-05, -1.1816620826721191e-05, -1.1244788765907288e-05, -1.0672956705093384e-05, -1.010112464427948e-05, -9.529292583465576e-06, -8.957460522651672e-06, -8.385628461837769e-06, -7.813796401023865e-06, -7.241964340209961e-06, -6.670132279396057e-06, -6.098300218582153e-06, -5.5264681577682495e-06, -4.954636096954346e-06, -4.382804036140442e-06, -3.810971975326538e-06, -3.2391399145126343e-06, -2.6673078536987305e-06, -2.0954757928848267e-06, -1.5236437320709229e-06, -9.51811671257019e-07, -3.7997961044311523e-07, 1.9185245037078857e-07, 7.636845111846924e-07, 1.3355165719985962e-06, 1.9073486328125e-06, 2.479180693626404e-06, 3.0510127544403076e-06, 3.6228448152542114e-06, 4.194676876068115e-06, 4.766508936882019e-06, 5.338340997695923e-06, 5.910173058509827e-06, 6.4820051193237305e-06, 7.053837180137634e-06, 7.625669240951538e-06, 8.197501301765442e-06, 8.769333362579346e-06, 9.34116542339325e-06, 9.912997484207153e-06, 1.0484829545021057e-05, 1.1056661605834961e-05, 1.1628493666648865e-05, 1.2200325727462769e-05, 1.2772157788276672e-05, 1.3343989849090576e-05, 1.391582190990448e-05, 1.4487653970718384e-05, 1.5059486031532288e-05, 1.563131809234619e-05, 1.6203150153160095e-05, 1.6774982213974e-05, 1.7346814274787903e-05, 1.7918646335601807e-05, 1.849047839641571e-05, 1.9062310457229614e-05, 1.9634142518043518e-05, 2.0205974578857422e-05]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 6.0, 15.0, 11.0, 25.0, 20.0, 22.0, 39.0, 41.0, 69.0, 82.0, 77.0, 101.0, 94.0, 87.0, 77.0, 49.0, 39.0, 18.0, 24.0, 26.0, 13.0, 12.0, 8.0, 8.0, 6.0, 1.0, 3.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.005751760210841894, -0.005565279629081488, -0.005378798581659794, -0.005192317999899387, -0.0050058369524776936, -0.004819356370717287, -0.004632875323295593, -0.004446394741535187, -0.00425991415977478, -0.004073433578014374, -0.00388695253059268, -0.0037004719488322735, -0.0035139909014105797, -0.003327510319650173, -0.003141029505059123, -0.002954548690468073, -0.002768067643046379, -0.002581586828455329, -0.002395106013864279, -0.0022086254321038723, -0.0020221443846821785, -0.0018356636865064502, -0.0016491829883307219, -0.0014627021737396717, -0.0012762213591486216, -0.0010897405445575714, -0.0009032597881741822, -0.0007167790317907929, -0.0005302982171997428, -0.00034381740260869265, -0.00015733670443296432, 2.9144110158085823e-05, 0.00021562492474913597, 0.00040210571023635566, 0.0005885864957235754, 0.0007750672521069646, 0.0009615480666980147, 0.0011480288812890649, 0.0013345095794647932, 0.0015209903940558434, 0.0017074712086468935, 0.0018939520232379436, 0.002080432837828994, 0.002266913652420044, 0.0024533942341804504, 0.0026398752816021442, 0.0028263558633625507, 0.003012836677953601, 0.003199317492544651, 0.003385798307135701, 0.0035722791217267513, 0.003758759703487158, 0.003945240750908852, 0.004131721332669258, 0.004318201914429665, 0.004504682961851358, 0.004691164009273052, 0.004877644591033459, 0.0050641256384551525, 0.005250606220215559, 0.005437087267637253, 0.005623567849397659, 0.005810048431158066, 0.00599652947857976, 0.006183010060340166]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 5.0, 1.0, 6.0, 1.0, 10.0, 8.0, 3.0, 14.0, 15.0, 14.0, 10.0, 20.0, 22.0, 18.0, 27.0, 25.0, 29.0, 25.0, 30.0, 30.0, 30.0, 45.0, 40.0, 25.0, 46.0, 44.0, 30.0, 32.0, 37.0, 30.0, 29.0, 31.0, 27.0, 34.0, 25.0, 26.0, 29.0, 20.0, 18.0, 15.0, 14.0, 14.0, 11.0, 7.0, 4.0, 5.0, 9.0, 3.0, 4.0, 4.0, 1.0, 5.0, 1.0, 0.0, 2.0], "bins": [-0.0033013676293194294, -0.003204216016456485, -0.00310706440359354, -0.0030099130235612392, -0.0029127614106982946, -0.00281560979783535, -0.002718458417803049, -0.0026213068049401045, -0.00252415519207716, -0.0024270035792142153, -0.0023298519663512707, -0.0022327005863189697, -0.002135548973456025, -0.0020383973605930805, -0.0019412458641454577, -0.001844094367697835, -0.0017469427548348904, -0.0016497911419719458, -0.001552639645524323, -0.0014554881490767002, -0.0013583365362137556, -0.001261184923350811, -0.0011640334269031882, -0.0010668819304555655, -0.0009697303175926208, -0.0008725787629373372, -0.0007754272082820535, -0.0006782756536267698, -0.0005811240989714861, -0.0004839725443162024, -0.0003868209896609187, -0.000289669435005635, -0.00019251788035035133, -9.536632569506764e-05, 1.7852289602160454e-06, 9.893678361549973e-05, 0.00019608833827078342, 0.0002932398929260671, 0.0003903914475813508, 0.0004875430022366345, 0.0005846945568919182, 0.0006818461115472019, 0.0007789976662024856, 0.0008761492208577693, 0.0009733007755130529, 0.0010704523883759975, 0.0011676038848236203, 0.001264755381271243, 0.0013619069941341877, 0.0014590586069971323, 0.001556210103444755, 0.0016533615998923779, 0.0017505132127553225, 0.001847664825618267, 0.0019448163220658898, 0.0020419678185135126, 0.002139119431376457, 0.002236271044239402, 0.0023334226571023464, 0.0024305740371346474, 0.002527725649997592, 0.0026248772628605366, 0.0027220286428928375, 0.002819180255755782, 0.0029163318686187267]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 8.0, 9.0, 13.0, 31.0, 30.0, 52.0, 78.0, 117.0, 218.0, 348.0, 665.0, 1300.0, 2478.0, 5187.0, 11325.0, 25701.0, 62918.0, 175252.0, 440257.0, 200498.0, 69856.0, 28666.0, 12309.0, 5601.0, 2612.0, 1335.0, 705.0, 388.0, 208.0, 121.0, 95.0, 62.0, 40.0, 28.0, 22.0, 12.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169219970703125, -0.016402244567871094, -0.015882492065429688, -0.015362739562988281, -0.014842987060546875, -0.014323234558105469, -0.013803482055664062, -0.013283729553222656, -0.01276397705078125, -0.012244224548339844, -0.011724472045898438, -0.011204719543457031, -0.010684967041015625, -0.010165214538574219, -0.009645462036132812, -0.009125709533691406, -0.00860595703125, -0.008086204528808594, -0.0075664520263671875, -0.007046699523925781, -0.006526947021484375, -0.006007194519042969, -0.0054874420166015625, -0.004967689514160156, -0.00444793701171875, -0.003928184509277344, -0.0034084320068359375, -0.0028886795043945312, -0.002368927001953125, -0.0018491744995117188, -0.0013294219970703125, -0.0008096694946289062, -0.0002899169921875, 0.00022983551025390625, 0.0007495880126953125, 0.0012693405151367188, 0.001789093017578125, 0.0023088455200195312, 0.0028285980224609375, 0.0033483505249023438, 0.00386810302734375, 0.004387855529785156, 0.0049076080322265625, 0.005427360534667969, 0.005947113037109375, 0.006466865539550781, 0.0069866180419921875, 0.007506370544433594, 0.008026123046875, 0.008545875549316406, 0.009065628051757812, 0.009585380554199219, 0.010105133056640625, 0.010624885559082031, 0.011144638061523438, 0.011664390563964844, 0.01218414306640625, 0.012703895568847656, 0.013223648071289062, 0.013743400573730469, 0.014263153076171875, 0.014782905578613281, 0.015302658081054688, 0.015822410583496094, 0.0163421630859375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 8.0, 11.0, 11.0, 14.0, 10.0, 17.0, 18.0, 22.0, 33.0, 30.0, 35.0, 36.0, 41.0, 51.0, 60.0, 54.0, 43.0, 57.0, 58.0, 46.0, 38.0, 36.0, 35.0, 34.0, 41.0, 30.0, 17.0, 29.0, 20.0, 17.0, 11.0, 10.0, 6.0, 5.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003620147705078125, -0.003491342067718506, -0.0033625364303588867, -0.0032337307929992676, -0.0031049251556396484, -0.0029761195182800293, -0.00284731388092041, -0.002718508243560791, -0.002589702606201172, -0.0024608969688415527, -0.0023320913314819336, -0.0022032856941223145, -0.0020744800567626953, -0.0019456744194030762, -0.001816868782043457, -0.0016880631446838379, -0.0015592575073242188, -0.0014304518699645996, -0.0013016462326049805, -0.0011728405952453613, -0.0010440349578857422, -0.000915229320526123, -0.0007864236831665039, -0.0006576180458068848, -0.0005288124084472656, -0.0004000067710876465, -0.00027120113372802734, -0.0001423954963684082, -1.3589859008789062e-05, 0.00011521577835083008, 0.00024402141571044922, 0.00037282705307006836, 0.0005016326904296875, 0.0006304383277893066, 0.0007592439651489258, 0.0008880496025085449, 0.001016855239868164, 0.0011456608772277832, 0.0012744665145874023, 0.0014032721519470215, 0.0015320777893066406, 0.0016608834266662598, 0.001789689064025879, 0.001918494701385498, 0.002047300338745117, 0.0021761059761047363, 0.0023049116134643555, 0.0024337172508239746, 0.0025625228881835938, 0.002691328525543213, 0.002820134162902832, 0.002948939800262451, 0.0030777454376220703, 0.0032065510749816895, 0.0033353567123413086, 0.0034641623497009277, 0.003592967987060547, 0.003721773624420166, 0.003850579261779785, 0.003979384899139404, 0.0041081905364990234, 0.004236996173858643, 0.004365801811218262, 0.004494607448577881, 0.0046234130859375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 10.0, 6.0, 9.0, 8.0, 17.0, 27.0, 27.0, 49.0, 84.0, 143.0, 315.0, 723.0, 2147.0, 7620.0, 36401.0, 276416.0, 638735.0, 68090.0, 12668.0, 3184.0, 1010.0, 401.0, 188.0, 111.0, 51.0, 41.0, 23.0, 10.0, 18.0, 5.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0279998779296875, -0.02693009376525879, -0.025860309600830078, -0.024790525436401367, -0.023720741271972656, -0.022650957107543945, -0.021581172943115234, -0.020511388778686523, -0.019441604614257812, -0.0183718204498291, -0.01730203628540039, -0.01623225212097168, -0.015162467956542969, -0.014092683792114258, -0.013022899627685547, -0.011953115463256836, -0.010883331298828125, -0.009813547134399414, -0.008743762969970703, -0.007673978805541992, -0.006604194641113281, -0.00553441047668457, -0.004464626312255859, -0.0033948421478271484, -0.0023250579833984375, -0.0012552738189697266, -0.00018548965454101562, 0.0008842945098876953, 0.0019540786743164062, 0.003023862838745117, 0.004093647003173828, 0.005163431167602539, 0.00623321533203125, 0.007302999496459961, 0.008372783660888672, 0.009442567825317383, 0.010512351989746094, 0.011582136154174805, 0.012651920318603516, 0.013721704483032227, 0.014791488647460938, 0.01586127281188965, 0.01693105697631836, 0.01800084114074707, 0.01907062530517578, 0.020140409469604492, 0.021210193634033203, 0.022279977798461914, 0.023349761962890625, 0.024419546127319336, 0.025489330291748047, 0.026559114456176758, 0.02762889862060547, 0.02869868278503418, 0.02976846694946289, 0.0308382511138916, 0.03190803527832031, 0.03297781944274902, 0.034047603607177734, 0.035117387771606445, 0.036187171936035156, 0.03725695610046387, 0.03832674026489258, 0.03939652442932129, 0.04046630859375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 12.0, 17.0, 10.0, 15.0, 20.0, 29.0, 34.0, 37.0, 42.0, 38.0, 53.0, 56.0, 56.0, 72.0, 52.0, 57.0, 51.0, 38.0, 41.0, 47.0, 44.0, 38.0, 29.0, 26.0, 22.0, 17.0, 14.0, 7.0, 5.0, 6.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0038738250732421875, -0.003731757402420044, -0.0035896897315979004, -0.003447622060775757, -0.0033055543899536133, -0.0031634867191314697, -0.003021419048309326, -0.0028793513774871826, -0.002737283706665039, -0.0025952160358428955, -0.002453148365020752, -0.0023110806941986084, -0.002169013023376465, -0.0020269453525543213, -0.0018848776817321777, -0.0017428100109100342, -0.0016007423400878906, -0.001458674669265747, -0.0013166069984436035, -0.00117453932762146, -0.0010324716567993164, -0.0008904039859771729, -0.0007483363151550293, -0.0006062686443328857, -0.0004642009735107422, -0.00032213330268859863, -0.00018006563186645508, -3.7997961044311523e-05, 0.00010406970977783203, 0.0002461373805999756, 0.00038820505142211914, 0.0005302727222442627, 0.0006723403930664062, 0.0008144080638885498, 0.0009564757347106934, 0.001098543405532837, 0.0012406110763549805, 0.001382678747177124, 0.0015247464179992676, 0.0016668140888214111, 0.0018088817596435547, 0.0019509494304656982, 0.002093017101287842, 0.0022350847721099854, 0.002377152442932129, 0.0025192201137542725, 0.002661287784576416, 0.0028033554553985596, 0.002945423126220703, 0.0030874907970428467, 0.0032295584678649902, 0.003371626138687134, 0.0035136938095092773, 0.003655761480331421, 0.0037978291511535645, 0.003939896821975708, 0.0040819644927978516, 0.004224032163619995, 0.004366099834442139, 0.004508167505264282, 0.004650235176086426, 0.004792302846908569, 0.004934370517730713, 0.0050764381885528564, 0.005218505859375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 8.0, 5.0, 9.0, 18.0, 14.0, 21.0, 21.0, 37.0, 53.0, 72.0, 101.0, 137.0, 174.0, 249.0, 391.0, 605.0, 897.0, 1172.0, 1691.0, 2845.0, 5210.0, 13685.0, 882538.0, 116498.0, 9963.0, 4449.0, 2545.0, 1558.0, 1068.0, 776.0, 510.0, 354.0, 260.0, 181.0, 138.0, 77.0, 65.0, 40.0, 29.0, 26.0, 17.0, 14.0, 8.0, 9.0, 7.0, 3.0, 6.0, 3.0, 2.0, 3.0, 2.0], "bins": [-0.01151275634765625, -0.011191844940185547, -0.010870933532714844, -0.01055002212524414, -0.010229110717773438, -0.009908199310302734, -0.009587287902832031, -0.009266376495361328, -0.008945465087890625, -0.008624553680419922, -0.008303642272949219, -0.007982730865478516, -0.0076618194580078125, -0.007340908050537109, -0.007019996643066406, -0.006699085235595703, -0.006378173828125, -0.006057262420654297, -0.005736351013183594, -0.005415439605712891, -0.0050945281982421875, -0.004773616790771484, -0.004452705383300781, -0.004131793975830078, -0.003810882568359375, -0.003489971160888672, -0.0031690597534179688, -0.0028481483459472656, -0.0025272369384765625, -0.0022063255310058594, -0.0018854141235351562, -0.0015645027160644531, -0.00124359130859375, -0.0009226799011230469, -0.0006017684936523438, -0.0002808570861816406, 4.00543212890625e-05, 0.0003609657287597656, 0.0006818771362304688, 0.0010027885437011719, 0.001323699951171875, 0.0016446113586425781, 0.0019655227661132812, 0.0022864341735839844, 0.0026073455810546875, 0.0029282569885253906, 0.0032491683959960938, 0.003570079803466797, 0.0038909912109375, 0.004211902618408203, 0.004532814025878906, 0.004853725433349609, 0.0051746368408203125, 0.005495548248291016, 0.005816459655761719, 0.006137371063232422, 0.006458282470703125, 0.006779193878173828, 0.007100105285644531, 0.007421016693115234, 0.0077419281005859375, 0.00806283950805664, 0.008383750915527344, 0.008704662322998047, 0.00902557373046875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 6.0, 4.0, 16.0, 12.0, 24.0, 26.0, 45.0, 34.0, 46.0, 57.0, 71.0, 119.0, 69.0, 113.0, 68.0, 68.0, 45.0, 48.0, 20.0, 26.0, 13.0, 14.0, 13.0, 8.0, 6.0, 3.0, 7.0, 0.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.092952728271484e-06, -6.887130439281464e-06, -6.681308150291443e-06, -6.475485861301422e-06, -6.269663572311401e-06, -6.063841283321381e-06, -5.85801899433136e-06, -5.652196705341339e-06, -5.446374416351318e-06, -5.240552127361298e-06, -5.034729838371277e-06, -4.828907549381256e-06, -4.623085260391235e-06, -4.417262971401215e-06, -4.211440682411194e-06, -4.005618393421173e-06, -3.7997961044311523e-06, -3.5939738154411316e-06, -3.388151526451111e-06, -3.18232923746109e-06, -2.9765069484710693e-06, -2.7706846594810486e-06, -2.564862370491028e-06, -2.359040081501007e-06, -2.1532177925109863e-06, -1.9473955035209656e-06, -1.7415732145309448e-06, -1.535750925540924e-06, -1.3299286365509033e-06, -1.1241063475608826e-06, -9.182840585708618e-07, -7.124617695808411e-07, -5.066394805908203e-07, -3.0081719160079956e-07, -9.499490261077881e-08, 1.1082738637924194e-07, 3.166496753692627e-07, 5.224719643592834e-07, 7.282942533493042e-07, 9.34116542339325e-07, 1.1399388313293457e-06, 1.3457611203193665e-06, 1.5515834093093872e-06, 1.757405698299408e-06, 1.9632279872894287e-06, 2.1690502762794495e-06, 2.3748725652694702e-06, 2.580694854259491e-06, 2.7865171432495117e-06, 2.9923394322395325e-06, 3.1981617212295532e-06, 3.403984010219574e-06, 3.6098062992095947e-06, 3.8156285881996155e-06, 4.021450877189636e-06, 4.227273166179657e-06, 4.433095455169678e-06, 4.6389177441596985e-06, 4.844740033149719e-06, 5.05056232213974e-06, 5.256384611129761e-06, 5.4622069001197815e-06, 5.668029189109802e-06, 5.873851478099823e-06, 6.079673767089844e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 10.0, 9.0, 15.0, 24.0, 25.0, 21.0, 39.0, 48.0, 80.0, 114.0, 145.0, 313.0, 617.0, 1384.0, 3395.0, 8980.0, 55323.0, 952118.0, 16532.0, 5278.0, 2074.0, 934.0, 407.0, 234.0, 113.0, 93.0, 49.0, 44.0, 28.0, 26.0, 14.0, 19.0, 14.0, 11.0, 7.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0143280029296875, -0.013854026794433594, -0.013380050659179688, -0.012906074523925781, -0.012432098388671875, -0.011958122253417969, -0.011484146118164062, -0.011010169982910156, -0.01053619384765625, -0.010062217712402344, -0.009588241577148438, -0.009114265441894531, -0.008640289306640625, -0.008166313171386719, -0.0076923370361328125, -0.007218360900878906, -0.006744384765625, -0.006270408630371094, -0.0057964324951171875, -0.005322456359863281, -0.004848480224609375, -0.004374504089355469, -0.0039005279541015625, -0.0034265518188476562, -0.00295257568359375, -0.0024785995483398438, -0.0020046234130859375, -0.0015306472778320312, -0.001056671142578125, -0.0005826950073242188, -0.0001087188720703125, 0.00036525726318359375, 0.0008392333984375, 0.0013132095336914062, 0.0017871856689453125, 0.0022611618041992188, 0.002735137939453125, 0.0032091140747070312, 0.0036830902099609375, 0.004157066345214844, 0.00463104248046875, 0.005105018615722656, 0.0055789947509765625, 0.006052970886230469, 0.006526947021484375, 0.007000923156738281, 0.0074748992919921875, 0.007948875427246094, 0.0084228515625, 0.008896827697753906, 0.009370803833007812, 0.009844779968261719, 0.010318756103515625, 0.010792732238769531, 0.011266708374023438, 0.011740684509277344, 0.01221466064453125, 0.012688636779785156, 0.013162612915039062, 0.013636589050292969, 0.014110565185546875, 0.014584541320800781, 0.015058517456054688, 0.015532493591308594, 0.0160064697265625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 2.0, 4.0, 8.0, 6.0, 8.0, 16.0, 49.0, 614.0, 204.0, 26.0, 18.0, 7.0, 9.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00257110595703125, -0.0024718046188354492, -0.0023725032806396484, -0.0022732019424438477, -0.002173900604248047, -0.002074599266052246, -0.0019752979278564453, -0.0018759965896606445, -0.0017766952514648438, -0.001677393913269043, -0.0015780925750732422, -0.0014787912368774414, -0.0013794898986816406, -0.0012801885604858398, -0.001180887222290039, -0.0010815858840942383, -0.0009822845458984375, -0.0008829832077026367, -0.0007836818695068359, -0.0006843805313110352, -0.0005850791931152344, -0.0004857778549194336, -0.0003864765167236328, -0.00028717517852783203, -0.00018787384033203125, -8.857250213623047e-05, 1.0728836059570312e-05, 0.0001100301742553711, 0.00020933151245117188, 0.00030863285064697266, 0.00040793418884277344, 0.0005072355270385742, 0.000606536865234375, 0.0007058382034301758, 0.0008051395416259766, 0.0009044408798217773, 0.0010037422180175781, 0.001103043556213379, 0.0012023448944091797, 0.0013016462326049805, 0.0014009475708007812, 0.001500248908996582, 0.0015995502471923828, 0.0016988515853881836, 0.0017981529235839844, 0.0018974542617797852, 0.001996755599975586, 0.0020960569381713867, 0.0021953582763671875, 0.0022946596145629883, 0.002393960952758789, 0.00249326229095459, 0.0025925636291503906, 0.0026918649673461914, 0.002791166305541992, 0.002890467643737793, 0.0029897689819335938, 0.0030890703201293945, 0.0031883716583251953, 0.003287672996520996, 0.003386974334716797, 0.0034862756729125977, 0.0035855770111083984, 0.0036848783493041992, 0.0037841796875]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 11.0, 8.0, 9.0, 24.0, 28.0, 44.0, 71.0, 126.0, 176.0, 173.0, 123.0, 72.0, 47.0, 30.0, 24.0, 12.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013542495667934418, -0.013105195015668869, -0.012667895294725895, -0.012230594642460346, -0.011793294921517372, -0.011355994269251823, -0.010918693616986275, -0.0104813938960433, -0.010044094175100327, -0.009606793522834778, -0.009169493801891804, -0.008732193149626255, -0.008294893428683281, -0.007857592776417732, -0.007420292589813471, -0.0069829924032092094, -0.006545691750943661, -0.006108391564339399, -0.005671091377735138, -0.005233790725469589, -0.004796491004526615, -0.0043591903522610664, -0.003921890165656805, -0.0034845899790525436, -0.0030472897924482822, -0.002609989605844021, -0.0021726894192397594, -0.0017353889998048544, -0.001298088813200593, -0.0008607886265963316, -0.00042348820716142654, 1.3811979442834854e-05, 0.00045111216604709625, 0.0008884124108590186, 0.0013257126556709409, 0.001763012958690524, 0.0022003131452947855, 0.002637613331899047, 0.003074913751333952, 0.0035122139379382133, 0.003949514124542475, 0.004386814311146736, 0.0048241144977509975, 0.005261414684355259, 0.005698715336620808, 0.006136015057563782, 0.0065733157098293304, 0.007010615896433592, 0.007447916083037853, 0.007885216735303402, 0.008322516456246376, 0.008759817108511925, 0.009197116829454899, 0.009634417481720448, 0.010071717202663422, 0.01050901785492897, 0.010946318507194519, 0.011383619159460068, 0.011820918880403042, 0.01225821953266859, 0.012695519253611565, 0.013132819905877113, 0.013570120558142662, 0.014007420279085636, 0.01444472000002861]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 6.0, 10.0, 15.0, 10.0, 13.0, 17.0, 19.0, 15.0, 32.0, 21.0, 33.0, 29.0, 28.0, 44.0, 40.0, 40.0, 55.0, 36.0, 43.0, 54.0, 45.0, 33.0, 32.0, 42.0, 31.0, 38.0, 29.0, 29.0, 23.0, 26.0, 19.0, 11.0, 9.0, 14.0, 8.0, 9.0, 10.0, 7.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004152177833020687, -0.004019753076136112, -0.003887328552082181, -0.0037549040280282497, -0.003622479271143675, -0.0034900547470897436, -0.0033576302230358124, -0.0032252054661512375, -0.0030927809420973063, -0.002960356418043375, -0.0028279316611588, -0.002695507137104869, -0.0025630826130509377, -0.0024306578561663628, -0.0022982333321124315, -0.0021658088080585003, -0.0020333840511739254, -0.0019009594107046723, -0.0017685347702354193, -0.001636110246181488, -0.001503685605712235, -0.001371260965242982, -0.0012388364411890507, -0.0011064118007197976, -0.0009739871602505445, -0.0008415625197812915, -0.0007091379375196993, -0.0005767133552581072, -0.0004442887147888541, -0.00031186407431960106, -0.0001794394920580089, -4.701490979641676e-05, 8.5409265011549e-05, 0.0002178338763769716, 0.0003502584877423942, 0.0004826830991078168, 0.0006151077104732394, 0.0007475323509424925, 0.0008799569332040846, 0.0010123815154656768, 0.0011448061559349298, 0.001277230796404183, 0.001409655436873436, 0.0015420799609273672, 0.0016745046013966203, 0.0018069292418658733, 0.0019393537659198046, 0.002071778289973736, 0.0022042030468583107, 0.002336627570912242, 0.002469052327796817, 0.002601476851850748, 0.002733901608735323, 0.002866326132789254, 0.0029987506568431854, 0.0031311754137277603, 0.0032635999377816916, 0.003396024461835623, 0.0035284492187201977, 0.003660873742774129, 0.00379329826682806, 0.003925723023712635, 0.00405814778059721, 0.0041905720718204975, 0.004322996828705072]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 11.0, 5.0, 10.0, 10.0, 13.0, 19.0, 20.0, 32.0, 41.0, 42.0, 67.0, 91.0, 125.0, 214.0, 349.0, 558.0, 938.0, 1765.0, 3501.0, 8183.0, 33187.0, 271515.0, 2989247.0, 793852.0, 68886.0, 12319.0, 4511.0, 2115.0, 1068.0, 602.0, 370.0, 187.0, 124.0, 102.0, 59.0, 27.0, 33.0, 19.0, 23.0, 9.0, 8.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.017578125, -0.017040729522705078, -0.016503334045410156, -0.015965938568115234, -0.015428543090820312, -0.01489114761352539, -0.014353752136230469, -0.013816356658935547, -0.013278961181640625, -0.012741565704345703, -0.012204170227050781, -0.01166677474975586, -0.011129379272460938, -0.010591983795166016, -0.010054588317871094, -0.009517192840576172, -0.00897979736328125, -0.008442401885986328, -0.007905006408691406, -0.007367610931396484, -0.0068302154541015625, -0.006292819976806641, -0.005755424499511719, -0.005218029022216797, -0.004680633544921875, -0.004143238067626953, -0.0036058425903320312, -0.0030684471130371094, -0.0025310516357421875, -0.0019936561584472656, -0.0014562606811523438, -0.0009188652038574219, -0.0003814697265625, 0.00015592575073242188, 0.0006933212280273438, 0.0012307167053222656, 0.0017681121826171875, 0.0023055076599121094, 0.0028429031372070312, 0.003380298614501953, 0.003917694091796875, 0.004455089569091797, 0.004992485046386719, 0.005529880523681641, 0.0060672760009765625, 0.006604671478271484, 0.007142066955566406, 0.007679462432861328, 0.00821685791015625, 0.008754253387451172, 0.009291648864746094, 0.009829044342041016, 0.010366439819335938, 0.01090383529663086, 0.011441230773925781, 0.011978626251220703, 0.012516021728515625, 0.013053417205810547, 0.013590812683105469, 0.01412820816040039, 0.014665603637695312, 0.015202999114990234, 0.015740394592285156, 0.016277790069580078, 0.016815185546875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 10.0, 5.0, 8.0, 5.0, 7.0, 10.0, 10.0, 18.0, 18.0, 23.0, 20.0, 29.0, 30.0, 23.0, 35.0, 34.0, 43.0, 41.0, 41.0, 58.0, 47.0, 36.0, 36.0, 41.0, 47.0, 35.0, 41.0, 38.0, 34.0, 25.0, 27.0, 26.0, 24.0, 17.0, 11.0, 10.0, 10.0, 7.0, 3.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.003612518310546875, -0.003510773181915283, -0.0034090280532836914, -0.0033072829246520996, -0.003205537796020508, -0.003103792667388916, -0.0030020475387573242, -0.0029003024101257324, -0.0027985572814941406, -0.002696812152862549, -0.002595067024230957, -0.0024933218955993652, -0.0023915767669677734, -0.0022898316383361816, -0.00218808650970459, -0.002086341381072998, -0.0019845962524414062, -0.0018828511238098145, -0.0017811059951782227, -0.0016793608665466309, -0.001577615737915039, -0.0014758706092834473, -0.0013741254806518555, -0.0012723803520202637, -0.0011706352233886719, -0.00106889009475708, -0.0009671449661254883, -0.0008653998374938965, -0.0007636547088623047, -0.0006619095802307129, -0.0005601644515991211, -0.0004584193229675293, -0.0003566741943359375, -0.0002549290657043457, -0.0001531839370727539, -5.143880844116211e-05, 5.030632019042969e-05, 0.00015205144882202148, 0.0002537965774536133, 0.0003555417060852051, 0.0004572868347167969, 0.0005590319633483887, 0.0006607770919799805, 0.0007625222206115723, 0.0008642673492431641, 0.0009660124778747559, 0.0010677576065063477, 0.0011695027351379395, 0.0012712478637695312, 0.001372992992401123, 0.0014747381210327148, 0.0015764832496643066, 0.0016782283782958984, 0.0017799735069274902, 0.001881718635559082, 0.001983463764190674, 0.0020852088928222656, 0.0021869540214538574, 0.0022886991500854492, 0.002390444278717041, 0.002492189407348633, 0.0025939345359802246, 0.0026956796646118164, 0.002797424793243408, 0.002899169921875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 8.0, 2.0, 2.0, 3.0, 9.0, 6.0, 10.0, 17.0, 20.0, 20.0, 45.0, 86.0, 159.0, 479.0, 2400.0, 33039.0, 4123662.0, 31596.0, 1939.0, 380.0, 142.0, 75.0, 57.0, 35.0, 30.0, 32.0, 15.0, 7.0, 1.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07379150390625, -0.07187461853027344, -0.06995773315429688, -0.06804084777832031, -0.06612396240234375, -0.06420707702636719, -0.062290191650390625, -0.06037330627441406, -0.0584564208984375, -0.05653953552246094, -0.054622650146484375, -0.05270576477050781, -0.05078887939453125, -0.04887199401855469, -0.046955108642578125, -0.04503822326660156, -0.043121337890625, -0.04120445251464844, -0.039287567138671875, -0.03737068176269531, -0.03545379638671875, -0.03353691101074219, -0.031620025634765625, -0.029703140258789062, -0.0277862548828125, -0.025869369506835938, -0.023952484130859375, -0.022035598754882812, -0.02011871337890625, -0.018201828002929688, -0.016284942626953125, -0.014368057250976562, -0.012451171875, -0.010534286499023438, -0.008617401123046875, -0.0067005157470703125, -0.00478363037109375, -0.0028667449951171875, -0.000949859619140625, 0.0009670257568359375, 0.0028839111328125, 0.0048007965087890625, 0.006717681884765625, 0.008634567260742188, 0.01055145263671875, 0.012468338012695312, 0.014385223388671875, 0.016302108764648438, 0.018218994140625, 0.020135879516601562, 0.022052764892578125, 0.023969650268554688, 0.02588653564453125, 0.027803421020507812, 0.029720306396484375, 0.03163719177246094, 0.0335540771484375, 0.03547096252441406, 0.037387847900390625, 0.03930473327636719, 0.04122161865234375, 0.04313850402832031, 0.045055389404296875, 0.04697227478027344, 0.04888916015625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 13.0, 15.0, 25.0, 35.0, 53.0, 69.0, 89.0, 170.0, 347.0, 711.0, 1039.0, 751.0, 355.0, 159.0, 65.0, 50.0, 21.0, 24.0, 12.0, 10.0, 5.0, 7.0, 14.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002323150634765625, -0.0022136569023132324, -0.00210416316986084, -0.0019946694374084473, -0.0018851757049560547, -0.0017756819725036621, -0.0016661882400512695, -0.001556694507598877, -0.0014472007751464844, -0.0013377070426940918, -0.0012282133102416992, -0.0011187195777893066, -0.001009225845336914, -0.0008997321128845215, -0.0007902383804321289, -0.0006807446479797363, -0.0005712509155273438, -0.00046175718307495117, -0.0003522634506225586, -0.00024276971817016602, -0.00013327598571777344, -2.378225326538086e-05, 8.571147918701172e-05, 0.0001952052116394043, 0.0003046989440917969, 0.00041419267654418945, 0.000523686408996582, 0.0006331801414489746, 0.0007426738739013672, 0.0008521676063537598, 0.0009616613388061523, 0.001071155071258545, 0.0011806488037109375, 0.00129014253616333, 0.0013996362686157227, 0.0015091300010681152, 0.0016186237335205078, 0.0017281174659729004, 0.001837611198425293, 0.0019471049308776855, 0.002056598663330078, 0.0021660923957824707, 0.0022755861282348633, 0.002385079860687256, 0.0024945735931396484, 0.002604067325592041, 0.0027135610580444336, 0.002823054790496826, 0.0029325485229492188, 0.0030420422554016113, 0.003151535987854004, 0.0032610297203063965, 0.003370523452758789, 0.0034800171852111816, 0.0035895109176635742, 0.003699004650115967, 0.0038084983825683594, 0.003917992115020752, 0.0040274858474731445, 0.004136979579925537, 0.00424647331237793, 0.004355967044830322, 0.004465460777282715, 0.004574954509735107, 0.0046844482421875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 15.0, 16.0, 33.0, 49.0, 109.0, 269.0, 265.0, 118.0, 64.0, 29.0, 12.0, 8.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009239403530955315, -0.00872760359197855, -0.008215803653001785, -0.007704002782702446, -0.007192202843725681, -0.006680402904748917, -0.006168602500110865, -0.005656802095472813, -0.005145002156496048, -0.004633202217519283, -0.004121401812881231, -0.003609601641073823, -0.0030978014692664146, -0.0025860012974590063, -0.002074201125651598, -0.0015624009538441896, -0.0010506007820367813, -0.000538800610229373, -2.7000438421964645e-05, 0.0004847997333854437, 0.000996599905192852, 0.0015084000770002604, 0.0020202002488076687, 0.002532000420615077, 0.0030438005924224854, 0.0035556007642298937, 0.004067400936037302, 0.004579201340675354, 0.005091001279652119, 0.005602801218628883, 0.006114601623266935, 0.006626402027904987, 0.007138200104236603, 0.0076500000432133675, 0.008161799982190132, 0.008673600852489471, 0.009185400791466236, 0.009697200730443, 0.01020900160074234, 0.010720801539719105, 0.01123260147869587, 0.011744401417672634, 0.012256201356649399, 0.012768002226948738, 0.013279802165925503, 0.013791602104902267, 0.014303402975201607, 0.014815202914178371, 0.015327002853155136, 0.015838803723454475, 0.016350602731108665, 0.016862403601408005, 0.017374202609062195, 0.017886003479361534, 0.018397804349660873, 0.018909603357315063, 0.019421404227614403, 0.019933205097913742, 0.020445004105567932, 0.02095680497586727, 0.02146860584616661, 0.0219804048538208, 0.02249220572412014, 0.02300400473177433, 0.02351580560207367]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 6.0, 10.0, 15.0, 15.0, 30.0, 27.0, 35.0, 30.0, 27.0, 32.0, 40.0, 53.0, 45.0, 61.0, 53.0, 56.0, 48.0, 45.0, 47.0, 63.0, 43.0, 32.0, 32.0, 27.0, 24.0, 23.0, 16.0, 13.0, 10.0, 13.0, 6.0, 5.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005774387624114752, -0.005598601885139942, -0.0054228161461651325, -0.005247030407190323, -0.005071244668215513, -0.004895458929240704, -0.004719672724604607, -0.004543887451291084, -0.004368101246654987, -0.004192315507680178, -0.004016529768705368, -0.0038407440297305584, -0.0036649582907557487, -0.003489172551780939, -0.003313386579975486, -0.003137600841000676, -0.00296181533485651, -0.0027860295958817005, -0.002610243856906891, -0.0024344581179320812, -0.0022586723789572716, -0.002082886639982462, -0.0019071006681770086, -0.001731314929202199, -0.0015555291902273893, -0.0013797434512525797, -0.00120395771227777, -0.0010281718568876386, -0.0008523861179128289, -0.0006766003789380193, -0.0005008145235478878, -0.00032502878457307816, -0.0001492430455982685, 2.6542722480371594e-05, 0.0002023284905590117, 0.00037811428774148226, 0.0005539000267162919, 0.0007296857656911016, 0.000905471621081233, 0.0010812573600560427, 0.0012570430990308523, 0.001432828838005662, 0.0016086145769804716, 0.001784400432370603, 0.0019601862877607346, 0.002135972026735544, 0.002311757765710354, 0.0024875435046851635, 0.002663329243659973, 0.002839114982634783, 0.0030149007216095924, 0.003190686460584402, 0.0033664721995592117, 0.0035422579385340214, 0.0037180439103394747, 0.0038938296493142843, 0.00406961515545845, 0.00424540089443326, 0.00442118663340807, 0.004596972372382879, 0.004772758111357689, 0.0049485438503324986, 0.005124329589307308, 0.005300115793943405, 0.005475901532918215]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 19.0, 24.0, 37.0, 57.0, 88.0, 147.0, 196.0, 272.0, 407.0, 716.0, 1117.0, 2076.0, 3410.0, 6111.0, 10879.0, 20153.0, 37629.0, 69801.0, 134087.0, 272708.0, 236207.0, 116948.0, 61619.0, 33151.0, 17788.0, 9766.0, 5419.0, 3076.0, 1717.0, 1076.0, 677.0, 405.0, 255.0, 159.0, 108.0, 57.0, 35.0, 32.0, 29.0, 25.0, 13.0, 9.0, 10.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0013484954833984375, -0.0013062208890914917, -0.001263946294784546, -0.0012216717004776, -0.0011793971061706543, -0.0011371225118637085, -0.0010948479175567627, -0.001052573323249817, -0.001010298728942871, -0.0009680241346359253, -0.0009257495403289795, -0.0008834749460220337, -0.0008412003517150879, -0.0007989257574081421, -0.0007566511631011963, -0.0007143765687942505, -0.0006721019744873047, -0.0006298273801803589, -0.0005875527858734131, -0.0005452781915664673, -0.0005030035972595215, -0.0004607290029525757, -0.0004184544086456299, -0.0003761798143386841, -0.0003339052200317383, -0.0002916306257247925, -0.0002493560314178467, -0.00020708143711090088, -0.00016480684280395508, -0.00012253224849700928, -8.025765419006348e-05, -3.7983059883117676e-05, 4.291534423828125e-06, 4.6566128730773926e-05, 8.884072303771973e-05, 0.00013111531734466553, 0.00017338991165161133, 0.00021566450595855713, 0.00025793910026550293, 0.00030021369457244873, 0.00034248828887939453, 0.00038476288318634033, 0.00042703747749328613, 0.00046931207180023193, 0.0005115866661071777, 0.0005538612604141235, 0.0005961358547210693, 0.0006384104490280151, 0.0006806850433349609, 0.0007229596376419067, 0.0007652342319488525, 0.0008075088262557983, 0.0008497834205627441, 0.0008920580148696899, 0.0009343326091766357, 0.0009766072034835815, 0.0010188817977905273, 0.0010611563920974731, 0.001103430986404419, 0.0011457055807113647, 0.0011879801750183105, 0.0012302547693252563, 0.0012725293636322021, 0.001314803957939148, 0.0013570785522460938]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 6.0, 14.0, 17.0, 23.0, 26.0, 36.0, 25.0, 32.0, 41.0, 35.0, 56.0, 56.0, 63.0, 63.0, 56.0, 55.0, 51.0, 44.0, 48.0, 47.0, 34.0, 27.0, 31.0, 19.0, 19.0, 15.0, 18.0, 10.0, 8.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00522613525390625, -0.005066990852355957, -0.004907846450805664, -0.004748702049255371, -0.004589557647705078, -0.004430413246154785, -0.004271268844604492, -0.004112124443054199, -0.003952980041503906, -0.0037938356399536133, -0.0036346912384033203, -0.0034755468368530273, -0.0033164024353027344, -0.0031572580337524414, -0.0029981136322021484, -0.0028389692306518555, -0.0026798248291015625, -0.0025206804275512695, -0.0023615360260009766, -0.0022023916244506836, -0.0020432472229003906, -0.0018841028213500977, -0.0017249584197998047, -0.0015658140182495117, -0.0014066696166992188, -0.0012475252151489258, -0.0010883808135986328, -0.0009292364120483398, -0.0007700920104980469, -0.0006109476089477539, -0.00045180320739746094, -0.00029265880584716797, -0.000133514404296875, 2.562999725341797e-05, 0.00018477439880371094, 0.0003439188003540039, 0.0005030632019042969, 0.0006622076034545898, 0.0008213520050048828, 0.0009804964065551758, 0.0011396408081054688, 0.0012987852096557617, 0.0014579296112060547, 0.0016170740127563477, 0.0017762184143066406, 0.0019353628158569336, 0.0020945072174072266, 0.0022536516189575195, 0.0024127960205078125, 0.0025719404220581055, 0.0027310848236083984, 0.0028902292251586914, 0.0030493736267089844, 0.0032085180282592773, 0.0033676624298095703, 0.0035268068313598633, 0.0036859512329101562, 0.0038450956344604492, 0.004004240036010742, 0.004163384437561035, 0.004322528839111328, 0.004481673240661621, 0.004640817642211914, 0.004799962043762207, 0.0049591064453125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 10.0, 6.0, 7.0, 8.0, 26.0, 31.0, 45.0, 84.0, 122.0, 205.0, 348.0, 604.0, 955.0, 1605.0, 2699.0, 4571.0, 7970.0, 14317.0, 25830.0, 48229.0, 93426.0, 207010.0, 335972.0, 147695.0, 71767.0, 37657.0, 20339.0, 11424.0, 6311.0, 3750.0, 2254.0, 1313.0, 804.0, 435.0, 264.0, 177.0, 107.0, 63.0, 41.0, 30.0, 23.0, 10.0, 13.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013208389282226562, -0.0012811720371246338, -0.0012415051460266113, -0.0012018382549285889, -0.0011621713638305664, -0.001122504472732544, -0.0010828375816345215, -0.001043170690536499, -0.0010035037994384766, -0.0009638369083404541, -0.0009241700172424316, -0.0008845031261444092, -0.0008448362350463867, -0.0008051693439483643, -0.0007655024528503418, -0.0007258355617523193, -0.0006861686706542969, -0.0006465017795562744, -0.000606834888458252, -0.0005671679973602295, -0.000527501106262207, -0.00048783421516418457, -0.0004481673240661621, -0.00040850043296813965, -0.0003688335418701172, -0.0003291666507720947, -0.00028949975967407227, -0.0002498328685760498, -0.00021016597747802734, -0.00017049908638000488, -0.00013083219528198242, -9.116530418395996e-05, -5.14984130859375e-05, -1.1831521987915039e-05, 2.7835369110107422e-05, 6.750226020812988e-05, 0.00010716915130615234, 0.0001468360424041748, 0.00018650293350219727, 0.00022616982460021973, 0.0002658367156982422, 0.00030550360679626465, 0.0003451704978942871, 0.00038483738899230957, 0.00042450428009033203, 0.0004641711711883545, 0.000503838062286377, 0.0005435049533843994, 0.0005831718444824219, 0.0006228387355804443, 0.0006625056266784668, 0.0007021725177764893, 0.0007418394088745117, 0.0007815062999725342, 0.0008211731910705566, 0.0008608400821685791, 0.0009005069732666016, 0.000940173864364624, 0.0009798407554626465, 0.001019507646560669, 0.0010591745376586914, 0.0010988414287567139, 0.0011385083198547363, 0.0011781752109527588, 0.0012178421020507812]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 11.0, 10.0, 10.0, 13.0, 18.0, 23.0, 30.0, 35.0, 33.0, 44.0, 49.0, 43.0, 31.0, 58.0, 43.0, 61.0, 53.0, 40.0, 37.0, 46.0, 47.0, 37.0, 39.0, 39.0, 18.0, 25.0, 18.0, 14.0, 10.0, 16.0, 13.0, 10.0, 9.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003101348876953125, -0.0030083060264587402, -0.0029152631759643555, -0.0028222203254699707, -0.002729177474975586, -0.002636134624481201, -0.0025430917739868164, -0.0024500489234924316, -0.002357006072998047, -0.002263963222503662, -0.0021709203720092773, -0.0020778775215148926, -0.001984834671020508, -0.001891791820526123, -0.0017987489700317383, -0.0017057061195373535, -0.0016126632690429688, -0.001519620418548584, -0.0014265775680541992, -0.0013335347175598145, -0.0012404918670654297, -0.001147449016571045, -0.0010544061660766602, -0.0009613633155822754, -0.0008683204650878906, -0.0007752776145935059, -0.0006822347640991211, -0.0005891919136047363, -0.0004961490631103516, -0.0004031062126159668, -0.00031006336212158203, -0.00021702051162719727, -0.0001239776611328125, -3.0934810638427734e-05, 6.210803985595703e-05, 0.0001551508903503418, 0.00024819374084472656, 0.00034123659133911133, 0.0004342794418334961, 0.0005273222923278809, 0.0006203651428222656, 0.0007134079933166504, 0.0008064508438110352, 0.0008994936943054199, 0.0009925365447998047, 0.0010855793952941895, 0.0011786222457885742, 0.001271665096282959, 0.0013647079467773438, 0.0014577507972717285, 0.0015507936477661133, 0.001643836498260498, 0.0017368793487548828, 0.0018299221992492676, 0.0019229650497436523, 0.002016007900238037, 0.002109050750732422, 0.0022020936012268066, 0.0022951364517211914, 0.002388179302215576, 0.002481222152709961, 0.0025742650032043457, 0.0026673078536987305, 0.0027603507041931152, 0.0028533935546875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 16.0, 25.0, 24.0, 43.0, 82.0, 86.0, 164.0, 219.0, 418.0, 797.0, 1382.0, 2657.0, 5790.0, 15658.0, 57379.0, 610457.0, 289230.0, 41653.0, 12261.0, 4978.0, 2294.0, 1226.0, 682.0, 364.0, 207.0, 154.0, 87.0, 64.0, 36.0, 32.0, 15.0, 25.0, 8.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002321004867553711, -0.00022482313215732574, -0.0002175457775592804, -0.00021026842296123505, -0.0002029910683631897, -0.00019571371376514435, -0.000188436359167099, -0.00018115900456905365, -0.0001738816499710083, -0.00016660429537296295, -0.0001593269407749176, -0.00015204958617687225, -0.0001447722315788269, -0.00013749487698078156, -0.0001302175223827362, -0.00012294016778469086, -0.00011566281318664551, -0.00010838545858860016, -0.00010110810399055481, -9.383074939250946e-05, -8.655339479446411e-05, -7.927604019641876e-05, -7.199868559837341e-05, -6.472133100032806e-05, -5.7443976402282715e-05, -5.0166621804237366e-05, -4.2889267206192017e-05, -3.561191260814667e-05, -2.833455801010132e-05, -2.105720341205597e-05, -1.377984881401062e-05, -6.502494215965271e-06, 7.748603820800781e-07, 8.052214980125427e-06, 1.5329569578170776e-05, 2.2606924176216125e-05, 2.9884278774261475e-05, 3.7161633372306824e-05, 4.443898797035217e-05, 5.171634256839752e-05, 5.899369716644287e-05, 6.627105176448822e-05, 7.354840636253357e-05, 8.082576096057892e-05, 8.810311555862427e-05, 9.538047015666962e-05, 0.00010265782475471497, 0.00010993517935276031, 0.00011721253395080566, 0.000124489888548851, 0.00013176724314689636, 0.0001390445977449417, 0.00014632195234298706, 0.0001535993069410324, 0.00016087666153907776, 0.0001681540161371231, 0.00017543137073516846, 0.0001827087253332138, 0.00018998607993125916, 0.0001972634345293045, 0.00020454078912734985, 0.0002118181437253952, 0.00021909549832344055, 0.0002263728529214859, 0.00023365020751953125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 8.0, 11.0, 12.0, 18.0, 12.0, 29.0, 23.0, 34.0, 62.0, 62.0, 44.0, 59.0, 55.0, 82.0, 60.0, 59.0, 63.0, 49.0, 54.0, 28.0, 31.0, 26.0, 15.0, 15.0, 16.0, 13.0, 5.0, 13.0, 4.0, 5.0, 5.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.2099742889404297e-05, -1.1730939149856567e-05, -1.1362135410308838e-05, -1.0993331670761108e-05, -1.0624527931213379e-05, -1.025572419166565e-05, -9.88692045211792e-06, -9.51811671257019e-06, -9.149312973022461e-06, -8.780509233474731e-06, -8.411705493927002e-06, -8.042901754379272e-06, -7.674098014831543e-06, -7.3052942752838135e-06, -6.936490535736084e-06, -6.5676867961883545e-06, -6.198883056640625e-06, -5.8300793170928955e-06, -5.461275577545166e-06, -5.0924718379974365e-06, -4.723668098449707e-06, -4.3548643589019775e-06, -3.986060619354248e-06, -3.6172568798065186e-06, -3.248453140258789e-06, -2.8796494007110596e-06, -2.51084566116333e-06, -2.1420419216156006e-06, -1.773238182067871e-06, -1.4044344425201416e-06, -1.0356307029724121e-06, -6.668269634246826e-07, -2.980232238769531e-07, 7.078051567077637e-08, 4.3958425521850586e-07, 8.083879947662354e-07, 1.1771917343139648e-06, 1.5459954738616943e-06, 1.914799213409424e-06, 2.2836029529571533e-06, 2.652406692504883e-06, 3.0212104320526123e-06, 3.390014171600342e-06, 3.7588179111480713e-06, 4.127621650695801e-06, 4.49642539024353e-06, 4.86522912979126e-06, 5.234032869338989e-06, 5.602836608886719e-06, 5.971640348434448e-06, 6.340444087982178e-06, 6.709247827529907e-06, 7.078051567077637e-06, 7.446855306625366e-06, 7.815659046173096e-06, 8.184462785720825e-06, 8.553266525268555e-06, 8.922070264816284e-06, 9.290874004364014e-06, 9.659677743911743e-06, 1.0028481483459473e-05, 1.0397285223007202e-05, 1.0766088962554932e-05, 1.1134892702102661e-05, 1.150369644165039e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 8.0, 7.0, 3.0, 10.0, 12.0, 29.0, 37.0, 129.0, 516.0, 3601.0, 77607.0, 948587.0, 16073.0, 1465.0, 278.0, 80.0, 39.0, 15.0, 9.0, 4.0, 5.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0011205673217773438, -0.001086905598640442, -0.00105324387550354, -0.0010195821523666382, -0.0009859204292297363, -0.0009522587060928345, -0.0009185969829559326, -0.0008849352598190308, -0.0008512735366821289, -0.000817611813545227, -0.0007839500904083252, -0.0007502883672714233, -0.0007166266441345215, -0.0006829649209976196, -0.0006493031978607178, -0.0006156414747238159, -0.0005819797515869141, -0.0005483180284500122, -0.0005146563053131104, -0.0004809945821762085, -0.00044733285903930664, -0.0004136711359024048, -0.00038000941276550293, -0.0003463476896286011, -0.0003126859664916992, -0.00027902424335479736, -0.0002453625202178955, -0.00021170079708099365, -0.0001780390739440918, -0.00014437735080718994, -0.00011071562767028809, -7.705390453338623e-05, -4.3392181396484375e-05, -9.73045825958252e-06, 2.3931264877319336e-05, 5.759298801422119e-05, 9.125471115112305e-05, 0.0001249164342880249, 0.00015857815742492676, 0.0001922398805618286, 0.00022590160369873047, 0.0002595633268356323, 0.0002932250499725342, 0.00032688677310943604, 0.0003605484962463379, 0.00039421021938323975, 0.0004278719425201416, 0.00046153366565704346, 0.0004951953887939453, 0.0005288571119308472, 0.000562518835067749, 0.0005961805582046509, 0.0006298422813415527, 0.0006635040044784546, 0.0006971657276153564, 0.0007308274507522583, 0.0007644891738891602, 0.000798150897026062, 0.0008318126201629639, 0.0008654743432998657, 0.0008991360664367676, 0.0009327977895736694, 0.0009664595127105713, 0.0010001212358474731, 0.001033782958984375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 3.0, 3.0, 4.0, 9.0, 6.0, 13.0, 11.0, 18.0, 24.0, 35.0, 40.0, 62.0, 105.0, 216.0, 141.0, 93.0, 48.0, 41.0, 31.0, 27.0, 15.0, 7.0, 12.0, 6.0, 9.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.257129669189453e-05, -5.086418241262436e-05, -4.915706813335419e-05, -4.7449953854084015e-05, -4.574283957481384e-05, -4.403572529554367e-05, -4.23286110162735e-05, -4.0621496737003326e-05, -3.8914382457733154e-05, -3.720726817846298e-05, -3.550015389919281e-05, -3.379303961992264e-05, -3.2085925340652466e-05, -3.0378811061382294e-05, -2.867169678211212e-05, -2.696458250284195e-05, -2.5257468223571777e-05, -2.3550353944301605e-05, -2.1843239665031433e-05, -2.013612538576126e-05, -1.842901110649109e-05, -1.6721896827220917e-05, -1.5014782547950745e-05, -1.3307668268680573e-05, -1.16005539894104e-05, -9.893439710140228e-06, -8.186325430870056e-06, -6.479211151599884e-06, -4.772096872329712e-06, -3.06498259305954e-06, -1.3578683137893677e-06, 3.4924596548080444e-07, 2.0563602447509766e-06, 3.7634745240211487e-06, 5.470588803291321e-06, 7.177703082561493e-06, 8.884817361831665e-06, 1.0591931641101837e-05, 1.229904592037201e-05, 1.4006160199642181e-05, 1.5713274478912354e-05, 1.7420388758182526e-05, 1.9127503037452698e-05, 2.083461731672287e-05, 2.2541731595993042e-05, 2.4248845875263214e-05, 2.5955960154533386e-05, 2.766307443380356e-05, 2.937018871307373e-05, 3.10773029923439e-05, 3.2784417271614075e-05, 3.449153155088425e-05, 3.619864583015442e-05, 3.790576010942459e-05, 3.961287438869476e-05, 4.1319988667964935e-05, 4.302710294723511e-05, 4.473421722650528e-05, 4.644133150577545e-05, 4.8148445785045624e-05, 4.9855560064315796e-05, 5.156267434358597e-05, 5.326978862285614e-05, 5.497690290212631e-05, 5.6684017181396484e-05]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 11.0, 16.0, 16.0, 40.0, 50.0, 89.0, 190.0, 225.0, 145.0, 82.0, 49.0, 37.0, 18.0, 8.0, 6.0, 6.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007299551274627447, -0.006940724793821573, -0.006581898778676987, -0.006223072297871113, -0.005864245817065239, -0.005505419336259365, -0.0051465933211147785, -0.004787766840308905, -0.004428940825164318, -0.004070114344358444, -0.003711288096383214, -0.0033524618484079838, -0.00299363536760211, -0.0026348091196268797, -0.0022759828716516495, -0.0019171563908457756, -0.0015583299100399017, -0.0011995035456493497, -0.0008406772394664586, -0.00048185093328356743, -0.00012302456889301538, 0.00023580179549753666, 0.0005946280434727669, 0.0009534545242786407, 0.001312280772253871, 0.001671107136644423, 0.002029933501034975, 0.0023887597490102053, 0.0027475859969854355, 0.0031064124777913094, 0.0034652387257665396, 0.0038240652065724134, 0.004182890988886356, 0.00454171746969223, 0.004900543484836817, 0.005259369965642691, 0.0056181964464485645, 0.005977022461593151, 0.006335848942399025, 0.006694675423204899, 0.007053501904010773, 0.007412328384816647, 0.007771154399961233, 0.00812998041510582, 0.008488806895911694, 0.008847633376717567, 0.009206459857523441, 0.009565286338329315, 0.009924111887812614, 0.010282938368618488, 0.010641764849424362, 0.011000590398907661, 0.011359416879713535, 0.01171824336051941, 0.012077069841325283, 0.012435896322131157, 0.01279472280293703, 0.013153549283742905, 0.013512375764548779, 0.013871202245354652, 0.014230027794837952, 0.014588854275643826, 0.0149476807564497, 0.015306507237255573, 0.015665333718061447]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 9.0, 8.0, 12.0, 17.0, 29.0, 26.0, 33.0, 33.0, 24.0, 28.0, 42.0, 48.0, 46.0, 65.0, 55.0, 51.0, 42.0, 58.0, 49.0, 51.0, 44.0, 37.0, 31.0, 29.0, 29.0, 26.0, 11.0, 13.0, 13.0, 7.0, 14.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004636884666979313, -0.00449325330555439, -0.004349621944129467, -0.004205991048365831, -0.004062359686940908, -0.0039187283255159855, -0.003775097196921706, -0.003631466068327427, -0.003487834706902504, -0.003344203345477581, -0.0032005722168833017, -0.0030569410882890224, -0.0029133097268640995, -0.0027696783654391766, -0.0026260472368448973, -0.002482416108250618, -0.002338784746825695, -0.002195153385400772, -0.002051522256806493, -0.0019078910117968917, -0.0017642597667872906, -0.0016206285217776895, -0.0014769972767680883, -0.0013333660317584872, -0.001189734786748886, -0.001046103541739285, -0.0009024722967296839, -0.0007588410517200828, -0.0006152098067104816, -0.00047157856170088053, -0.0003279473166912794, -0.0001843160716816783, -4.068436101078987e-05, 0.00010294688399881124, 0.00024657812900841236, 0.0003902093740180135, 0.0005338406190276146, 0.0006774718640372157, 0.0008211031090468168, 0.0009647343540564179, 0.001108365599066019, 0.0012519968440756202, 0.0013956280890852213, 0.0015392593340948224, 0.0016828905791044235, 0.0018265218241140246, 0.0019701530691236258, 0.002113784197717905, 0.002257415559142828, 0.002401046920567751, 0.0025446780491620302, 0.0026883091777563095, 0.0028319405391812325, 0.0029755719006061554, 0.0031192030292004347, 0.003262834157794714, 0.003406465519219637, 0.00355009688064456, 0.003693728009238839, 0.0038373591378331184, 0.003980990499258041, 0.004124621860682964, 0.004268253222107887, 0.004411884117871523, 0.004555515479296446]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 6.0, 11.0, 10.0, 15.0, 28.0, 36.0, 49.0, 68.0, 123.0, 154.0, 244.0, 493.0, 925.0, 2334.0, 6209.0, 20264.0, 87233.0, 579521.0, 281084.0, 49390.0, 12688.0, 4259.0, 1714.0, 689.0, 354.0, 194.0, 147.0, 96.0, 62.0, 38.0, 31.0, 28.0, 13.0, 14.0, 9.0, 5.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0235595703125, -0.022819042205810547, -0.022078514099121094, -0.02133798599243164, -0.020597457885742188, -0.019856929779052734, -0.01911640167236328, -0.018375873565673828, -0.017635345458984375, -0.016894817352294922, -0.01615428924560547, -0.015413761138916016, -0.014673233032226562, -0.01393270492553711, -0.013192176818847656, -0.012451648712158203, -0.01171112060546875, -0.010970592498779297, -0.010230064392089844, -0.00948953628540039, -0.008749008178710938, -0.008008480072021484, -0.007267951965332031, -0.006527423858642578, -0.005786895751953125, -0.005046367645263672, -0.004305839538574219, -0.0035653114318847656, -0.0028247833251953125, -0.0020842552185058594, -0.0013437271118164062, -0.0006031990051269531, 0.0001373291015625, 0.0008778572082519531, 0.0016183853149414062, 0.0023589134216308594, 0.0030994415283203125, 0.0038399696350097656, 0.004580497741699219, 0.005321025848388672, 0.006061553955078125, 0.006802082061767578, 0.007542610168457031, 0.008283138275146484, 0.009023666381835938, 0.00976419448852539, 0.010504722595214844, 0.011245250701904297, 0.01198577880859375, 0.012726306915283203, 0.013466835021972656, 0.01420736312866211, 0.014947891235351562, 0.015688419342041016, 0.01642894744873047, 0.017169475555419922, 0.017910003662109375, 0.018650531768798828, 0.01939105987548828, 0.020131587982177734, 0.020872116088867188, 0.02161264419555664, 0.022353172302246094, 0.023093700408935547, 0.023834228515625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 4.0, 15.0, 12.0, 13.0, 21.0, 29.0, 23.0, 27.0, 26.0, 33.0, 41.0, 47.0, 49.0, 42.0, 61.0, 70.0, 51.0, 58.0, 48.0, 46.0, 46.0, 41.0, 34.0, 32.0, 32.0, 19.0, 19.0, 17.0, 7.0, 8.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074005126953125, -0.007166624069213867, -0.006932735443115234, -0.0066988468170166016, -0.006464958190917969, -0.006231069564819336, -0.005997180938720703, -0.00576329231262207, -0.0055294036865234375, -0.005295515060424805, -0.005061626434326172, -0.004827737808227539, -0.004593849182128906, -0.0043599605560302734, -0.004126071929931641, -0.003892183303833008, -0.003658294677734375, -0.003424406051635742, -0.0031905174255371094, -0.0029566287994384766, -0.0027227401733398438, -0.002488851547241211, -0.002254962921142578, -0.0020210742950439453, -0.0017871856689453125, -0.0015532970428466797, -0.0013194084167480469, -0.001085519790649414, -0.0008516311645507812, -0.0006177425384521484, -0.0003838539123535156, -0.0001499652862548828, 8.392333984375e-05, 0.0003178119659423828, 0.0005517005920410156, 0.0007855892181396484, 0.0010194778442382812, 0.001253366470336914, 0.0014872550964355469, 0.0017211437225341797, 0.0019550323486328125, 0.0021889209747314453, 0.002422809600830078, 0.002656698226928711, 0.0028905868530273438, 0.0031244754791259766, 0.0033583641052246094, 0.003592252731323242, 0.003826141357421875, 0.004060029983520508, 0.004293918609619141, 0.0045278072357177734, 0.004761695861816406, 0.004995584487915039, 0.005229473114013672, 0.005463361740112305, 0.0056972503662109375, 0.00593113899230957, 0.006165027618408203, 0.006398916244506836, 0.006632804870605469, 0.0068666934967041016, 0.007100582122802734, 0.007334470748901367, 0.007568359375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 3.0, 12.0, 12.0, 16.0, 21.0, 31.0, 30.0, 32.0, 42.0, 53.0, 41.0, 124.0, 1203.0, 35984.0, 993802.0, 15975.0, 716.0, 174.0, 49.0, 44.0, 46.0, 33.0, 29.0, 15.0, 7.0, 19.0, 7.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08709716796875, -0.08391952514648438, -0.08074188232421875, -0.07756423950195312, -0.0743865966796875, -0.07120895385742188, -0.06803131103515625, -0.06485366821289062, -0.061676025390625, -0.058498382568359375, -0.05532073974609375, -0.052143096923828125, -0.0489654541015625, -0.045787811279296875, -0.04261016845703125, -0.039432525634765625, -0.0362548828125, -0.033077239990234375, -0.02989959716796875, -0.026721954345703125, -0.0235443115234375, -0.020366668701171875, -0.01718902587890625, -0.014011383056640625, -0.010833740234375, -0.007656097412109375, -0.00447845458984375, -0.001300811767578125, 0.0018768310546875, 0.005054473876953125, 0.00823211669921875, 0.011409759521484375, 0.01458740234375, 0.017765045166015625, 0.02094268798828125, 0.024120330810546875, 0.0272979736328125, 0.030475616455078125, 0.03365325927734375, 0.036830902099609375, 0.040008544921875, 0.043186187744140625, 0.04636383056640625, 0.049541473388671875, 0.0527191162109375, 0.055896759033203125, 0.05907440185546875, 0.062252044677734375, 0.0654296875, 0.06860733032226562, 0.07178497314453125, 0.07496261596679688, 0.0781402587890625, 0.08131790161132812, 0.08449554443359375, 0.08767318725585938, 0.090850830078125, 0.09402847290039062, 0.09720611572265625, 0.10038375854492188, 0.1035614013671875, 0.10673904418945312, 0.10991668701171875, 0.11309432983398438, 0.11627197265625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 8.0, 14.0, 18.0, 23.0, 30.0, 25.0, 33.0, 42.0, 46.0, 41.0, 44.0, 52.0, 64.0, 75.0, 52.0, 65.0, 59.0, 49.0, 36.0, 44.0, 43.0, 23.0, 20.0, 20.0, 10.0, 12.0, 8.0, 9.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007232666015625, -0.006971001625061035, -0.00670933723449707, -0.0064476728439331055, -0.006186008453369141, -0.005924344062805176, -0.005662679672241211, -0.005401015281677246, -0.005139350891113281, -0.004877686500549316, -0.0046160221099853516, -0.004354357719421387, -0.004092693328857422, -0.003831028938293457, -0.003569364547729492, -0.0033077001571655273, -0.0030460357666015625, -0.0027843713760375977, -0.002522706985473633, -0.002261042594909668, -0.001999378204345703, -0.0017377138137817383, -0.0014760494232177734, -0.0012143850326538086, -0.0009527206420898438, -0.0006910562515258789, -0.00042939186096191406, -0.00016772747039794922, 9.393692016601562e-05, 0.00035560131072998047, 0.0006172657012939453, 0.0008789300918579102, 0.001140594482421875, 0.0014022588729858398, 0.0016639232635498047, 0.0019255876541137695, 0.0021872520446777344, 0.0024489164352416992, 0.002710580825805664, 0.002972245216369629, 0.0032339096069335938, 0.0034955739974975586, 0.0037572383880615234, 0.004018902778625488, 0.004280567169189453, 0.004542231559753418, 0.004803895950317383, 0.005065560340881348, 0.0053272247314453125, 0.005588889122009277, 0.005850553512573242, 0.006112217903137207, 0.006373882293701172, 0.006635546684265137, 0.0068972110748291016, 0.007158875465393066, 0.007420539855957031, 0.007682204246520996, 0.007943868637084961, 0.008205533027648926, 0.00846719741821289, 0.008728861808776855, 0.00899052619934082, 0.009252190589904785, 0.00951385498046875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 7.0, 5.0, 6.0, 10.0, 12.0, 23.0, 23.0, 44.0, 85.0, 141.0, 340.0, 955.0, 3078.0, 10621.0, 84756.0, 917976.0, 22595.0, 5198.0, 1660.0, 575.0, 203.0, 89.0, 65.0, 37.0, 25.0, 9.0, 8.0, 11.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012385845184326172, -0.00011706538498401642, -0.00011027231812477112, -0.00010347925126552582, -9.668618440628052e-05, -8.989311754703522e-05, -8.310005068778992e-05, -7.630698382854462e-05, -6.951391696929932e-05, -6.272085011005402e-05, -5.5927783250808716e-05, -4.9134716391563416e-05, -4.2341649532318115e-05, -3.5548582673072815e-05, -2.8755515813827515e-05, -2.1962448954582214e-05, -1.5169382095336914e-05, -8.376315236091614e-06, -1.5832483768463135e-06, 5.209818482398987e-06, 1.2002885341644287e-05, 1.8795952200889587e-05, 2.5589019060134888e-05, 3.238208591938019e-05, 3.917515277862549e-05, 4.596821963787079e-05, 5.276128649711609e-05, 5.955435335636139e-05, 6.634742021560669e-05, 7.314048707485199e-05, 7.993355393409729e-05, 8.672662079334259e-05, 9.351968765258789e-05, 0.00010031275451183319, 0.00010710582137107849, 0.00011389888823032379, 0.00012069195508956909, 0.0001274850219488144, 0.0001342780888080597, 0.000141071155667305, 0.0001478642225265503, 0.0001546572893857956, 0.0001614503562450409, 0.0001682434231042862, 0.0001750364899635315, 0.0001818295568227768, 0.0001886226236820221, 0.0001954156905412674, 0.0002022087574005127, 0.000209001824259758, 0.0002157948911190033, 0.0002225879579782486, 0.0002293810248374939, 0.0002361740916967392, 0.0002429671585559845, 0.0002497602254152298, 0.0002565532922744751, 0.0002633463591337204, 0.0002701394259929657, 0.000276932492852211, 0.0002837255597114563, 0.0002905186265707016, 0.0002973116934299469, 0.0003041047602891922, 0.0003108978271484375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 1.0, 5.0, 7.0, 3.0, 11.0, 4.0, 25.0, 13.0, 56.0, 85.0, 63.0, 378.0, 65.0, 96.0, 37.0, 56.0, 13.0, 27.0, 9.0, 6.0, 10.0, 4.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-06, -2.4102628231048584e-06, -2.3171305656433105e-06, -2.2239983081817627e-06, -2.130866050720215e-06, -2.037733793258667e-06, -1.944601535797119e-06, -1.8514692783355713e-06, -1.7583370208740234e-06, -1.6652047634124756e-06, -1.5720725059509277e-06, -1.4789402484893799e-06, -1.385807991027832e-06, -1.2926757335662842e-06, -1.1995434761047363e-06, -1.1064112186431885e-06, -1.0132789611816406e-06, -9.201467037200928e-07, -8.270144462585449e-07, -7.338821887969971e-07, -6.407499313354492e-07, -5.476176738739014e-07, -4.544854164123535e-07, -3.6135315895080566e-07, -2.682209014892578e-07, -1.7508864402770996e-07, -8.195638656616211e-08, 1.1175870895385742e-08, 1.043081283569336e-07, 1.9744038581848145e-07, 2.905726432800293e-07, 3.8370490074157715e-07, 4.76837158203125e-07, 5.699694156646729e-07, 6.631016731262207e-07, 7.562339305877686e-07, 8.493661880493164e-07, 9.424984455108643e-07, 1.0356307029724121e-06, 1.12876296043396e-06, 1.2218952178955078e-06, 1.3150274753570557e-06, 1.4081597328186035e-06, 1.5012919902801514e-06, 1.5944242477416992e-06, 1.687556505203247e-06, 1.780688762664795e-06, 1.8738210201263428e-06, 1.9669532775878906e-06, 2.0600855350494385e-06, 2.1532177925109863e-06, 2.246350049972534e-06, 2.339482307434082e-06, 2.43261456489563e-06, 2.5257468223571777e-06, 2.6188790798187256e-06, 2.7120113372802734e-06, 2.8051435947418213e-06, 2.898275852203369e-06, 2.991408109664917e-06, 3.084540367126465e-06, 3.1776726245880127e-06, 3.2708048820495605e-06, 3.3639371395111084e-06, 3.4570693969726562e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 13.0, 7.0, 17.0, 25.0, 26.0, 55.0, 97.0, 130.0, 267.0, 525.0, 1162.0, 3108.0, 10949.0, 62656.0, 925626.0, 32348.0, 7313.0, 2375.0, 905.0, 414.0, 228.0, 121.0, 63.0, 43.0, 31.0, 23.0, 16.0, 8.0, 7.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002257823944091797, -0.00021721422672271729, -0.00020864605903625488, -0.00020007789134979248, -0.00019150972366333008, -0.00018294155597686768, -0.00017437338829040527, -0.00016580522060394287, -0.00015723705291748047, -0.00014866888523101807, -0.00014010071754455566, -0.00013153254985809326, -0.00012296438217163086, -0.00011439621448516846, -0.00010582804679870605, -9.725987911224365e-05, -8.869171142578125e-05, -8.012354373931885e-05, -7.155537605285645e-05, -6.298720836639404e-05, -5.441904067993164e-05, -4.585087299346924e-05, -3.7282705307006836e-05, -2.8714537620544434e-05, -2.014636993408203e-05, -1.1578202247619629e-05, -3.0100345611572266e-06, 5.558133125305176e-06, 1.4126300811767578e-05, 2.269446849822998e-05, 3.126263618469238e-05, 3.9830803871154785e-05, 4.839897155761719e-05, 5.696713924407959e-05, 6.553530693054199e-05, 7.41034746170044e-05, 8.26716423034668e-05, 9.12398099899292e-05, 9.98079776763916e-05, 0.000108376145362854, 0.0001169443130493164, 0.0001255124807357788, 0.0001340806484222412, 0.0001426488161087036, 0.00015121698379516602, 0.00015978515148162842, 0.00016835331916809082, 0.00017692148685455322, 0.00018548965454101562, 0.00019405782222747803, 0.00020262598991394043, 0.00021119415760040283, 0.00021976232528686523, 0.00022833049297332764, 0.00023689866065979004, 0.00024546682834625244, 0.00025403499603271484, 0.00026260316371917725, 0.00027117133140563965, 0.00027973949909210205, 0.00028830766677856445, 0.00029687583446502686, 0.00030544400215148926, 0.00031401216983795166, 0.00032258033752441406]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 12.0, 15.0, 22.0, 68.0, 135.0, 586.0, 70.0, 34.0, 14.0, 9.0, 4.0, 5.0, 8.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3795833587646484e-05, -3.2271258533000946e-05, -3.074668347835541e-05, -2.922210842370987e-05, -2.769753336906433e-05, -2.6172958314418793e-05, -2.4648383259773254e-05, -2.3123808205127716e-05, -2.1599233150482178e-05, -2.007465809583664e-05, -1.85500830411911e-05, -1.7025507986545563e-05, -1.5500932931900024e-05, -1.3976357877254486e-05, -1.2451782822608948e-05, -1.092720776796341e-05, -9.402632713317871e-06, -7.878057658672333e-06, -6.3534826040267944e-06, -4.828907549381256e-06, -3.3043324947357178e-06, -1.7797574400901794e-06, -2.551823854446411e-07, 1.2693926692008972e-06, 2.7939677238464355e-06, 4.318542778491974e-06, 5.843117833137512e-06, 7.3676928877830505e-06, 8.892267942428589e-06, 1.0416842997074127e-05, 1.1941418051719666e-05, 1.3465993106365204e-05, 1.4990568161010742e-05, 1.651514321565628e-05, 1.803971827030182e-05, 1.9564293324947357e-05, 2.1088868379592896e-05, 2.2613443434238434e-05, 2.4138018488883972e-05, 2.566259354352951e-05, 2.718716859817505e-05, 2.8711743652820587e-05, 3.0236318707466125e-05, 3.1760893762111664e-05, 3.32854688167572e-05, 3.481004387140274e-05, 3.633461892604828e-05, 3.785919398069382e-05, 3.9383769035339355e-05, 4.0908344089984894e-05, 4.243291914463043e-05, 4.395749419927597e-05, 4.548206925392151e-05, 4.700664430856705e-05, 4.8531219363212585e-05, 5.0055794417858124e-05, 5.158036947250366e-05, 5.31049445271492e-05, 5.462951958179474e-05, 5.615409463644028e-05, 5.7678669691085815e-05, 5.9203244745731354e-05, 6.072781980037689e-05, 6.225239485502243e-05, 6.377696990966797e-05]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 6.0, 23.0, 33.0, 77.0, 203.0, 323.0, 189.0, 78.0, 40.0, 18.0, 7.0, 5.0, 1.0, 2.0], "bins": [-0.033837392926216125, -0.03322727978229523, -0.03261717036366463, -0.03200705721974373, -0.03139694407582283, -0.03078683279454708, -0.030176721513271332, -0.029566608369350433, -0.028956497088074684, -0.028346385806798935, -0.027736272662878036, -0.027126161381602287, -0.026516050100326538, -0.02590593695640564, -0.02529582567512989, -0.02468571439385414, -0.024075601249933243, -0.023465489968657494, -0.022855376824736595, -0.022245265543460846, -0.021635152399539948, -0.0210250411182642, -0.02041492983698845, -0.01980481669306755, -0.0191947054117918, -0.018584594130516052, -0.017974480986595154, -0.017364369705319405, -0.016754258424043655, -0.016144145280122757, -0.015534033998847008, -0.014923921786248684, -0.014313807711005211, -0.013703695498406887, -0.013093583285808563, -0.012483472004532814, -0.01187335979193449, -0.011263247579336166, -0.010653136298060417, -0.010043024085462093, -0.00943291187286377, -0.008822799660265446, -0.008212687447667122, -0.007602576166391373, -0.006992463953793049, -0.006382351741194725, -0.0057722399942576885, -0.005162128247320652, -0.004552016034722328, -0.003941903822124004, -0.003331792075186968, -0.0027216800954192877, -0.0021115681156516075, -0.0015014561358839273, -0.0008913441561162472, -0.00028123240917921066, 0.00032887980341911316, 0.0009389917831867933, 0.0015491037629544735, 0.0021592157427221537, 0.002769327722489834, 0.003379439702257514, 0.003989551682025194, 0.004599663428962231, 0.0052097756415605545]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 3.0, 8.0, 6.0, 12.0, 13.0, 13.0, 22.0, 15.0, 20.0, 17.0, 25.0, 28.0, 29.0, 37.0, 38.0, 46.0, 41.0, 24.0, 49.0, 33.0, 42.0, 43.0, 36.0, 38.0, 41.0, 34.0, 31.0, 31.0, 29.0, 27.0, 24.0, 24.0, 19.0, 14.0, 15.0, 16.0, 12.0, 7.0, 6.0, 5.0, 8.0, 5.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.008004965260624886, -0.007771429605782032, -0.007537894416600466, -0.007304358761757612, -0.007070823572576046, -0.0068372879177331924, -0.006603752262890339, -0.006370216608047485, -0.006136681418865919, -0.005903145764023066, -0.005669610574841499, -0.005436074919998646, -0.005202539265155792, -0.004969004075974226, -0.0047354684211313725, -0.004501933231949806, -0.004268397577106953, -0.004034861922264099, -0.003801326733082533, -0.0035677910782396793, -0.0033342556562274694, -0.0031007202342152596, -0.002867184579372406, -0.002633649157360196, -0.0024001137353479862, -0.0021665783133357763, -0.0019330427749082446, -0.0016995072364807129, -0.001465971814468503, -0.001232436392456293, -0.0009989008540287614, -0.0007653653156012297, -0.0005318298935890198, -0.00029829441336914897, -6.475893314927816e-05, 0.00016877654707059264, 0.00040231202729046345, 0.0006358474493026733, 0.0008693829877302051, 0.0011029185261577368, 0.0013364539481699467, 0.0015699893701821566, 0.0018035249086096883, 0.00203706044703722, 0.00227059586904943, 0.00250413129106164, 0.0027376669459044933, 0.0029712023679167032, 0.003204737789928913, 0.003438273211941123, 0.003671808633953333, 0.0039053442887961864, 0.004138879477977753, 0.004372415132820606, 0.00460595078766346, 0.004839486442506313, 0.0050730216316878796, 0.005306557286530733, 0.005540092475712299, 0.005773628130555153, 0.0060071637853980064, 0.006240698974579573, 0.006474234629422426, 0.0067077698186039925, 0.006941305473446846]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 10.0, 9.0, 7.0, 15.0, 17.0, 22.0, 19.0, 33.0, 38.0, 64.0, 90.0, 177.0, 350.0, 746.0, 1971.0, 8762.0, 118804.0, 3401273.0, 636492.0, 19537.0, 3576.0, 1070.0, 547.0, 228.0, 134.0, 73.0, 64.0, 33.0, 30.0, 15.0, 16.0, 16.0, 12.0, 9.0, 5.0, 3.0, 7.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.017822265625, -0.017260313034057617, -0.016698360443115234, -0.01613640785217285, -0.015574455261230469, -0.015012502670288086, -0.014450550079345703, -0.01388859748840332, -0.013326644897460938, -0.012764692306518555, -0.012202739715576172, -0.011640787124633789, -0.011078834533691406, -0.010516881942749023, -0.00995492935180664, -0.009392976760864258, -0.008831024169921875, -0.008269071578979492, -0.007707118988037109, -0.0071451663970947266, -0.006583213806152344, -0.006021261215209961, -0.005459308624267578, -0.004897356033325195, -0.0043354034423828125, -0.0037734508514404297, -0.003211498260498047, -0.002649545669555664, -0.0020875930786132812, -0.0015256404876708984, -0.0009636878967285156, -0.0004017353057861328, 0.00016021728515625, 0.0007221698760986328, 0.0012841224670410156, 0.0018460750579833984, 0.0024080276489257812, 0.002969980239868164, 0.003531932830810547, 0.00409388542175293, 0.0046558380126953125, 0.005217790603637695, 0.005779743194580078, 0.006341695785522461, 0.006903648376464844, 0.0074656009674072266, 0.00802755355834961, 0.008589506149291992, 0.009151458740234375, 0.009713411331176758, 0.01027536392211914, 0.010837316513061523, 0.011399269104003906, 0.011961221694946289, 0.012523174285888672, 0.013085126876831055, 0.013647079467773438, 0.01420903205871582, 0.014770984649658203, 0.015332937240600586, 0.01589488983154297, 0.01645684242248535, 0.017018795013427734, 0.017580747604370117, 0.0181427001953125]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 8.0, 12.0, 9.0, 9.0, 13.0, 17.0, 14.0, 23.0, 12.0, 20.0, 21.0, 25.0, 35.0, 35.0, 31.0, 29.0, 41.0, 38.0, 27.0, 32.0, 35.0, 36.0, 50.0, 38.0, 37.0, 31.0, 25.0, 31.0, 26.0, 22.0, 26.0, 28.0, 21.0, 17.0, 16.0, 21.0, 17.0, 12.0, 10.0, 9.0, 4.0, 5.0, 5.0, 6.0, 4.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.0038909912109375, -0.0037650465965270996, -0.0036391019821166992, -0.003513157367706299, -0.0033872127532958984, -0.003261268138885498, -0.0031353235244750977, -0.0030093789100646973, -0.002883434295654297, -0.0027574896812438965, -0.002631545066833496, -0.0025056004524230957, -0.0023796558380126953, -0.002253711223602295, -0.0021277666091918945, -0.002001821994781494, -0.0018758773803710938, -0.0017499327659606934, -0.001623988151550293, -0.0014980435371398926, -0.0013720989227294922, -0.0012461543083190918, -0.0011202096939086914, -0.000994265079498291, -0.0008683204650878906, -0.0007423758506774902, -0.0006164312362670898, -0.0004904866218566895, -0.00036454200744628906, -0.00023859739303588867, -0.00011265277862548828, 1.329183578491211e-05, 0.0001392364501953125, 0.0002651810646057129, 0.0003911256790161133, 0.0005170702934265137, 0.0006430149078369141, 0.0007689595222473145, 0.0008949041366577148, 0.0010208487510681152, 0.0011467933654785156, 0.001272737979888916, 0.0013986825942993164, 0.0015246272087097168, 0.0016505718231201172, 0.0017765164375305176, 0.001902461051940918, 0.0020284056663513184, 0.0021543502807617188, 0.002280294895172119, 0.0024062395095825195, 0.00253218412399292, 0.0026581287384033203, 0.0027840733528137207, 0.002910017967224121, 0.0030359625816345215, 0.003161907196044922, 0.0032878518104553223, 0.0034137964248657227, 0.003539741039276123, 0.0036656856536865234, 0.003791630268096924, 0.003917574882507324, 0.004043519496917725, 0.004169464111328125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 11.0, 12.0, 13.0, 36.0, 36.0, 61.0, 95.0, 114.0, 236.0, 367.0, 1486.0, 4185156.0, 5318.0, 521.0, 257.0, 163.0, 95.0, 74.0, 61.0, 41.0, 23.0, 18.0, 22.0, 20.0, 9.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.101318359375, -0.09789562225341797, -0.09447288513183594, -0.0910501480102539, -0.08762741088867188, -0.08420467376708984, -0.08078193664550781, -0.07735919952392578, -0.07393646240234375, -0.07051372528076172, -0.06709098815917969, -0.06366825103759766, -0.060245513916015625, -0.056822776794433594, -0.05340003967285156, -0.04997730255126953, -0.0465545654296875, -0.04313182830810547, -0.03970909118652344, -0.036286354064941406, -0.032863616943359375, -0.029440879821777344, -0.026018142700195312, -0.02259540557861328, -0.01917266845703125, -0.01574993133544922, -0.012327194213867188, -0.008904457092285156, -0.005481719970703125, -0.0020589828491210938, 0.0013637542724609375, 0.004786491394042969, 0.008209228515625, 0.011631965637207031, 0.015054702758789062, 0.018477439880371094, 0.021900177001953125, 0.025322914123535156, 0.028745651245117188, 0.03216838836669922, 0.03559112548828125, 0.03901386260986328, 0.04243659973144531, 0.045859336853027344, 0.049282073974609375, 0.052704811096191406, 0.05612754821777344, 0.05955028533935547, 0.0629730224609375, 0.06639575958251953, 0.06981849670410156, 0.0732412338256836, 0.07666397094726562, 0.08008670806884766, 0.08350944519042969, 0.08693218231201172, 0.09035491943359375, 0.09377765655517578, 0.09720039367675781, 0.10062313079833984, 0.10404586791992188, 0.1074686050415039, 0.11089134216308594, 0.11431407928466797, 0.11773681640625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 13.0, 12.0, 14.0, 38.0, 39.0, 73.0, 84.0, 134.0, 241.0, 342.0, 530.0, 814.0, 610.0, 365.0, 215.0, 164.0, 87.0, 78.0, 61.0, 32.0, 21.0, 22.0, 24.0, 17.0, 7.0, 10.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00341796875, -0.0033020377159118652, -0.0031861066818237305, -0.0030701756477355957, -0.002954244613647461, -0.002838313579559326, -0.0027223825454711914, -0.0026064515113830566, -0.002490520477294922, -0.002374589443206787, -0.0022586584091186523, -0.0021427273750305176, -0.002026796340942383, -0.001910865306854248, -0.0017949342727661133, -0.0016790032386779785, -0.0015630722045898438, -0.001447141170501709, -0.0013312101364135742, -0.0012152791023254395, -0.0010993480682373047, -0.00098341703414917, -0.0008674860000610352, -0.0007515549659729004, -0.0006356239318847656, -0.0005196928977966309, -0.0004037618637084961, -0.00028783082962036133, -0.00017189979553222656, -5.59687614440918e-05, 5.996227264404297e-05, 0.00017589330673217773, 0.0002918243408203125, 0.00040775537490844727, 0.000523686408996582, 0.0006396174430847168, 0.0007555484771728516, 0.0008714795112609863, 0.000987410545349121, 0.0011033415794372559, 0.0012192726135253906, 0.0013352036476135254, 0.0014511346817016602, 0.001567065715789795, 0.0016829967498779297, 0.0017989277839660645, 0.0019148588180541992, 0.002030789852142334, 0.0021467208862304688, 0.0022626519203186035, 0.0023785829544067383, 0.002494513988494873, 0.002610445022583008, 0.0027263760566711426, 0.0028423070907592773, 0.002958238124847412, 0.003074169158935547, 0.0031901001930236816, 0.0033060312271118164, 0.003421962261199951, 0.003537893295288086, 0.0036538243293762207, 0.0037697553634643555, 0.0038856863975524902, 0.004001617431640625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 18.0, 63.0, 286.0, 424.0, 129.0, 48.0, 15.0, 11.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017433365806937218, -0.016569560393691063, -0.015705754980444908, -0.014841949567198753, -0.013978144153952599, -0.013114338740706444, -0.012250534258782864, -0.011386728845536709, -0.010522923432290554, -0.0096591180190444, -0.008795312605798244, -0.007931508123874664, -0.007067702244967222, -0.006203896831721067, -0.0053400918841362, -0.004476286470890045, -0.0036124810576438904, -0.0027486756443977356, -0.0018848704639822245, -0.0010210652835667133, -0.00015725987032055855, 0.0007065455429255962, 0.0015703504905104637, 0.0024341559037566185, 0.0032979613170027733, 0.004161766730248928, 0.005025572143495083, 0.00588937709107995, 0.006753182504326105, 0.00761698791757226, 0.008480792865157127, 0.009344598278403282, 0.010208401829004288, 0.011072207242250443, 0.011936012655496597, 0.012799818068742752, 0.013663623481988907, 0.014527428895235062, 0.015391233377158642, 0.01625503972172737, 0.017118845134973526, 0.01798265054821968, 0.018846455961465836, 0.01971026137471199, 0.020574066787958145, 0.0214378722012043, 0.022301677614450455, 0.02316548302769661, 0.024029286578297615, 0.02489309199154377, 0.025756897404789925, 0.02662070281803608, 0.027484508231282234, 0.02834831364452839, 0.029212117195129395, 0.03007592260837555, 0.030939728021621704, 0.03180353343486786, 0.032667338848114014, 0.03353114426136017, 0.03439494967460632, 0.03525875508785248, 0.03612256050109863, 0.03698636591434479, 0.03785017132759094]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 6.0, 14.0, 15.0, 13.0, 18.0, 19.0, 28.0, 24.0, 42.0, 32.0, 36.0, 51.0, 50.0, 56.0, 52.0, 57.0, 61.0, 51.0, 48.0, 46.0, 39.0, 27.0, 34.0, 29.0, 30.0, 24.0, 21.0, 17.0, 6.0, 7.0, 8.0, 5.0, 3.0, 5.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.012542599812150002, -0.012145341373980045, -0.011748082004487514, -0.011350823566317558, -0.010953564196825027, -0.010556305758655071, -0.010159047320485115, -0.009761787950992584, -0.009364529512822628, -0.008967271074652672, -0.008570011705160141, -0.008172753266990185, -0.007775494363158941, -0.007378235459327698, -0.0069809770211577415, -0.006583718117326498, -0.0061864592134952545, -0.005789200309664011, -0.0053919414058327675, -0.004994682967662811, -0.004597424063831568, -0.004200165160000324, -0.0038029064889997244, -0.0034056478179991245, -0.003008388914167881, -0.0026111300103366375, -0.0022138713393360376, -0.001816612551920116, -0.0014193537645041943, -0.0010220948606729507, -0.0006248361896723509, -0.00022757751867175102, 0.00016968045383691788, 0.0005669392412528396, 0.0009641980286687613, 0.001361456816084683, 0.0017587156035006046, 0.002155974507331848, 0.002553233178332448, 0.002950491849333048, 0.0033477507531642914, 0.003745009656995535, 0.004142268560826778, 0.004539526998996735, 0.004936785902827978, 0.005334044806659222, 0.005731303244829178, 0.006128562148660421, 0.006525821052491665, 0.006923079956322908, 0.007320338860154152, 0.007717597298324108, 0.008114855736494064, 0.008512115105986595, 0.008909373544156551, 0.009306631982326508, 0.009703891351819038, 0.010101149789988995, 0.010498409159481525, 0.010895667597651482, 0.011292926967144012, 0.011690185405313969, 0.012087443843483925, 0.012484703212976456, 0.012881961651146412]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 16.0, 17.0, 30.0, 37.0, 44.0, 78.0, 93.0, 147.0, 190.0, 300.0, 442.0, 630.0, 997.0, 1593.0, 2332.0, 3708.0, 6245.0, 10720.0, 18498.0, 34017.0, 67074.0, 153127.0, 367346.0, 203713.0, 82946.0, 40877.0, 21558.0, 12496.0, 7078.0, 4391.0, 2702.0, 1718.0, 1065.0, 736.0, 511.0, 321.0, 230.0, 147.0, 116.0, 68.0, 67.0, 32.0, 29.0, 27.0, 8.0, 10.0, 7.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0], "bins": [-0.0016813278198242188, -0.0016313493251800537, -0.0015813708305358887, -0.0015313923358917236, -0.0014814138412475586, -0.0014314353466033936, -0.0013814568519592285, -0.0013314783573150635, -0.0012814998626708984, -0.0012315213680267334, -0.0011815428733825684, -0.0011315643787384033, -0.0010815858840942383, -0.0010316073894500732, -0.0009816288948059082, -0.0009316504001617432, -0.0008816719055175781, -0.0008316934108734131, -0.000781714916229248, -0.000731736421585083, -0.000681757926940918, -0.0006317794322967529, -0.0005818009376525879, -0.0005318224430084229, -0.0004818439483642578, -0.0004318654537200928, -0.00038188695907592773, -0.0003319084644317627, -0.00028192996978759766, -0.00023195147514343262, -0.00018197298049926758, -0.00013199448585510254, -8.20159912109375e-05, -3.203749656677246e-05, 1.7940998077392578e-05, 6.791949272155762e-05, 0.00011789798736572266, 0.0001678764820098877, 0.00021785497665405273, 0.0002678334712982178, 0.0003178119659423828, 0.00036779046058654785, 0.0004177689552307129, 0.00046774744987487793, 0.000517725944519043, 0.000567704439163208, 0.000617682933807373, 0.0006676614284515381, 0.0007176399230957031, 0.0007676184177398682, 0.0008175969123840332, 0.0008675754070281982, 0.0009175539016723633, 0.0009675323963165283, 0.0010175108909606934, 0.0010674893856048584, 0.0011174678802490234, 0.0011674463748931885, 0.0012174248695373535, 0.0012674033641815186, 0.0013173818588256836, 0.0013673603534698486, 0.0014173388481140137, 0.0014673173427581787, 0.0015172958374023438]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 9.0, 8.0, 21.0, 12.0, 14.0, 21.0, 25.0, 26.0, 25.0, 46.0, 44.0, 65.0, 53.0, 69.0, 66.0, 81.0, 52.0, 57.0, 40.0, 34.0, 36.0, 36.0, 23.0, 29.0, 24.0, 19.0, 15.0, 7.0, 7.0, 5.0, 8.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006175994873046875, -0.0059760212898254395, -0.005776047706604004, -0.005576074123382568, -0.005376100540161133, -0.005176126956939697, -0.004976153373718262, -0.004776179790496826, -0.004576206207275391, -0.004376232624053955, -0.0041762590408325195, -0.003976285457611084, -0.0037763118743896484, -0.003576338291168213, -0.0033763647079467773, -0.003176391124725342, -0.0029764175415039062, -0.0027764439582824707, -0.002576470375061035, -0.0023764967918395996, -0.002176523208618164, -0.0019765496253967285, -0.001776576042175293, -0.0015766024589538574, -0.0013766288757324219, -0.0011766552925109863, -0.0009766817092895508, -0.0007767081260681152, -0.0005767345428466797, -0.00037676095962524414, -0.0001767873764038086, 2.3186206817626953e-05, 0.0002231597900390625, 0.00042313337326049805, 0.0006231069564819336, 0.0008230805397033691, 0.0010230541229248047, 0.0012230277061462402, 0.0014230012893676758, 0.0016229748725891113, 0.0018229484558105469, 0.0020229220390319824, 0.002222895622253418, 0.0024228692054748535, 0.002622842788696289, 0.0028228163719177246, 0.00302278995513916, 0.0032227635383605957, 0.0034227371215820312, 0.003622710704803467, 0.0038226842880249023, 0.004022657871246338, 0.0042226314544677734, 0.004422605037689209, 0.0046225786209106445, 0.00482255220413208, 0.005022525787353516, 0.005222499370574951, 0.005422472953796387, 0.005622446537017822, 0.005822420120239258, 0.006022393703460693, 0.006222367286682129, 0.0064223408699035645, 0.006622314453125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 5.0, 4.0, 8.0, 23.0, 35.0, 48.0, 72.0, 102.0, 143.0, 201.0, 343.0, 465.0, 756.0, 1114.0, 1743.0, 2617.0, 4203.0, 6470.0, 10591.0, 17750.0, 30455.0, 55322.0, 111651.0, 282386.0, 279784.0, 110600.0, 54956.0, 30622.0, 17461.0, 10530.0, 6430.0, 4073.0, 2632.0, 1734.0, 1072.0, 726.0, 504.0, 326.0, 206.0, 136.0, 93.0, 53.0, 32.0, 30.0, 12.0, 12.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.0014848709106445312, -0.0014398694038391113, -0.0013948678970336914, -0.0013498663902282715, -0.0013048648834228516, -0.0012598633766174316, -0.0012148618698120117, -0.0011698603630065918, -0.0011248588562011719, -0.001079857349395752, -0.001034855842590332, -0.0009898543357849121, -0.0009448528289794922, -0.0008998513221740723, -0.0008548498153686523, -0.0008098483085632324, -0.0007648468017578125, -0.0007198452949523926, -0.0006748437881469727, -0.0006298422813415527, -0.0005848407745361328, -0.0005398392677307129, -0.000494837760925293, -0.00044983625411987305, -0.0004048347473144531, -0.0003598332405090332, -0.0003148317337036133, -0.00026983022689819336, -0.00022482872009277344, -0.00017982721328735352, -0.0001348257064819336, -8.982419967651367e-05, -4.482269287109375e-05, 1.7881393432617188e-07, 4.5180320739746094e-05, 9.018182754516602e-05, 0.00013518333435058594, 0.00018018484115600586, 0.00022518634796142578, 0.0002701878547668457, 0.0003151893615722656, 0.00036019086837768555, 0.00040519237518310547, 0.0004501938819885254, 0.0004951953887939453, 0.0005401968955993652, 0.0005851984024047852, 0.0006301999092102051, 0.000675201416015625, 0.0007202029228210449, 0.0007652044296264648, 0.0008102059364318848, 0.0008552074432373047, 0.0009002089500427246, 0.0009452104568481445, 0.0009902119636535645, 0.0010352134704589844, 0.0010802149772644043, 0.0011252164840698242, 0.0011702179908752441, 0.001215219497680664, 0.001260221004486084, 0.001305222511291504, 0.0013502240180969238, 0.0013952255249023438]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 14.0, 5.0, 12.0, 12.0, 9.0, 25.0, 19.0, 21.0, 27.0, 24.0, 35.0, 33.0, 38.0, 34.0, 28.0, 46.0, 39.0, 45.0, 35.0, 42.0, 45.0, 44.0, 37.0, 25.0, 28.0, 30.0, 37.0, 31.0, 25.0, 16.0, 14.0, 20.0, 15.0, 10.0, 13.0, 13.0, 7.0, 4.0, 4.0, 5.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.003345489501953125, -0.0032472312450408936, -0.003148972988128662, -0.0030507147312164307, -0.0029524564743041992, -0.0028541982173919678, -0.0027559399604797363, -0.002657681703567505, -0.0025594234466552734, -0.002461165189743042, -0.0023629069328308105, -0.002264648675918579, -0.0021663904190063477, -0.002068132162094116, -0.0019698739051818848, -0.0018716156482696533, -0.0017733573913574219, -0.0016750991344451904, -0.001576840877532959, -0.0014785826206207275, -0.001380324363708496, -0.0012820661067962646, -0.0011838078498840332, -0.0010855495929718018, -0.0009872913360595703, -0.0008890330791473389, -0.0007907748222351074, -0.000692516565322876, -0.0005942583084106445, -0.0004960000514984131, -0.00039774179458618164, -0.0002994835376739502, -0.00020122528076171875, -0.0001029670238494873, -4.708766937255859e-06, 9.354948997497559e-05, 0.00019180774688720703, 0.0002900660037994385, 0.0003883242607116699, 0.00048658251762390137, 0.0005848407745361328, 0.0006830990314483643, 0.0007813572883605957, 0.0008796155452728271, 0.0009778738021850586, 0.00107613205909729, 0.0011743903160095215, 0.001272648572921753, 0.0013709068298339844, 0.0014691650867462158, 0.0015674233436584473, 0.0016656816005706787, 0.0017639398574829102, 0.0018621981143951416, 0.001960456371307373, 0.0020587146282196045, 0.002156972885131836, 0.0022552311420440674, 0.002353489398956299, 0.0024517476558685303, 0.0025500059127807617, 0.002648264169692993, 0.0027465224266052246, 0.002844780683517456, 0.0029430389404296875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 6.0, 6.0, 15.0, 21.0, 24.0, 39.0, 46.0, 94.0, 122.0, 197.0, 262.0, 365.0, 576.0, 934.0, 1449.0, 2375.0, 3634.0, 6199.0, 10573.0, 18971.0, 36867.0, 86756.0, 463064.0, 272071.0, 71140.0, 32143.0, 16525.0, 9144.0, 5652.0, 3355.0, 2081.0, 1316.0, 835.0, 548.0, 384.0, 250.0, 163.0, 112.0, 61.0, 39.0, 41.0, 26.0, 29.0, 11.0, 12.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.00018322467803955078, -0.00017781928181648254, -0.0001724138855934143, -0.00016700848937034607, -0.00016160309314727783, -0.0001561976969242096, -0.00015079230070114136, -0.00014538690447807312, -0.00013998150825500488, -0.00013457611203193665, -0.0001291707158088684, -0.00012376531958580017, -0.00011835992336273193, -0.0001129545271396637, -0.00010754913091659546, -0.00010214373469352722, -9.673833847045898e-05, -9.133294224739075e-05, -8.592754602432251e-05, -8.052214980125427e-05, -7.511675357818604e-05, -6.97113573551178e-05, -6.430596113204956e-05, -5.890056490898132e-05, -5.3495168685913086e-05, -4.808977246284485e-05, -4.268437623977661e-05, -3.7278980016708374e-05, -3.187358379364014e-05, -2.64681875705719e-05, -2.1062791347503662e-05, -1.5657395124435425e-05, -1.0251998901367188e-05, -4.84660267829895e-06, 5.587935447692871e-07, 5.964189767837524e-06, 1.1369585990905762e-05, 1.6774982213974e-05, 2.2180378437042236e-05, 2.7585774660110474e-05, 3.299117088317871e-05, 3.839656710624695e-05, 4.3801963329315186e-05, 4.920735955238342e-05, 5.461275577545166e-05, 6.00181519985199e-05, 6.542354822158813e-05, 7.082894444465637e-05, 7.623434066772461e-05, 8.163973689079285e-05, 8.704513311386108e-05, 9.245052933692932e-05, 9.785592555999756e-05, 0.0001032613217830658, 0.00010866671800613403, 0.00011407211422920227, 0.00011947751045227051, 0.00012488290667533875, 0.00013028830289840698, 0.00013569369912147522, 0.00014109909534454346, 0.0001465044915676117, 0.00015190988779067993, 0.00015731528401374817, 0.0001627206802368164]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 0.0, 0.0, 3.0, 6.0, 9.0, 13.0, 8.0, 12.0, 19.0, 24.0, 17.0, 33.0, 27.0, 38.0, 40.0, 63.0, 38.0, 68.0, 48.0, 67.0, 69.0, 49.0, 59.0, 31.0, 57.0, 37.0, 28.0, 25.0, 34.0, 22.0, 20.0, 10.0, 7.0, 4.0, 6.0, 3.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0371208190917969e-05, -1.0040588676929474e-05, -9.709969162940979e-06, -9.379349648952484e-06, -9.04873013496399e-06, -8.718110620975494e-06, -8.387491106987e-06, -8.056871592998505e-06, -7.72625207901001e-06, -7.395632565021515e-06, -7.06501305103302e-06, -6.734393537044525e-06, -6.40377402305603e-06, -6.073154509067535e-06, -5.7425349950790405e-06, -5.411915481090546e-06, -5.081295967102051e-06, -4.750676453113556e-06, -4.420056939125061e-06, -4.089437425136566e-06, -3.7588179111480713e-06, -3.4281983971595764e-06, -3.0975788831710815e-06, -2.7669593691825867e-06, -2.436339855194092e-06, -2.105720341205597e-06, -1.775100827217102e-06, -1.4444813132286072e-06, -1.1138617992401123e-06, -7.832422852516174e-07, -4.5262277126312256e-07, -1.2200325727462769e-07, 2.086162567138672e-07, 5.392357707023621e-07, 8.698552846908569e-07, 1.2004747986793518e-06, 1.5310943126678467e-06, 1.8617138266563416e-06, 2.1923333406448364e-06, 2.5229528546333313e-06, 2.853572368621826e-06, 3.184191882610321e-06, 3.514811396598816e-06, 3.845430910587311e-06, 4.176050424575806e-06, 4.5066699385643005e-06, 4.837289452552795e-06, 5.16790896654129e-06, 5.498528480529785e-06, 5.82914799451828e-06, 6.159767508506775e-06, 6.49038702249527e-06, 6.821006536483765e-06, 7.1516260504722595e-06, 7.482245564460754e-06, 7.81286507844925e-06, 8.143484592437744e-06, 8.474104106426239e-06, 8.804723620414734e-06, 9.135343134403229e-06, 9.465962648391724e-06, 9.796582162380219e-06, 1.0127201676368713e-05, 1.0457821190357208e-05, 1.0788440704345703e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 9.0, 6.0, 11.0, 10.0, 9.0, 16.0, 21.0, 27.0, 15.0, 22.0, 45.0, 36.0, 59.0, 160.0, 926.0, 711020.0, 335074.0, 673.0, 145.0, 57.0, 48.0, 25.0, 16.0, 21.0, 17.0, 13.0, 15.0, 7.0, 11.0, 7.0, 3.0, 5.0, 6.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0015239715576171875, -0.0014763176441192627, -0.0014286637306213379, -0.001381009817123413, -0.0013333559036254883, -0.0012857019901275635, -0.0012380480766296387, -0.0011903941631317139, -0.001142740249633789, -0.0010950863361358643, -0.0010474324226379395, -0.0009997785091400146, -0.0009521245956420898, -0.000904470682144165, -0.0008568167686462402, -0.0008091628551483154, -0.0007615089416503906, -0.0007138550281524658, -0.000666201114654541, -0.0006185472011566162, -0.0005708932876586914, -0.0005232393741607666, -0.0004755854606628418, -0.000427931547164917, -0.0003802776336669922, -0.0003326237201690674, -0.0002849698066711426, -0.00023731589317321777, -0.00018966197967529297, -0.00014200806617736816, -9.435415267944336e-05, -4.6700239181518555e-05, 9.5367431640625e-07, 4.8607587814331055e-05, 9.626150131225586e-05, 0.00014391541481018066, 0.00019156932830810547, 0.00023922324180603027, 0.0002868771553039551, 0.0003345310688018799, 0.0003821849822998047, 0.0004298388957977295, 0.0004774928092956543, 0.0005251467227935791, 0.0005728006362915039, 0.0006204545497894287, 0.0006681084632873535, 0.0007157623767852783, 0.0007634162902832031, 0.0008110702037811279, 0.0008587241172790527, 0.0009063780307769775, 0.0009540319442749023, 0.0010016858577728271, 0.001049339771270752, 0.0010969936847686768, 0.0011446475982666016, 0.0011923015117645264, 0.0012399554252624512, 0.001287609338760376, 0.0013352632522583008, 0.0013829171657562256, 0.0014305710792541504, 0.0014782249927520752, 0.00152587890625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 7.0, 9.0, 7.0, 4.0, 8.0, 17.0, 13.0, 10.0, 19.0, 24.0, 21.0, 31.0, 29.0, 30.0, 52.0, 82.0, 121.0, 120.0, 94.0, 71.0, 45.0, 24.0, 27.0, 21.0, 20.0, 21.0, 10.0, 9.0, 16.0, 6.0, 8.0, 2.0, 7.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6702880859375e-05, -2.5900080800056458e-05, -2.5097280740737915e-05, -2.4294480681419373e-05, -2.349168062210083e-05, -2.2688880562782288e-05, -2.1886080503463745e-05, -2.1083280444145203e-05, -2.028048038482666e-05, -1.9477680325508118e-05, -1.8674880266189575e-05, -1.7872080206871033e-05, -1.706928014755249e-05, -1.6266480088233948e-05, -1.5463680028915405e-05, -1.4660879969596863e-05, -1.385807991027832e-05, -1.3055279850959778e-05, -1.2252479791641235e-05, -1.1449679732322693e-05, -1.064687967300415e-05, -9.844079613685608e-06, -9.041279554367065e-06, -8.238479495048523e-06, -7.4356794357299805e-06, -6.632879376411438e-06, -5.8300793170928955e-06, -5.027279257774353e-06, -4.2244791984558105e-06, -3.421679139137268e-06, -2.6188790798187256e-06, -1.816079020500183e-06, -1.0132789611816406e-06, -2.1047890186309814e-07, 5.923211574554443e-07, 1.3951212167739868e-06, 2.1979212760925293e-06, 3.0007213354110718e-06, 3.8035213947296143e-06, 4.606321454048157e-06, 5.409121513366699e-06, 6.211921572685242e-06, 7.014721632003784e-06, 7.817521691322327e-06, 8.620321750640869e-06, 9.423121809959412e-06, 1.0225921869277954e-05, 1.1028721928596497e-05, 1.1831521987915039e-05, 1.2634322047233582e-05, 1.3437122106552124e-05, 1.4239922165870667e-05, 1.5042722225189209e-05, 1.584552228450775e-05, 1.6648322343826294e-05, 1.7451122403144836e-05, 1.825392246246338e-05, 1.905672252178192e-05, 1.9859522581100464e-05, 2.0662322640419006e-05, 2.146512269973755e-05, 2.226792275905609e-05, 2.3070722818374634e-05, 2.3873522877693176e-05, 2.467632293701172e-05]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 76.0, 602.0, 234.0, 53.0, 17.0, 11.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05051940679550171, -0.04921130836009979, -0.047903209924697876, -0.04659511148929596, -0.04528701305389404, -0.043978914618492126, -0.04267081618309021, -0.04136271774768829, -0.04005461931228638, -0.03874652087688446, -0.037438422441482544, -0.03613032400608063, -0.03482222557067871, -0.033514127135276794, -0.03220602869987488, -0.03089793212711811, -0.029589835554361343, -0.028281737118959427, -0.02697363868355751, -0.025665540248155594, -0.024357441812753677, -0.02304934337735176, -0.021741246804594994, -0.020433148369193077, -0.01912504993379116, -0.017816951498389244, -0.016508853062987328, -0.015200755558907986, -0.01389265712350607, -0.012584558688104153, -0.01127646118402481, -0.009968362748622894, -0.008660264313220978, -0.007352165877819061, -0.006044067908078432, -0.004735969938337803, -0.0034278715029358864, -0.00211977306753397, -0.000811675563454628, 0.0004964228719472885, 0.001804521307349205, 0.003112619509920478, 0.004420717712491751, 0.00572881568223238, 0.007036914117634296, 0.008345012553036213, 0.009653110057115555, 0.010961208492517471, 0.012269306927919388, 0.013577405363321304, 0.01488550379872322, 0.016193602234125137, 0.017501700669527054, 0.01880979910492897, 0.020117895677685738, 0.021425994113087654, 0.02273409254848957, 0.024042190983891487, 0.025350289419293404, 0.02665838599205017, 0.027966484427452087, 0.029274582862854004, 0.03058268129825592, 0.03189077973365784, 0.03319887816905975]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 9.0, 12.0, 14.0, 17.0, 17.0, 15.0, 28.0, 29.0, 38.0, 29.0, 39.0, 50.0, 52.0, 63.0, 46.0, 63.0, 59.0, 42.0, 53.0, 40.0, 41.0, 33.0, 31.0, 26.0, 31.0, 24.0, 19.0, 17.0, 8.0, 7.0, 8.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005402303300797939, -0.005225004628300667, -0.005047705490142107, -0.0048704068176448345, -0.004693108145147562, -0.004515809006989002, -0.00433851033449173, -0.004161211661994457, -0.003983912989497185, -0.0038066140841692686, -0.003629315411671996, -0.00345201650634408, -0.0032747178338468075, -0.0030974189285188913, -0.002920120023190975, -0.0027428213506937027, -0.002565522212535143, -0.0023882233072072268, -0.0022109246347099543, -0.002033625729382038, -0.0018563269404694438, -0.0016790281515568495, -0.0015017292462289333, -0.001324430457316339, -0.0011471316684037447, -0.0009698328794911504, -0.0007925340323708951, -0.0006152351852506399, -0.0004379363963380456, -0.0002606376074254513, -8.333870209753513e-05, 9.396008681505919e-05, 0.0002712588757276535, 0.0004485576937440783, 0.000625856511760503, 0.0008031553588807583, 0.0009804541477933526, 0.001157752936705947, 0.001335051842033863, 0.0015123506309464574, 0.0016896494198590517, 0.001866948208771646, 0.0020442469976842403, 0.0022215459030121565, 0.0023988448083400726, 0.002576143480837345, 0.0027534423861652613, 0.0029307412914931774, 0.00310803996399045, 0.003285338869318366, 0.0034626375418156385, 0.0036399364471435547, 0.003817235119640827, 0.0039945337921381, 0.0041718329302966595, 0.004349131602793932, 0.004526430740952492, 0.004703729413449764, 0.004881028551608324, 0.0050583272241055965, 0.005235625896602869, 0.005412925034761429, 0.005590223707258701, 0.005767522379755974, 0.005944821052253246]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 9.0, 18.0, 24.0, 44.0, 83.0, 218.0, 514.0, 1598.0, 9402.0, 171051.0, 833038.0, 27986.0, 3195.0, 730.0, 334.0, 128.0, 78.0, 32.0, 27.0, 11.0, 14.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061279296875, -0.05943489074707031, -0.057590484619140625, -0.05574607849121094, -0.05390167236328125, -0.05205726623535156, -0.050212860107421875, -0.04836845397949219, -0.0465240478515625, -0.04467964172363281, -0.042835235595703125, -0.04099082946777344, -0.03914642333984375, -0.03730201721191406, -0.035457611083984375, -0.03361320495605469, -0.031768798828125, -0.029924392700195312, -0.028079986572265625, -0.026235580444335938, -0.02439117431640625, -0.022546768188476562, -0.020702362060546875, -0.018857955932617188, -0.0170135498046875, -0.015169143676757812, -0.013324737548828125, -0.011480331420898438, -0.00963592529296875, -0.0077915191650390625, -0.005947113037109375, -0.0041027069091796875, -0.00225830078125, -0.0004138946533203125, 0.001430511474609375, 0.0032749176025390625, 0.00511932373046875, 0.0069637298583984375, 0.008808135986328125, 0.010652542114257812, 0.0124969482421875, 0.014341354370117188, 0.016185760498046875, 0.018030166625976562, 0.01987457275390625, 0.021718978881835938, 0.023563385009765625, 0.025407791137695312, 0.027252197265625, 0.029096603393554688, 0.030941009521484375, 0.03278541564941406, 0.03462982177734375, 0.03647422790527344, 0.038318634033203125, 0.04016304016113281, 0.0420074462890625, 0.04385185241699219, 0.045696258544921875, 0.04754066467285156, 0.04938507080078125, 0.05122947692871094, 0.053073883056640625, 0.05491828918457031, 0.0567626953125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 8.0, 22.0, 38.0, 35.0, 61.0, 79.0, 95.0, 125.0, 127.0, 113.0, 90.0, 73.0, 43.0, 37.0, 22.0, 14.0, 7.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04193115234375, -0.04096055030822754, -0.03998994827270508, -0.03901934623718262, -0.038048744201660156, -0.037078142166137695, -0.036107540130615234, -0.03513693809509277, -0.03416633605957031, -0.03319573402404785, -0.03222513198852539, -0.03125452995300293, -0.03028392791748047, -0.029313325881958008, -0.028342723846435547, -0.027372121810913086, -0.026401519775390625, -0.025430917739868164, -0.024460315704345703, -0.023489713668823242, -0.02251911163330078, -0.02154850959777832, -0.02057790756225586, -0.0196073055267334, -0.018636703491210938, -0.017666101455688477, -0.016695499420166016, -0.015724897384643555, -0.014754295349121094, -0.013783693313598633, -0.012813091278076172, -0.011842489242553711, -0.01087188720703125, -0.009901285171508789, -0.008930683135986328, -0.007960081100463867, -0.006989479064941406, -0.006018877029418945, -0.005048274993896484, -0.0040776729583740234, -0.0031070709228515625, -0.0021364688873291016, -0.0011658668518066406, -0.0001952648162841797, 0.0007753372192382812, 0.0017459392547607422, 0.002716541290283203, 0.003687143325805664, 0.004657745361328125, 0.005628347396850586, 0.006598949432373047, 0.007569551467895508, 0.008540153503417969, 0.00951075553894043, 0.01048135757446289, 0.011451959609985352, 0.012422561645507812, 0.013393163681030273, 0.014363765716552734, 0.015334367752075195, 0.016304969787597656, 0.017275571823120117, 0.018246173858642578, 0.01921677589416504, 0.0201873779296875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 13.0, 20.0, 27.0, 65.0, 99.0, 220.0, 477.0, 1323.0, 4296.0, 241758.0, 793337.0, 4707.0, 1224.0, 498.0, 200.0, 101.0, 50.0, 31.0, 22.0, 18.0, 10.0, 8.0, 8.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.162353515625, -0.1567668914794922, -0.15118026733398438, -0.14559364318847656, -0.14000701904296875, -0.13442039489746094, -0.12883377075195312, -0.12324714660644531, -0.1176605224609375, -0.11207389831542969, -0.10648727416992188, -0.10090065002441406, -0.09531402587890625, -0.08972740173339844, -0.08414077758789062, -0.07855415344238281, -0.072967529296875, -0.06738090515136719, -0.061794281005859375, -0.05620765686035156, -0.05062103271484375, -0.04503440856933594, -0.039447784423828125, -0.03386116027832031, -0.0282745361328125, -0.022687911987304688, -0.017101287841796875, -0.011514663696289062, -0.00592803955078125, -0.0003414154052734375, 0.005245208740234375, 0.010831832885742188, 0.01641845703125, 0.022005081176757812, 0.027591705322265625, 0.03317832946777344, 0.03876495361328125, 0.04435157775878906, 0.049938201904296875, 0.05552482604980469, 0.0611114501953125, 0.06669807434082031, 0.07228469848632812, 0.07787132263183594, 0.08345794677734375, 0.08904457092285156, 0.09463119506835938, 0.10021781921386719, 0.105804443359375, 0.11139106750488281, 0.11697769165039062, 0.12256431579589844, 0.12815093994140625, 0.13373756408691406, 0.13932418823242188, 0.1449108123779297, 0.1504974365234375, 0.1560840606689453, 0.16167068481445312, 0.16725730895996094, 0.17284393310546875, 0.17843055725097656, 0.18401718139648438, 0.1896038055419922, 0.1951904296875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 5.0, 7.0, 15.0, 31.0, 54.0, 79.0, 130.0, 154.0, 171.0, 109.0, 100.0, 58.0, 32.0, 28.0, 12.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.051422119140625, -0.04965829849243164, -0.04789447784423828, -0.04613065719604492, -0.04436683654785156, -0.0426030158996582, -0.040839195251464844, -0.039075374603271484, -0.037311553955078125, -0.035547733306884766, -0.033783912658691406, -0.03202009201049805, -0.030256271362304688, -0.028492450714111328, -0.02672863006591797, -0.02496480941772461, -0.02320098876953125, -0.02143716812133789, -0.01967334747314453, -0.017909526824951172, -0.016145706176757812, -0.014381885528564453, -0.012618064880371094, -0.010854244232177734, -0.009090423583984375, -0.007326602935791016, -0.005562782287597656, -0.003798961639404297, -0.0020351409912109375, -0.0002713203430175781, 0.0014925003051757812, 0.0032563209533691406, 0.0050201416015625, 0.006783962249755859, 0.008547782897949219, 0.010311603546142578, 0.012075424194335938, 0.013839244842529297, 0.015603065490722656, 0.017366886138916016, 0.019130706787109375, 0.020894527435302734, 0.022658348083496094, 0.024422168731689453, 0.026185989379882812, 0.027949810028076172, 0.02971363067626953, 0.03147745132446289, 0.03324127197265625, 0.03500509262084961, 0.03676891326904297, 0.03853273391723633, 0.04029655456542969, 0.04206037521362305, 0.043824195861816406, 0.045588016510009766, 0.047351837158203125, 0.049115657806396484, 0.050879478454589844, 0.0526432991027832, 0.05440711975097656, 0.05617094039916992, 0.05793476104736328, 0.05969858169555664, 0.06146240234375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 8.0, 8.0, 7.0, 11.0, 14.0, 10.0, 20.0, 21.0, 42.0, 37.0, 90.0, 140.0, 271.0, 603.0, 1147.0, 2195.0, 4596.0, 15737.0, 417949.0, 577633.0, 18050.0, 4890.0, 2297.0, 1238.0, 635.0, 349.0, 181.0, 113.0, 76.0, 42.0, 33.0, 15.0, 8.0, 9.0, 10.0, 14.0, 7.0, 7.0, 6.0, 8.0, 1.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.004535675048828125, -0.0044097900390625, -0.004283905029296875, -0.00415802001953125, -0.004032135009765625, -0.00390625, -0.003780364990234375, -0.00365447998046875, -0.003528594970703125, -0.0034027099609375, -0.003276824951171875, -0.00315093994140625, -0.003025054931640625, -0.002899169921875, -0.002773284912109375, -0.00264739990234375, -0.002521514892578125, -0.0023956298828125, -0.002269744873046875, -0.00214385986328125, -0.002017974853515625, -0.00189208984375, -0.001766204833984375, -0.00164031982421875, -0.001514434814453125, -0.0013885498046875, -0.001262664794921875, -0.00113677978515625, -0.001010894775390625, -0.000885009765625, -0.000759124755859375, -0.00063323974609375, -0.000507354736328125, -0.0003814697265625, -0.000255584716796875, -0.00012969970703125, -3.814697265625e-06, 0.0001220703125, 0.000247955322265625, 0.00037384033203125, 0.000499725341796875, 0.0006256103515625, 0.000751495361328125, 0.00087738037109375, 0.001003265380859375, 0.001129150390625, 0.001255035400390625, 0.00138092041015625, 0.001506805419921875, 0.0016326904296875, 0.001758575439453125, 0.00188446044921875, 0.002010345458984375, 0.00213623046875, 0.002262115478515625, 0.00238800048828125, 0.002513885498046875, 0.0026397705078125, 0.002765655517578125, 0.00289154052734375, 0.003017425537109375, 0.003143310546875, 0.003269195556640625, 0.00339508056640625, 0.003520965576171875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 12.0, 13.0, 16.0, 18.0, 38.0, 46.0, 59.0, 77.0, 47.0, 84.0, 106.0, 94.0, 75.0, 77.0, 37.0, 46.0, 37.0, 29.0, 28.0, 13.0, 11.0, 15.0, 8.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.198883056640625e-06, -6.030313670635223e-06, -5.861744284629822e-06, -5.69317489862442e-06, -5.5246055126190186e-06, -5.356036126613617e-06, -5.187466740608215e-06, -5.018897354602814e-06, -4.850327968597412e-06, -4.6817585825920105e-06, -4.513189196586609e-06, -4.344619810581207e-06, -4.176050424575806e-06, -4.007481038570404e-06, -3.8389116525650024e-06, -3.670342266559601e-06, -3.5017728805541992e-06, -3.3332034945487976e-06, -3.164634108543396e-06, -2.9960647225379944e-06, -2.8274953365325928e-06, -2.658925950527191e-06, -2.4903565645217896e-06, -2.321787178516388e-06, -2.1532177925109863e-06, -1.9846484065055847e-06, -1.816079020500183e-06, -1.6475096344947815e-06, -1.4789402484893799e-06, -1.3103708624839783e-06, -1.1418014764785767e-06, -9.73232090473175e-07, -8.046627044677734e-07, -6.360933184623718e-07, -4.675239324569702e-07, -2.989545464515686e-07, -1.30385160446167e-07, 3.818422555923462e-08, 2.0675361156463623e-07, 3.7532299757003784e-07, 5.438923835754395e-07, 7.124617695808411e-07, 8.810311555862427e-07, 1.0496005415916443e-06, 1.218169927597046e-06, 1.3867393136024475e-06, 1.5553086996078491e-06, 1.7238780856132507e-06, 1.8924474716186523e-06, 2.061016857624054e-06, 2.2295862436294556e-06, 2.398155629634857e-06, 2.566725015640259e-06, 2.7352944016456604e-06, 2.903863787651062e-06, 3.0724331736564636e-06, 3.2410025596618652e-06, 3.409571945667267e-06, 3.5781413316726685e-06, 3.74671071767807e-06, 3.915280103683472e-06, 4.083849489688873e-06, 4.252418875694275e-06, 4.4209882616996765e-06, 4.589557647705078e-06]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 2.0, 8.0, 3.0, 6.0, 13.0, 13.0, 17.0, 16.0, 28.0, 32.0, 34.0, 31.0, 51.0, 54.0, 62.0, 104.0, 150.0, 258.0, 513.0, 1682.0, 9368.0, 793958.0, 232557.0, 6938.0, 1394.0, 530.0, 251.0, 158.0, 68.0, 54.0, 32.0, 26.0, 25.0, 18.0, 23.0, 10.0, 12.0, 12.0, 11.0, 11.0, 8.0, 4.0, 1.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007801055908203125, -0.0075002312660217285, -0.007199406623840332, -0.0068985819816589355, -0.006597757339477539, -0.006296932697296143, -0.005996108055114746, -0.00569528341293335, -0.005394458770751953, -0.005093634128570557, -0.00479280948638916, -0.004491984844207764, -0.004191160202026367, -0.0038903355598449707, -0.0035895109176635742, -0.0032886862754821777, -0.0029878616333007812, -0.0026870369911193848, -0.0023862123489379883, -0.002085387706756592, -0.0017845630645751953, -0.0014837384223937988, -0.0011829137802124023, -0.0008820891380310059, -0.0005812644958496094, -0.0002804398536682129, 2.0384788513183594e-05, 0.0003212094306945801, 0.0006220340728759766, 0.000922858715057373, 0.0012236833572387695, 0.001524507999420166, 0.0018253326416015625, 0.002126157283782959, 0.0024269819259643555, 0.002727806568145752, 0.0030286312103271484, 0.003329455852508545, 0.0036302804946899414, 0.003931105136871338, 0.004231929779052734, 0.004532754421234131, 0.004833579063415527, 0.005134403705596924, 0.00543522834777832, 0.005736052989959717, 0.006036877632141113, 0.00633770227432251, 0.006638526916503906, 0.006939351558685303, 0.007240176200866699, 0.007541000843048096, 0.007841825485229492, 0.008142650127410889, 0.008443474769592285, 0.008744299411773682, 0.009045124053955078, 0.009345948696136475, 0.009646773338317871, 0.009947597980499268, 0.010248422622680664, 0.01054924726486206, 0.010850071907043457, 0.011150896549224854, 0.01145172119140625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 20.0, 58.0, 404.0, 409.0, 61.0, 24.0, 9.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00714111328125, -0.006989181041717529, -0.006837248802185059, -0.006685316562652588, -0.006533384323120117, -0.0063814520835876465, -0.006229519844055176, -0.006077587604522705, -0.005925655364990234, -0.005773723125457764, -0.005621790885925293, -0.005469858646392822, -0.0053179264068603516, -0.005165994167327881, -0.00501406192779541, -0.0048621296882629395, -0.004710197448730469, -0.004558265209197998, -0.004406332969665527, -0.004254400730133057, -0.004102468490600586, -0.003950536251068115, -0.0037986040115356445, -0.003646671772003174, -0.003494739532470703, -0.0033428072929382324, -0.0031908750534057617, -0.003038942813873291, -0.0028870105743408203, -0.0027350783348083496, -0.002583146095275879, -0.002431213855743408, -0.0022792816162109375, -0.002127349376678467, -0.001975417137145996, -0.0018234848976135254, -0.0016715526580810547, -0.001519620418548584, -0.0013676881790161133, -0.0012157559394836426, -0.0010638236999511719, -0.0009118914604187012, -0.0007599592208862305, -0.0006080269813537598, -0.00045609474182128906, -0.00030416250228881836, -0.00015223026275634766, -2.980232238769531e-07, 0.00015163421630859375, 0.00030356645584106445, 0.00045549869537353516, 0.0006074309349060059, 0.0007593631744384766, 0.0009112954139709473, 0.001063227653503418, 0.0012151598930358887, 0.0013670921325683594, 0.00151902437210083, 0.0016709566116333008, 0.0018228888511657715, 0.001974821090698242, 0.002126753330230713, 0.0022786855697631836, 0.0024306178092956543, 0.002582550048828125]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 257.0, 724.0, 16.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2762903571128845, -0.2697255611419678, -0.263160765171051, -0.25659599900245667, -0.2500312030315399, -0.24346640706062317, -0.23690161108970642, -0.23033681511878967, -0.22377203404903412, -0.21720723807811737, -0.21064245700836182, -0.20407766103744507, -0.19751286506652832, -0.19094808399677277, -0.18438328802585602, -0.17781850695610046, -0.17125371098518372, -0.16468891501426697, -0.1581241339445114, -0.15155933797359467, -0.1449945569038391, -0.13842976093292236, -0.13186496496200562, -0.12530016899108887, -0.11873538792133331, -0.11217059940099716, -0.10560581088066101, -0.09904101490974426, -0.09247622638940811, -0.08591143786907196, -0.07934664189815521, -0.07278185337781906, -0.0662170797586441, -0.05965229123830795, -0.0530874989926815, -0.046522706747055054, -0.0399579182267189, -0.03339312970638275, -0.026828337460756302, -0.020263545215129852, -0.013698756694793701, -0.007133966311812401, -0.0005691759288311005, 0.0059956144541502, 0.0125604048371315, 0.01912519335746765, 0.0256899856030941, 0.03225477784872055, 0.0388195663690567, 0.04538435488939285, 0.0519491471350193, 0.05851393938064575, 0.0650787279009819, 0.07164351642131805, 0.0782083123922348, 0.08477310091257095, 0.0913378894329071, 0.09790267795324326, 0.1044674664735794, 0.11103226244449615, 0.1175970509648323, 0.12416183948516846, 0.1307266354560852, 0.13729143142700195, 0.1438562124967575]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 6.0, 7.0, 6.0, 16.0, 11.0, 19.0, 14.0, 18.0, 21.0, 27.0, 18.0, 31.0, 50.0, 34.0, 40.0, 38.0, 49.0, 56.0, 68.0, 68.0, 67.0, 45.0, 45.0, 39.0, 28.0, 27.0, 19.0, 20.0, 30.0, 17.0, 13.0, 10.0, 12.0, 6.0, 9.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.036292288452386856, -0.035212405025959015, -0.034132521599531174, -0.03305263817310333, -0.03197275102138519, -0.0308928694576025, -0.02981298416852951, -0.02873310074210167, -0.027653217315673828, -0.026573333889245987, -0.025493450462818146, -0.024413565173745155, -0.023333681747317314, -0.022253798320889473, -0.021173913031816483, -0.02009402960538864, -0.0190141461789608, -0.01793426275253296, -0.016854379326105118, -0.015774494037032127, -0.014694610610604286, -0.013614727184176445, -0.01253484282642603, -0.011454958468675613, -0.010375075042247772, -0.009295191615819931, -0.008215307258069515, -0.007135423365980387, -0.006055539473891258, -0.00497565558180213, -0.0038957716897130013, -0.0028158877976238728, -0.0017360076308250427, -0.0006561237387359142, 0.00042376015335321426, 0.0015036440454423428, 0.0025835279375314713, 0.0036634118296205997, 0.004743295721709728, 0.005823179613798857, 0.006903063505887985, 0.007982946932315826, 0.009062831290066242, 0.010142715647816658, 0.0112225990742445, 0.01230248250067234, 0.013382366858422756, 0.014462251216173172, 0.015542134642601013, 0.016622018069028854, 0.017701901495456696, 0.018781786784529686, 0.019861670210957527, 0.02094155363738537, 0.02202143892645836, 0.0231013223528862, 0.02418120577931404, 0.025261089205741882, 0.026340972632169724, 0.027420857921242714, 0.028500741347670555, 0.029580624774098396, 0.030660510063171387, 0.03174039348959923, 0.03282027691602707]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 6.0, 10.0, 20.0, 13.0, 10.0, 21.0, 19.0, 21.0, 24.0, 45.0, 43.0, 56.0, 86.0, 139.0, 167.0, 409.0, 522301.0, 228.0, 163.0, 116.0, 77.0, 61.0, 41.0, 23.0, 25.0, 16.0, 24.0, 17.0, 16.0, 13.0, 11.0, 4.0, 8.0, 7.0, 3.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1902363896369934, -0.18373820185661316, -0.17723999917507172, -0.17074181139469147, -0.16424362361431122, -0.15774542093276978, -0.15124723315238953, -0.14474904537200928, -0.13825084269046783, -0.13175265491008759, -0.12525445222854614, -0.1187562644481659, -0.11225806921720505, -0.1057598739862442, -0.09926168620586395, -0.0927634909749031, -0.08626530319452286, -0.07976710796356201, -0.07326892018318176, -0.06677072495222092, -0.06027252972126007, -0.05377433821558952, -0.047276146709918976, -0.04077795147895813, -0.03427975997328758, -0.027781566604971886, -0.02128337323665619, -0.014785181730985641, -0.008286988362669945, -0.001788794994354248, 0.0047093965113162994, 0.011207591742277145, 0.017705783247947693, 0.02420397661626339, 0.030702169984579086, 0.037200361490249634, 0.04369855672121048, 0.05019674822688103, 0.056694939732551575, 0.06319313496351242, 0.06969133019447327, 0.07618952542543411, 0.08268771320581436, 0.08918590843677521, 0.09568410366773605, 0.1021822988986969, 0.10868048667907715, 0.115178681910038, 0.12167686969041824, 0.1281750649213791, 0.13467325270175934, 0.14117145538330078, 0.14766964316368103, 0.15416783094406128, 0.16066601872444153, 0.16716422140598297, 0.17366240918636322, 0.18016059696674347, 0.1866587996482849, 0.19315698742866516, 0.1996551752090454, 0.20615337789058685, 0.2126515656709671, 0.21914976835250854, 0.2256479561328888]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 3.0, 10.0, 3.0, 7.0, 14.0, 22.0, 14.0, 16.0, 21.0, 21.0, 20.0, 34.0, 40.0, 58.0, 38.0, 58.0, 37.0, 1096.0, 63.0, 60.0, 64.0, 47.0, 45.0, 36.0, 35.0, 31.0, 20.0, 22.0, 17.0, 12.0, 18.0, 5.0, 10.0, 11.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22894053161144257, -0.2219921052455902, -0.21504369378089905, -0.2080952674150467, -0.20114684104919434, -0.19419842958450317, -0.18725000321865082, -0.18030157685279846, -0.1733531653881073, -0.16640473902225494, -0.15945632755756378, -0.15250790119171143, -0.14555947482585907, -0.1386110484600067, -0.13166263699531555, -0.1247142106294632, -0.11776578426361084, -0.11081736534833908, -0.10386893898248672, -0.09692052006721497, -0.08997209370136261, -0.08302367478609085, -0.07607525587081909, -0.06912682950496674, -0.06217841058969498, -0.05522998794913292, -0.04828156530857086, -0.0413331463932991, -0.034384723752737045, -0.027436301112174988, -0.02048788219690323, -0.013539459556341171, -0.006591036915779114, 0.0003573847934603691, 0.007305806502699852, 0.01425422728061676, 0.021202649921178818, 0.028151072561740875, 0.035099491477012634, 0.04204791411757469, 0.04899633675813675, 0.05594475939869881, 0.06289318203926086, 0.06984160095453262, 0.07679001986980438, 0.08373844623565674, 0.0906868651509285, 0.09763528406620026, 0.10458371043205261, 0.11153212934732437, 0.11848055571317673, 0.1254289746284485, 0.13237740099430084, 0.1393258273601532, 0.14627423882484436, 0.15322266519069672, 0.16017109155654907, 0.16711951792240143, 0.1740679293870926, 0.18101635575294495, 0.1879647821187973, 0.19491320848464966, 0.20186161994934082, 0.20881004631519318, 0.21575845777988434]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 18.0, 17.0, 21.0, 28.0, 41.0, 71.0, 93.0, 205.0, 397.0, 865.0, 2147.0, 7887.0, 55395.0, 31147300.0, 33422.0, 4240.0, 1256.0, 492.0, 272.0, 122.0, 64.0, 31.0, 27.0, 22.0, 14.0, 12.0, 13.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.28052520751953, -31.792743682861328, -30.304962158203125, -28.817180633544922, -27.32939910888672, -25.841617584228516, -24.353836059570312, -22.86605453491211, -21.378273010253906, -19.890491485595703, -18.4027099609375, -16.914928436279297, -15.427146911621094, -13.93936538696289, -12.451582908630371, -10.963801383972168, -9.476018905639648, -7.988237380981445, -6.500455856323242, -5.012673854827881, -3.5248923301696777, -2.0371108055114746, -0.5493288040161133, 0.9384527206420898, 2.426234245300293, 3.914015769958496, 5.401797294616699, 6.8895792961120605, 8.377361297607422, 9.865142822265625, 11.352924346923828, 12.840705871582031, 14.328487396240234, 15.816268920898438, 17.30405044555664, 18.791831970214844, 20.279613494873047, 21.76739501953125, 23.255176544189453, 24.742958068847656, 26.23073959350586, 27.718521118164062, 29.206302642822266, 30.69408416748047, 32.18186569213867, 33.669647216796875, 35.15742874145508, 36.64521026611328, 38.13299560546875, 39.62077713012695, 41.108558654785156, 42.59634017944336, 44.08412170410156, 45.571903228759766, 47.05968475341797, 48.54746627807617, 50.035247802734375, 51.52302932739258, 53.01081085205078, 54.498592376708984, 55.98637390136719, 57.47415542602539, 58.961936950683594, 60.4497184753418, 61.9375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 6.0, 3.0, 0.0, 9.0, 2.0, 7.0, 3.0, 32.0, 25.0, 44.0, 79.0, 75.0, 129.0, 202.0, 298.0, 435.0, 759.0, 1185.0, 1949.0, 3320.0, 5452.0, 9449.0, 17159.0, 31839.0, 61534.0, 128993.0, 300178.0, 1013039.0, 3775632.0, 539370.0, 204280.0, 93813.0, 45863.0, 24199.0, 13431.0, 7428.0, 4315.0, 2702.0, 1566.0, 927.0, 601.0, 402.0, 229.0, 172.0, 97.0, 75.0, 53.0, 37.0, 16.0, 12.0, 5.0, 6.0, 5.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.308349609375, -0.2978172302246094, -0.28728485107421875, -0.2767524719238281, -0.2662200927734375, -0.2556877136230469, -0.24515533447265625, -0.23462295532226562, -0.224090576171875, -0.21355819702148438, -0.20302581787109375, -0.19249343872070312, -0.1819610595703125, -0.17142868041992188, -0.16089630126953125, -0.15036392211914062, -0.13983154296875, -0.12929916381835938, -0.11876678466796875, -0.10823440551757812, -0.0977020263671875, -0.08716964721679688, -0.07663726806640625, -0.06610488891601562, -0.055572509765625, -0.045040130615234375, -0.03450775146484375, -0.023975372314453125, -0.0134429931640625, -0.002910614013671875, 0.00762176513671875, 0.018154144287109375, 0.0286865234375, 0.039218902587890625, 0.04975128173828125, 0.060283660888671875, 0.0708160400390625, 0.08134841918945312, 0.09188079833984375, 0.10241317749023438, 0.112945556640625, 0.12347793579101562, 0.13401031494140625, 0.14454269409179688, 0.1550750732421875, 0.16560745239257812, 0.17613983154296875, 0.18667221069335938, 0.19720458984375, 0.20773696899414062, 0.21826934814453125, 0.22880172729492188, 0.2393341064453125, 0.24986648559570312, 0.26039886474609375, 0.2709312438964844, 0.281463623046875, 0.2919960021972656, 0.30252838134765625, 0.3130607604980469, 0.3235931396484375, 0.3341255187988281, 0.34465789794921875, 0.3551902770996094, 0.36572265625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 3.0, 1.0, 7.0, 10.0, 11.0, 10.0, 14.0, 23.0, 22.0, 27.0, 26.0, 30.0, 33.0, 41.0, 60.0, 78.0, 121.0, 372.0, 447.0, 181.0, 116.0, 70.0, 60.0, 54.0, 41.0, 35.0, 29.0, 18.0, 14.0, 15.0, 8.0, 14.0, 12.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 7.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.67626953125, -0.6584701538085938, -0.6406707763671875, -0.6228713989257812, -0.605072021484375, -0.5872726440429688, -0.5694732666015625, -0.5516738891601562, -0.53387451171875, -0.5160751342773438, -0.4982757568359375, -0.48047637939453125, -0.462677001953125, -0.44487762451171875, -0.4270782470703125, -0.40927886962890625, -0.3914794921875, -0.37368011474609375, -0.3558807373046875, -0.33808135986328125, -0.320281982421875, -0.30248260498046875, -0.2846832275390625, -0.26688385009765625, -0.24908447265625, -0.23128509521484375, -0.2134857177734375, -0.19568634033203125, -0.177886962890625, -0.16008758544921875, -0.1422882080078125, -0.12448883056640625, -0.106689453125, -0.08889007568359375, -0.0710906982421875, -0.05329132080078125, -0.035491943359375, -0.01769256591796875, 0.0001068115234375, 0.01790618896484375, 0.03570556640625, 0.05350494384765625, 0.0713043212890625, 0.08910369873046875, 0.106903076171875, 0.12470245361328125, 0.1425018310546875, 0.16030120849609375, 0.1781005859375, 0.19589996337890625, 0.2136993408203125, 0.23149871826171875, 0.249298095703125, 0.26709747314453125, 0.2848968505859375, 0.30269622802734375, 0.32049560546875, 0.33829498291015625, 0.3560943603515625, 0.37389373779296875, 0.391693115234375, 0.40949249267578125, 0.4272918701171875, 0.44509124755859375, 0.462890625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [7.0, 2.0, 0.0, 4.0, 17.0, 16.0, 20.0, 29.0, 39.0, 33.0, 60.0, 61.0, 107.0, 163.0, 195.0, 282.0, 450.0, 698.0, 982.0, 1434.0, 2157.0, 3331.0, 5093.0, 8410.0, 13952.0, 24762.0, 45238.0, 90506.0, 211828.0, 699537.0, 4230681.0, 578714.0, 188207.0, 83473.0, 42183.0, 22834.0, 13382.0, 8135.0, 4842.0, 2970.0, 2167.0, 1446.0, 868.0, 599.0, 457.0, 292.0, 208.0, 166.0, 126.0, 85.0, 64.0, 34.0, 35.0, 30.0, 3.0, 13.0, 5.0, 7.0, 5.0, 8.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.40625, -0.3929023742675781, -0.37955474853515625, -0.3662071228027344, -0.3528594970703125, -0.3395118713378906, -0.32616424560546875, -0.3128166198730469, -0.299468994140625, -0.2861213684082031, -0.27277374267578125, -0.2594261169433594, -0.2460784912109375, -0.23273086547851562, -0.21938323974609375, -0.20603561401367188, -0.19268798828125, -0.17934036254882812, -0.16599273681640625, -0.15264511108398438, -0.1392974853515625, -0.12594985961914062, -0.11260223388671875, -0.09925460815429688, -0.085906982421875, -0.07255935668945312, -0.05921173095703125, -0.045864105224609375, -0.0325164794921875, -0.019168853759765625, -0.00582122802734375, 0.007526397705078125, 0.0208740234375, 0.034221649169921875, 0.04756927490234375, 0.060916900634765625, 0.0742645263671875, 0.08761215209960938, 0.10095977783203125, 0.11430740356445312, 0.127655029296875, 0.14100265502929688, 0.15435028076171875, 0.16769790649414062, 0.1810455322265625, 0.19439315795898438, 0.20774078369140625, 0.22108840942382812, 0.23443603515625, 0.24778366088867188, 0.26113128662109375, 0.2744789123535156, 0.2878265380859375, 0.3011741638183594, 0.31452178955078125, 0.3278694152832031, 0.341217041015625, 0.3545646667480469, 0.36791229248046875, 0.3812599182128906, 0.3946075439453125, 0.4079551696777344, 0.42130279541015625, 0.4346504211425781, 0.447998046875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 7.0, 7.0, 13.0, 14.0, 15.0, 32.0, 29.0, 37.0, 38.0, 49.0, 55.0, 76.0, 88.0, 325.0, 545.0, 215.0, 118.0, 66.0, 45.0, 51.0, 29.0, 30.0, 18.0, 24.0, 17.0, 15.0, 12.0, 8.0, 6.0, 5.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60888671875, -0.5886459350585938, -0.5684051513671875, -0.5481643676757812, -0.527923583984375, -0.5076828002929688, -0.4874420166015625, -0.46720123291015625, -0.44696044921875, -0.42671966552734375, -0.4064788818359375, -0.38623809814453125, -0.365997314453125, -0.34575653076171875, -0.3255157470703125, -0.30527496337890625, -0.2850341796875, -0.26479339599609375, -0.2445526123046875, -0.22431182861328125, -0.204071044921875, -0.18383026123046875, -0.1635894775390625, -0.14334869384765625, -0.12310791015625, -0.10286712646484375, -0.0826263427734375, -0.06238555908203125, -0.042144775390625, -0.02190399169921875, -0.0016632080078125, 0.01857757568359375, 0.038818359375, 0.05905914306640625, 0.0792999267578125, 0.09954071044921875, 0.119781494140625, 0.14002227783203125, 0.1602630615234375, 0.18050384521484375, 0.20074462890625, 0.22098541259765625, 0.2412261962890625, 0.26146697998046875, 0.281707763671875, 0.30194854736328125, 0.3221893310546875, 0.34243011474609375, 0.3626708984375, 0.38291168212890625, 0.4031524658203125, 0.42339324951171875, 0.443634033203125, 0.46387481689453125, 0.4841156005859375, 0.5043563842773438, 0.52459716796875, 0.5448379516601562, 0.5650787353515625, 0.5853195190429688, 0.605560302734375, 0.6258010864257812, 0.6460418701171875, 0.6662826538085938, 0.6865234375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [5.0, 3.0, 1.0, 8.0, 7.0, 17.0, 4.0, 6.0, 19.0, 10.0, 17.0, 32.0, 39.0, 54.0, 61.0, 70.0, 86.0, 131.0, 156.0, 230.0, 294.0, 359.0, 485.0, 654.0, 1012.0, 1529.0, 2537.0, 4606.0, 8629.0, 20186.0, 68024.0, 5982716.0, 143586.0, 29236.0, 11693.0, 5735.0, 3082.0, 1859.0, 1222.0, 816.0, 502.0, 458.0, 271.0, 230.0, 143.0, 118.0, 115.0, 77.0, 56.0, 63.0, 53.0, 28.0, 35.0, 23.0, 27.0, 3.0, 2.0, 5.0, 9.0, 10.0, 0.0, 3.0, 5.0, 4.0], "bins": [-2.408203125, -2.332183837890625, -2.25616455078125, -2.180145263671875, -2.1041259765625, -2.028106689453125, -1.95208740234375, -1.876068115234375, -1.800048828125, -1.724029541015625, -1.64801025390625, -1.571990966796875, -1.4959716796875, -1.419952392578125, -1.34393310546875, -1.267913818359375, -1.19189453125, -1.115875244140625, -1.03985595703125, -0.963836669921875, -0.8878173828125, -0.811798095703125, -0.73577880859375, -0.659759521484375, -0.583740234375, -0.507720947265625, -0.43170166015625, -0.355682373046875, -0.2796630859375, -0.203643798828125, -0.12762451171875, -0.051605224609375, 0.0244140625, 0.100433349609375, 0.17645263671875, 0.252471923828125, 0.3284912109375, 0.404510498046875, 0.48052978515625, 0.556549072265625, 0.632568359375, 0.708587646484375, 0.78460693359375, 0.860626220703125, 0.9366455078125, 1.012664794921875, 1.08868408203125, 1.164703369140625, 1.24072265625, 1.316741943359375, 1.39276123046875, 1.468780517578125, 1.5447998046875, 1.620819091796875, 1.69683837890625, 1.772857666015625, 1.848876953125, 1.924896240234375, 2.00091552734375, 2.076934814453125, 2.1529541015625, 2.228973388671875, 2.30499267578125, 2.381011962890625, 2.45703125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 3.0, 5.0, 6.0, 3.0, 2.0, 8.0, 10.0, 15.0, 17.0, 13.0, 23.0, 20.0, 21.0, 27.0, 52.0, 59.0, 68.0, 116.0, 315.0, 550.0, 247.0, 105.0, 65.0, 41.0, 29.0, 27.0, 33.0, 24.0, 18.0, 13.0, 12.0, 16.0, 4.0, 11.0, 6.0, 10.0, 5.0, 2.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.83349609375, -0.8075103759765625, -0.781524658203125, -0.7555389404296875, -0.72955322265625, -0.7035675048828125, -0.677581787109375, -0.6515960693359375, -0.6256103515625, -0.5996246337890625, -0.573638916015625, -0.5476531982421875, -0.52166748046875, -0.4956817626953125, -0.469696044921875, -0.4437103271484375, -0.417724609375, -0.3917388916015625, -0.365753173828125, -0.3397674560546875, -0.31378173828125, -0.2877960205078125, -0.261810302734375, -0.2358245849609375, -0.2098388671875, -0.1838531494140625, -0.157867431640625, -0.1318817138671875, -0.10589599609375, -0.0799102783203125, -0.053924560546875, -0.0279388427734375, -0.001953125, 0.0240325927734375, 0.050018310546875, 0.0760040283203125, 0.10198974609375, 0.1279754638671875, 0.153961181640625, 0.1799468994140625, 0.2059326171875, 0.2319183349609375, 0.257904052734375, 0.2838897705078125, 0.30987548828125, 0.3358612060546875, 0.361846923828125, 0.3878326416015625, 0.413818359375, 0.4398040771484375, 0.465789794921875, 0.4917755126953125, 0.51776123046875, 0.5437469482421875, 0.569732666015625, 0.5957183837890625, 0.6217041015625, 0.6476898193359375, 0.673675537109375, 0.6996612548828125, 0.72564697265625, 0.7516326904296875, 0.777618408203125, 0.8036041259765625, 0.82958984375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 13.0, 47.0, 836.0, 64.0, 27.0, 11.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.892606258392334, -2.3565311431884766, -1.8204561471939087, -1.2843811511993408, -0.7483060359954834, -0.21223092079162598, 0.32384395599365234, 0.8599190711975098, 1.3959941864013672, 1.9320693016052246, 2.468144416809082, 3.0042192935943604, 3.5402944087982178, 4.076369285583496, 4.6124444007873535, 5.148519515991211, 5.684594631195068, 6.220669746398926, 6.756744861602783, 7.292819976806641, 7.82889461517334, 8.364970207214355, 8.901044845581055, 9.43712043762207, 9.97319507598877, 10.509269714355469, 11.045345306396484, 11.581419944763184, 12.1174955368042, 12.653570175170898, 13.189645767211914, 13.725720405578613, 14.261796951293945, 14.797871589660645, 15.33394718170166, 15.87002182006836, 16.406097412109375, 16.94217300415039, 17.478246688842773, 18.01432228088379, 18.550397872924805, 19.08647346496582, 19.622547149658203, 20.15862274169922, 20.694698333740234, 21.23077392578125, 21.766847610473633, 22.30292320251465, 22.83899688720703, 23.375072479248047, 23.91114616394043, 24.447221755981445, 24.98329734802246, 25.519372940063477, 26.05544662475586, 26.591522216796875, 27.12759780883789, 27.663673400878906, 28.19974708557129, 28.735822677612305, 29.27189826965332, 29.807973861694336, 30.34404754638672, 30.880123138427734, 31.41619873046875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 9.0, 10.0, 17.0, 18.0, 34.0, 72.0, 460.0, 234.0, 49.0, 21.0, 18.0, 13.0, 12.0, 8.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.841955184936523, -4.629395484924316, -4.416835308074951, -4.204275131225586, -3.991715431213379, -3.7791554927825928, -3.5665955543518066, -3.3540356159210205, -3.1414756774902344, -2.9289157390594482, -2.716355800628662, -2.503795862197876, -2.29123592376709, -2.0786759853363037, -1.8661160469055176, -1.6535561084747314, -1.4409961700439453, -1.2284362316131592, -1.015876293182373, -0.8033163547515869, -0.5907564163208008, -0.37819647789001465, -0.16563653945922852, 0.04692339897155762, 0.25948333740234375, 0.4720432758331299, 0.684603214263916, 0.8971631526947021, 1.1097230911254883, 1.3222830295562744, 1.5348429679870605, 1.7474029064178467, 1.9599628448486328, 2.172522783279419, 2.385082721710205, 2.597642660140991, 2.8102025985717773, 3.0227625370025635, 3.2353224754333496, 3.4478824138641357, 3.660442352294922, 3.873002290725708, 4.085562229156494, 4.298122406005859, 4.510682106018066, 4.723241806030273, 4.935801982879639, 5.148362159729004, 5.360921859741211, 5.573481559753418, 5.786041736602783, 5.998601913452148, 6.2111616134643555, 6.4237213134765625, 6.636281490325928, 6.848841667175293, 7.0614013671875, 7.273961067199707, 7.486521244049072, 7.6990814208984375, 7.9116411209106445, 8.124200820922852, 8.336761474609375, 8.549321174621582, 8.761880874633789]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 23.0, 33.0, 56.0, 95.0, 146.0, 231.0, 362.0, 633.0, 1321.0, 2820.0, 6910.0, 19978.0, 74322.0, 3936538.0, 108316.0, 23096.0, 9690.0, 4405.0, 2182.0, 1119.0, 639.0, 363.0, 211.0, 171.0, 105.0, 87.0, 82.0, 68.0, 35.0, 42.0, 21.0, 25.0, 19.0, 19.0, 16.0, 13.0, 10.0, 7.0, 9.0, 11.0, 4.0, 12.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.00687408447265625, -0.0065402984619140625, -0.006206512451171875, -0.0058727264404296875, -0.0055389404296875, -0.0052051544189453125, -0.004871368408203125, -0.0045375823974609375, -0.00420379638671875, -0.0038700103759765625, -0.003536224365234375, -0.0032024383544921875, -0.00286865234375, -0.0025348663330078125, -0.002201080322265625, -0.0018672943115234375, -0.00153350830078125, -0.0011997222900390625, -0.000865936279296875, -0.0005321502685546875, -0.0001983642578125, 0.0001354217529296875, 0.000469207763671875, 0.0008029937744140625, 0.00113677978515625, 0.0014705657958984375, 0.001804351806640625, 0.0021381378173828125, 0.002471923828125, 0.0028057098388671875, 0.003139495849609375, 0.0034732818603515625, 0.00380706787109375, 0.0041408538818359375, 0.004474639892578125, 0.0048084259033203125, 0.0051422119140625, 0.0054759979248046875, 0.005809783935546875, 0.0061435699462890625, 0.00647735595703125, 0.0068111419677734375, 0.007144927978515625, 0.0074787139892578125, 0.0078125, 0.008146286010742188, 0.008480072021484375, 0.008813858032226562, 0.00914764404296875, 0.009481430053710938, 0.009815216064453125, 0.010149002075195312, 0.0104827880859375, 0.010816574096679688, 0.011150360107421875, 0.011484146118164062, 0.01181793212890625, 0.012151718139648438, 0.012485504150390625, 0.012819290161132812, 0.013153076171875, 0.013486862182617188, 0.013820648193359375, 0.014154434204101562, 0.01448822021484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 6.0, 11.0, 16.0, 14.0, 20.0, 226.0, 568.0, 59.0, 19.0, 10.0, 10.0, 13.0, 6.0, 5.0, 2.0, 0.0, 1.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007481575012207031, -0.0007112547755241394, -0.0006743520498275757, -0.000637449324131012, -0.0006005465984344482, -0.0005636438727378845, -0.0005267411470413208, -0.0004898384213447571, -0.00045293569564819336, -0.00041603296995162964, -0.0003791302442550659, -0.0003422275185585022, -0.0003053247928619385, -0.00026842206716537476, -0.00023151934146881104, -0.00019461661577224731, -0.0001577138900756836, -0.00012081116437911987, -8.390843868255615e-05, -4.700571298599243e-05, -1.0102987289428711e-05, 2.679973840713501e-05, 6.370246410369873e-05, 0.00010060518980026245, 0.00013750791549682617, 0.0001744106411933899, 0.0002113133668899536, 0.00024821609258651733, 0.00028511881828308105, 0.0003220215439796448, 0.0003589242696762085, 0.0003958269953727722, 0.00043272972106933594, 0.00046963244676589966, 0.0005065351724624634, 0.0005434378981590271, 0.0005803406238555908, 0.0006172433495521545, 0.0006541460752487183, 0.000691048800945282, 0.0007279515266418457, 0.0007648542523384094, 0.0008017569780349731, 0.0008386597037315369, 0.0008755624294281006, 0.0009124651551246643, 0.000949367880821228, 0.0009862706065177917, 0.0010231733322143555, 0.0010600760579109192, 0.001096978783607483, 0.0011338815093040466, 0.0011707842350006104, 0.001207686960697174, 0.0012445896863937378, 0.0012814924120903015, 0.0013183951377868652, 0.001355297863483429, 0.0013922005891799927, 0.0014291033148765564, 0.0014660060405731201, 0.0015029087662696838, 0.0015398114919662476, 0.0015767142176628113, 0.001613616943359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 13.0, 21.0, 21.0, 38.0, 61.0, 85.0, 149.0, 213.0, 372.0, 714.0, 1346.0, 3537.0, 15813.0, 471391.0, 3659583.0, 31282.0, 5477.0, 1923.0, 901.0, 508.0, 273.0, 185.0, 112.0, 80.0, 52.0, 36.0, 31.0, 20.0, 13.0, 7.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0189666748046875, -0.018337488174438477, -0.017708301544189453, -0.01707911491394043, -0.016449928283691406, -0.015820741653442383, -0.01519155502319336, -0.014562368392944336, -0.013933181762695312, -0.013303995132446289, -0.012674808502197266, -0.012045621871948242, -0.011416435241699219, -0.010787248611450195, -0.010158061981201172, -0.009528875350952148, -0.008899688720703125, -0.008270502090454102, -0.007641315460205078, -0.007012128829956055, -0.006382942199707031, -0.005753755569458008, -0.005124568939208984, -0.004495382308959961, -0.0038661956787109375, -0.003237009048461914, -0.0026078224182128906, -0.001978635787963867, -0.0013494491577148438, -0.0007202625274658203, -9.107589721679688e-05, 0.0005381107330322266, 0.00116729736328125, 0.0017964839935302734, 0.002425670623779297, 0.0030548572540283203, 0.0036840438842773438, 0.004313230514526367, 0.004942417144775391, 0.005571603775024414, 0.0062007904052734375, 0.006829977035522461, 0.007459163665771484, 0.008088350296020508, 0.008717536926269531, 0.009346723556518555, 0.009975910186767578, 0.010605096817016602, 0.011234283447265625, 0.011863470077514648, 0.012492656707763672, 0.013121843338012695, 0.013751029968261719, 0.014380216598510742, 0.015009403228759766, 0.01563858985900879, 0.016267776489257812, 0.016896963119506836, 0.01752614974975586, 0.018155336380004883, 0.018784523010253906, 0.01941370964050293, 0.020042896270751953, 0.020672082901000977, 0.02130126953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 3.0, 5.0, 8.0, 12.0, 22.0, 28.0, 35.0, 51.0, 65.0, 102.0, 125.0, 188.0, 295.0, 483.0, 1230.0, 450.0, 296.0, 219.0, 122.0, 98.0, 57.0, 45.0, 28.0, 33.0, 11.0, 16.0, 13.0, 9.0, 4.0, 3.0, 4.0, 6.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016107559204101562, -0.0015519708395004272, -0.0014931857585906982, -0.0014344006776809692, -0.0013756155967712402, -0.0013168305158615112, -0.0012580454349517822, -0.0011992603540420532, -0.0011404752731323242, -0.0010816901922225952, -0.0010229051113128662, -0.0009641200304031372, -0.0009053349494934082, -0.0008465498685836792, -0.0007877647876739502, -0.0007289797067642212, -0.0006701946258544922, -0.0006114095449447632, -0.0005526244640350342, -0.0004938393831253052, -0.00043505430221557617, -0.00037626922130584717, -0.00031748414039611816, -0.00025869905948638916, -0.00019991397857666016, -0.00014112889766693115, -8.234381675720215e-05, -2.3558735847473145e-05, 3.522634506225586e-05, 9.401142597198486e-05, 0.00015279650688171387, 0.00021158158779144287, 0.0002703666687011719, 0.0003291517496109009, 0.0003879368305206299, 0.0004467219114303589, 0.0005055069923400879, 0.0005642920732498169, 0.0006230771541595459, 0.0006818622350692749, 0.0007406473159790039, 0.0007994323968887329, 0.0008582174777984619, 0.0009170025587081909, 0.0009757876396179199, 0.001034572720527649, 0.001093357801437378, 0.001152142882347107, 0.001210927963256836, 0.001269713044166565, 0.001328498125076294, 0.001387283205986023, 0.001446068286895752, 0.001504853367805481, 0.00156363844871521, 0.001622423529624939, 0.001681208610534668, 0.001739993691444397, 0.001798778772354126, 0.001857563853263855, 0.001916348934173584, 0.001975134015083313, 0.002033919095993042, 0.002092704176902771, 0.0021514892578125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 18.0, 41.0, 125.0, 410.0, 318.0, 64.0, 21.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02318253368139267, -0.02124577760696411, -0.019309021532535553, -0.017372265458106995, -0.015435507521033287, -0.013498751446604729, -0.01156199537217617, -0.009625238366425037, -0.007688482291996479, -0.005751725751906633, -0.0038149694446474314, -0.0018782131373882294, 5.854340270161629e-05, 0.001995299942791462, 0.00393205601722002, 0.005868813022971153, 0.007805569097399712, 0.00974232517182827, 0.011679082177579403, 0.013615838252007961, 0.015552595257759094, 0.017489351332187653, 0.01942610740661621, 0.02136286348104477, 0.023299619555473328, 0.025236375629901886, 0.027173131704330444, 0.029109887778759003, 0.03104664571583271, 0.03298339992761612, 0.03492015600204468, 0.036856915801763535, 0.03879367187619209, 0.04073042795062065, 0.04266718402504921, 0.04460394009947777, 0.046540696173906326, 0.04847745597362518, 0.05041421204805374, 0.0523509681224823, 0.05428772419691086, 0.056224480271339417, 0.058161236345767975, 0.06009799242019653, 0.06203474849462509, 0.06397150456905365, 0.06590826064348221, 0.06784501671791077, 0.06978177279233932, 0.07171852886676788, 0.07365528494119644, 0.075592041015625, 0.07752879709005356, 0.07946555316448212, 0.08140230923891068, 0.08333906531333923, 0.08527582883834839, 0.08721258491277695, 0.0891493409872055, 0.09108609706163406, 0.09302285313606262, 0.09495960921049118, 0.09689636528491974, 0.0988331213593483, 0.10076987743377686]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 9.0, 7.0, 11.0, 9.0, 12.0, 12.0, 26.0, 26.0, 27.0, 25.0, 34.0, 33.0, 49.0, 40.0, 40.0, 67.0, 50.0, 50.0, 40.0, 60.0, 35.0, 38.0, 37.0, 32.0, 34.0, 38.0, 31.0, 27.0, 12.0, 14.0, 14.0, 16.0, 15.0, 12.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.008158683776855469, -0.007928579114377499, -0.0076984744518995285, -0.007468369789421558, -0.007238265126943588, -0.007008160464465618, -0.006778055801987648, -0.006547951139509678, -0.006317846477031708, -0.006087741814553738, -0.0058576371520757675, -0.005627532489597797, -0.005397427827119827, -0.005167323164641857, -0.004937218502163887, -0.004707113839685917, -0.004477009177207947, -0.004246904514729977, -0.0040167998522520065, -0.0037866951897740364, -0.0035565905272960663, -0.003326485864818096, -0.003096381202340126, -0.002866276539862156, -0.002636171877384186, -0.0024060672149062157, -0.0021759625524282455, -0.0019458578899502754, -0.0017157532274723053, -0.0014856485649943352, -0.001255543902516365, -0.001025439240038395, -0.0007953345775604248, -0.0005652299150824547, -0.00033512525260448456, -0.00010502059012651443, 0.0001250840723514557, 0.0003551887348294258, 0.0005852933973073959, 0.0008153980597853661, 0.0010455027222633362, 0.0012756073847413063, 0.0015057120472192764, 0.0017358167096972466, 0.0019659213721752167, 0.002196026034653187, 0.002426130697131157, 0.002656235359609127, 0.002886340022087097, 0.0031164446845650673, 0.0033465493470430374, 0.0035766540095210075, 0.0038067586719989777, 0.004036863334476948, 0.004266967996954918, 0.004497072659432888, 0.004727177321910858, 0.004957281984388828, 0.005187386646866798, 0.0054174913093447685, 0.005647595971822739, 0.005877700634300709, 0.006107805296778679, 0.006337909959256649, 0.006568014621734619]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 13.0, 13.0, 11.0, 15.0, 28.0, 30.0, 42.0, 66.0, 112.0, 176.0, 241.0, 355.0, 676.0, 1294.0, 2505.0, 5751.0, 17121.0, 304133.0, 683418.0, 20236.0, 6301.0, 2701.0, 1404.0, 727.0, 379.0, 249.0, 162.0, 121.0, 79.0, 58.0, 39.0, 21.0, 20.0, 11.0, 12.0, 7.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01117706298828125, -0.010817170143127441, -0.010457277297973633, -0.010097384452819824, -0.009737491607666016, -0.009377598762512207, -0.009017705917358398, -0.00865781307220459, -0.008297920227050781, -0.007938027381896973, -0.007578134536743164, -0.0072182416915893555, -0.006858348846435547, -0.006498456001281738, -0.00613856315612793, -0.005778670310974121, -0.0054187774658203125, -0.005058884620666504, -0.004698991775512695, -0.004339098930358887, -0.003979206085205078, -0.0036193132400512695, -0.003259420394897461, -0.0028995275497436523, -0.0025396347045898438, -0.002179741859436035, -0.0018198490142822266, -0.001459956169128418, -0.0011000633239746094, -0.0007401704788208008, -0.0003802776336669922, -2.0384788513183594e-05, 0.000339508056640625, 0.0006994009017944336, 0.0010592937469482422, 0.0014191865921020508, 0.0017790794372558594, 0.002138972282409668, 0.0024988651275634766, 0.002858757972717285, 0.0032186508178710938, 0.0035785436630249023, 0.003938436508178711, 0.0042983293533325195, 0.004658222198486328, 0.005018115043640137, 0.005378007888793945, 0.005737900733947754, 0.0060977935791015625, 0.006457686424255371, 0.00681757926940918, 0.007177472114562988, 0.007537364959716797, 0.007897257804870605, 0.008257150650024414, 0.008617043495178223, 0.008976936340332031, 0.00933682918548584, 0.009696722030639648, 0.010056614875793457, 0.010416507720947266, 0.010776400566101074, 0.011136293411254883, 0.011496186256408691, 0.0118560791015625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 5.0, 6.0, 7.0, 12.0, 5.0, 16.0, 16.0, 54.0, 179.0, 371.0, 209.0, 55.0, 17.0, 7.0, 10.0, 5.0, 5.0, 4.0, 4.0, 0.0, 4.0, 1.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007610321044921875, -0.0007322728633880615, -0.0007035136222839355, -0.0006747543811798096, -0.0006459951400756836, -0.0006172358989715576, -0.0005884766578674316, -0.0005597174167633057, -0.0005309581756591797, -0.0005021989345550537, -0.00047343969345092773, -0.00044468045234680176, -0.0004159212112426758, -0.0003871619701385498, -0.00035840272903442383, -0.00032964348793029785, -0.0003008842468261719, -0.0002721250057220459, -0.00024336576461791992, -0.00021460652351379395, -0.00018584728240966797, -0.000157088041305542, -0.00012832880020141602, -9.956955909729004e-05, -7.081031799316406e-05, -4.2051076889038086e-05, -1.329183578491211e-05, 1.5467405319213867e-05, 4.4226646423339844e-05, 7.298588752746582e-05, 0.0001017451286315918, 0.00013050436973571777, 0.00015926361083984375, 0.00018802285194396973, 0.0002167820930480957, 0.0002455413341522217, 0.00027430057525634766, 0.00030305981636047363, 0.0003318190574645996, 0.0003605782985687256, 0.00038933753967285156, 0.00041809678077697754, 0.0004468560218811035, 0.0004756152629852295, 0.0005043745040893555, 0.0005331337451934814, 0.0005618929862976074, 0.0005906522274017334, 0.0006194114685058594, 0.0006481707096099854, 0.0006769299507141113, 0.0007056891918182373, 0.0007344484329223633, 0.0007632076740264893, 0.0007919669151306152, 0.0008207261562347412, 0.0008494853973388672, 0.0008782446384429932, 0.0009070038795471191, 0.0009357631206512451, 0.0009645223617553711, 0.000993281602859497, 0.001022040843963623, 0.001050800085067749, 0.001079559326171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 6.0, 6.0, 8.0, 8.0, 9.0, 15.0, 12.0, 21.0, 26.0, 36.0, 49.0, 66.0, 86.0, 120.0, 162.0, 248.0, 377.0, 654.0, 1067.0, 2179.0, 4622.0, 12509.0, 52500.0, 704399.0, 226113.0, 27729.0, 8157.0, 3332.0, 1578.0, 865.0, 510.0, 344.0, 200.0, 114.0, 91.0, 76.0, 59.0, 39.0, 49.0, 30.0, 15.0, 20.0, 11.0, 6.0, 8.0, 7.0, 9.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.01000213623046875, -0.009706258773803711, -0.009410381317138672, -0.009114503860473633, -0.008818626403808594, -0.008522748947143555, -0.008226871490478516, -0.007930994033813477, -0.0076351165771484375, -0.0073392391204833984, -0.007043361663818359, -0.00674748420715332, -0.006451606750488281, -0.006155729293823242, -0.005859851837158203, -0.005563974380493164, -0.005268096923828125, -0.004972219467163086, -0.004676342010498047, -0.004380464553833008, -0.004084587097167969, -0.0037887096405029297, -0.0034928321838378906, -0.0031969547271728516, -0.0029010772705078125, -0.0026051998138427734, -0.0023093223571777344, -0.0020134449005126953, -0.0017175674438476562, -0.0014216899871826172, -0.0011258125305175781, -0.0008299350738525391, -0.0005340576171875, -0.00023818016052246094, 5.7697296142578125e-05, 0.0003535747528076172, 0.0006494522094726562, 0.0009453296661376953, 0.0012412071228027344, 0.0015370845794677734, 0.0018329620361328125, 0.0021288394927978516, 0.0024247169494628906, 0.0027205944061279297, 0.0030164718627929688, 0.003312349319458008, 0.003608226776123047, 0.003904104232788086, 0.004199981689453125, 0.004495859146118164, 0.004791736602783203, 0.005087614059448242, 0.005383491516113281, 0.00567936897277832, 0.005975246429443359, 0.0062711238861083984, 0.0065670013427734375, 0.0068628787994384766, 0.007158756256103516, 0.007454633712768555, 0.007750511169433594, 0.008046388626098633, 0.008342266082763672, 0.008638143539428711, 0.00893402099609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 10.0, 11.0, 14.0, 10.0, 8.0, 10.0, 23.0, 20.0, 12.0, 25.0, 25.0, 33.0, 28.0, 34.0, 32.0, 39.0, 37.0, 38.0, 42.0, 42.0, 40.0, 35.0, 33.0, 49.0, 38.0, 43.0, 35.0, 39.0, 20.0, 17.0, 21.0, 17.0, 22.0, 16.0, 5.0, 15.0, 10.0, 11.0, 12.0, 3.0, 5.0, 4.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002674102783203125, -0.002594888210296631, -0.0025156736373901367, -0.0024364590644836426, -0.0023572444915771484, -0.0022780299186706543, -0.00219881534576416, -0.002119600772857666, -0.002040386199951172, -0.0019611716270446777, -0.0018819570541381836, -0.0018027424812316895, -0.0017235279083251953, -0.0016443133354187012, -0.001565098762512207, -0.0014858841896057129, -0.0014066696166992188, -0.0013274550437927246, -0.0012482404708862305, -0.0011690258979797363, -0.0010898113250732422, -0.001010596752166748, -0.0009313821792602539, -0.0008521676063537598, -0.0007729530334472656, -0.0006937384605407715, -0.0006145238876342773, -0.0005353093147277832, -0.00045609474182128906, -0.0003768801689147949, -0.0002976655960083008, -0.00021845102310180664, -0.0001392364501953125, -6.002187728881836e-05, 1.919269561767578e-05, 9.840726852416992e-05, 0.00017762184143066406, 0.0002568364143371582, 0.00033605098724365234, 0.0004152655601501465, 0.0004944801330566406, 0.0005736947059631348, 0.0006529092788696289, 0.000732123851776123, 0.0008113384246826172, 0.0008905529975891113, 0.0009697675704956055, 0.0010489821434020996, 0.0011281967163085938, 0.0012074112892150879, 0.001286625862121582, 0.0013658404350280762, 0.0014450550079345703, 0.0015242695808410645, 0.0016034841537475586, 0.0016826987266540527, 0.0017619132995605469, 0.001841127872467041, 0.0019203424453735352, 0.0019995570182800293, 0.0020787715911865234, 0.0021579861640930176, 0.0022372007369995117, 0.002316415309906006, 0.0023956298828125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 6.0, 8.0, 12.0, 12.0, 18.0, 21.0, 50.0, 75.0, 187.0, 394.0, 1330.0, 6120.0, 598853.0, 433463.0, 5859.0, 1270.0, 438.0, 185.0, 84.0, 52.0, 27.0, 19.0, 16.0, 14.0, 9.0, 6.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05230712890625, -0.050768375396728516, -0.04922962188720703, -0.04769086837768555, -0.04615211486816406, -0.04461336135864258, -0.043074607849121094, -0.04153585433959961, -0.039997100830078125, -0.03845834732055664, -0.036919593811035156, -0.03538084030151367, -0.03384208679199219, -0.0323033332824707, -0.03076457977294922, -0.029225826263427734, -0.02768707275390625, -0.026148319244384766, -0.02460956573486328, -0.023070812225341797, -0.021532058715820312, -0.019993305206298828, -0.018454551696777344, -0.01691579818725586, -0.015377044677734375, -0.01383829116821289, -0.012299537658691406, -0.010760784149169922, -0.009222030639648438, -0.007683277130126953, -0.006144523620605469, -0.004605770111083984, -0.0030670166015625, -0.0015282630920410156, 1.049041748046875e-05, 0.0015492439270019531, 0.0030879974365234375, 0.004626750946044922, 0.006165504455566406, 0.007704257965087891, 0.009243011474609375, 0.01078176498413086, 0.012320518493652344, 0.013859272003173828, 0.015398025512695312, 0.016936779022216797, 0.01847553253173828, 0.020014286041259766, 0.02155303955078125, 0.023091793060302734, 0.02463054656982422, 0.026169300079345703, 0.027708053588867188, 0.029246807098388672, 0.030785560607910156, 0.03232431411743164, 0.033863067626953125, 0.03540182113647461, 0.036940574645996094, 0.03847932815551758, 0.04001808166503906, 0.04155683517456055, 0.04309558868408203, 0.044634342193603516, 0.046173095703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 4.0, 10.0, 6.0, 16.0, 5.0, 11.0, 21.0, 17.0, 25.0, 28.0, 36.0, 45.0, 41.0, 59.0, 154.0, 182.0, 79.0, 47.0, 35.0, 30.0, 25.0, 18.0, 19.0, 17.0, 11.0, 12.0, 3.0, 3.0, 11.0, 4.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0037822723388671875, -0.0036475956439971924, -0.0035129189491271973, -0.003378242254257202, -0.003243565559387207, -0.003108888864517212, -0.002974212169647217, -0.0028395354747772217, -0.0027048587799072266, -0.0025701820850372314, -0.0024355053901672363, -0.002300828695297241, -0.002166152000427246, -0.002031475305557251, -0.0018967986106872559, -0.0017621219158172607, -0.0016274452209472656, -0.0014927685260772705, -0.0013580918312072754, -0.0012234151363372803, -0.0010887384414672852, -0.00095406174659729, -0.0008193850517272949, -0.0006847083568572998, -0.0005500316619873047, -0.00041535496711730957, -0.00028067827224731445, -0.00014600157737731934, -1.1324882507324219e-05, 0.0001233518123626709, 0.000258028507232666, 0.00039270520210266113, 0.0005273818969726562, 0.0006620585918426514, 0.0007967352867126465, 0.0009314119815826416, 0.0010660886764526367, 0.0012007653713226318, 0.001335442066192627, 0.001470118761062622, 0.0016047954559326172, 0.0017394721508026123, 0.0018741488456726074, 0.0020088255405426025, 0.0021435022354125977, 0.0022781789302825928, 0.002412855625152588, 0.002547532320022583, 0.002682209014892578, 0.0028168857097625732, 0.0029515624046325684, 0.0030862390995025635, 0.0032209157943725586, 0.0033555924892425537, 0.003490269184112549, 0.003624945878982544, 0.003759622573852539, 0.003894299268722534, 0.004028975963592529, 0.004163652658462524, 0.0042983293533325195, 0.004433006048202515, 0.00456768274307251, 0.004702359437942505, 0.0048370361328125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 12.0, 12.0, 18.0, 23.0, 27.0, 49.0, 75.0, 136.0, 204.0, 412.0, 766.0, 1887.0, 5971.0, 55001.0, 956486.0, 20721.0, 3962.0, 1345.0, 617.0, 312.0, 194.0, 103.0, 81.0, 49.0, 26.0, 16.0, 17.0, 8.0, 6.0, 0.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.041534423828125, -0.04042196273803711, -0.03930950164794922, -0.03819704055786133, -0.03708457946777344, -0.03597211837768555, -0.034859657287597656, -0.033747196197509766, -0.032634735107421875, -0.031522274017333984, -0.030409812927246094, -0.029297351837158203, -0.028184890747070312, -0.027072429656982422, -0.02595996856689453, -0.02484750747680664, -0.02373504638671875, -0.02262258529663086, -0.02151012420654297, -0.020397663116455078, -0.019285202026367188, -0.018172740936279297, -0.017060279846191406, -0.015947818756103516, -0.014835357666015625, -0.013722896575927734, -0.012610435485839844, -0.011497974395751953, -0.010385513305664062, -0.009273052215576172, -0.008160591125488281, -0.007048130035400391, -0.0059356689453125, -0.004823207855224609, -0.0037107467651367188, -0.002598285675048828, -0.0014858245849609375, -0.0003733634948730469, 0.0007390975952148438, 0.0018515586853027344, 0.002964019775390625, 0.004076480865478516, 0.005188941955566406, 0.006301403045654297, 0.0074138641357421875, 0.008526325225830078, 0.009638786315917969, 0.01075124740600586, 0.01186370849609375, 0.01297616958618164, 0.014088630676269531, 0.015201091766357422, 0.016313552856445312, 0.017426013946533203, 0.018538475036621094, 0.019650936126708984, 0.020763397216796875, 0.021875858306884766, 0.022988319396972656, 0.024100780487060547, 0.025213241577148438, 0.026325702667236328, 0.02743816375732422, 0.02855062484741211, 0.0296630859375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 10.0, 5.0, 13.0, 15.0, 19.0, 17.0, 27.0, 44.0, 44.0, 65.0, 89.0, 124.0, 147.0, 89.0, 68.0, 39.0, 44.0, 29.0, 23.0, 25.0, 12.0, 11.0, 12.0, 7.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0080413818359375, -0.007818937301635742, -0.007596492767333984, -0.0073740482330322266, -0.007151603698730469, -0.006929159164428711, -0.006706714630126953, -0.006484270095825195, -0.0062618255615234375, -0.00603938102722168, -0.005816936492919922, -0.005594491958618164, -0.005372047424316406, -0.0051496028900146484, -0.004927158355712891, -0.004704713821411133, -0.004482269287109375, -0.004259824752807617, -0.004037380218505859, -0.0038149356842041016, -0.0035924911499023438, -0.003370046615600586, -0.003147602081298828, -0.0029251575469970703, -0.0027027130126953125, -0.0024802684783935547, -0.002257823944091797, -0.002035379409790039, -0.0018129348754882812, -0.0015904903411865234, -0.0013680458068847656, -0.0011456012725830078, -0.00092315673828125, -0.0007007122039794922, -0.0004782676696777344, -0.00025582313537597656, -3.337860107421875e-05, 0.00018906593322753906, 0.0004115104675292969, 0.0006339550018310547, 0.0008563995361328125, 0.0010788440704345703, 0.0013012886047363281, 0.001523733139038086, 0.0017461776733398438, 0.0019686222076416016, 0.0021910667419433594, 0.002413511276245117, 0.002635955810546875, 0.002858400344848633, 0.0030808448791503906, 0.0033032894134521484, 0.0035257339477539062, 0.003748178482055664, 0.003970623016357422, 0.00419306755065918, 0.0044155120849609375, 0.004637956619262695, 0.004860401153564453, 0.005082845687866211, 0.005305290222167969, 0.0055277347564697266, 0.005750179290771484, 0.005972623825073242, 0.006195068359375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 12.0, 13.0, 39.0, 118.0, 458.0, 262.0, 56.0, 20.0, 10.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.13949346542358398, -0.1338934451341629, -0.12829343974590302, -0.12269341945648193, -0.11709341406822205, -0.11149339377880096, -0.10589338093996048, -0.10029336810112, -0.09469335526227951, -0.08909334242343903, -0.08349332958459854, -0.07789331674575806, -0.07229329645633698, -0.06669329106807709, -0.061093270778656006, -0.05549325793981552, -0.04989324510097504, -0.04429323226213455, -0.03869321942329407, -0.033093202859163284, -0.0274931900203228, -0.021893177181482315, -0.016293160617351532, -0.010693147778511047, -0.005093134939670563, 0.0005068788304924965, 0.006106892600655556, 0.01170690730214119, 0.017306920140981674, 0.02290693297982216, 0.028506949543952942, 0.034106962382793427, 0.039706990122795105, 0.04530700296163559, 0.050907015800476074, 0.05650703236460686, 0.06210704520344734, 0.06770706176757812, 0.07330707460641861, 0.0789070874452591, 0.08450710028409958, 0.09010711312294006, 0.09570712596178055, 0.10130713880062103, 0.10690715909004211, 0.112507164478302, 0.11810718476772308, 0.12370719760656357, 0.12930721044540405, 0.13490723073482513, 0.14050723612308502, 0.1461072564125061, 0.151707261800766, 0.15730728209018707, 0.16290730237960815, 0.16850730776786804, 0.17410731315612793, 0.179707333445549, 0.1853073388338089, 0.19090735912322998, 0.19650736451148987, 0.20210738480091095, 0.20770740509033203, 0.21330741047859192, 0.218907430768013]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 7.0, 6.0, 8.0, 9.0, 7.0, 15.0, 24.0, 36.0, 51.0, 74.0, 85.0, 110.0, 106.0, 116.0, 94.0, 66.0, 52.0, 49.0, 29.0, 20.0, 15.0, 5.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07804703712463379, -0.07602675259113312, -0.07400646060705185, -0.07198617607355118, -0.06996588408946991, -0.06794559955596924, -0.06592531502246857, -0.0639050230383873, -0.06188473850488663, -0.05986445024609566, -0.05784416198730469, -0.055823877453804016, -0.053803589195013046, -0.051783300936222076, -0.049763016402721405, -0.047742728143930435, -0.045722439885139465, -0.043702151626348495, -0.041681863367557526, -0.039661578834056854, -0.037641290575265884, -0.035621002316474915, -0.03360071778297424, -0.03158042952418327, -0.029560141265392303, -0.027539853006601334, -0.025519566610455513, -0.023499280214309692, -0.021478991955518723, -0.019458703696727753, -0.017438417300581932, -0.015418129973113537, -0.013397842645645142, -0.011377555318176746, -0.009357267990708351, -0.007336980663239956, -0.005316693335771561, -0.0032964060083031654, -0.0012761186808347702, 0.000744168646633625, 0.0027644559741020203, 0.0047847433015704155, 0.006805030629038811, 0.008825317956507206, 0.010845605283975601, 0.012865892611443996, 0.014886179938912392, 0.016906466335058212, 0.018926754593849182, 0.020947042852640152, 0.022967329248785973, 0.024987615644931793, 0.027007903903722763, 0.029028192162513733, 0.031048478558659554, 0.033068764954805374, 0.035089053213596344, 0.037109341472387314, 0.039129629731178284, 0.041149914264678955, 0.043170202523469925, 0.045190490782260895, 0.047210775315761566, 0.049231063574552536, 0.051251351833343506]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 17.0, 26.0, 38.0, 87.0, 1411.0, 4188004.0, 4218.0, 289.0, 76.0, 40.0, 16.0, 12.0, 14.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.787109375, -0.7488250732421875, -0.710540771484375, -0.6722564697265625, -0.63397216796875, -0.5956878662109375, -0.557403564453125, -0.5191192626953125, -0.4808349609375, -0.4425506591796875, -0.404266357421875, -0.3659820556640625, -0.32769775390625, -0.2894134521484375, -0.251129150390625, -0.2128448486328125, -0.174560546875, -0.1362762451171875, -0.097991943359375, -0.0597076416015625, -0.02142333984375, 0.0168609619140625, 0.055145263671875, 0.0934295654296875, 0.1317138671875, 0.1699981689453125, 0.208282470703125, 0.2465667724609375, 0.28485107421875, 0.3231353759765625, 0.361419677734375, 0.3997039794921875, 0.43798828125, 0.4762725830078125, 0.514556884765625, 0.5528411865234375, 0.59112548828125, 0.6294097900390625, 0.667694091796875, 0.7059783935546875, 0.7442626953125, 0.7825469970703125, 0.820831298828125, 0.8591156005859375, 0.89739990234375, 0.9356842041015625, 0.973968505859375, 1.0122528076171875, 1.050537109375, 1.0888214111328125, 1.127105712890625, 1.1653900146484375, 1.20367431640625, 1.2419586181640625, 1.280242919921875, 1.3185272216796875, 1.3568115234375, 1.3950958251953125, 1.433380126953125, 1.4716644287109375, 1.50994873046875, 1.5482330322265625, 1.586517333984375, 1.6248016357421875, 1.6630859375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 6.0, 4.0, 7.0, 4.0, 5.0, 14.0, 16.0, 37.0, 117.0, 200.0, 262.0, 165.0, 77.0, 27.0, 20.0, 11.0, 7.0, 6.0, 5.0, 3.0, 1.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005469322204589844, -0.0005212798714637756, -0.0004956275224685669, -0.00046997517347335815, -0.0004443228244781494, -0.0004186704754829407, -0.00039301812648773193, -0.0003673657774925232, -0.00034171342849731445, -0.0003160610795021057, -0.00029040873050689697, -0.00026475638151168823, -0.0002391040325164795, -0.00021345168352127075, -0.000187799334526062, -0.00016214698553085327, -0.00013649463653564453, -0.00011084228754043579, -8.518993854522705e-05, -5.953758955001831e-05, -3.388524055480957e-05, -8.23289155960083e-06, 1.741945743560791e-05, 4.307180643081665e-05, 6.872415542602539e-05, 9.437650442123413e-05, 0.00012002885341644287, 0.0001456812024116516, 0.00017133355140686035, 0.0001969859004020691, 0.00022263824939727783, 0.00024829059839248657, 0.0002739429473876953, 0.00029959529638290405, 0.0003252476453781128, 0.00035089999437332153, 0.0003765523433685303, 0.000402204692363739, 0.00042785704135894775, 0.0004535093903541565, 0.00047916173934936523, 0.000504814088344574, 0.0005304664373397827, 0.0005561187863349915, 0.0005817711353302002, 0.0006074234843254089, 0.0006330758333206177, 0.0006587281823158264, 0.0006843805313110352, 0.0007100328803062439, 0.0007356852293014526, 0.0007613375782966614, 0.0007869899272918701, 0.0008126422762870789, 0.0008382946252822876, 0.0008639469742774963, 0.0008895993232727051, 0.0009152516722679138, 0.0009409040212631226, 0.0009665563702583313, 0.00099220871925354, 0.0010178610682487488, 0.0010435134172439575, 0.0010691657662391663, 0.001094818115234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 15.0, 21.0, 39.0, 98.0, 179.0, 329.0, 622.0, 4161432.0, 31236.0, 224.0, 60.0, 20.0, 8.0, 1.0], "bins": [-1.0810546875, -1.062387466430664, -1.0437202453613281, -1.0250530242919922, -1.0063858032226562, -0.9877185821533203, -0.9690513610839844, -0.9503841400146484, -0.9317169189453125, -0.9130496978759766, -0.8943824768066406, -0.8757152557373047, -0.8570480346679688, -0.8383808135986328, -0.8197135925292969, -0.8010463714599609, -0.782379150390625, -0.7637119293212891, -0.7450447082519531, -0.7263774871826172, -0.7077102661132812, -0.6890430450439453, -0.6703758239746094, -0.6517086029052734, -0.6330413818359375, -0.6143741607666016, -0.5957069396972656, -0.5770397186279297, -0.5583724975585938, -0.5397052764892578, -0.5210380554199219, -0.5023708343505859, -0.48370361328125, -0.46503639221191406, -0.4463691711425781, -0.4277019500732422, -0.40903472900390625, -0.3903675079345703, -0.3717002868652344, -0.35303306579589844, -0.3343658447265625, -0.31569862365722656, -0.2970314025878906, -0.2783641815185547, -0.25969696044921875, -0.2410297393798828, -0.22236251831054688, -0.20369529724121094, -0.185028076171875, -0.16636085510253906, -0.14769363403320312, -0.1290264129638672, -0.11035919189453125, -0.09169197082519531, -0.07302474975585938, -0.05435752868652344, -0.0356903076171875, -0.017023086547851562, 0.001644134521484375, 0.020311355590820312, 0.03897857666015625, 0.05764579772949219, 0.07631301879882812, 0.09498023986816406, 0.1136474609375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 8.0, 3.0, 17.0, 19.0, 45.0, 86.0, 141.0, 219.0, 355.0, 595.0, 1895.0, 460.0, 151.0, 56.0, 25.0, 8.0, 2.0], "bins": [-0.0079345703125, -0.00779646635055542, -0.00765836238861084, -0.00752025842666626, -0.00738215446472168, -0.0072440505027771, -0.0071059465408325195, -0.0069678425788879395, -0.006829738616943359, -0.006691634654998779, -0.006553530693054199, -0.006415426731109619, -0.006277322769165039, -0.006139218807220459, -0.006001114845275879, -0.005863010883331299, -0.005724906921386719, -0.005586802959442139, -0.005448698997497559, -0.0053105950355529785, -0.0051724910736083984, -0.005034387111663818, -0.004896283149719238, -0.004758179187774658, -0.004620075225830078, -0.004481971263885498, -0.004343867301940918, -0.004205763339996338, -0.004067659378051758, -0.003929555416107178, -0.0037914514541625977, -0.0036533474922180176, -0.0035152435302734375, -0.0033771395683288574, -0.0032390356063842773, -0.0031009316444396973, -0.002962827682495117, -0.002824723720550537, -0.002686619758605957, -0.002548515796661377, -0.002410411834716797, -0.002272307872772217, -0.0021342039108276367, -0.0019960999488830566, -0.0018579959869384766, -0.0017198920249938965, -0.0015817880630493164, -0.0014436841011047363, -0.0013055801391601562, -0.0011674761772155762, -0.001029372215270996, -0.000891268253326416, -0.0007531642913818359, -0.0006150603294372559, -0.0004769563674926758, -0.0003388524055480957, -0.00020074844360351562, -6.264448165893555e-05, 7.545948028564453e-05, 0.0002135634422302246, 0.0003516674041748047, 0.0004897713661193848, 0.0006278753280639648, 0.0007659792900085449, 0.000904083251953125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 17.0, 918.0, 85.0], "bins": [-4.433717727661133, -4.363304615020752, -4.292891502380371, -4.22247838973999, -4.152065753936768, -4.081652641296387, -4.011239528656006, -3.940826416015625, -3.870413303375244, -3.8000001907348633, -3.7295873165130615, -3.6591742038726807, -3.5887610912323, -3.518348217010498, -3.447935104370117, -3.3775219917297363, -3.3071091175079346, -3.2366960048675537, -3.166283130645752, -3.095870018005371, -3.0254569053649902, -2.9550437927246094, -2.8846309185028076, -2.8142178058624268, -2.743804931640625, -2.673391819000244, -2.6029789447784424, -2.5325658321380615, -2.4621527194976807, -2.391739845275879, -2.321326732635498, -2.250913619995117, -2.1805005073547363, -2.1100873947143555, -2.0396745204925537, -1.9692614078521729, -1.898848295211792, -1.8284353017807007, -1.7580223083496094, -1.6876091957092285, -1.6171960830688477, -1.5467830896377563, -1.4763699769973755, -1.4059569835662842, -1.3355438709259033, -1.265130877494812, -1.1947178840637207, -1.1243047714233398, -1.0538917779922485, -0.9834787249565125, -0.9130656719207764, -0.8426526784896851, -0.772239625453949, -0.7018265724182129, -0.6314135789871216, -0.5610005259513855, -0.4905874729156494, -0.42017441987991333, -0.34976139664649963, -0.27934837341308594, -0.20893532037734985, -0.13852226734161377, -0.06810924410820007, 0.002303779125213623, 0.07271682471036911]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 11.0, 23.0, 29.0, 75.0, 120.0, 156.0, 188.0, 140.0, 113.0, 64.0, 44.0, 20.0, 13.0, 6.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.27601486444473267, -0.270718514919281, -0.26542216539382935, -0.2601258456707001, -0.2548294961452484, -0.24953314661979675, -0.2442367970943451, -0.23894046247005463, -0.23364412784576416, -0.2283477783203125, -0.22305144369602203, -0.21775509417057037, -0.2124587595462799, -0.20716241002082825, -0.2018660604953766, -0.19656972587108612, -0.19127337634563446, -0.1859770268201828, -0.18068069219589233, -0.17538434267044067, -0.1700880080461502, -0.16479165852069855, -0.15949532389640808, -0.15419897437095642, -0.14890262484550476, -0.1436062753200531, -0.13830994069576263, -0.13301359117031097, -0.1277172565460205, -0.12242090702056885, -0.11712456494569778, -0.11182822287082672, -0.10653188824653625, -0.10123554617166519, -0.09593920409679413, -0.09064285457134247, -0.085346519947052, -0.08005017042160034, -0.07475382834672928, -0.06945748627185822, -0.06416114419698715, -0.05886480212211609, -0.053568460047245026, -0.048272114247083664, -0.0429757721722126, -0.03767943009734154, -0.032383084297180176, -0.027086742222309113, -0.02179040014743805, -0.016494058072566986, -0.011197714135050774, -0.005901370197534561, -0.0006050281226634979, 0.004691313952207565, 0.009987659752368927, 0.01528400182723999, 0.020580343902111053, 0.025876685976982117, 0.03117302991449833, 0.03646937385201454, 0.041765715926885605, 0.04706205800175667, 0.05235840380191803, 0.05765474587678909, 0.06295108795166016]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 6.0, 7.0, 10.0, 4.0, 11.0, 14.0, 12.0, 11.0, 16.0, 20.0, 27.0, 27.0, 25.0, 28.0, 48.0, 89.0, 278.0, 863.0, 3254.0, 18588.0, 911099.0, 104441.0, 7107.0, 1676.0, 444.0, 146.0, 62.0, 37.0, 30.0, 20.0, 26.0, 15.0, 19.0, 10.0, 8.0, 14.0, 13.0, 7.0, 3.0, 8.0, 6.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.035888671875, -0.034758567810058594, -0.03362846374511719, -0.03249835968017578, -0.031368255615234375, -0.03023815155029297, -0.029108047485351562, -0.027977943420410156, -0.02684783935546875, -0.025717735290527344, -0.024587631225585938, -0.02345752716064453, -0.022327423095703125, -0.02119731903076172, -0.020067214965820312, -0.018937110900878906, -0.0178070068359375, -0.016676902770996094, -0.015546798706054688, -0.014416694641113281, -0.013286590576171875, -0.012156486511230469, -0.011026382446289062, -0.009896278381347656, -0.00876617431640625, -0.007636070251464844, -0.0065059661865234375, -0.005375862121582031, -0.004245758056640625, -0.0031156539916992188, -0.0019855499267578125, -0.0008554458618164062, 0.000274658203125, 0.0014047622680664062, 0.0025348663330078125, 0.0036649703979492188, 0.004795074462890625, 0.005925178527832031, 0.0070552825927734375, 0.008185386657714844, 0.00931549072265625, 0.010445594787597656, 0.011575698852539062, 0.012705802917480469, 0.013835906982421875, 0.014966011047363281, 0.016096115112304688, 0.017226219177246094, 0.0183563232421875, 0.019486427307128906, 0.020616531372070312, 0.02174663543701172, 0.022876739501953125, 0.02400684356689453, 0.025136947631835938, 0.026267051696777344, 0.02739715576171875, 0.028527259826660156, 0.029657363891601562, 0.03078746795654297, 0.031917572021484375, 0.03304767608642578, 0.03417778015136719, 0.035307884216308594, 0.03643798828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 10.0, 5.0, 13.0, 23.0, 85.0, 260.0, 309.0, 185.0, 63.0, 21.0, 8.0, 9.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005478858947753906, -0.0005037412047386169, -0.00045959651470184326, -0.0004154518246650696, -0.0003713071346282959, -0.0003271624445915222, -0.00028301775455474854, -0.00023887306451797485, -0.00019472837448120117, -0.0001505836844444275, -0.00010643899440765381, -6.229430437088013e-05, -1.8149614334106445e-05, 2.5995075702667236e-05, 7.013976573944092e-05, 0.0001142844557762146, 0.00015842914581298828, 0.00020257383584976196, 0.00024671852588653564, 0.0002908632159233093, 0.000335007905960083, 0.0003791525959968567, 0.00042329728603363037, 0.00046744197607040405, 0.0005115866661071777, 0.0005557313561439514, 0.0005998760461807251, 0.0006440207362174988, 0.0006881654262542725, 0.0007323101162910461, 0.0007764548063278198, 0.0008205994963645935, 0.0008647441864013672, 0.0009088888764381409, 0.0009530335664749146, 0.0009971782565116882, 0.001041322946548462, 0.0010854676365852356, 0.0011296123266220093, 0.001173757016658783, 0.0012179017066955566, 0.0012620463967323303, 0.001306191086769104, 0.0013503357768058777, 0.0013944804668426514, 0.001438625156879425, 0.0014827698469161987, 0.0015269145369529724, 0.001571059226989746, 0.0016152039170265198, 0.0016593486070632935, 0.0017034932971000671, 0.0017476379871368408, 0.0017917826771736145, 0.0018359273672103882, 0.0018800720572471619, 0.0019242167472839355, 0.0019683614373207092, 0.002012506127357483, 0.0020566508173942566, 0.0021007955074310303, 0.002144940197467804, 0.0021890848875045776, 0.0022332295775413513, 0.002277374267578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 8.0, 4.0, 10.0, 13.0, 14.0, 16.0, 29.0, 21.0, 31.0, 27.0, 42.0, 53.0, 129.0, 818.0, 13902.0, 1013355.0, 18465.0, 1086.0, 192.0, 59.0, 54.0, 32.0, 28.0, 27.0, 29.0, 11.0, 12.0, 15.0, 9.0, 13.0, 7.0, 13.0, 9.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.04315185546875, -0.041864871978759766, -0.04057788848876953, -0.0392909049987793, -0.03800392150878906, -0.03671693801879883, -0.035429954528808594, -0.03414297103881836, -0.032855987548828125, -0.03156900405883789, -0.030282020568847656, -0.028995037078857422, -0.027708053588867188, -0.026421070098876953, -0.02513408660888672, -0.023847103118896484, -0.02256011962890625, -0.021273136138916016, -0.01998615264892578, -0.018699169158935547, -0.017412185668945312, -0.016125202178955078, -0.014838218688964844, -0.01355123519897461, -0.012264251708984375, -0.01097726821899414, -0.009690284729003906, -0.008403301239013672, -0.0071163177490234375, -0.005829334259033203, -0.004542350769042969, -0.0032553672790527344, -0.0019683837890625, -0.0006814002990722656, 0.0006055831909179688, 0.0018925666809082031, 0.0031795501708984375, 0.004466533660888672, 0.005753517150878906, 0.007040500640869141, 0.008327484130859375, 0.00961446762084961, 0.010901451110839844, 0.012188434600830078, 0.013475418090820312, 0.014762401580810547, 0.01604938507080078, 0.017336368560791016, 0.01862335205078125, 0.019910335540771484, 0.02119731903076172, 0.022484302520751953, 0.023771286010742188, 0.025058269500732422, 0.026345252990722656, 0.02763223648071289, 0.028919219970703125, 0.03020620346069336, 0.031493186950683594, 0.03278017044067383, 0.03406715393066406, 0.0353541374206543, 0.03664112091064453, 0.037928104400634766, 0.039215087890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 6.0, 5.0, 8.0, 6.0, 15.0, 9.0, 17.0, 21.0, 22.0, 28.0, 24.0, 36.0, 41.0, 37.0, 29.0, 34.0, 49.0, 48.0, 44.0, 45.0, 50.0, 29.0, 44.0, 50.0, 44.0, 32.0, 32.0, 29.0, 22.0, 16.0, 20.0, 16.0, 18.0, 12.0, 18.0, 11.0, 6.0, 7.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00218963623046875, -0.0021223723888397217, -0.0020551085472106934, -0.001987844705581665, -0.0019205808639526367, -0.0018533170223236084, -0.00178605318069458, -0.0017187893390655518, -0.0016515254974365234, -0.0015842616558074951, -0.0015169978141784668, -0.0014497339725494385, -0.0013824701309204102, -0.0013152062892913818, -0.0012479424476623535, -0.0011806786060333252, -0.0011134147644042969, -0.0010461509227752686, -0.0009788870811462402, -0.0009116232395172119, -0.0008443593978881836, -0.0007770955562591553, -0.000709831714630127, -0.0006425678730010986, -0.0005753040313720703, -0.000508040189743042, -0.00044077634811401367, -0.00037351250648498535, -0.00030624866485595703, -0.0002389848232269287, -0.0001717209815979004, -0.00010445713996887207, -3.719329833984375e-05, 3.007054328918457e-05, 9.733438491821289e-05, 0.0001645982265472412, 0.00023186206817626953, 0.00029912590980529785, 0.00036638975143432617, 0.0004336535930633545, 0.0005009174346923828, 0.0005681812763214111, 0.0006354451179504395, 0.0007027089595794678, 0.0007699728012084961, 0.0008372366428375244, 0.0009045004844665527, 0.0009717643260955811, 0.0010390281677246094, 0.0011062920093536377, 0.001173555850982666, 0.0012408196926116943, 0.0013080835342407227, 0.001375347375869751, 0.0014426112174987793, 0.0015098750591278076, 0.001577138900756836, 0.0016444027423858643, 0.0017116665840148926, 0.001778930425643921, 0.0018461942672729492, 0.0019134581089019775, 0.001980721950531006, 0.002047985792160034, 0.0021152496337890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 20.0, 27.0, 139.0, 1358.0, 1040513.0, 6052.0, 331.0, 58.0, 18.0, 13.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.54296875, -0.5302543640136719, -0.5175399780273438, -0.5048255920410156, -0.4921112060546875, -0.4793968200683594, -0.46668243408203125, -0.4539680480957031, -0.441253662109375, -0.4285392761230469, -0.41582489013671875, -0.4031105041503906, -0.3903961181640625, -0.3776817321777344, -0.36496734619140625, -0.3522529602050781, -0.33953857421875, -0.3268241882324219, -0.31410980224609375, -0.3013954162597656, -0.2886810302734375, -0.2759666442871094, -0.26325225830078125, -0.2505378723144531, -0.237823486328125, -0.22510910034179688, -0.21239471435546875, -0.19968032836914062, -0.1869659423828125, -0.17425155639648438, -0.16153717041015625, -0.14882278442382812, -0.1361083984375, -0.12339401245117188, -0.11067962646484375, -0.09796524047851562, -0.0852508544921875, -0.07253646850585938, -0.05982208251953125, -0.047107696533203125, -0.034393310546875, -0.021678924560546875, -0.00896453857421875, 0.003749847412109375, 0.0164642333984375, 0.029178619384765625, 0.04189300537109375, 0.054607391357421875, 0.06732177734375, 0.08003616333007812, 0.09275054931640625, 0.10546493530273438, 0.1181793212890625, 0.13089370727539062, 0.14360809326171875, 0.15632247924804688, 0.169036865234375, 0.18175125122070312, 0.19446563720703125, 0.20718002319335938, 0.2198944091796875, 0.23260879516601562, 0.24532318115234375, 0.2580375671386719, 0.270751953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 15.0, 66.0, 147.0, 487.0, 170.0, 40.0, 22.0, 11.0, 6.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011577606201171875, -0.001113981008529663, -0.0010702013969421387, -0.0010264217853546143, -0.0009826421737670898, -0.0009388625621795654, -0.000895082950592041, -0.0008513033390045166, -0.0008075237274169922, -0.0007637441158294678, -0.0007199645042419434, -0.0006761848926544189, -0.0006324052810668945, -0.0005886256694793701, -0.0005448460578918457, -0.0005010664463043213, -0.0004572868347167969, -0.00041350722312927246, -0.00036972761154174805, -0.00032594799995422363, -0.0002821683883666992, -0.0002383887767791748, -0.0001946091651916504, -0.00015082955360412598, -0.00010704994201660156, -6.327033042907715e-05, -1.9490718841552734e-05, 2.428889274597168e-05, 6.80685043334961e-05, 0.00011184811592102051, 0.00015562772750854492, 0.00019940733909606934, 0.00024318695068359375, 0.00028696656227111816, 0.0003307461738586426, 0.000374525785446167, 0.0004183053970336914, 0.0004620850086212158, 0.0005058646202087402, 0.0005496442317962646, 0.0005934238433837891, 0.0006372034549713135, 0.0006809830665588379, 0.0007247626781463623, 0.0007685422897338867, 0.0008123219013214111, 0.0008561015129089355, 0.00089988112449646, 0.0009436607360839844, 0.0009874403476715088, 0.0010312199592590332, 0.0010749995708465576, 0.001118779182434082, 0.0011625587940216064, 0.0012063384056091309, 0.0012501180171966553, 0.0012938976287841797, 0.001337677240371704, 0.0013814568519592285, 0.001425236463546753, 0.0014690160751342773, 0.0015127956867218018, 0.0015565752983093262, 0.0016003549098968506, 0.001644134521484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 2.0, 2.0, 3.0, 8.0, 6.0, 16.0, 45.0, 166.0, 1338.0, 230587.0, 814675.0, 1445.0, 186.0, 39.0, 15.0, 8.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1138916015625, -0.10933876037597656, -0.10478591918945312, -0.10023307800292969, -0.09568023681640625, -0.09112739562988281, -0.08657455444335938, -0.08202171325683594, -0.0774688720703125, -0.07291603088378906, -0.06836318969726562, -0.06381034851074219, -0.05925750732421875, -0.05470466613769531, -0.050151824951171875, -0.04559898376464844, -0.041046142578125, -0.03649330139160156, -0.031940460205078125, -0.027387619018554688, -0.02283477783203125, -0.018281936645507812, -0.013729095458984375, -0.009176254272460938, -0.0046234130859375, -7.05718994140625e-05, 0.004482269287109375, 0.009035110473632812, 0.01358795166015625, 0.018140792846679688, 0.022693634033203125, 0.027246475219726562, 0.03179931640625, 0.03635215759277344, 0.040904998779296875, 0.04545783996582031, 0.05001068115234375, 0.05456352233886719, 0.059116363525390625, 0.06366920471191406, 0.0682220458984375, 0.07277488708496094, 0.07732772827148438, 0.08188056945800781, 0.08643341064453125, 0.09098625183105469, 0.09553909301757812, 0.10009193420410156, 0.104644775390625, 0.10919761657714844, 0.11375045776367188, 0.11830329895019531, 0.12285614013671875, 0.1274089813232422, 0.13196182250976562, 0.13651466369628906, 0.1410675048828125, 0.14562034606933594, 0.15017318725585938, 0.1547260284423828, 0.15927886962890625, 0.1638317108154297, 0.16838455200195312, 0.17293739318847656, 0.177490234375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 13.0, 8.0, 11.0, 15.0, 19.0, 23.0, 28.0, 30.0, 89.0, 457.0, 145.0, 36.0, 26.0, 20.0, 24.0, 11.0, 5.0, 3.0, 5.0, 7.0, 0.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01065826416015625, -0.010286092758178711, -0.009913921356201172, -0.009541749954223633, -0.009169578552246094, -0.008797407150268555, -0.008425235748291016, -0.008053064346313477, -0.0076808929443359375, -0.0073087215423583984, -0.006936550140380859, -0.00656437873840332, -0.006192207336425781, -0.005820035934448242, -0.005447864532470703, -0.005075693130493164, -0.004703521728515625, -0.004331350326538086, -0.003959178924560547, -0.003587007522583008, -0.0032148361206054688, -0.0028426647186279297, -0.0024704933166503906, -0.0020983219146728516, -0.0017261505126953125, -0.0013539791107177734, -0.0009818077087402344, -0.0006096363067626953, -0.00023746490478515625, 0.0001347064971923828, 0.0005068778991699219, 0.0008790493011474609, 0.001251220703125, 0.001623392105102539, 0.001995563507080078, 0.002367734909057617, 0.0027399063110351562, 0.0031120777130126953, 0.0034842491149902344, 0.0038564205169677734, 0.0042285919189453125, 0.0046007633209228516, 0.004972934722900391, 0.00534510612487793, 0.005717277526855469, 0.006089448928833008, 0.006461620330810547, 0.006833791732788086, 0.007205963134765625, 0.007578134536743164, 0.007950305938720703, 0.008322477340698242, 0.008694648742675781, 0.00906682014465332, 0.00943899154663086, 0.009811162948608398, 0.010183334350585938, 0.010555505752563477, 0.010927677154541016, 0.011299848556518555, 0.011672019958496094, 0.012044191360473633, 0.012416362762451172, 0.012788534164428711, 0.01316070556640625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 32.0, 721.0, 247.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5680237412452698, -0.5553622841835022, -0.5427008271217346, -0.530039370059967, -0.5173779129981995, -0.5047164559364319, -0.4920549988746643, -0.4793935716152191, -0.46673211455345154, -0.45407065749168396, -0.4414092004299164, -0.4287477433681488, -0.4160862863063812, -0.40342485904693604, -0.39076340198516846, -0.3781019449234009, -0.3654404878616333, -0.3527790307998657, -0.34011757373809814, -0.32745611667633057, -0.314794659614563, -0.3021332025527954, -0.28947174549102783, -0.27681031823158264, -0.2641488313674927, -0.2514873743057251, -0.23882591724395752, -0.22616446018218994, -0.21350301802158356, -0.20084156095981598, -0.1881801038980484, -0.17551866173744202, -0.16285720467567444, -0.15019574761390686, -0.13753429055213928, -0.1248728409409523, -0.11221139132976532, -0.09954993426799774, -0.08688847720623016, -0.07422702759504318, -0.061565570533275604, -0.048904117196798325, -0.036242663860321045, -0.023581206798553467, -0.010919753462076187, 0.0017416998744010925, 0.01440315693616867, 0.027064606547355652, 0.03972606360912323, 0.05238751694560051, 0.06504897028207779, 0.07771042734384537, 0.09037187695503235, 0.10303333401679993, 0.1156947910785675, 0.12835624814033508, 0.14101770520210266, 0.15367916226387024, 0.16634061932563782, 0.1790020763874054, 0.19166351854801178, 0.20432497560977936, 0.21698643267154694, 0.22964787483215332, 0.2423093318939209]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 8.0, 9.0, 13.0, 15.0, 16.0, 25.0, 26.0, 35.0, 39.0, 53.0, 51.0, 59.0, 72.0, 55.0, 61.0, 83.0, 60.0, 54.0, 52.0, 43.0, 37.0, 23.0, 26.0, 28.0, 12.0, 17.0, 3.0, 9.0, 8.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02806776762008667, -0.027309512719511986, -0.0265512578189373, -0.025793002918362617, -0.025034748017787933, -0.02427649311721325, -0.023518238216638565, -0.02275998331606388, -0.022001728415489197, -0.021243473514914513, -0.02048521861433983, -0.019726963713765144, -0.01896870881319046, -0.018210453912615776, -0.017452199012041092, -0.016693944111466408, -0.015935689210891724, -0.01517743431031704, -0.014419179409742355, -0.013660924509167671, -0.012902669608592987, -0.012144414708018303, -0.011386159807443619, -0.010627904906868935, -0.00986965000629425, -0.009111395105719566, -0.008353140205144882, -0.007594885304570198, -0.006836630403995514, -0.00607837550342083, -0.005320120602846146, -0.0045618657022714615, -0.0038036108016967773, -0.003045355901122093, -0.002287101000547409, -0.001528846099972725, -0.0007705911993980408, -1.2336298823356628e-05, 0.0007459186017513275, 0.0015041735023260117, 0.002262428402900696, 0.00302068330347538, 0.003778938204050064, 0.004537193104624748, 0.005295448005199432, 0.0060537029057741165, 0.006811957806348801, 0.007570212706923485, 0.008328467607498169, 0.009086722508072853, 0.009844977408647537, 0.010603232309222221, 0.011361487209796906, 0.01211974211037159, 0.012877997010946274, 0.013636251911520958, 0.014394506812095642, 0.015152761712670326, 0.01591101661324501, 0.016669271513819695, 0.01742752641439438, 0.018185781314969063, 0.018944036215543747, 0.01970229111611843, 0.020460546016693115]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 2.0, 10.0, 10.0, 14.0, 6.0, 10.0, 4.0, 14.0, 10.0, 12.0, 26.0, 40.0, 48.0, 86.0, 4188558.0, 5050.0, 174.0, 42.0, 16.0, 20.0, 10.0, 16.0, 20.0, 14.0, 10.0, 6.0, 0.0, 4.0, 4.0, 8.0, 2.0, 6.0, 8.0, 2.0, 6.0, 6.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.83203125, -0.8074722290039062, -0.7829132080078125, -0.7583541870117188, -0.733795166015625, -0.7092361450195312, -0.6846771240234375, -0.6601181030273438, -0.63555908203125, -0.6110000610351562, -0.5864410400390625, -0.5618820190429688, -0.537322998046875, -0.5127639770507812, -0.4882049560546875, -0.46364593505859375, -0.4390869140625, -0.41452789306640625, -0.3899688720703125, -0.36540985107421875, -0.340850830078125, -0.31629180908203125, -0.2917327880859375, -0.26717376708984375, -0.24261474609375, -0.21805572509765625, -0.1934967041015625, -0.16893768310546875, -0.144378662109375, -0.11981964111328125, -0.0952606201171875, -0.07070159912109375, -0.046142578125, -0.02158355712890625, 0.0029754638671875, 0.02753448486328125, 0.052093505859375, 0.07665252685546875, 0.1012115478515625, 0.12577056884765625, 0.15032958984375, 0.17488861083984375, 0.1994476318359375, 0.22400665283203125, 0.248565673828125, 0.27312469482421875, 0.2976837158203125, 0.32224273681640625, 0.3468017578125, 0.37136077880859375, 0.3959197998046875, 0.42047882080078125, 0.445037841796875, 0.46959686279296875, 0.4941558837890625, 0.5187149047851562, 0.54327392578125, 0.5678329467773438, 0.5923919677734375, 0.6169509887695312, 0.641510009765625, 0.6660690307617188, 0.6906280517578125, 0.7151870727539062, 0.73974609375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 8.0, 10.0, 10.0, 34.0, 104.0, 184.0, 254.0, 236.0, 102.0, 30.0, 21.0, 11.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004057884216308594, -0.00035259872674942017, -0.00029940903186798096, -0.00024621933698654175, -0.00019302964210510254, -0.00013983994722366333, -8.665025234222412e-05, -3.346055746078491e-05, 1.9729137420654297e-05, 7.29188323020935e-05, 0.00012610852718353271, 0.00017929822206497192, 0.00023248791694641113, 0.00028567761182785034, 0.00033886730670928955, 0.00039205700159072876, 0.00044524669647216797, 0.0004984363913536072, 0.0005516260862350464, 0.0006048157811164856, 0.0006580054759979248, 0.000711195170879364, 0.0007643848657608032, 0.0008175745606422424, 0.0008707642555236816, 0.0009239539504051208, 0.00097714364528656, 0.0010303333401679993, 0.0010835230350494385, 0.0011367127299308777, 0.001189902424812317, 0.001243092119693756, 0.0012962818145751953, 0.0013494715094566345, 0.0014026612043380737, 0.001455850899219513, 0.0015090405941009521, 0.0015622302889823914, 0.0016154199838638306, 0.0016686096787452698, 0.001721799373626709, 0.0017749890685081482, 0.0018281787633895874, 0.0018813684582710266, 0.0019345581531524658, 0.001987747848033905, 0.0020409375429153442, 0.0020941272377967834, 0.0021473169326782227, 0.002200506627559662, 0.002253696322441101, 0.0023068860173225403, 0.0023600757122039795, 0.0024132654070854187, 0.002466455101966858, 0.002519644796848297, 0.0025728344917297363, 0.0026260241866111755, 0.0026792138814926147, 0.002732403576374054, 0.002785593271255493, 0.0028387829661369324, 0.0028919726610183716, 0.002945162355899811, 0.00299835205078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 60.0, 556.0, 4192556.0, 955.0, 142.0, 19.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2099609375, -0.1637725830078125, -0.117584228515625, -0.0713958740234375, -0.02520751953125, 0.0209808349609375, 0.067169189453125, 0.1133575439453125, 0.1595458984375, 0.2057342529296875, 0.251922607421875, 0.2981109619140625, 0.34429931640625, 0.3904876708984375, 0.436676025390625, 0.4828643798828125, 0.529052734375, 0.5752410888671875, 0.621429443359375, 0.6676177978515625, 0.71380615234375, 0.7599945068359375, 0.806182861328125, 0.8523712158203125, 0.8985595703125, 0.9447479248046875, 0.990936279296875, 1.0371246337890625, 1.08331298828125, 1.1295013427734375, 1.175689697265625, 1.2218780517578125, 1.26806640625, 1.3142547607421875, 1.360443115234375, 1.4066314697265625, 1.45281982421875, 1.4990081787109375, 1.545196533203125, 1.5913848876953125, 1.6375732421875, 1.6837615966796875, 1.729949951171875, 1.7761383056640625, 1.82232666015625, 1.8685150146484375, 1.914703369140625, 1.9608917236328125, 2.007080078125, 2.0532684326171875, 2.099456787109375, 2.1456451416015625, 2.19183349609375, 2.2380218505859375, 2.284210205078125, 2.3303985595703125, 2.3765869140625, 2.4227752685546875, 2.468963623046875, 2.5151519775390625, 2.56134033203125, 2.6075286865234375, 2.653717041015625, 2.6999053955078125, 2.74609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 8.0, 46.0, 590.0, 3326.0, 104.0, 15.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0032711029052734375, -0.0027362406253814697, -0.002201378345489502, -0.0016665160655975342, -0.0011316537857055664, -0.0005967915058135986, -6.192922592163086e-05, 0.0004729330539703369, 0.0010077953338623047, 0.0015426576137542725, 0.0020775198936462402, 0.002612382173538208, 0.0031472444534301758, 0.0036821067333221436, 0.004216969013214111, 0.004751831293106079, 0.005286693572998047, 0.005821555852890015, 0.006356418132781982, 0.00689128041267395, 0.007426142692565918, 0.007961004972457886, 0.008495867252349854, 0.009030729532241821, 0.009565591812133789, 0.010100454092025757, 0.010635316371917725, 0.011170178651809692, 0.01170504093170166, 0.012239903211593628, 0.012774765491485596, 0.013309627771377563, 0.013844490051269531, 0.014379352331161499, 0.014914214611053467, 0.015449076890945435, 0.015983939170837402, 0.01651880145072937, 0.017053663730621338, 0.017588526010513306, 0.018123388290405273, 0.01865825057029724, 0.01919311285018921, 0.019727975130081177, 0.020262837409973145, 0.020797699689865112, 0.02133256196975708, 0.021867424249649048, 0.022402286529541016, 0.022937148809432983, 0.02347201108932495, 0.02400687336921692, 0.024541735649108887, 0.025076597929000854, 0.025611460208892822, 0.02614632248878479, 0.026681184768676758, 0.027216047048568726, 0.027750909328460693, 0.02828577160835266, 0.02882063388824463, 0.029355496168136597, 0.029890358448028564, 0.030425220727920532, 0.0309600830078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [57.0, 962.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1321904957294464, -0.02535158395767212, 0.08148732781410217, 0.18832623958587646, 0.29516515135765076, 0.40200409293174744, 0.508842945098877, 0.6156818866729736, 0.7225208282470703, 0.829359769821167, 0.9361986517906189, 1.0430375337600708, 1.1498764753341675, 1.2567154169082642, 1.3635542392730713, 1.470393180847168, 1.5772321224212646, 1.6840710639953613, 1.790910005569458, 1.8977488279342651, 2.0045876502990723, 2.111426830291748, 2.2182655334472656, 2.3251044750213623, 2.431943416595459, 2.5387823581695557, 2.6456212997436523, 2.752460241317749, 2.8592991828918457, 2.9661378860473633, 3.07297682762146, 3.1798157691955566, 3.286654472351074, 3.393493413925171, 3.5003323554992676, 3.6071712970733643, 3.714010238647461, 3.8208489418029785, 3.927687883377075, 4.034526824951172, 4.141366004943848, 4.248204708099365, 4.355043888092041, 4.461882591247559, 4.568721771240234, 4.675560474395752, 4.782399654388428, 4.889238357543945, 4.996077060699463, 5.1029157638549805, 5.209754943847656, 5.316593647003174, 5.42343282699585, 5.530271530151367, 5.637110710144043, 5.7439494132995605, 5.850788116455078, 5.957626819610596, 6.0644659996032715, 6.171304702758789, 6.278143882751465, 6.384982585906982, 6.491821765899658, 6.598660469055176, 6.705499649047852]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 10.0, 29.0, 51.0, 127.0, 192.0, 262.0, 184.0, 94.0, 42.0, 14.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15993249416351318, -0.14729642868041992, -0.13466037809848785, -0.12202431261539459, -0.10938825458288193, -0.09675219655036926, -0.084116131067276, -0.07148007303476334, -0.05884401500225067, -0.04620795696973801, -0.03357189521193504, -0.02093583345413208, -0.008299775421619415, 0.0043362826108932495, 0.01697234809398651, 0.029608406126499176, 0.04224446415901184, 0.054880522191524506, 0.06751658022403717, 0.08015264570713043, 0.0927887037396431, 0.10542476177215576, 0.11806082725524902, 0.13069689273834229, 0.14333294332027435, 0.15596900880336761, 0.16860505938529968, 0.18124112486839294, 0.1938771903514862, 0.20651324093341827, 0.21914930641651154, 0.2317853569984436, 0.24442142248153687, 0.2570574879646301, 0.2696935534477234, 0.28232961893081665, 0.2949656546115875, 0.3076017200946808, 0.32023778557777405, 0.3328738510608673, 0.3455098867416382, 0.35814595222473145, 0.3707820177078247, 0.38341808319091797, 0.39605411887168884, 0.4086901843547821, 0.42132624983787537, 0.43396231532096863, 0.4465983808040619, 0.45923444628715515, 0.4718705117702484, 0.4845065474510193, 0.49714261293411255, 0.5097786784172058, 0.5224147439002991, 0.5350508093833923, 0.5476868748664856, 0.5603229403495789, 0.5729590058326721, 0.5855950713157654, 0.5982311367988586, 0.6108671426773071, 0.6235032081604004, 0.6361392736434937, 0.6487753391265869]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 11.0, 9.0, 15.0, 30.0, 27.0, 26.0, 25.0, 30.0, 37.0, 44.0, 51.0, 34.0, 60.0, 147.0, 1019672.0, 27863.0, 69.0, 42.0, 48.0, 45.0, 42.0, 44.0, 30.0, 29.0, 20.0, 17.0, 17.0, 4.0, 17.0, 3.0, 7.0, 7.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2880859375, -1.250030517578125, -1.21197509765625, -1.173919677734375, -1.1358642578125, -1.097808837890625, -1.05975341796875, -1.021697998046875, -0.983642578125, -0.945587158203125, -0.90753173828125, -0.869476318359375, -0.8314208984375, -0.793365478515625, -0.75531005859375, -0.717254638671875, -0.67919921875, -0.641143798828125, -0.60308837890625, -0.565032958984375, -0.5269775390625, -0.488922119140625, -0.45086669921875, -0.412811279296875, -0.374755859375, -0.336700439453125, -0.29864501953125, -0.260589599609375, -0.2225341796875, -0.184478759765625, -0.14642333984375, -0.108367919921875, -0.0703125, -0.032257080078125, 0.00579833984375, 0.043853759765625, 0.0819091796875, 0.119964599609375, 0.15802001953125, 0.196075439453125, 0.234130859375, 0.272186279296875, 0.31024169921875, 0.348297119140625, 0.3863525390625, 0.424407958984375, 0.46246337890625, 0.500518798828125, 0.53857421875, 0.576629638671875, 0.61468505859375, 0.652740478515625, 0.6907958984375, 0.728851318359375, 0.76690673828125, 0.804962158203125, 0.843017578125, 0.881072998046875, 0.91912841796875, 0.957183837890625, 0.9952392578125, 1.033294677734375, 1.07135009765625, 1.109405517578125, 1.1474609375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 10.0, 172.0, 594.0, 233.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0078582763671875, -0.00568699836730957, -0.0035157203674316406, -0.001344442367553711, 0.0008268356323242188, 0.0029981136322021484, 0.005169391632080078, 0.007340669631958008, 0.009511947631835938, 0.011683225631713867, 0.013854503631591797, 0.016025781631469727, 0.018197059631347656, 0.020368337631225586, 0.022539615631103516, 0.024710893630981445, 0.026882171630859375, 0.029053449630737305, 0.031224727630615234, 0.033396005630493164, 0.035567283630371094, 0.03773856163024902, 0.03990983963012695, 0.04208111763000488, 0.04425239562988281, 0.04642367362976074, 0.04859495162963867, 0.0507662296295166, 0.05293750762939453, 0.05510878562927246, 0.05728006362915039, 0.05945134162902832, 0.06162261962890625, 0.06379389762878418, 0.06596517562866211, 0.06813645362854004, 0.07030773162841797, 0.0724790096282959, 0.07465028762817383, 0.07682156562805176, 0.07899284362792969, 0.08116412162780762, 0.08333539962768555, 0.08550667762756348, 0.0876779556274414, 0.08984923362731934, 0.09202051162719727, 0.0941917896270752, 0.09636306762695312, 0.09853434562683105, 0.10070562362670898, 0.10287690162658691, 0.10504817962646484, 0.10721945762634277, 0.1093907356262207, 0.11156201362609863, 0.11373329162597656, 0.11590456962585449, 0.11807584762573242, 0.12024712562561035, 0.12241840362548828, 0.12458968162536621, 0.12676095962524414, 0.12893223762512207, 0.131103515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 8.0, 3.0, 10.0, 11.0, 14.0, 28.0, 37.0, 50.0, 91.0, 180.0, 293.0, 793.0, 2545.0, 10277.0, 76243.0, 820572.0, 118656.0, 13827.0, 3085.0, 997.0, 382.0, 182.0, 95.0, 71.0, 32.0, 21.0, 18.0, 11.0, 5.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.457763671875, -0.44525146484375, -0.4327392578125, -0.42022705078125, -0.40771484375, -0.39520263671875, -0.3826904296875, -0.37017822265625, -0.357666015625, -0.34515380859375, -0.3326416015625, -0.32012939453125, -0.3076171875, -0.29510498046875, -0.2825927734375, -0.27008056640625, -0.257568359375, -0.24505615234375, -0.2325439453125, -0.22003173828125, -0.20751953125, -0.19500732421875, -0.1824951171875, -0.16998291015625, -0.157470703125, -0.14495849609375, -0.1324462890625, -0.11993408203125, -0.107421875, -0.09490966796875, -0.0823974609375, -0.06988525390625, -0.057373046875, -0.04486083984375, -0.0323486328125, -0.01983642578125, -0.00732421875, 0.00518798828125, 0.0177001953125, 0.03021240234375, 0.042724609375, 0.05523681640625, 0.0677490234375, 0.08026123046875, 0.0927734375, 0.10528564453125, 0.1177978515625, 0.13031005859375, 0.142822265625, 0.15533447265625, 0.1678466796875, 0.18035888671875, 0.19287109375, 0.20538330078125, 0.2178955078125, 0.23040771484375, 0.242919921875, 0.25543212890625, 0.2679443359375, 0.28045654296875, 0.29296875, 0.30548095703125, 0.3179931640625, 0.33050537109375, 0.343017578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 1.0, 8.0, 3.0, 3.0, 9.0, 6.0, 15.0, 30.0, 20.0, 32.0, 32.0, 21.0, 41.0, 55.0, 60.0, 57.0, 46.0, 62.0, 68.0, 62.0, 71.0, 55.0, 41.0, 29.0, 33.0, 29.0, 22.0, 18.0, 17.0, 10.0, 6.0, 7.0, 7.0, 4.0, 8.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11004638671875, -0.1068735122680664, -0.10370063781738281, -0.10052776336669922, -0.09735488891601562, -0.09418201446533203, -0.09100914001464844, -0.08783626556396484, -0.08466339111328125, -0.08149051666259766, -0.07831764221191406, -0.07514476776123047, -0.07197189331054688, -0.06879901885986328, -0.06562614440917969, -0.062453269958496094, -0.0592803955078125, -0.056107521057128906, -0.05293464660644531, -0.04976177215576172, -0.046588897705078125, -0.04341602325439453, -0.04024314880371094, -0.037070274353027344, -0.03389739990234375, -0.030724525451660156, -0.027551651000976562, -0.02437877655029297, -0.021205902099609375, -0.01803302764892578, -0.014860153198242188, -0.011687278747558594, -0.008514404296875, -0.005341529846191406, -0.0021686553955078125, 0.0010042190551757812, 0.004177093505859375, 0.007349967956542969, 0.010522842407226562, 0.013695716857910156, 0.01686859130859375, 0.020041465759277344, 0.023214340209960938, 0.02638721466064453, 0.029560089111328125, 0.03273296356201172, 0.03590583801269531, 0.039078712463378906, 0.0422515869140625, 0.045424461364746094, 0.04859733581542969, 0.05177021026611328, 0.054943084716796875, 0.05811595916748047, 0.06128883361816406, 0.06446170806884766, 0.06763458251953125, 0.07080745697021484, 0.07398033142089844, 0.07715320587158203, 0.08032608032226562, 0.08349895477294922, 0.08667182922363281, 0.0898447036743164, 0.093017578125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 10.0, 19.0, 16.0, 41.0, 56.0, 89.0, 142.0, 297.0, 634.0, 1969.0, 7143.0, 39302.0, 801209.0, 175881.0, 15869.0, 3748.0, 1133.0, 469.0, 198.0, 112.0, 61.0, 37.0, 29.0, 19.0, 12.0, 16.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2427978515625, -0.2340526580810547, -0.22530746459960938, -0.21656227111816406, -0.20781707763671875, -0.19907188415527344, -0.19032669067382812, -0.1815814971923828, -0.1728363037109375, -0.1640911102294922, -0.15534591674804688, -0.14660072326660156, -0.13785552978515625, -0.12911033630371094, -0.12036514282226562, -0.11161994934082031, -0.102874755859375, -0.09412956237792969, -0.08538436889648438, -0.07663917541503906, -0.06789398193359375, -0.05914878845214844, -0.050403594970703125, -0.04165840148925781, -0.0329132080078125, -0.024168014526367188, -0.015422821044921875, -0.0066776275634765625, 0.00206756591796875, 0.010812759399414062, 0.019557952880859375, 0.028303146362304688, 0.03704833984375, 0.04579353332519531, 0.054538726806640625, 0.06328392028808594, 0.07202911376953125, 0.08077430725097656, 0.08951950073242188, 0.09826469421386719, 0.1070098876953125, 0.11575508117675781, 0.12450027465820312, 0.13324546813964844, 0.14199066162109375, 0.15073585510253906, 0.15948104858398438, 0.1682262420654297, 0.176971435546875, 0.1857166290283203, 0.19446182250976562, 0.20320701599121094, 0.21195220947265625, 0.22069740295410156, 0.22944259643554688, 0.2381877899169922, 0.2469329833984375, 0.2556781768798828, 0.2644233703613281, 0.27316856384277344, 0.28191375732421875, 0.29065895080566406, 0.2994041442871094, 0.3081493377685547, 0.31689453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 5.0, 9.0, 6.0, 17.0, 7.0, 17.0, 17.0, 34.0, 35.0, 43.0, 63.0, 97.0, 130.0, 130.0, 94.0, 62.0, 40.0, 39.0, 21.0, 24.0, 23.0, 21.0, 12.0, 7.0, 7.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006952285766601562, -0.0006694570183753967, -0.0006436854600906372, -0.0006179139018058777, -0.0005921423435211182, -0.0005663707852363586, -0.0005405992269515991, -0.0005148276686668396, -0.0004890561103820801, -0.00046328455209732056, -0.00043751299381256104, -0.0004117414355278015, -0.000385969877243042, -0.00036019831895828247, -0.00033442676067352295, -0.00030865520238876343, -0.0002828836441040039, -0.0002571120858192444, -0.00023134052753448486, -0.00020556896924972534, -0.00017979741096496582, -0.0001540258526802063, -0.00012825429439544678, -0.00010248273611068726, -7.671117782592773e-05, -5.093961954116821e-05, -2.516806125640869e-05, 6.034970283508301e-07, 2.637505531311035e-05, 5.214661359786987e-05, 7.79181718826294e-05, 0.00010368973016738892, 0.00012946128845214844, 0.00015523284673690796, 0.00018100440502166748, 0.000206775963306427, 0.00023254752159118652, 0.00025831907987594604, 0.00028409063816070557, 0.0003098621964454651, 0.0003356337547302246, 0.00036140531301498413, 0.00038717687129974365, 0.0004129484295845032, 0.0004387199878692627, 0.0004644915461540222, 0.0004902631044387817, 0.0005160346627235413, 0.0005418062210083008, 0.0005675777792930603, 0.0005933493375778198, 0.0006191208958625793, 0.0006448924541473389, 0.0006706640124320984, 0.0006964355707168579, 0.0007222071290016174, 0.000747978687286377, 0.0007737502455711365, 0.000799521803855896, 0.0008252933621406555, 0.000851064920425415, 0.0008768364787101746, 0.0009026080369949341, 0.0009283795952796936, 0.0009541511535644531]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 13.0, 14.0, 16.0, 37.0, 53.0, 79.0, 127.0, 269.0, 630.0, 1543.0, 5006.0, 28842.0, 851520.0, 144929.0, 11062.0, 2595.0, 953.0, 396.0, 201.0, 114.0, 50.0, 38.0, 19.0, 11.0, 10.0, 6.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294677734375, -0.285400390625, -0.276123046875, -0.266845703125, -0.257568359375, -0.248291015625, -0.239013671875, -0.229736328125, -0.220458984375, -0.211181640625, -0.201904296875, -0.192626953125, -0.183349609375, -0.174072265625, -0.164794921875, -0.155517578125, -0.146240234375, -0.136962890625, -0.127685546875, -0.118408203125, -0.109130859375, -0.099853515625, -0.090576171875, -0.081298828125, -0.072021484375, -0.062744140625, -0.053466796875, -0.044189453125, -0.034912109375, -0.025634765625, -0.016357421875, -0.007080078125, 0.002197265625, 0.011474609375, 0.020751953125, 0.030029296875, 0.039306640625, 0.048583984375, 0.057861328125, 0.067138671875, 0.076416015625, 0.085693359375, 0.094970703125, 0.104248046875, 0.113525390625, 0.122802734375, 0.132080078125, 0.141357421875, 0.150634765625, 0.159912109375, 0.169189453125, 0.178466796875, 0.187744140625, 0.197021484375, 0.206298828125, 0.215576171875, 0.224853515625, 0.234130859375, 0.243408203125, 0.252685546875, 0.261962890625, 0.271240234375, 0.280517578125, 0.289794921875, 0.299072265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 11.0, 3.0, 16.0, 15.0, 25.0, 40.0, 52.0, 76.0, 84.0, 114.0, 140.0, 122.0, 86.0, 54.0, 37.0, 31.0, 21.0, 20.0, 10.0, 7.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.083984375, -0.08167171478271484, -0.07935905456542969, -0.07704639434814453, -0.07473373413085938, -0.07242107391357422, -0.07010841369628906, -0.0677957534790039, -0.06548309326171875, -0.0631704330444336, -0.06085777282714844, -0.05854511260986328, -0.056232452392578125, -0.05391979217529297, -0.05160713195800781, -0.049294471740722656, -0.0469818115234375, -0.044669151306152344, -0.04235649108886719, -0.04004383087158203, -0.037731170654296875, -0.03541851043701172, -0.03310585021972656, -0.030793190002441406, -0.02848052978515625, -0.026167869567871094, -0.023855209350585938, -0.02154254913330078, -0.019229888916015625, -0.01691722869873047, -0.014604568481445312, -0.012291908264160156, -0.009979248046875, -0.007666587829589844, -0.0053539276123046875, -0.0030412673950195312, -0.000728607177734375, 0.0015840530395507812, 0.0038967132568359375, 0.006209373474121094, 0.00852203369140625, 0.010834693908691406, 0.013147354125976562, 0.015460014343261719, 0.017772674560546875, 0.02008533477783203, 0.022397994995117188, 0.024710655212402344, 0.0270233154296875, 0.029335975646972656, 0.03164863586425781, 0.03396129608154297, 0.036273956298828125, 0.03858661651611328, 0.04089927673339844, 0.043211936950683594, 0.04552459716796875, 0.047837257385253906, 0.05014991760253906, 0.05246257781982422, 0.054775238037109375, 0.05708789825439453, 0.05940055847167969, 0.061713218688964844, 0.06402587890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 42.0, 579.0, 378.0, 10.0], "bins": [-13.244521141052246, -13.030671119689941, -12.81682014465332, -12.602970123291016, -12.389119148254395, -12.17526912689209, -11.961418151855469, -11.747568130493164, -11.533717155456543, -11.319867134094238, -11.106016159057617, -10.892166137695312, -10.678315162658691, -10.464465141296387, -10.250614166259766, -10.036764144897461, -9.82291316986084, -9.609063148498535, -9.395212173461914, -9.18136215209961, -8.967511177062988, -8.753661155700684, -8.539810180664062, -8.325960159301758, -8.112109184265137, -7.898258686065674, -7.684408187866211, -7.470557689666748, -7.256707191467285, -7.042856693267822, -6.829006195068359, -6.6151556968688965, -6.401305198669434, -6.187454700469971, -5.973604202270508, -5.759753704071045, -5.545903205871582, -5.332052707672119, -5.118202209472656, -4.904351711273193, -4.6905012130737305, -4.476650714874268, -4.262800216674805, -4.048949718475342, -3.835099220275879, -3.621248722076416, -3.407398223876953, -3.1935477256774902, -2.9796977043151855, -2.7658472061157227, -2.5519967079162598, -2.338146209716797, -2.124295711517334, -1.9104453325271606, -1.6965948343276978, -1.4827443361282349, -1.2688937187194824, -1.0550432205200195, -0.8411927223205566, -0.6273422837257385, -0.41349178552627563, -0.19964134693145752, 0.014209151268005371, 0.22805964946746826, 0.44191014766693115]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 11.0, 17.0, 18.0, 23.0, 29.0, 31.0, 43.0, 46.0, 60.0, 61.0, 56.0, 68.0, 65.0, 66.0, 68.0, 62.0, 52.0, 42.0, 30.0, 47.0, 18.0, 22.0, 14.0, 11.0, 11.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5875391960144043, -0.5657150745391846, -0.5438908934593201, -0.5220667719841003, -0.5002425909042358, -0.4784184694290161, -0.456594318151474, -0.4347701668739319, -0.41294601559638977, -0.39112186431884766, -0.36929771304130554, -0.3474735617637634, -0.3256494402885437, -0.3038252592086792, -0.2820011377334595, -0.26017698645591736, -0.23835283517837524, -0.21652868390083313, -0.19470453262329102, -0.1728803962469101, -0.15105624496936798, -0.12923209369182587, -0.10740795731544495, -0.08558380603790283, -0.06375965476036072, -0.0419355072081089, -0.020111359655857086, 0.0017127841711044312, 0.023536935448646545, 0.04536108672618866, 0.06718522310256958, 0.0890093743801117, 0.11083346605300903, 0.13265761733055115, 0.15448176860809326, 0.17630590498447418, 0.1981300562620163, 0.2199542075395584, 0.24177834391593933, 0.26360249519348145, 0.28542664647102356, 0.3072507977485657, 0.3290749490261078, 0.3508991003036499, 0.37272322177886963, 0.39454740285873413, 0.41637152433395386, 0.43819567561149597, 0.4600198268890381, 0.4818439781665802, 0.5036681294441223, 0.525492250919342, 0.5473164319992065, 0.5691405534744263, 0.590964674949646, 0.6127888560295105, 0.634613037109375, 0.6564371585845947, 0.6782613396644592, 0.700085461139679, 0.7219096422195435, 0.7437337636947632, 0.7655578851699829, 0.7873820662498474, 0.8092061877250671]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [11.0, 35.0, 233.0, 8672.0, 4184130.0, 722.0, 128.0, 78.0, 44.0, 53.0, 48.0, 32.0, 33.0, 28.0, 19.0, 17.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3974609375, -0.3046417236328125, -0.211822509765625, -0.1190032958984375, -0.02618408203125, 0.0666351318359375, 0.159454345703125, 0.2522735595703125, 0.3450927734375, 0.4379119873046875, 0.530731201171875, 0.6235504150390625, 0.71636962890625, 0.8091888427734375, 0.902008056640625, 0.9948272705078125, 1.087646484375, 1.1804656982421875, 1.273284912109375, 1.3661041259765625, 1.45892333984375, 1.5517425537109375, 1.644561767578125, 1.7373809814453125, 1.8302001953125, 1.9230194091796875, 2.015838623046875, 2.1086578369140625, 2.20147705078125, 2.2942962646484375, 2.387115478515625, 2.4799346923828125, 2.57275390625, 2.6655731201171875, 2.758392333984375, 2.8512115478515625, 2.94403076171875, 3.0368499755859375, 3.129669189453125, 3.2224884033203125, 3.3153076171875, 3.4081268310546875, 3.500946044921875, 3.5937652587890625, 3.68658447265625, 3.7794036865234375, 3.872222900390625, 3.9650421142578125, 4.057861328125, 4.1506805419921875, 4.243499755859375, 4.3363189697265625, 4.42913818359375, 4.5219573974609375, 4.614776611328125, 4.7075958251953125, 4.8004150390625, 4.8932342529296875, 4.986053466796875, 5.0788726806640625, 5.17169189453125, 5.2645111083984375, 5.357330322265625, 5.4501495361328125, 5.54296875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 7.0, 45.0, 145.0, 309.0, 325.0, 146.0, 30.0, 10.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01165008544921875, -0.009337544441223145, -0.007025003433227539, -0.004712462425231934, -0.002399921417236328, -8.738040924072266e-05, 0.002225160598754883, 0.004537701606750488, 0.006850242614746094, 0.0091627836227417, 0.011475324630737305, 0.01378786563873291, 0.016100406646728516, 0.01841294765472412, 0.020725488662719727, 0.023038029670715332, 0.025350570678710938, 0.027663111686706543, 0.02997565269470215, 0.032288193702697754, 0.03460073471069336, 0.036913275718688965, 0.03922581672668457, 0.041538357734680176, 0.04385089874267578, 0.04616343975067139, 0.04847598075866699, 0.0507885217666626, 0.0531010627746582, 0.05541360378265381, 0.057726144790649414, 0.06003868579864502, 0.062351226806640625, 0.06466376781463623, 0.06697630882263184, 0.06928884983062744, 0.07160139083862305, 0.07391393184661865, 0.07622647285461426, 0.07853901386260986, 0.08085155487060547, 0.08316409587860107, 0.08547663688659668, 0.08778917789459229, 0.09010171890258789, 0.0924142599105835, 0.0947268009185791, 0.09703934192657471, 0.09935188293457031, 0.10166442394256592, 0.10397696495056152, 0.10628950595855713, 0.10860204696655273, 0.11091458797454834, 0.11322712898254395, 0.11553966999053955, 0.11785221099853516, 0.12016475200653076, 0.12247729301452637, 0.12478983402252197, 0.12710237503051758, 0.12941491603851318, 0.1317274570465088, 0.1340399980545044, 0.1363525390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 12.0, 29.0, 69.0, 190.0, 471.0, 7470.0, 4178625.0, 6511.0, 536.0, 210.0, 92.0, 48.0, 15.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2421875, -1.14276123046875, -1.0433349609375, -0.94390869140625, -0.844482421875, -0.74505615234375, -0.6456298828125, -0.54620361328125, -0.44677734375, -0.34735107421875, -0.2479248046875, -0.14849853515625, -0.049072265625, 0.05035400390625, 0.1497802734375, 0.24920654296875, 0.3486328125, 0.44805908203125, 0.5474853515625, 0.64691162109375, 0.746337890625, 0.84576416015625, 0.9451904296875, 1.04461669921875, 1.14404296875, 1.24346923828125, 1.3428955078125, 1.44232177734375, 1.541748046875, 1.64117431640625, 1.7406005859375, 1.84002685546875, 1.939453125, 2.03887939453125, 2.1383056640625, 2.23773193359375, 2.337158203125, 2.43658447265625, 2.5360107421875, 2.63543701171875, 2.73486328125, 2.83428955078125, 2.9337158203125, 3.03314208984375, 3.132568359375, 3.23199462890625, 3.3314208984375, 3.43084716796875, 3.5302734375, 3.62969970703125, 3.7291259765625, 3.82855224609375, 3.927978515625, 4.02740478515625, 4.1268310546875, 4.22625732421875, 4.32568359375, 4.42510986328125, 4.5245361328125, 4.62396240234375, 4.723388671875, 4.82281494140625, 4.9222412109375, 5.02166748046875, 5.12109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 10.0, 5.0, 33.0, 89.0, 278.0, 3398.0, 160.0, 68.0, 23.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12030029296875, -0.1133584976196289, -0.10641670227050781, -0.09947490692138672, -0.09253311157226562, -0.08559131622314453, -0.07864952087402344, -0.07170772552490234, -0.06476593017578125, -0.057824134826660156, -0.05088233947753906, -0.04394054412841797, -0.036998748779296875, -0.03005695343017578, -0.023115158081054688, -0.016173362731933594, -0.0092315673828125, -0.0022897720336914062, 0.0046520233154296875, 0.011593818664550781, 0.018535614013671875, 0.02547740936279297, 0.03241920471191406, 0.039361000061035156, 0.04630279541015625, 0.053244590759277344, 0.06018638610839844, 0.06712818145751953, 0.07406997680664062, 0.08101177215576172, 0.08795356750488281, 0.0948953628540039, 0.101837158203125, 0.1087789535522461, 0.11572074890136719, 0.12266254425048828, 0.12960433959960938, 0.13654613494873047, 0.14348793029785156, 0.15042972564697266, 0.15737152099609375, 0.16431331634521484, 0.17125511169433594, 0.17819690704345703, 0.18513870239257812, 0.19208049774169922, 0.1990222930908203, 0.2059640884399414, 0.2129058837890625, 0.2198476791381836, 0.2267894744873047, 0.23373126983642578, 0.24067306518554688, 0.24761486053466797, 0.25455665588378906, 0.26149845123291016, 0.26844024658203125, 0.27538204193115234, 0.28232383728027344, 0.28926563262939453, 0.2962074279785156, 0.3031492233276367, 0.3100910186767578, 0.3170328140258789, 0.323974609375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 17.0, 103.0, 678.0, 185.0, 19.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7803741693496704, -0.6772595047950745, -0.5741447806358337, -0.4710301160812378, -0.36791542172431946, -0.2648007273674011, -0.16168606281280518, -0.05857133865356445, 0.044543325901031494, 0.14765802025794983, 0.25077271461486816, 0.3538873791694641, 0.45700207352638245, 0.5601167678833008, 0.6632314324378967, 0.7663461565971375, 0.8694608211517334, 0.9725754857063293, 1.0756901502609253, 1.178804874420166, 1.2819195985794067, 1.3850343227386475, 1.4881489276885986, 1.5912636518478394, 1.69437837600708, 1.7974931001663208, 1.900607705116272, 2.0037224292755127, 2.106837034225464, 2.209951877593994, 2.3130664825439453, 2.4161810874938965, 2.5192959308624268, 2.622410535812378, 2.725525379180908, 2.8286399841308594, 2.9317545890808105, 3.034869432449341, 3.137984037399292, 3.2410988807678223, 3.3442134857177734, 3.4473280906677246, 3.550442934036255, 3.653557538986206, 3.7566721439361572, 3.8597869873046875, 3.9629015922546387, 4.06601619720459, 4.169130802154541, 4.272245407104492, 4.375360012054443, 4.4784746170043945, 4.581589698791504, 4.684704303741455, 4.787818908691406, 4.890933513641357, 4.994048595428467, 5.097163200378418, 5.200277805328369, 5.30339241027832, 5.40650749206543, 5.509622097015381, 5.612736701965332, 5.715851306915283, 5.818965911865234]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 12.0, 16.0, 25.0, 50.0, 77.0, 93.0, 131.0, 136.0, 135.0, 120.0, 78.0, 55.0, 30.0, 20.0, 9.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0807788372039795, -1.0531522035598755, -1.025525450706482, -0.9978988170623779, -0.9702721834182739, -0.9426454901695251, -0.9150188565254211, -0.8873921632766724, -0.8597655296325684, -0.8321388363838196, -0.8045122027397156, -0.7768855094909668, -0.7492588758468628, -0.721632182598114, -0.69400554895401, -0.6663788557052612, -0.6387522220611572, -0.6111255288124084, -0.5834988951683044, -0.5558722019195557, -0.5282455682754517, -0.5006188750267029, -0.4729922413825989, -0.4453655481338501, -0.4177388548851013, -0.3901121914386749, -0.36248552799224854, -0.33485886454582214, -0.30723220109939575, -0.279605507850647, -0.25197887420654297, -0.22435219585895538, -0.19672554731369019, -0.1690988838672638, -0.1414722204208374, -0.11384554952383041, -0.08621888607740402, -0.058592215180397034, -0.030965551733970642, -0.0033388882875442505, 0.02428777515888214, 0.05191443860530853, 0.07954110205173492, 0.10716777294874191, 0.1347944438457489, 0.1624211072921753, 0.19004777073860168, 0.21767443418502808, 0.24530109763145447, 0.27292776107788086, 0.30055442452430725, 0.32818108797073364, 0.35580775141716003, 0.3834344148635864, 0.4110611081123352, 0.4386877417564392, 0.466314435005188, 0.4939410984516144, 0.5215677618980408, 0.5491944551467896, 0.5768210887908936, 0.6044477820396423, 0.6320744156837463, 0.6597011089324951, 0.6873277425765991]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 3.0, 6.0, 6.0, 5.0, 9.0, 5.0, 3.0, 12.0, 14.0, 15.0, 20.0, 27.0, 21.0, 24.0, 33.0, 33.0, 51.0, 111.0, 288.0, 1431.0, 23842.0, 952294.0, 66897.0, 2563.0, 420.0, 114.0, 67.0, 35.0, 28.0, 30.0, 32.0, 27.0, 12.0, 22.0, 13.0, 11.0, 8.0, 7.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.2392578125, -1.2071685791015625, -1.175079345703125, -1.1429901123046875, -1.11090087890625, -1.0788116455078125, -1.046722412109375, -1.0146331787109375, -0.9825439453125, -0.9504547119140625, -0.918365478515625, -0.8862762451171875, -0.85418701171875, -0.8220977783203125, -0.790008544921875, -0.7579193115234375, -0.725830078125, -0.6937408447265625, -0.661651611328125, -0.6295623779296875, -0.59747314453125, -0.5653839111328125, -0.533294677734375, -0.5012054443359375, -0.4691162109375, -0.4370269775390625, -0.404937744140625, -0.3728485107421875, -0.34075927734375, -0.3086700439453125, -0.276580810546875, -0.2444915771484375, -0.21240234375, -0.1803131103515625, -0.148223876953125, -0.1161346435546875, -0.08404541015625, -0.0519561767578125, -0.019866943359375, 0.0122222900390625, 0.0443115234375, 0.0764007568359375, 0.108489990234375, 0.1405792236328125, 0.17266845703125, 0.2047576904296875, 0.236846923828125, 0.2689361572265625, 0.301025390625, 0.3331146240234375, 0.365203857421875, 0.3972930908203125, 0.42938232421875, 0.4614715576171875, 0.493560791015625, 0.5256500244140625, 0.5577392578125, 0.5898284912109375, 0.621917724609375, 0.6540069580078125, 0.68609619140625, 0.7181854248046875, 0.750274658203125, 0.7823638916015625, 0.814453125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 9.0, 25.0, 69.0, 150.0, 231.0, 246.0, 179.0, 59.0, 29.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032684326171875, -0.029972553253173828, -0.027260780334472656, -0.024549007415771484, -0.021837234497070312, -0.01912546157836914, -0.01641368865966797, -0.013701915740966797, -0.010990142822265625, -0.008278369903564453, -0.005566596984863281, -0.0028548240661621094, -0.0001430511474609375, 0.0025687217712402344, 0.005280494689941406, 0.007992267608642578, 0.01070404052734375, 0.013415813446044922, 0.016127586364746094, 0.018839359283447266, 0.021551132202148438, 0.02426290512084961, 0.02697467803955078, 0.029686450958251953, 0.032398223876953125, 0.0351099967956543, 0.03782176971435547, 0.04053354263305664, 0.04324531555175781, 0.045957088470458984, 0.048668861389160156, 0.05138063430786133, 0.0540924072265625, 0.05680418014526367, 0.059515953063964844, 0.062227725982666016, 0.06493949890136719, 0.06765127182006836, 0.07036304473876953, 0.0730748176574707, 0.07578659057617188, 0.07849836349487305, 0.08121013641357422, 0.08392190933227539, 0.08663368225097656, 0.08934545516967773, 0.0920572280883789, 0.09476900100708008, 0.09748077392578125, 0.10019254684448242, 0.1029043197631836, 0.10561609268188477, 0.10832786560058594, 0.11103963851928711, 0.11375141143798828, 0.11646318435668945, 0.11917495727539062, 0.1218867301940918, 0.12459850311279297, 0.12731027603149414, 0.1300220489501953, 0.13273382186889648, 0.13544559478759766, 0.13815736770629883, 0.140869140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 3.0, 4.0, 10.0, 17.0, 22.0, 26.0, 37.0, 45.0, 106.0, 210.0, 522.0, 1485.0, 6605.0, 58334.0, 788235.0, 176035.0, 13063.0, 2416.0, 711.0, 297.0, 128.0, 75.0, 44.0, 35.0, 19.0, 16.0, 23.0, 7.0, 7.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3603515625, -0.34632110595703125, -0.3322906494140625, -0.31826019287109375, -0.304229736328125, -0.29019927978515625, -0.2761688232421875, -0.26213836669921875, -0.24810791015625, -0.23407745361328125, -0.2200469970703125, -0.20601654052734375, -0.191986083984375, -0.17795562744140625, -0.1639251708984375, -0.14989471435546875, -0.1358642578125, -0.12183380126953125, -0.1078033447265625, -0.09377288818359375, -0.079742431640625, -0.06571197509765625, -0.0516815185546875, -0.03765106201171875, -0.02362060546875, -0.00959014892578125, 0.0044403076171875, 0.01847076416015625, 0.032501220703125, 0.04653167724609375, 0.0605621337890625, 0.07459259033203125, 0.088623046875, 0.10265350341796875, 0.1166839599609375, 0.13071441650390625, 0.144744873046875, 0.15877532958984375, 0.1728057861328125, 0.18683624267578125, 0.20086669921875, 0.21489715576171875, 0.2289276123046875, 0.24295806884765625, 0.256988525390625, 0.27101898193359375, 0.2850494384765625, 0.29907989501953125, 0.3131103515625, 0.32714080810546875, 0.3411712646484375, 0.35520172119140625, 0.369232177734375, 0.38326263427734375, 0.3972930908203125, 0.41132354736328125, 0.42535400390625, 0.43938446044921875, 0.4534149169921875, 0.46744537353515625, 0.481475830078125, 0.49550628662109375, 0.5095367431640625, 0.5235671997070312, 0.53759765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 6.0, 5.0, 9.0, 19.0, 24.0, 23.0, 24.0, 32.0, 32.0, 44.0, 58.0, 49.0, 73.0, 75.0, 68.0, 56.0, 56.0, 67.0, 49.0, 39.0, 37.0, 26.0, 25.0, 11.0, 17.0, 22.0, 8.0, 12.0, 10.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09844970703125, -0.09438610076904297, -0.09032249450683594, -0.0862588882446289, -0.08219528198242188, -0.07813167572021484, -0.07406806945800781, -0.07000446319580078, -0.06594085693359375, -0.06187725067138672, -0.05781364440917969, -0.053750038146972656, -0.049686431884765625, -0.045622825622558594, -0.04155921936035156, -0.03749561309814453, -0.0334320068359375, -0.02936840057373047, -0.025304794311523438, -0.021241188049316406, -0.017177581787109375, -0.013113975524902344, -0.009050369262695312, -0.004986763000488281, -0.00092315673828125, 0.0031404495239257812, 0.0072040557861328125, 0.011267662048339844, 0.015331268310546875, 0.019394874572753906, 0.023458480834960938, 0.02752208709716797, 0.031585693359375, 0.03564929962158203, 0.03971290588378906, 0.043776512145996094, 0.047840118408203125, 0.051903724670410156, 0.05596733093261719, 0.06003093719482422, 0.06409454345703125, 0.06815814971923828, 0.07222175598144531, 0.07628536224365234, 0.08034896850585938, 0.0844125747680664, 0.08847618103027344, 0.09253978729248047, 0.0966033935546875, 0.10066699981689453, 0.10473060607910156, 0.1087942123413086, 0.11285781860351562, 0.11692142486572266, 0.12098503112792969, 0.12504863739013672, 0.12911224365234375, 0.13317584991455078, 0.1372394561767578, 0.14130306243896484, 0.14536666870117188, 0.1494302749633789, 0.15349388122558594, 0.15755748748779297, 0.16162109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 5.0, 12.0, 8.0, 20.0, 26.0, 34.0, 65.0, 95.0, 127.0, 232.0, 453.0, 775.0, 1695.0, 4595.0, 16026.0, 96081.0, 779544.0, 121739.0, 17976.0, 5111.0, 1893.0, 854.0, 433.0, 260.0, 157.0, 117.0, 49.0, 55.0, 29.0, 22.0, 12.0, 10.0, 9.0, 7.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2103271484375, -0.20344161987304688, -0.19655609130859375, -0.18967056274414062, -0.1827850341796875, -0.17589950561523438, -0.16901397705078125, -0.16212844848632812, -0.155242919921875, -0.14835739135742188, -0.14147186279296875, -0.13458633422851562, -0.1277008056640625, -0.12081527709960938, -0.11392974853515625, -0.10704421997070312, -0.10015869140625, -0.09327316284179688, -0.08638763427734375, -0.07950210571289062, -0.0726165771484375, -0.06573104858398438, -0.05884552001953125, -0.051959991455078125, -0.045074462890625, -0.038188934326171875, -0.03130340576171875, -0.024417877197265625, -0.0175323486328125, -0.010646820068359375, -0.00376129150390625, 0.003124237060546875, 0.010009765625, 0.016895294189453125, 0.02378082275390625, 0.030666351318359375, 0.0375518798828125, 0.044437408447265625, 0.05132293701171875, 0.058208465576171875, 0.065093994140625, 0.07197952270507812, 0.07886505126953125, 0.08575057983398438, 0.0926361083984375, 0.09952163696289062, 0.10640716552734375, 0.11329269409179688, 0.12017822265625, 0.12706375122070312, 0.13394927978515625, 0.14083480834960938, 0.1477203369140625, 0.15460586547851562, 0.16149139404296875, 0.16837692260742188, 0.175262451171875, 0.18214797973632812, 0.18903350830078125, 0.19591903686523438, 0.2028045654296875, 0.20969009399414062, 0.21657562255859375, 0.22346115112304688, 0.2303466796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 5.0, 4.0, 4.0, 2.0, 4.0, 5.0, 7.0, 5.0, 7.0, 8.0, 6.0, 10.0, 12.0, 12.0, 12.0, 18.0, 19.0, 20.0, 35.0, 30.0, 45.0, 57.0, 63.0, 81.0, 77.0, 77.0, 55.0, 46.0, 45.0, 33.0, 31.0, 25.0, 23.0, 23.0, 16.0, 10.0, 12.0, 11.0, 6.0, 10.0, 7.0, 5.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0006203651428222656, -0.0006022229790687561, -0.0005840808153152466, -0.0005659386515617371, -0.0005477964878082275, -0.000529654324054718, -0.0005115121603012085, -0.000493369996547699, -0.00047522783279418945, -0.00045708566904067993, -0.0004389435052871704, -0.0004208013415336609, -0.00040265917778015137, -0.00038451701402664185, -0.0003663748502731323, -0.0003482326865196228, -0.0003300905227661133, -0.00031194835901260376, -0.00029380619525909424, -0.0002756640315055847, -0.0002575218677520752, -0.00023937970399856567, -0.00022123754024505615, -0.00020309537649154663, -0.0001849532127380371, -0.0001668110489845276, -0.00014866888523101807, -0.00013052672147750854, -0.00011238455772399902, -9.42423939704895e-05, -7.610023021697998e-05, -5.795806646347046e-05, -3.981590270996094e-05, -2.1673738956451416e-05, -3.5315752029418945e-06, 1.4610588550567627e-05, 3.275275230407715e-05, 5.089491605758667e-05, 6.903707981109619e-05, 8.717924356460571e-05, 0.00010532140731811523, 0.00012346357107162476, 0.00014160573482513428, 0.0001597478985786438, 0.00017789006233215332, 0.00019603222608566284, 0.00021417438983917236, 0.00023231655359268188, 0.0002504587173461914, 0.00026860088109970093, 0.00028674304485321045, 0.00030488520860671997, 0.0003230273723602295, 0.000341169536113739, 0.00035931169986724854, 0.00037745386362075806, 0.0003955960273742676, 0.0004137381911277771, 0.0004318803548812866, 0.00045002251863479614, 0.00046816468238830566, 0.0004863068461418152, 0.0005044490098953247, 0.0005225911736488342, 0.0005407333374023438]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 6.0, 15.0, 25.0, 70.0, 156.0, 500.0, 2314.0, 69135.0, 965409.0, 9436.0, 980.0, 283.0, 110.0, 57.0, 24.0, 15.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.351318359375, -0.3320808410644531, -0.31284332275390625, -0.2936058044433594, -0.2743682861328125, -0.2551307678222656, -0.23589324951171875, -0.21665573120117188, -0.197418212890625, -0.17818069458007812, -0.15894317626953125, -0.13970565795898438, -0.1204681396484375, -0.10123062133789062, -0.08199310302734375, -0.06275558471679688, -0.04351806640625, -0.024280548095703125, -0.00504302978515625, 0.014194488525390625, 0.0334320068359375, 0.052669525146484375, 0.07190704345703125, 0.09114456176757812, 0.110382080078125, 0.12961959838867188, 0.14885711669921875, 0.16809463500976562, 0.1873321533203125, 0.20656967163085938, 0.22580718994140625, 0.24504470825195312, 0.2642822265625, 0.2835197448730469, 0.30275726318359375, 0.3219947814941406, 0.3412322998046875, 0.3604698181152344, 0.37970733642578125, 0.3989448547363281, 0.418182373046875, 0.4374198913574219, 0.45665740966796875, 0.4758949279785156, 0.4951324462890625, 0.5143699645996094, 0.5336074829101562, 0.5528450012207031, 0.57208251953125, 0.5913200378417969, 0.6105575561523438, 0.6297950744628906, 0.6490325927734375, 0.6682701110839844, 0.6875076293945312, 0.7067451477050781, 0.725982666015625, 0.7452201843261719, 0.7644577026367188, 0.7836952209472656, 0.8029327392578125, 0.8221702575683594, 0.8414077758789062, 0.8606452941894531, 0.8798828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 12.0, 18.0, 19.0, 42.0, 87.0, 198.0, 235.0, 180.0, 105.0, 44.0, 18.0, 14.0, 13.0, 4.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1298828125, -0.12382888793945312, -0.11777496337890625, -0.11172103881835938, -0.1056671142578125, -0.09961318969726562, -0.09355926513671875, -0.08750534057617188, -0.081451416015625, -0.07539749145507812, -0.06934356689453125, -0.06328964233398438, -0.0572357177734375, -0.051181793212890625, -0.04512786865234375, -0.039073944091796875, -0.03302001953125, -0.026966094970703125, -0.02091217041015625, -0.014858245849609375, -0.0088043212890625, -0.002750396728515625, 0.00330352783203125, 0.009357452392578125, 0.015411376953125, 0.021465301513671875, 0.02751922607421875, 0.033573150634765625, 0.0396270751953125, 0.045680999755859375, 0.05173492431640625, 0.057788848876953125, 0.0638427734375, 0.06989669799804688, 0.07595062255859375, 0.08200454711914062, 0.0880584716796875, 0.09411239624023438, 0.10016632080078125, 0.10622024536132812, 0.112274169921875, 0.11832809448242188, 0.12438201904296875, 0.13043594360351562, 0.1364898681640625, 0.14254379272460938, 0.14859771728515625, 0.15465164184570312, 0.16070556640625, 0.16675949096679688, 0.17281341552734375, 0.17886734008789062, 0.1849212646484375, 0.19097518920898438, 0.19702911376953125, 0.20308303833007812, 0.209136962890625, 0.21519088745117188, 0.22124481201171875, 0.22729873657226562, 0.2333526611328125, 0.23940658569335938, 0.24546051025390625, 0.2515144348144531, 0.257568359375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 42.0, 880.0, 85.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.141572952270508, -18.791067123413086, -18.440561294555664, -18.090057373046875, -17.739551544189453, -17.38904571533203, -17.03853988647461, -16.688034057617188, -16.3375301361084, -15.987024307250977, -15.636519432067871, -15.28601360321045, -14.935508728027344, -14.585002899169922, -14.2344970703125, -13.883992195129395, -13.533486366271973, -13.18298053741455, -12.832475662231445, -12.481969833374023, -12.131464958190918, -11.780959129333496, -11.43045425415039, -11.079948425292969, -10.729442596435547, -10.378936767578125, -10.02843189239502, -9.677926063537598, -9.327421188354492, -8.97691535949707, -8.626409530639648, -8.275904655456543, -7.9253997802734375, -7.574894428253174, -7.22438907623291, -6.873883247375488, -6.523378372192383, -6.172872543334961, -5.822367191314697, -5.471861839294434, -5.121356010437012, -4.770850658416748, -4.420345306396484, -4.0698394775390625, -3.719334363937378, -3.3688290119171143, -3.0183234214782715, -2.667818069458008, -2.3173129558563232, -1.9668076038360596, -1.6163021326065063, -1.2657966613769531, -0.9152913093566895, -0.5647859573364258, -0.214280366897583, 0.13622498512268066, 0.48673033714294434, 0.8372357487678528, 1.1877411603927612, 1.5382466316223145, 1.8887519836425781, 2.239257335662842, 2.5897629261016846, 2.9402682781219482, 3.290773630142212]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 13.0, 23.0, 31.0, 30.0, 48.0, 53.0, 58.0, 54.0, 67.0, 51.0, 87.0, 76.0, 80.0, 50.0, 60.0, 61.0, 32.0, 38.0, 25.0, 28.0, 9.0, 12.0, 7.0, 3.0, 2.0, 4.0, 3.0], "bins": [-1.6099014282226562, -1.5777150392532349, -1.545528769493103, -1.5133423805236816, -1.4811561107635498, -1.4489697217941284, -1.416783332824707, -1.3845970630645752, -1.3524106740951538, -1.3202242851257324, -1.2880380153656006, -1.2558516263961792, -1.2236652374267578, -1.191478967666626, -1.1592925786972046, -1.1271063089370728, -1.0949199199676514, -1.06273353099823, -1.0305472612380981, -0.9983608722686768, -0.9661745429039001, -0.9339882135391235, -0.9018018245697021, -0.8696154952049255, -0.8374291658401489, -0.8052428364753723, -0.7730565071105957, -0.7408701181411743, -0.7086837887763977, -0.6764974594116211, -0.6443110704421997, -0.6121247410774231, -0.5799384713172913, -0.5477521419525146, -0.5155657529830933, -0.48337942361831665, -0.45119309425354004, -0.4190067648887634, -0.38682040572166443, -0.35463404655456543, -0.3224477171897888, -0.2902613878250122, -0.2580750286579132, -0.2258886843919754, -0.1937023401260376, -0.1615159958600998, -0.129329651594162, -0.09714330732822418, -0.06495696306228638, -0.03277061879634857, -0.0005842745304107666, 0.03160206973552704, 0.06378841400146484, 0.09597475826740265, 0.12816110253334045, 0.16034744679927826, 0.19253379106521606, 0.22472013533115387, 0.2569064795970917, 0.2890928387641907, 0.3212791681289673, 0.3534654974937439, 0.3856518566608429, 0.4178382158279419, 0.4500245451927185]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 10.0, 26.0, 45.0, 77.0, 167.0, 516.0, 2593.0, 23338.0, 3900619.0, 253818.0, 10556.0, 1493.0, 357.0, 172.0, 114.0, 76.0, 48.0, 27.0, 19.0, 27.0, 18.0, 18.0, 11.0, 14.0, 12.0, 9.0, 7.0, 11.0, 6.0, 8.0, 10.0, 9.0, 5.0, 6.0, 3.0, 6.0, 4.0, 2.0, 5.0, 4.0, 1.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.309814453125, -0.2857017517089844, -0.26158905029296875, -0.23747634887695312, -0.2133636474609375, -0.18925094604492188, -0.16513824462890625, -0.14102554321289062, -0.116912841796875, -0.09280014038085938, -0.06868743896484375, -0.044574737548828125, -0.0204620361328125, 0.003650665283203125, 0.02776336669921875, 0.051876068115234375, 0.07598876953125, 0.10010147094726562, 0.12421417236328125, 0.14832687377929688, 0.1724395751953125, 0.19655227661132812, 0.22066497802734375, 0.24477767944335938, 0.268890380859375, 0.2930030822753906, 0.31711578369140625, 0.3412284851074219, 0.3653411865234375, 0.3894538879394531, 0.41356658935546875, 0.4376792907714844, 0.4617919921875, 0.4859046936035156, 0.5100173950195312, 0.5341300964355469, 0.5582427978515625, 0.5823554992675781, 0.6064682006835938, 0.6305809020996094, 0.654693603515625, 0.6788063049316406, 0.7029190063476562, 0.7270317077636719, 0.7511444091796875, 0.7752571105957031, 0.7993698120117188, 0.8234825134277344, 0.84759521484375, 0.8717079162597656, 0.8958206176757812, 0.9199333190917969, 0.9440460205078125, 0.9681587219238281, 0.9922714233398438, 1.0163841247558594, 1.040496826171875, 1.0646095275878906, 1.0887222290039062, 1.1128349304199219, 1.1369476318359375, 1.1610603332519531, 1.1851730346679688, 1.2092857360839844, 1.2333984375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 15.0, 21.0, 64.0, 107.0, 161.0, 224.0, 175.0, 126.0, 71.0, 34.0, 10.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0235595703125, -0.021121978759765625, -0.01868438720703125, -0.016246795654296875, -0.0138092041015625, -0.011371612548828125, -0.00893402099609375, -0.006496429443359375, -0.004058837890625, -0.001621246337890625, 0.00081634521484375, 0.003253936767578125, 0.0056915283203125, 0.008129119873046875, 0.01056671142578125, 0.013004302978515625, 0.01544189453125, 0.017879486083984375, 0.02031707763671875, 0.022754669189453125, 0.0251922607421875, 0.027629852294921875, 0.03006744384765625, 0.032505035400390625, 0.034942626953125, 0.037380218505859375, 0.03981781005859375, 0.042255401611328125, 0.0446929931640625, 0.047130584716796875, 0.04956817626953125, 0.052005767822265625, 0.054443359375, 0.056880950927734375, 0.05931854248046875, 0.061756134033203125, 0.0641937255859375, 0.06663131713867188, 0.06906890869140625, 0.07150650024414062, 0.073944091796875, 0.07638168334960938, 0.07881927490234375, 0.08125686645507812, 0.0836944580078125, 0.08613204956054688, 0.08856964111328125, 0.09100723266601562, 0.09344482421875, 0.09588241577148438, 0.09832000732421875, 0.10075759887695312, 0.1031951904296875, 0.10563278198242188, 0.10807037353515625, 0.11050796508789062, 0.112945556640625, 0.11538314819335938, 0.11782073974609375, 0.12025833129882812, 0.1226959228515625, 0.12513351440429688, 0.12757110595703125, 0.13000869750976562, 0.1324462890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 12.0, 19.0, 38.0, 43.0, 80.0, 148.0, 337.0, 776.0, 3744.0, 304862.0, 3876629.0, 5456.0, 1106.0, 492.0, 235.0, 132.0, 67.0, 36.0, 24.0, 10.0, 11.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79443359375, -0.7504959106445312, -0.7065582275390625, -0.6626205444335938, -0.618682861328125, -0.5747451782226562, -0.5308074951171875, -0.48686981201171875, -0.44293212890625, -0.39899444580078125, -0.3550567626953125, -0.31111907958984375, -0.267181396484375, -0.22324371337890625, -0.1793060302734375, -0.13536834716796875, -0.0914306640625, -0.04749298095703125, -0.0035552978515625, 0.04038238525390625, 0.084320068359375, 0.12825775146484375, 0.1721954345703125, 0.21613311767578125, 0.26007080078125, 0.30400848388671875, 0.3479461669921875, 0.39188385009765625, 0.435821533203125, 0.47975921630859375, 0.5236968994140625, 0.5676345825195312, 0.611572265625, 0.6555099487304688, 0.6994476318359375, 0.7433853149414062, 0.787322998046875, 0.8312606811523438, 0.8751983642578125, 0.9191360473632812, 0.96307373046875, 1.0070114135742188, 1.0509490966796875, 1.0948867797851562, 1.138824462890625, 1.1827621459960938, 1.2266998291015625, 1.2706375122070312, 1.3145751953125, 1.3585128784179688, 1.4024505615234375, 1.4463882446289062, 1.490325927734375, 1.5342636108398438, 1.5782012939453125, 1.6221389770507812, 1.66607666015625, 1.7100143432617188, 1.7539520263671875, 1.7978897094726562, 1.841827392578125, 1.8857650756835938, 1.9297027587890625, 1.9736404418945312, 2.017578125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 8.0, 7.0, 16.0, 17.0, 23.0, 45.0, 76.0, 168.0, 679.0, 2485.0, 319.0, 90.0, 67.0, 32.0, 18.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056396484375, -0.052928924560546875, -0.04946136474609375, -0.045993804931640625, -0.0425262451171875, -0.039058685302734375, -0.03559112548828125, -0.032123565673828125, -0.028656005859375, -0.025188446044921875, -0.02172088623046875, -0.018253326416015625, -0.0147857666015625, -0.011318206787109375, -0.00785064697265625, -0.004383087158203125, -0.00091552734375, 0.002552032470703125, 0.00601959228515625, 0.009487152099609375, 0.0129547119140625, 0.016422271728515625, 0.01988983154296875, 0.023357391357421875, 0.026824951171875, 0.030292510986328125, 0.03376007080078125, 0.037227630615234375, 0.0406951904296875, 0.044162750244140625, 0.04763031005859375, 0.051097869873046875, 0.0545654296875, 0.058032989501953125, 0.06150054931640625, 0.06496810913085938, 0.0684356689453125, 0.07190322875976562, 0.07537078857421875, 0.07883834838867188, 0.082305908203125, 0.08577346801757812, 0.08924102783203125, 0.09270858764648438, 0.0961761474609375, 0.09964370727539062, 0.10311126708984375, 0.10657882690429688, 0.11004638671875, 0.11351394653320312, 0.11698150634765625, 0.12044906616210938, 0.1239166259765625, 0.12738418579101562, 0.13085174560546875, 0.13431930541992188, 0.137786865234375, 0.14125442504882812, 0.14472198486328125, 0.14818954467773438, 0.1516571044921875, 0.15512466430664062, 0.15859222412109375, 0.16205978393554688, 0.16552734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 61.0, 678.0, 223.0, 28.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.192574977874756, -5.088194370269775, -4.983813762664795, -4.879433631896973, -4.775053024291992, -4.670672416687012, -4.566291809082031, -4.461911201477051, -4.3575310707092285, -4.253150463104248, -4.148769855499268, -4.044389724731445, -3.940009117126465, -3.8356285095214844, -3.731247901916504, -3.6268675327301025, -3.522486925125122, -3.4181063175201416, -3.3137259483337402, -3.2093453407287598, -3.1049649715423584, -3.000584363937378, -2.8962039947509766, -2.791823387145996, -2.6874427795410156, -2.583062171936035, -2.478681802749634, -2.3743011951446533, -2.269920825958252, -2.1655402183532715, -2.061159610748291, -1.9567792415618896, -1.8523986339569092, -1.7480181455612183, -1.6436376571655273, -1.5392570495605469, -1.4348766803741455, -1.330496072769165, -1.2261155843734741, -1.1217350959777832, -1.0173546075820923, -0.9129741191864014, -0.8085936307907104, -0.7042130827903748, -0.5998325943946838, -0.4954521059989929, -0.3910715579986572, -0.2866910696029663, -0.1823105812072754, -0.07793007791042328, 0.026450425386428833, 0.13083094358444214, 0.23521143198013306, 0.339591920375824, 0.44397246837615967, 0.5483529567718506, 0.6527334451675415, 0.7571139335632324, 0.8614944219589233, 0.965874969959259, 1.0702555179595947, 1.174635887145996, 1.2790164947509766, 1.3833969831466675, 1.4877774715423584]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 6.0, 4.0, 5.0, 12.0, 24.0, 37.0, 53.0, 67.0, 98.0, 104.0, 100.0, 125.0, 102.0, 93.0, 62.0, 52.0, 25.0, 20.0, 5.0, 12.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6837261319160461, -0.6633762717247009, -0.6430264711380005, -0.6226766109466553, -0.6023267507553101, -0.5819769501686096, -0.5616270899772644, -0.541277289390564, -0.5209274291992188, -0.5005775690078735, -0.4802277684211731, -0.4598779082298279, -0.43952807784080505, -0.4191782474517822, -0.398828387260437, -0.3784785568714142, -0.35812872648239136, -0.33777889609336853, -0.3174290657043457, -0.2970792055130005, -0.27672937512397766, -0.25637954473495483, -0.2360296994447708, -0.2156798541545868, -0.19533002376556396, -0.17498019337654114, -0.15463034808635712, -0.1342805027961731, -0.11393067240715027, -0.09358083456754684, -0.07323099672794342, -0.0528811514377594, -0.03253132104873657, -0.012181483209133148, 0.008168354630470276, 0.0285181924700737, 0.048868030309677124, 0.06921786814928055, 0.08956770598888397, 0.109917551279068, 0.13026738166809082, 0.15061721205711365, 0.17096705734729767, 0.1913169026374817, 0.21166673302650452, 0.23201656341552734, 0.25236642360687256, 0.2727162539958954, 0.2930660843849182, 0.31341591477394104, 0.33376574516296387, 0.3541156053543091, 0.3744654357433319, 0.39481526613235474, 0.41516512632369995, 0.4355149567127228, 0.4558647871017456, 0.47621461749076843, 0.49656444787979126, 0.5169143080711365, 0.5372641086578369, 0.5576139688491821, 0.5779638290405273, 0.5983136892318726, 0.618663489818573]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 6.0, 11.0, 7.0, 11.0, 22.0, 20.0, 32.0, 30.0, 35.0, 49.0, 69.0, 126.0, 201.0, 396.0, 1172.0, 7409.0, 110899.0, 843317.0, 77114.0, 5691.0, 961.0, 381.0, 181.0, 105.0, 81.0, 43.0, 32.0, 23.0, 15.0, 15.0, 19.0, 16.0, 7.0, 11.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58642578125, -0.5650558471679688, -0.5436859130859375, -0.5223159790039062, -0.500946044921875, -0.47957611083984375, -0.4582061767578125, -0.43683624267578125, -0.41546630859375, -0.39409637451171875, -0.3727264404296875, -0.35135650634765625, -0.329986572265625, -0.30861663818359375, -0.2872467041015625, -0.26587677001953125, -0.2445068359375, -0.22313690185546875, -0.2017669677734375, -0.18039703369140625, -0.159027099609375, -0.13765716552734375, -0.1162872314453125, -0.09491729736328125, -0.07354736328125, -0.05217742919921875, -0.0308074951171875, -0.00943756103515625, 0.011932373046875, 0.03330230712890625, 0.0546722412109375, 0.07604217529296875, 0.097412109375, 0.11878204345703125, 0.1401519775390625, 0.16152191162109375, 0.182891845703125, 0.20426177978515625, 0.2256317138671875, 0.24700164794921875, 0.26837158203125, 0.28974151611328125, 0.3111114501953125, 0.33248138427734375, 0.353851318359375, 0.37522125244140625, 0.3965911865234375, 0.41796112060546875, 0.4393310546875, 0.46070098876953125, 0.4820709228515625, 0.5034408569335938, 0.524810791015625, 0.5461807250976562, 0.5675506591796875, 0.5889205932617188, 0.61029052734375, 0.6316604614257812, 0.6530303955078125, 0.6744003295898438, 0.695770263671875, 0.7171401977539062, 0.7385101318359375, 0.7598800659179688, 0.78125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 11.0, 28.0, 58.0, 101.0, 162.0, 185.0, 194.0, 126.0, 70.0, 45.0, 17.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0577392578125, -0.05465888977050781, -0.051578521728515625, -0.04849815368652344, -0.04541778564453125, -0.04233741760253906, -0.039257049560546875, -0.03617668151855469, -0.0330963134765625, -0.030015945434570312, -0.026935577392578125, -0.023855209350585938, -0.02077484130859375, -0.017694473266601562, -0.014614105224609375, -0.011533737182617188, -0.008453369140625, -0.0053730010986328125, -0.002292633056640625, 0.0007877349853515625, 0.00386810302734375, 0.0069484710693359375, 0.010028839111328125, 0.013109207153320312, 0.0161895751953125, 0.019269943237304688, 0.022350311279296875, 0.025430679321289062, 0.02851104736328125, 0.03159141540527344, 0.034671783447265625, 0.03775215148925781, 0.04083251953125, 0.04391288757324219, 0.046993255615234375, 0.05007362365722656, 0.05315399169921875, 0.05623435974121094, 0.059314727783203125, 0.06239509582519531, 0.0654754638671875, 0.06855583190917969, 0.07163619995117188, 0.07471656799316406, 0.07779693603515625, 0.08087730407714844, 0.08395767211914062, 0.08703804016113281, 0.090118408203125, 0.09319877624511719, 0.09627914428710938, 0.09935951232910156, 0.10243988037109375, 0.10552024841308594, 0.10860061645507812, 0.11168098449707031, 0.1147613525390625, 0.11784172058105469, 0.12092208862304688, 0.12400245666503906, 0.12708282470703125, 0.13016319274902344, 0.13324356079101562, 0.1363239288330078, 0.139404296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 5.0, 6.0, 11.0, 9.0, 16.0, 27.0, 26.0, 54.0, 67.0, 104.0, 156.0, 246.0, 463.0, 822.0, 1725.0, 3883.0, 10118.0, 33316.0, 138842.0, 515198.0, 259315.0, 57755.0, 15793.0, 5592.0, 2423.0, 1136.0, 536.0, 319.0, 188.0, 126.0, 80.0, 45.0, 33.0, 28.0, 27.0, 10.0, 13.0, 10.0, 5.0, 8.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.270751953125, -0.2631683349609375, -0.255584716796875, -0.2480010986328125, -0.24041748046875, -0.2328338623046875, -0.225250244140625, -0.2176666259765625, -0.2100830078125, -0.2024993896484375, -0.194915771484375, -0.1873321533203125, -0.17974853515625, -0.1721649169921875, -0.164581298828125, -0.1569976806640625, -0.1494140625, -0.1418304443359375, -0.134246826171875, -0.1266632080078125, -0.11907958984375, -0.1114959716796875, -0.103912353515625, -0.0963287353515625, -0.0887451171875, -0.0811614990234375, -0.073577880859375, -0.0659942626953125, -0.05841064453125, -0.0508270263671875, -0.043243408203125, -0.0356597900390625, -0.028076171875, -0.0204925537109375, -0.012908935546875, -0.0053253173828125, 0.00225830078125, 0.0098419189453125, 0.017425537109375, 0.0250091552734375, 0.0325927734375, 0.0401763916015625, 0.047760009765625, 0.0553436279296875, 0.06292724609375, 0.0705108642578125, 0.078094482421875, 0.0856781005859375, 0.09326171875, 0.1008453369140625, 0.108428955078125, 0.1160125732421875, 0.12359619140625, 0.1311798095703125, 0.138763427734375, 0.1463470458984375, 0.1539306640625, 0.1615142822265625, 0.169097900390625, 0.1766815185546875, 0.18426513671875, 0.1918487548828125, 0.199432373046875, 0.2070159912109375, 0.214599609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 6.0, 4.0, 9.0, 21.0, 13.0, 27.0, 24.0, 31.0, 35.0, 49.0, 50.0, 47.0, 54.0, 48.0, 50.0, 53.0, 47.0, 36.0, 57.0, 41.0, 49.0, 36.0, 32.0, 27.0, 28.0, 30.0, 20.0, 11.0, 17.0, 10.0, 11.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159423828125, -0.15469741821289062, -0.14997100830078125, -0.14524459838867188, -0.1405181884765625, -0.13579177856445312, -0.13106536865234375, -0.12633895874023438, -0.121612548828125, -0.11688613891601562, -0.11215972900390625, -0.10743331909179688, -0.1027069091796875, -0.09798049926757812, -0.09325408935546875, -0.08852767944335938, -0.08380126953125, -0.07907485961914062, -0.07434844970703125, -0.06962203979492188, -0.0648956298828125, -0.060169219970703125, -0.05544281005859375, -0.050716400146484375, -0.045989990234375, -0.041263580322265625, -0.03653717041015625, -0.031810760498046875, -0.0270843505859375, -0.022357940673828125, -0.01763153076171875, -0.012905120849609375, -0.0081787109375, -0.003452301025390625, 0.00127410888671875, 0.006000518798828125, 0.0107269287109375, 0.015453338623046875, 0.02017974853515625, 0.024906158447265625, 0.029632568359375, 0.034358978271484375, 0.03908538818359375, 0.043811798095703125, 0.0485382080078125, 0.053264617919921875, 0.05799102783203125, 0.06271743774414062, 0.06744384765625, 0.07217025756835938, 0.07689666748046875, 0.08162307739257812, 0.0863494873046875, 0.09107589721679688, 0.09580230712890625, 0.10052871704101562, 0.105255126953125, 0.10998153686523438, 0.11470794677734375, 0.11943435668945312, 0.1241607666015625, 0.12888717651367188, 0.13361358642578125, 0.13833999633789062, 0.14306640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 9.0, 8.0, 15.0, 16.0, 18.0, 38.0, 54.0, 93.0, 169.0, 313.0, 511.0, 1057.0, 2187.0, 5646.0, 18203.0, 108529.0, 747217.0, 133243.0, 20146.0, 6270.0, 2406.0, 1118.0, 568.0, 308.0, 158.0, 99.0, 52.0, 30.0, 26.0, 15.0, 9.0, 9.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1397705078125, -0.1345043182373047, -0.12923812866210938, -0.12397193908691406, -0.11870574951171875, -0.11343955993652344, -0.10817337036132812, -0.10290718078613281, -0.0976409912109375, -0.09237480163574219, -0.08710861206054688, -0.08184242248535156, -0.07657623291015625, -0.07131004333496094, -0.06604385375976562, -0.06077766418457031, -0.055511474609375, -0.05024528503417969, -0.044979095458984375, -0.03971290588378906, -0.03444671630859375, -0.029180526733398438, -0.023914337158203125, -0.018648147583007812, -0.0133819580078125, -0.008115768432617188, -0.002849578857421875, 0.0024166107177734375, 0.00768280029296875, 0.012948989868164062, 0.018215179443359375, 0.023481369018554688, 0.02874755859375, 0.03401374816894531, 0.039279937744140625, 0.04454612731933594, 0.04981231689453125, 0.05507850646972656, 0.060344696044921875, 0.06561088562011719, 0.0708770751953125, 0.07614326477050781, 0.08140945434570312, 0.08667564392089844, 0.09194183349609375, 0.09720802307128906, 0.10247421264648438, 0.10774040222167969, 0.113006591796875, 0.11827278137207031, 0.12353897094726562, 0.12880516052246094, 0.13407135009765625, 0.13933753967285156, 0.14460372924804688, 0.1498699188232422, 0.1551361083984375, 0.1604022979736328, 0.16566848754882812, 0.17093467712402344, 0.17620086669921875, 0.18146705627441406, 0.18673324584960938, 0.1919994354248047, 0.197265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 0.0, 5.0, 6.0, 9.0, 8.0, 7.0, 13.0, 17.0, 25.0, 42.0, 52.0, 69.0, 97.0, 122.0, 128.0, 96.0, 89.0, 48.0, 43.0, 25.0, 21.0, 24.0, 11.0, 7.0, 6.0, 6.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003757476806640625, -0.0003628730773925781, -0.00034999847412109375, -0.0003371238708496094, -0.000324249267578125, -0.0003113746643066406, -0.00029850006103515625, -0.0002856254577636719, -0.0002727508544921875, -0.0002598762512207031, -0.00024700164794921875, -0.00023412704467773438, -0.00022125244140625, -0.00020837783813476562, -0.00019550323486328125, -0.00018262863159179688, -0.0001697540283203125, -0.00015687942504882812, -0.00014400482177734375, -0.00013113021850585938, -0.000118255615234375, -0.00010538101196289062, -9.250640869140625e-05, -7.963180541992188e-05, -6.67572021484375e-05, -5.3882598876953125e-05, -4.100799560546875e-05, -2.8133392333984375e-05, -1.52587890625e-05, -2.384185791015625e-06, 1.049041748046875e-05, 2.3365020751953125e-05, 3.62396240234375e-05, 4.9114227294921875e-05, 6.198883056640625e-05, 7.486343383789062e-05, 8.7738037109375e-05, 0.00010061264038085938, 0.00011348724365234375, 0.00012636184692382812, 0.0001392364501953125, 0.00015211105346679688, 0.00016498565673828125, 0.00017786026000976562, 0.00019073486328125, 0.00020360946655273438, 0.00021648406982421875, 0.00022935867309570312, 0.0002422332763671875, 0.0002551078796386719, 0.00026798248291015625, 0.0002808570861816406, 0.000293731689453125, 0.0003066062927246094, 0.00031948089599609375, 0.0003323554992675781, 0.0003452301025390625, 0.0003581047058105469, 0.00037097930908203125, 0.0003838539123535156, 0.000396728515625, 0.0004096031188964844, 0.00042247772216796875, 0.0004353523254394531, 0.0004482269287109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 7.0, 2.0, 7.0, 9.0, 13.0, 19.0, 21.0, 33.0, 34.0, 64.0, 98.0, 138.0, 247.0, 462.0, 862.0, 1839.0, 4801.0, 15547.0, 86571.0, 689617.0, 209816.0, 26303.0, 7039.0, 2563.0, 1089.0, 550.0, 331.0, 157.0, 113.0, 63.0, 38.0, 33.0, 19.0, 14.0, 13.0, 4.0, 3.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.138916015625, -0.13438796997070312, -0.12985992431640625, -0.12533187866210938, -0.1208038330078125, -0.11627578735351562, -0.11174774169921875, -0.10721969604492188, -0.102691650390625, -0.09816360473632812, -0.09363555908203125, -0.08910751342773438, -0.0845794677734375, -0.08005142211914062, -0.07552337646484375, -0.07099533081054688, -0.06646728515625, -0.061939239501953125, -0.05741119384765625, -0.052883148193359375, -0.0483551025390625, -0.043827056884765625, -0.03929901123046875, -0.034770965576171875, -0.030242919921875, -0.025714874267578125, -0.02118682861328125, -0.016658782958984375, -0.0121307373046875, -0.007602691650390625, -0.00307464599609375, 0.001453399658203125, 0.0059814453125, 0.010509490966796875, 0.01503753662109375, 0.019565582275390625, 0.0240936279296875, 0.028621673583984375, 0.03314971923828125, 0.037677764892578125, 0.042205810546875, 0.046733856201171875, 0.05126190185546875, 0.055789947509765625, 0.0603179931640625, 0.06484603881835938, 0.06937408447265625, 0.07390213012695312, 0.07843017578125, 0.08295822143554688, 0.08748626708984375, 0.09201431274414062, 0.0965423583984375, 0.10107040405273438, 0.10559844970703125, 0.11012649536132812, 0.114654541015625, 0.11918258666992188, 0.12371063232421875, 0.12823867797851562, 0.1327667236328125, 0.13729476928710938, 0.14182281494140625, 0.14635086059570312, 0.15087890625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 1.0, 2.0, 3.0, 10.0, 4.0, 8.0, 6.0, 11.0, 19.0, 25.0, 46.0, 54.0, 77.0, 91.0, 116.0, 100.0, 98.0, 87.0, 70.0, 58.0, 36.0, 21.0, 22.0, 8.0, 8.0, 8.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0916748046875, -0.08893013000488281, -0.08618545532226562, -0.08344078063964844, -0.08069610595703125, -0.07795143127441406, -0.07520675659179688, -0.07246208190917969, -0.0697174072265625, -0.06697273254394531, -0.06422805786132812, -0.06148338317871094, -0.05873870849609375, -0.05599403381347656, -0.053249359130859375, -0.05050468444824219, -0.047760009765625, -0.04501533508300781, -0.042270660400390625, -0.03952598571777344, -0.03678131103515625, -0.03403663635253906, -0.031291961669921875, -0.028547286987304688, -0.0258026123046875, -0.023057937622070312, -0.020313262939453125, -0.017568588256835938, -0.01482391357421875, -0.012079238891601562, -0.009334564208984375, -0.0065898895263671875, -0.00384521484375, -0.0011005401611328125, 0.001644134521484375, 0.0043888092041015625, 0.00713348388671875, 0.009878158569335938, 0.012622833251953125, 0.015367507934570312, 0.0181121826171875, 0.020856857299804688, 0.023601531982421875, 0.026346206665039062, 0.02909088134765625, 0.03183555603027344, 0.034580230712890625, 0.03732490539550781, 0.040069580078125, 0.04281425476074219, 0.045558929443359375, 0.04830360412597656, 0.05104827880859375, 0.05379295349121094, 0.056537628173828125, 0.05928230285644531, 0.0620269775390625, 0.06477165222167969, 0.06751632690429688, 0.07026100158691406, 0.07300567626953125, 0.07575035095214844, 0.07849502563476562, 0.08123970031738281, 0.083984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 7.0, 5.0, 13.0, 19.0, 33.0, 69.0, 107.0, 139.0, 193.0, 152.0, 104.0, 76.0, 37.0, 16.0, 9.0, 10.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5146430730819702, -1.4654897451400757, -1.4163364171981812, -1.3671832084655762, -1.3180298805236816, -1.268876552581787, -1.2197232246398926, -1.170569896697998, -1.1214165687561035, -1.072263240814209, -1.0231099128723145, -0.9739566445350647, -0.9248033761978149, -0.8756500482559204, -0.8264967203140259, -0.7773433923721313, -0.7281901836395264, -0.6790368556976318, -0.6298835873603821, -0.5807302594184875, -0.5315769910812378, -0.48242366313934326, -0.43327033519744873, -0.3841170370578766, -0.33496373891830444, -0.2858104407787323, -0.23665712773799896, -0.18750381469726562, -0.13835051655769348, -0.08919721841812134, -0.04004389047622681, 0.009109407663345337, 0.05826258659362793, 0.10741589218378067, 0.1565691977739334, 0.20572251081466675, 0.2548758089542389, 0.30402910709381104, 0.35318243503570557, 0.4023357331752777, 0.45148903131484985, 0.5006423592567444, 0.5497956275939941, 0.5989489555358887, 0.6481022834777832, 0.697255551815033, 0.7464088797569275, 0.7955621480941772, 0.8447154760360718, 0.8938688039779663, 0.9430220723152161, 0.9921754002571106, 1.0413286685943604, 1.0904819965362549, 1.1396353244781494, 1.188788652420044, 1.2379419803619385, 1.287095308303833, 1.3362486362457275, 1.385401964187622, 1.434555172920227, 1.4837085008621216, 1.5328618288040161, 1.5820151567459106, 1.6311683654785156]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 9.0, 4.0, 10.0, 12.0, 16.0, 29.0, 35.0, 25.0, 44.0, 40.0, 50.0, 68.0, 53.0, 53.0, 81.0, 53.0, 67.0, 53.0, 63.0, 53.0, 45.0, 35.0, 27.0, 20.0, 15.0, 15.0, 7.0, 7.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2122056484222412, -1.1768276691436768, -1.1414495706558228, -1.1060715913772583, -1.0706934928894043, -1.0353155136108398, -0.9999374747276306, -0.9645594358444214, -0.9291813969612122, -0.8938033580780029, -0.8584253191947937, -0.8230472803115845, -0.78766930103302, -0.752291202545166, -0.7169132232666016, -0.6815351843833923, -0.6461571455001831, -0.6107791066169739, -0.5754010677337646, -0.5400230288505554, -0.5046449899673462, -0.46926698088645935, -0.4338889718055725, -0.3985109329223633, -0.36313289403915405, -0.3277548551559448, -0.2923768162727356, -0.25699880719184875, -0.22162076830863953, -0.1862427294254303, -0.15086470544338226, -0.11548668146133423, -0.080108642578125, -0.04473061114549637, -0.009352579712867737, 0.026025451719760895, 0.061403483152389526, 0.09678152203559875, 0.1321595460176468, 0.16753756999969482, 0.20291560888290405, 0.23829364776611328, 0.2736716866493225, 0.30904969573020935, 0.3444277346134186, 0.3798057734966278, 0.41518378257751465, 0.4505618214607239, 0.4859398603439331, 0.5213178992271423, 0.5566959381103516, 0.5920739769935608, 0.62745201587677, 0.6628299951553345, 0.6982080340385437, 0.7335860729217529, 0.7689641118049622, 0.8043421506881714, 0.8397201895713806, 0.8750982284545898, 0.9104762077331543, 0.9458543062210083, 0.9812322854995728, 1.0166103839874268, 1.0519883632659912]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 24.0, 20.0, 67.0, 136.0, 342.0, 1403.0, 9109.0, 3704037.0, 471052.0, 6385.0, 1040.0, 283.0, 123.0, 74.0, 42.0, 15.0, 15.0, 18.0, 14.0, 14.0, 8.0, 11.0, 5.0, 5.0, 4.0, 8.0, 0.0, 3.0, 3.0, 0.0, 6.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.70654296875, -0.6757431030273438, -0.6449432373046875, -0.6141433715820312, -0.583343505859375, -0.5525436401367188, -0.5217437744140625, -0.49094390869140625, -0.46014404296875, -0.42934417724609375, -0.3985443115234375, -0.36774444580078125, -0.336944580078125, -0.30614471435546875, -0.2753448486328125, -0.24454498291015625, -0.2137451171875, -0.18294525146484375, -0.1521453857421875, -0.12134552001953125, -0.090545654296875, -0.05974578857421875, -0.0289459228515625, 0.00185394287109375, 0.03265380859375, 0.06345367431640625, 0.0942535400390625, 0.12505340576171875, 0.155853271484375, 0.18665313720703125, 0.2174530029296875, 0.24825286865234375, 0.279052734375, 0.30985260009765625, 0.3406524658203125, 0.37145233154296875, 0.402252197265625, 0.43305206298828125, 0.4638519287109375, 0.49465179443359375, 0.52545166015625, 0.5562515258789062, 0.5870513916015625, 0.6178512573242188, 0.648651123046875, 0.6794509887695312, 0.7102508544921875, 0.7410507202148438, 0.7718505859375, 0.8026504516601562, 0.8334503173828125, 0.8642501831054688, 0.895050048828125, 0.9258499145507812, 0.9566497802734375, 0.9874496459960938, 1.01824951171875, 1.0490493774414062, 1.0798492431640625, 1.1106491088867188, 1.141448974609375, 1.1722488403320312, 1.2030487060546875, 1.2338485717773438, 1.2646484375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 14.0, 21.0, 55.0, 90.0, 141.0, 177.0, 190.0, 158.0, 86.0, 47.0, 17.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060028076171875, -0.05686235427856445, -0.053696632385253906, -0.05053091049194336, -0.04736518859863281, -0.044199466705322266, -0.04103374481201172, -0.03786802291870117, -0.034702301025390625, -0.03153657913208008, -0.02837085723876953, -0.025205135345458984, -0.022039413452148438, -0.01887369155883789, -0.015707969665527344, -0.012542247772216797, -0.00937652587890625, -0.006210803985595703, -0.0030450820922851562, 0.00012063980102539062, 0.0032863616943359375, 0.006452083587646484, 0.009617805480957031, 0.012783527374267578, 0.015949249267578125, 0.019114971160888672, 0.02228069305419922, 0.025446414947509766, 0.028612136840820312, 0.03177785873413086, 0.034943580627441406, 0.03810930252075195, 0.0412750244140625, 0.04444074630737305, 0.047606468200683594, 0.05077219009399414, 0.05393791198730469, 0.057103633880615234, 0.06026935577392578, 0.06343507766723633, 0.06660079956054688, 0.06976652145385742, 0.07293224334716797, 0.07609796524047852, 0.07926368713378906, 0.08242940902709961, 0.08559513092041016, 0.0887608528137207, 0.09192657470703125, 0.0950922966003418, 0.09825801849365234, 0.10142374038696289, 0.10458946228027344, 0.10775518417358398, 0.11092090606689453, 0.11408662796020508, 0.11725234985351562, 0.12041807174682617, 0.12358379364013672, 0.12674951553344727, 0.1299152374267578, 0.13308095932006836, 0.1362466812133789, 0.13941240310668945, 0.142578125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 16.0, 35.0, 33.0, 57.0, 79.0, 135.0, 320.0, 706.0, 2110.0, 20319.0, 4138866.0, 27204.0, 2535.0, 969.0, 435.0, 228.0, 91.0, 58.0, 28.0, 17.0, 18.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3583984375, -1.3201751708984375, -1.281951904296875, -1.2437286376953125, -1.20550537109375, -1.1672821044921875, -1.129058837890625, -1.0908355712890625, -1.0526123046875, -1.0143890380859375, -0.976165771484375, -0.9379425048828125, -0.89971923828125, -0.8614959716796875, -0.823272705078125, -0.7850494384765625, -0.746826171875, -0.7086029052734375, -0.670379638671875, -0.6321563720703125, -0.59393310546875, -0.5557098388671875, -0.517486572265625, -0.4792633056640625, -0.4410400390625, -0.4028167724609375, -0.364593505859375, -0.3263702392578125, -0.28814697265625, -0.2499237060546875, -0.211700439453125, -0.1734771728515625, -0.13525390625, -0.0970306396484375, -0.058807373046875, -0.0205841064453125, 0.01763916015625, 0.0558624267578125, 0.094085693359375, 0.1323089599609375, 0.1705322265625, 0.2087554931640625, 0.246978759765625, 0.2852020263671875, 0.32342529296875, 0.3616485595703125, 0.399871826171875, 0.4380950927734375, 0.476318359375, 0.5145416259765625, 0.552764892578125, 0.5909881591796875, 0.62921142578125, 0.6674346923828125, 0.705657958984375, 0.7438812255859375, 0.7821044921875, 0.8203277587890625, 0.858551025390625, 0.8967742919921875, 0.93499755859375, 0.9732208251953125, 1.011444091796875, 1.0496673583984375, 1.087890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 19.0, 32.0, 96.0, 308.0, 2818.0, 596.0, 111.0, 39.0, 21.0, 12.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.18341064453125, -0.1776123046875, -0.17181396484375, -0.166015625, -0.16021728515625, -0.1544189453125, -0.14862060546875, -0.142822265625, -0.13702392578125, -0.1312255859375, -0.12542724609375, -0.11962890625, -0.11383056640625, -0.1080322265625, -0.10223388671875, -0.096435546875, -0.09063720703125, -0.0848388671875, -0.07904052734375, -0.0732421875, -0.06744384765625, -0.0616455078125, -0.05584716796875, -0.050048828125, -0.04425048828125, -0.0384521484375, -0.03265380859375, -0.02685546875, -0.02105712890625, -0.0152587890625, -0.00946044921875, -0.003662109375, 0.00213623046875, 0.0079345703125, 0.01373291015625, 0.01953125, 0.02532958984375, 0.0311279296875, 0.03692626953125, 0.042724609375, 0.04852294921875, 0.0543212890625, 0.06011962890625, 0.06591796875, 0.07171630859375, 0.0775146484375, 0.08331298828125, 0.089111328125, 0.09490966796875, 0.1007080078125, 0.10650634765625, 0.1123046875, 0.11810302734375, 0.1239013671875, 0.12969970703125, 0.135498046875, 0.14129638671875, 0.1470947265625, 0.15289306640625, 0.15869140625, 0.16448974609375, 0.1702880859375, 0.17608642578125, 0.181884765625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 64.0, 452.0, 412.0, 56.0, 13.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8740477561950684, -1.7887136936187744, -1.703379511833191, -1.618045449256897, -1.532711386680603, -1.4473772048950195, -1.3620431423187256, -1.2767090797424316, -1.1913750171661377, -1.1060409545898438, -1.0207067728042603, -0.9353727102279663, -0.8500386476516724, -0.7647045254707336, -0.6793704032897949, -0.594036340713501, -0.5087021589279175, -0.42336806654930115, -0.3380339741706848, -0.2526998519897461, -0.16736575961112976, -0.08203166723251343, 0.003302454948425293, 0.08863651752471924, 0.17397063970565796, 0.2593047320842743, 0.3446388244628906, 0.42997294664382935, 0.5153070688247681, 0.600641131401062, 0.6859752535820007, 0.7713093161582947, 0.8566434383392334, 0.9419775605201721, 1.0273116827011108, 1.1126457452774048, 1.1979798078536987, 1.2833139896392822, 1.3686480522155762, 1.4539821147918701, 1.539316177368164, 1.624650239944458, 1.7099844217300415, 1.7953184843063354, 1.8806525468826294, 1.965986728668213, 2.051320791244507, 2.136654853820801, 2.221989154815674, 2.3073232173919678, 2.3926572799682617, 2.4779915809631348, 2.5633256435394287, 2.6486597061157227, 2.7339937686920166, 2.8193278312683105, 2.9046618938446045, 2.9899959564208984, 3.0753300189971924, 3.1606640815734863, 3.2459983825683594, 3.3313324451446533, 3.4166665077209473, 3.502000570297241, 3.587334632873535]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 9.0, 13.0, 27.0, 19.0, 25.0, 33.0, 44.0, 53.0, 57.0, 57.0, 54.0, 64.0, 78.0, 76.0, 54.0, 56.0, 50.0, 46.0, 35.0, 37.0, 25.0, 26.0, 18.0, 9.0, 4.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31181126832962036, -0.2996055781841278, -0.28739985823631287, -0.2751941680908203, -0.26298844814300537, -0.2507827579975128, -0.23857705295085907, -0.22637134790420532, -0.21416565775871277, -0.20195995271205902, -0.18975424766540527, -0.17754855751991272, -0.16534285247325897, -0.15313714742660522, -0.14093144237995148, -0.12872573733329773, -0.11652003228664398, -0.10431432723999023, -0.09210862964391708, -0.07990292459726334, -0.06769722700119019, -0.05549152195453644, -0.04328581690788269, -0.03108011931180954, -0.018874414265155792, -0.0066687120124697685, 0.005536990240216255, 0.017742693424224854, 0.029948394745588303, 0.04215409606695175, 0.0543598011136055, 0.06656549870967865, 0.0787712037563324, 0.09097690880298615, 0.1031826063990593, 0.11538831144571304, 0.1275940090417862, 0.13979971408843994, 0.1520054191350937, 0.16421112418174744, 0.17641681432724, 0.18862251937389374, 0.20082822442054749, 0.21303391456604004, 0.2252396196126938, 0.23744532465934753, 0.24965102970600128, 0.26185673475265503, 0.27406245470046997, 0.2862681448459625, 0.29847386479377747, 0.31067955493927, 0.32288527488708496, 0.3350909650325775, 0.34729665517807007, 0.359502375125885, 0.37170806527137756, 0.3839137554168701, 0.39611947536468506, 0.4083251655101776, 0.42053088545799255, 0.4327365756034851, 0.44494229555130005, 0.4571479856967926, 0.46935367584228516]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 5.0, 9.0, 8.0, 13.0, 15.0, 15.0, 19.0, 24.0, 41.0, 59.0, 94.0, 170.0, 322.0, 882.0, 3984.0, 44308.0, 814797.0, 171313.0, 9810.0, 1582.0, 483.0, 217.0, 124.0, 76.0, 51.0, 37.0, 16.0, 17.0, 8.0, 14.0, 6.0, 15.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9140625, -0.8884658813476562, -0.8628692626953125, -0.8372726440429688, -0.811676025390625, -0.7860794067382812, -0.7604827880859375, -0.7348861694335938, -0.70928955078125, -0.6836929321289062, -0.6580963134765625, -0.6324996948242188, -0.606903076171875, -0.5813064575195312, -0.5557098388671875, -0.5301132202148438, -0.5045166015625, -0.47891998291015625, -0.4533233642578125, -0.42772674560546875, -0.402130126953125, -0.37653350830078125, -0.3509368896484375, -0.32534027099609375, -0.29974365234375, -0.27414703369140625, -0.2485504150390625, -0.22295379638671875, -0.197357177734375, -0.17176055908203125, -0.1461639404296875, -0.12056732177734375, -0.094970703125, -0.06937408447265625, -0.0437774658203125, -0.01818084716796875, 0.007415771484375, 0.03301239013671875, 0.0586090087890625, 0.08420562744140625, 0.10980224609375, 0.13539886474609375, 0.1609954833984375, 0.18659210205078125, 0.212188720703125, 0.23778533935546875, 0.2633819580078125, 0.28897857666015625, 0.3145751953125, 0.34017181396484375, 0.3657684326171875, 0.39136505126953125, 0.416961669921875, 0.44255828857421875, 0.4681549072265625, 0.49375152587890625, 0.51934814453125, 0.5449447631835938, 0.5705413818359375, 0.5961380004882812, 0.621734619140625, 0.6473312377929688, 0.6729278564453125, 0.6985244750976562, 0.72412109375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 3.0, 14.0, 27.0, 62.0, 71.0, 97.0, 114.0, 137.0, 149.0, 118.0, 77.0, 59.0, 42.0, 16.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039276123046875, -0.03661775588989258, -0.033959388732910156, -0.031301021575927734, -0.028642654418945312, -0.02598428726196289, -0.02332592010498047, -0.020667552947998047, -0.018009185791015625, -0.015350818634033203, -0.012692451477050781, -0.01003408432006836, -0.0073757171630859375, -0.004717350006103516, -0.0020589828491210938, 0.0005993843078613281, 0.00325775146484375, 0.005916118621826172, 0.008574485778808594, 0.011232852935791016, 0.013891220092773438, 0.01654958724975586, 0.01920795440673828, 0.021866321563720703, 0.024524688720703125, 0.027183055877685547, 0.02984142303466797, 0.03249979019165039, 0.03515815734863281, 0.037816524505615234, 0.040474891662597656, 0.04313325881958008, 0.0457916259765625, 0.04844999313354492, 0.051108360290527344, 0.053766727447509766, 0.05642509460449219, 0.05908346176147461, 0.06174182891845703, 0.06440019607543945, 0.06705856323242188, 0.0697169303894043, 0.07237529754638672, 0.07503366470336914, 0.07769203186035156, 0.08035039901733398, 0.0830087661743164, 0.08566713333129883, 0.08832550048828125, 0.09098386764526367, 0.0936422348022461, 0.09630060195922852, 0.09895896911621094, 0.10161733627319336, 0.10427570343017578, 0.1069340705871582, 0.10959243774414062, 0.11225080490112305, 0.11490917205810547, 0.11756753921508789, 0.12022590637207031, 0.12288427352905273, 0.12554264068603516, 0.12820100784301758, 0.130859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 8.0, 11.0, 22.0, 29.0, 43.0, 64.0, 96.0, 156.0, 252.0, 470.0, 809.0, 1520.0, 3277.0, 7932.0, 23286.0, 92887.0, 476244.0, 346150.0, 65227.0, 17889.0, 6359.0, 2780.0, 1305.0, 676.0, 408.0, 223.0, 155.0, 101.0, 49.0, 39.0, 30.0, 9.0, 8.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.25146484375, -0.2424468994140625, -0.233428955078125, -0.2244110107421875, -0.21539306640625, -0.2063751220703125, -0.197357177734375, -0.1883392333984375, -0.1793212890625, -0.1703033447265625, -0.161285400390625, -0.1522674560546875, -0.14324951171875, -0.1342315673828125, -0.125213623046875, -0.1161956787109375, -0.107177734375, -0.0981597900390625, -0.089141845703125, -0.0801239013671875, -0.07110595703125, -0.0620880126953125, -0.053070068359375, -0.0440521240234375, -0.0350341796875, -0.0260162353515625, -0.016998291015625, -0.0079803466796875, 0.00103759765625, 0.0100555419921875, 0.019073486328125, 0.0280914306640625, 0.037109375, 0.0461273193359375, 0.055145263671875, 0.0641632080078125, 0.07318115234375, 0.0821990966796875, 0.091217041015625, 0.1002349853515625, 0.1092529296875, 0.1182708740234375, 0.127288818359375, 0.1363067626953125, 0.14532470703125, 0.1543426513671875, 0.163360595703125, 0.1723785400390625, 0.181396484375, 0.1904144287109375, 0.199432373046875, 0.2084503173828125, 0.21746826171875, 0.2264862060546875, 0.235504150390625, 0.2445220947265625, 0.2535400390625, 0.2625579833984375, 0.271575927734375, 0.2805938720703125, 0.28961181640625, 0.2986297607421875, 0.307647705078125, 0.3166656494140625, 0.32568359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 2.0, 12.0, 9.0, 9.0, 17.0, 22.0, 27.0, 29.0, 39.0, 49.0, 56.0, 55.0, 79.0, 68.0, 67.0, 76.0, 65.0, 59.0, 49.0, 50.0, 40.0, 33.0, 20.0, 17.0, 7.0, 13.0, 6.0, 10.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1767578125, -0.170013427734375, -0.16326904296875, -0.156524658203125, -0.1497802734375, -0.143035888671875, -0.13629150390625, -0.129547119140625, -0.122802734375, -0.116058349609375, -0.10931396484375, -0.102569580078125, -0.0958251953125, -0.089080810546875, -0.08233642578125, -0.075592041015625, -0.06884765625, -0.062103271484375, -0.05535888671875, -0.048614501953125, -0.0418701171875, -0.035125732421875, -0.02838134765625, -0.021636962890625, -0.014892578125, -0.008148193359375, -0.00140380859375, 0.005340576171875, 0.0120849609375, 0.018829345703125, 0.02557373046875, 0.032318115234375, 0.0390625, 0.045806884765625, 0.05255126953125, 0.059295654296875, 0.0660400390625, 0.072784423828125, 0.07952880859375, 0.086273193359375, 0.093017578125, 0.099761962890625, 0.10650634765625, 0.113250732421875, 0.1199951171875, 0.126739501953125, 0.13348388671875, 0.140228271484375, 0.14697265625, 0.153717041015625, 0.16046142578125, 0.167205810546875, 0.1739501953125, 0.180694580078125, 0.18743896484375, 0.194183349609375, 0.200927734375, 0.207672119140625, 0.21441650390625, 0.221160888671875, 0.2279052734375, 0.234649658203125, 0.24139404296875, 0.248138427734375, 0.2548828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 7.0, 5.0, 11.0, 9.0, 23.0, 30.0, 26.0, 67.0, 86.0, 152.0, 279.0, 455.0, 978.0, 2245.0, 6494.0, 27575.0, 280003.0, 651539.0, 61364.0, 11014.0, 3384.0, 1330.0, 643.0, 357.0, 178.0, 101.0, 54.0, 36.0, 39.0, 19.0, 15.0, 7.0, 11.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.18505859375, -0.1799468994140625, -0.174835205078125, -0.1697235107421875, -0.16461181640625, -0.1595001220703125, -0.154388427734375, -0.1492767333984375, -0.1441650390625, -0.1390533447265625, -0.133941650390625, -0.1288299560546875, -0.12371826171875, -0.1186065673828125, -0.113494873046875, -0.1083831787109375, -0.103271484375, -0.0981597900390625, -0.093048095703125, -0.0879364013671875, -0.08282470703125, -0.0777130126953125, -0.072601318359375, -0.0674896240234375, -0.0623779296875, -0.0572662353515625, -0.052154541015625, -0.0470428466796875, -0.04193115234375, -0.0368194580078125, -0.031707763671875, -0.0265960693359375, -0.021484375, -0.0163726806640625, -0.011260986328125, -0.0061492919921875, -0.00103759765625, 0.0040740966796875, 0.009185791015625, 0.0142974853515625, 0.0194091796875, 0.0245208740234375, 0.029632568359375, 0.0347442626953125, 0.03985595703125, 0.0449676513671875, 0.050079345703125, 0.0551910400390625, 0.060302734375, 0.0654144287109375, 0.070526123046875, 0.0756378173828125, 0.08074951171875, 0.0858612060546875, 0.090972900390625, 0.0960845947265625, 0.1011962890625, 0.1063079833984375, 0.111419677734375, 0.1165313720703125, 0.12164306640625, 0.1267547607421875, 0.131866455078125, 0.1369781494140625, 0.14208984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 14.0, 3.0, 6.0, 15.0, 19.0, 25.0, 33.0, 31.0, 56.0, 72.0, 71.0, 81.0, 103.0, 102.0, 94.0, 67.0, 43.0, 29.0, 28.0, 19.0, 22.0, 16.0, 11.0, 15.0, 9.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00015020370483398438, -0.00014493241906166077, -0.00013966113328933716, -0.00013438984751701355, -0.00012911856174468994, -0.00012384727597236633, -0.00011857599020004272, -0.00011330470442771912, -0.00010803341865539551, -0.0001027621328830719, -9.749084711074829e-05, -9.221956133842468e-05, -8.694827556610107e-05, -8.167698979377747e-05, -7.640570402145386e-05, -7.113441824913025e-05, -6.586313247680664e-05, -6.059184670448303e-05, -5.5320560932159424e-05, -5.0049275159835815e-05, -4.477798938751221e-05, -3.95067036151886e-05, -3.423541784286499e-05, -2.8964132070541382e-05, -2.3692846298217773e-05, -1.8421560525894165e-05, -1.3150274753570557e-05, -7.878988981246948e-06, -2.60770320892334e-06, 2.6635825634002686e-06, 7.934868335723877e-06, 1.3206154108047485e-05, 1.8477439880371094e-05, 2.3748725652694702e-05, 2.902001142501831e-05, 3.429129719734192e-05, 3.956258296966553e-05, 4.4833868741989136e-05, 5.0105154514312744e-05, 5.537644028663635e-05, 6.064772605895996e-05, 6.591901183128357e-05, 7.119029760360718e-05, 7.646158337593079e-05, 8.17328691482544e-05, 8.7004154920578e-05, 9.227544069290161e-05, 9.754672646522522e-05, 0.00010281801223754883, 0.00010808929800987244, 0.00011336058378219604, 0.00011863186955451965, 0.00012390315532684326, 0.00012917444109916687, 0.00013444572687149048, 0.0001397170126438141, 0.0001449882984161377, 0.0001502595841884613, 0.0001555308699607849, 0.00016080215573310852, 0.00016607344150543213, 0.00017134472727775574, 0.00017661601305007935, 0.00018188729882240295, 0.00018715858459472656]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 6.0, 15.0, 15.0, 41.0, 37.0, 71.0, 112.0, 199.0, 401.0, 701.0, 1605.0, 4064.0, 14189.0, 114304.0, 797401.0, 95615.0, 12912.0, 3773.0, 1498.0, 695.0, 356.0, 208.0, 108.0, 73.0, 45.0, 27.0, 26.0, 14.0, 7.0, 2.0, 5.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1768798828125, -0.17125892639160156, -0.16563796997070312, -0.1600170135498047, -0.15439605712890625, -0.1487751007080078, -0.14315414428710938, -0.13753318786621094, -0.1319122314453125, -0.12629127502441406, -0.12067031860351562, -0.11504936218261719, -0.10942840576171875, -0.10380744934082031, -0.09818649291992188, -0.09256553649902344, -0.086944580078125, -0.08132362365722656, -0.07570266723632812, -0.07008171081542969, -0.06446075439453125, -0.05883979797363281, -0.053218841552734375, -0.04759788513183594, -0.0419769287109375, -0.03635597229003906, -0.030735015869140625, -0.025114059448242188, -0.01949310302734375, -0.013872146606445312, -0.008251190185546875, -0.0026302337646484375, 0.00299072265625, 0.008611679077148438, 0.014232635498046875, 0.019853591918945312, 0.02547454833984375, 0.031095504760742188, 0.036716461181640625, 0.04233741760253906, 0.0479583740234375, 0.05357933044433594, 0.059200286865234375, 0.06482124328613281, 0.07044219970703125, 0.07606315612792969, 0.08168411254882812, 0.08730506896972656, 0.092926025390625, 0.09854698181152344, 0.10416793823242188, 0.10978889465332031, 0.11540985107421875, 0.12103080749511719, 0.12665176391601562, 0.13227272033691406, 0.1378936767578125, 0.14351463317871094, 0.14913558959960938, 0.1547565460205078, 0.16037750244140625, 0.1659984588623047, 0.17161941528320312, 0.17724037170410156, 0.182861328125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 14.0, 10.0, 14.0, 26.0, 23.0, 44.0, 60.0, 86.0, 100.0, 128.0, 116.0, 94.0, 71.0, 63.0, 38.0, 24.0, 18.0, 14.0, 11.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08184814453125, -0.0791168212890625, -0.076385498046875, -0.0736541748046875, -0.0709228515625, -0.0681915283203125, -0.065460205078125, -0.0627288818359375, -0.05999755859375, -0.0572662353515625, -0.054534912109375, -0.0518035888671875, -0.049072265625, -0.0463409423828125, -0.043609619140625, -0.0408782958984375, -0.03814697265625, -0.0354156494140625, -0.032684326171875, -0.0299530029296875, -0.0272216796875, -0.0244903564453125, -0.021759033203125, -0.0190277099609375, -0.01629638671875, -0.0135650634765625, -0.010833740234375, -0.0081024169921875, -0.00537109375, -0.0026397705078125, 9.1552734375e-05, 0.0028228759765625, 0.00555419921875, 0.0082855224609375, 0.011016845703125, 0.0137481689453125, 0.0164794921875, 0.0192108154296875, 0.021942138671875, 0.0246734619140625, 0.02740478515625, 0.0301361083984375, 0.032867431640625, 0.0355987548828125, 0.038330078125, 0.0410614013671875, 0.043792724609375, 0.0465240478515625, 0.04925537109375, 0.0519866943359375, 0.054718017578125, 0.0574493408203125, 0.0601806640625, 0.0629119873046875, 0.065643310546875, 0.0683746337890625, 0.07110595703125, 0.0738372802734375, 0.076568603515625, 0.0792999267578125, 0.08203125, 0.0847625732421875, 0.087493896484375, 0.0902252197265625, 0.09295654296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 11.0, 23.0, 17.0, 31.0, 49.0, 87.0, 156.0, 182.0, 162.0, 116.0, 57.0, 40.0, 35.0, 9.0, 4.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8722143173217773, -1.8132679462432861, -1.7543216943740845, -1.6953753232955933, -1.636428952217102, -1.5774827003479004, -1.5185363292694092, -1.459589958190918, -1.4006435871124268, -1.3416972160339355, -1.2827509641647339, -1.2238045930862427, -1.1648582220077515, -1.1059119701385498, -1.0469655990600586, -0.9880192279815674, -0.929072916507721, -0.8701266050338745, -0.8111802339553833, -0.7522339224815369, -0.6932875514030457, -0.6343412399291992, -0.575394868850708, -0.5164485573768616, -0.45750221610069275, -0.3985558748245239, -0.3396095335483551, -0.2806631922721863, -0.22171686589717865, -0.16277053952217102, -0.1038241982460022, -0.044877856969833374, 0.01406848430633545, 0.07301482558250427, 0.1319611668586731, 0.19090749323368073, 0.24985383450984955, 0.3088001608848572, 0.367746502161026, 0.4266928434371948, 0.48563918471336365, 0.5445855259895325, 0.6035318374633789, 0.6624782085418701, 0.7214245200157166, 0.780370831489563, 0.8393172025680542, 0.8982635736465454, 0.9572098851203918, 1.0161561965942383, 1.0751025676727295, 1.1340489387512207, 1.1929951906204224, 1.2519415616989136, 1.3108879327774048, 1.3698341846466064, 1.4287805557250977, 1.4877269268035889, 1.5466731786727905, 1.6056195497512817, 1.664565920829773, 1.7235121726989746, 1.7824585437774658, 1.841404914855957, 1.9003512859344482]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 13.0, 10.0, 11.0, 25.0, 24.0, 19.0, 34.0, 29.0, 35.0, 39.0, 47.0, 54.0, 53.0, 66.0, 57.0, 71.0, 41.0, 51.0, 50.0, 35.0, 43.0, 33.0, 32.0, 24.0, 20.0, 16.0, 15.0, 9.0, 16.0, 7.0, 6.0, 6.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0742924213409424, -1.041581630706787, -1.0088709592819214, -0.9761602282524109, -0.9434494972229004, -0.9107387661933899, -0.8780280351638794, -0.8453173041343689, -0.8126065731048584, -0.7798958420753479, -0.7471851110458374, -0.7144743800163269, -0.6817636489868164, -0.6490529179573059, -0.6163421869277954, -0.5836314558982849, -0.5509207248687744, -0.5182099938392639, -0.4854992628097534, -0.4527885317802429, -0.4200778007507324, -0.3873670697212219, -0.3546563386917114, -0.3219456076622009, -0.28923487663269043, -0.25652414560317993, -0.22381341457366943, -0.19110268354415894, -0.15839195251464844, -0.12568122148513794, -0.09297049045562744, -0.06025975942611694, -0.027549028396606445, 0.005161702632904053, 0.03787243366241455, 0.07058316469192505, 0.10329389572143555, 0.13600462675094604, 0.16871535778045654, 0.20142608880996704, 0.23413681983947754, 0.26684755086898804, 0.29955828189849854, 0.33226901292800903, 0.36497974395751953, 0.39769047498703003, 0.4304012060165405, 0.463111937046051, 0.4958226680755615, 0.528533399105072, 0.5612441301345825, 0.593954861164093, 0.6266655921936035, 0.659376323223114, 0.6920870542526245, 0.724797785282135, 0.7575085163116455, 0.790219247341156, 0.8229299783706665, 0.855640709400177, 0.8883514404296875, 0.921062171459198, 0.9537729024887085, 0.986483633518219, 1.0191943645477295]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 12.0, 18.0, 51.0, 120.0, 377.0, 1721.0, 25784.0, 4125254.0, 37501.0, 2310.0, 544.0, 238.0, 111.0, 53.0, 33.0, 39.0, 27.0, 16.0, 22.0, 11.0, 11.0, 11.0, 3.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74609375, -0.7035980224609375, -0.661102294921875, -0.6186065673828125, -0.57611083984375, -0.5336151123046875, -0.491119384765625, -0.4486236572265625, -0.4061279296875, -0.3636322021484375, -0.321136474609375, -0.2786407470703125, -0.23614501953125, -0.1936492919921875, -0.151153564453125, -0.1086578369140625, -0.066162109375, -0.0236663818359375, 0.018829345703125, 0.0613250732421875, 0.10382080078125, 0.1463165283203125, 0.188812255859375, 0.2313079833984375, 0.2738037109375, 0.3162994384765625, 0.358795166015625, 0.4012908935546875, 0.44378662109375, 0.4862823486328125, 0.528778076171875, 0.5712738037109375, 0.61376953125, 0.6562652587890625, 0.698760986328125, 0.7412567138671875, 0.78375244140625, 0.8262481689453125, 0.868743896484375, 0.9112396240234375, 0.9537353515625, 0.9962310791015625, 1.038726806640625, 1.0812225341796875, 1.12371826171875, 1.1662139892578125, 1.208709716796875, 1.2512054443359375, 1.293701171875, 1.3361968994140625, 1.378692626953125, 1.4211883544921875, 1.46368408203125, 1.5061798095703125, 1.548675537109375, 1.5911712646484375, 1.6336669921875, 1.6761627197265625, 1.718658447265625, 1.7611541748046875, 1.80364990234375, 1.8461456298828125, 1.888641357421875, 1.9311370849609375, 1.9736328125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 5.0, 20.0, 22.0, 45.0, 68.0, 114.0, 124.0, 128.0, 139.0, 103.0, 95.0, 61.0, 40.0, 32.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027557373046875, -0.025026798248291016, -0.02249622344970703, -0.019965648651123047, -0.017435073852539062, -0.014904499053955078, -0.012373924255371094, -0.00984334945678711, -0.007312774658203125, -0.004782199859619141, -0.0022516250610351562, 0.0002789497375488281, 0.0028095245361328125, 0.005340099334716797, 0.007870674133300781, 0.010401248931884766, 0.01293182373046875, 0.015462398529052734, 0.01799297332763672, 0.020523548126220703, 0.023054122924804688, 0.025584697723388672, 0.028115272521972656, 0.03064584732055664, 0.033176422119140625, 0.03570699691772461, 0.038237571716308594, 0.04076814651489258, 0.04329872131347656, 0.04582929611206055, 0.04835987091064453, 0.050890445709228516, 0.0534210205078125, 0.055951595306396484, 0.05848217010498047, 0.06101274490356445, 0.06354331970214844, 0.06607389450073242, 0.0686044692993164, 0.07113504409790039, 0.07366561889648438, 0.07619619369506836, 0.07872676849365234, 0.08125734329223633, 0.08378791809082031, 0.0863184928894043, 0.08884906768798828, 0.09137964248657227, 0.09391021728515625, 0.09644079208374023, 0.09897136688232422, 0.1015019416809082, 0.10403251647949219, 0.10656309127807617, 0.10909366607666016, 0.11162424087524414, 0.11415481567382812, 0.11668539047241211, 0.1192159652709961, 0.12174654006958008, 0.12427711486816406, 0.12680768966674805, 0.12933826446533203, 0.13186883926391602, 0.1343994140625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 3.0, 6.0, 19.0, 11.0, 24.0, 23.0, 56.0, 83.0, 170.0, 441.0, 1486.0, 8518.0, 4030382.0, 146173.0, 4983.0, 1101.0, 357.0, 171.0, 76.0, 59.0, 42.0, 34.0, 21.0, 9.0, 9.0, 14.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1318359375, -1.0748138427734375, -1.017791748046875, -0.9607696533203125, -0.90374755859375, -0.8467254638671875, -0.789703369140625, -0.7326812744140625, -0.6756591796875, -0.6186370849609375, -0.561614990234375, -0.5045928955078125, -0.44757080078125, -0.3905487060546875, -0.333526611328125, -0.2765045166015625, -0.219482421875, -0.1624603271484375, -0.105438232421875, -0.0484161376953125, 0.00860595703125, 0.0656280517578125, 0.122650146484375, 0.1796722412109375, 0.2366943359375, 0.2937164306640625, 0.350738525390625, 0.4077606201171875, 0.46478271484375, 0.5218048095703125, 0.578826904296875, 0.6358489990234375, 0.69287109375, 0.7498931884765625, 0.806915283203125, 0.8639373779296875, 0.92095947265625, 0.9779815673828125, 1.035003662109375, 1.0920257568359375, 1.1490478515625, 1.2060699462890625, 1.263092041015625, 1.3201141357421875, 1.37713623046875, 1.4341583251953125, 1.491180419921875, 1.5482025146484375, 1.605224609375, 1.6622467041015625, 1.719268798828125, 1.7762908935546875, 1.83331298828125, 1.8903350830078125, 1.947357177734375, 2.0043792724609375, 2.0614013671875, 2.1184234619140625, 2.175445556640625, 2.2324676513671875, 2.28948974609375, 2.3465118408203125, 2.403533935546875, 2.4605560302734375, 2.517578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 14.0, 48.0, 70.0, 301.0, 2917.0, 522.0, 117.0, 33.0, 17.0, 12.0, 8.0, 1.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1778564453125, -0.16716575622558594, -0.15647506713867188, -0.1457843780517578, -0.13509368896484375, -0.12440299987792969, -0.11371231079101562, -0.10302162170410156, -0.0923309326171875, -0.08164024353027344, -0.07094955444335938, -0.06025886535644531, -0.04956817626953125, -0.03887748718261719, -0.028186798095703125, -0.017496109008789062, -0.006805419921875, 0.0038852691650390625, 0.014575958251953125, 0.025266647338867188, 0.03595733642578125, 0.04664802551269531, 0.057338714599609375, 0.06802940368652344, 0.0787200927734375, 0.08941078186035156, 0.10010147094726562, 0.11079216003417969, 0.12148284912109375, 0.1321735382080078, 0.14286422729492188, 0.15355491638183594, 0.16424560546875, 0.17493629455566406, 0.18562698364257812, 0.1963176727294922, 0.20700836181640625, 0.2176990509033203, 0.22838973999023438, 0.23908042907714844, 0.2497711181640625, 0.26046180725097656, 0.2711524963378906, 0.2818431854248047, 0.29253387451171875, 0.3032245635986328, 0.3139152526855469, 0.32460594177246094, 0.335296630859375, 0.34598731994628906, 0.3566780090332031, 0.3673686981201172, 0.37805938720703125, 0.3887500762939453, 0.3994407653808594, 0.41013145446777344, 0.4208221435546875, 0.43151283264160156, 0.4422035217285156, 0.4528942108154297, 0.46358489990234375, 0.4742755889892578, 0.4849662780761719, 0.49565696716308594, 0.50634765625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 15.0, 29.0, 122.0, 398.0, 315.0, 82.0, 25.0, 9.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0324134826660156, -2.9275970458984375, -2.8227808475494385, -2.7179644107818604, -2.6131482124328613, -2.508331775665283, -2.403515577316284, -2.298699140548706, -2.193882942199707, -2.089066505432129, -1.9842503070831299, -1.8794339895248413, -1.7746176719665527, -1.6698012351989746, -1.5649850368499756, -1.4601686000823975, -1.3553522825241089, -1.2505359649658203, -1.1457196474075317, -1.0409033298492432, -0.9360870122909546, -0.8312706351280212, -0.7264543175697327, -0.6216380000114441, -0.5168216824531555, -0.41200536489486694, -0.30718904733657837, -0.2023726999759674, -0.09755638241767883, 0.007259964942932129, 0.1120762825012207, 0.21689260005950928, 0.32170891761779785, 0.4265252351760864, 0.531341552734375, 0.6361578702926636, 0.7409741878509521, 0.8457905650138855, 0.9506068825721741, 1.0554232597351074, 1.1602394580841064, 1.265055775642395, 1.3698720932006836, 1.4746884107589722, 1.5795047283172607, 1.6843211650848389, 1.789137363433838, 1.893953800201416, 1.9987701177597046, 2.103586435317993, 2.2084028720855713, 2.3132190704345703, 2.4180355072021484, 2.5228517055511475, 2.6276681423187256, 2.7324843406677246, 2.8373007774353027, 2.942117214202881, 3.04693341255188, 3.151749849319458, 3.256566047668457, 3.361382484436035, 3.466198682785034, 3.5710151195526123, 3.6758313179016113]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 12.0, 13.0, 21.0, 23.0, 59.0, 65.0, 75.0, 109.0, 100.0, 105.0, 93.0, 97.0, 79.0, 70.0, 39.0, 19.0, 12.0, 11.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0166237354278564, -0.9833853840827942, -0.9501470327377319, -0.9169086813926697, -0.8836703300476074, -0.8504320383071899, -0.8171936869621277, -0.7839553356170654, -0.7507169842720032, -0.7174786329269409, -0.6842402815818787, -0.6510019302368164, -0.6177636384963989, -0.5845252275466919, -0.5512869358062744, -0.5180485844612122, -0.4848102331161499, -0.45157188177108765, -0.4183335304260254, -0.3850952088832855, -0.35185685753822327, -0.318618506193161, -0.28538018465042114, -0.2521418333053589, -0.21890348196029663, -0.18566513061523438, -0.1524267941713333, -0.11918845027685165, -0.08595010638237, -0.05271175503730774, -0.019473418593406677, 0.013764917850494385, 0.04700326919555664, 0.0802416130900383, 0.11347995698451996, 0.14671829342842102, 0.17995664477348328, 0.21319499611854553, 0.2464333325624466, 0.27967166900634766, 0.3129100203514099, 0.34614837169647217, 0.3793867230415344, 0.4126250445842743, 0.44586339592933655, 0.4791017472743988, 0.5123400688171387, 0.5455784201622009, 0.5788167715072632, 0.6120551228523254, 0.6452934741973877, 0.67853182554245, 0.7117701768875122, 0.7450084686279297, 0.7782468199729919, 0.8114851713180542, 0.8447235226631165, 0.8779618740081787, 0.911200225353241, 0.9444385766983032, 0.9776768684387207, 1.0109152793884277, 1.0441535711288452, 1.0773918628692627, 1.1106302738189697]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 4.0, 6.0, 5.0, 17.0, 19.0, 28.0, 43.0, 48.0, 76.0, 133.0, 222.0, 512.0, 1401.0, 9983.0, 553018.0, 471335.0, 9300.0, 1353.0, 466.0, 247.0, 111.0, 71.0, 53.0, 31.0, 28.0, 23.0, 10.0, 1.0, 9.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.25018310546875, -1.2122802734375, -1.17437744140625, -1.136474609375, -1.09857177734375, -1.0606689453125, -1.02276611328125, -0.98486328125, -0.94696044921875, -0.9090576171875, -0.87115478515625, -0.833251953125, -0.79534912109375, -0.7574462890625, -0.71954345703125, -0.681640625, -0.64373779296875, -0.6058349609375, -0.56793212890625, -0.530029296875, -0.49212646484375, -0.4542236328125, -0.41632080078125, -0.37841796875, -0.34051513671875, -0.3026123046875, -0.26470947265625, -0.226806640625, -0.18890380859375, -0.1510009765625, -0.11309814453125, -0.0751953125, -0.03729248046875, 0.0006103515625, 0.03851318359375, 0.076416015625, 0.11431884765625, 0.1522216796875, 0.19012451171875, 0.22802734375, 0.26593017578125, 0.3038330078125, 0.34173583984375, 0.379638671875, 0.41754150390625, 0.4554443359375, 0.49334716796875, 0.53125, 0.56915283203125, 0.6070556640625, 0.64495849609375, 0.682861328125, 0.72076416015625, 0.7586669921875, 0.79656982421875, 0.83447265625, 0.87237548828125, 0.9102783203125, 0.94818115234375, 0.986083984375, 1.02398681640625, 1.0618896484375, 1.09979248046875, 1.1376953125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 13.0, 21.0, 40.0, 81.0, 112.0, 150.0, 162.0, 148.0, 114.0, 76.0, 50.0, 25.0, 11.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0853271484375, -0.08233928680419922, -0.07935142517089844, -0.07636356353759766, -0.07337570190429688, -0.0703878402709961, -0.06739997863769531, -0.06441211700439453, -0.06142425537109375, -0.05843639373779297, -0.05544853210449219, -0.052460670471191406, -0.049472808837890625, -0.046484947204589844, -0.04349708557128906, -0.04050922393798828, -0.0375213623046875, -0.03453350067138672, -0.03154563903808594, -0.028557777404785156, -0.025569915771484375, -0.022582054138183594, -0.019594192504882812, -0.01660633087158203, -0.01361846923828125, -0.010630607604980469, -0.0076427459716796875, -0.004654884338378906, -0.001667022705078125, 0.0013208389282226562, 0.0043087005615234375, 0.007296562194824219, 0.010284423828125, 0.013272285461425781, 0.016260147094726562, 0.019248008728027344, 0.022235870361328125, 0.025223731994628906, 0.028211593627929688, 0.03119945526123047, 0.03418731689453125, 0.03717517852783203, 0.04016304016113281, 0.043150901794433594, 0.046138763427734375, 0.049126625061035156, 0.05211448669433594, 0.05510234832763672, 0.0580902099609375, 0.06107807159423828, 0.06406593322753906, 0.06705379486083984, 0.07004165649414062, 0.0730295181274414, 0.07601737976074219, 0.07900524139404297, 0.08199310302734375, 0.08498096466064453, 0.08796882629394531, 0.0909566879272461, 0.09394454956054688, 0.09693241119384766, 0.09992027282714844, 0.10290813446044922, 0.10589599609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 7.0, 15.0, 10.0, 33.0, 43.0, 70.0, 162.0, 283.0, 576.0, 1363.0, 3214.0, 8717.0, 26292.0, 93749.0, 410572.0, 379647.0, 85720.0, 24318.0, 8183.0, 3064.0, 1307.0, 575.0, 288.0, 141.0, 83.0, 61.0, 26.0, 15.0, 9.0, 5.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.250732421875, -0.24335098266601562, -0.23596954345703125, -0.22858810424804688, -0.2212066650390625, -0.21382522583007812, -0.20644378662109375, -0.19906234741210938, -0.191680908203125, -0.18429946899414062, -0.17691802978515625, -0.16953659057617188, -0.1621551513671875, -0.15477371215820312, -0.14739227294921875, -0.14001083374023438, -0.13262939453125, -0.12524795532226562, -0.11786651611328125, -0.11048507690429688, -0.1031036376953125, -0.09572219848632812, -0.08834075927734375, -0.08095932006835938, -0.073577880859375, -0.06619644165039062, -0.05881500244140625, -0.051433563232421875, -0.0440521240234375, -0.036670684814453125, -0.02928924560546875, -0.021907806396484375, -0.0145263671875, -0.007144927978515625, 0.00023651123046875, 0.007617950439453125, 0.0149993896484375, 0.022380828857421875, 0.02976226806640625, 0.037143707275390625, 0.044525146484375, 0.051906585693359375, 0.05928802490234375, 0.06666946411132812, 0.0740509033203125, 0.08143234252929688, 0.08881378173828125, 0.09619522094726562, 0.10357666015625, 0.11095809936523438, 0.11833953857421875, 0.12572097778320312, 0.1331024169921875, 0.14048385620117188, 0.14786529541015625, 0.15524673461914062, 0.162628173828125, 0.17000961303710938, 0.17739105224609375, 0.18477249145507812, 0.1921539306640625, 0.19953536987304688, 0.20691680908203125, 0.21429824829101562, 0.2216796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 5.0, 6.0, 5.0, 7.0, 12.0, 7.0, 17.0, 12.0, 15.0, 17.0, 28.0, 35.0, 37.0, 44.0, 51.0, 58.0, 58.0, 47.0, 61.0, 53.0, 52.0, 48.0, 52.0, 39.0, 41.0, 30.0, 28.0, 29.0, 25.0, 19.0, 21.0, 14.0, 12.0, 6.0, 3.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1612548828125, -0.1566295623779297, -0.15200424194335938, -0.14737892150878906, -0.14275360107421875, -0.13812828063964844, -0.13350296020507812, -0.1288776397705078, -0.1242523193359375, -0.11962699890136719, -0.11500167846679688, -0.11037635803222656, -0.10575103759765625, -0.10112571716308594, -0.09650039672851562, -0.09187507629394531, -0.087249755859375, -0.08262443542480469, -0.07799911499023438, -0.07337379455566406, -0.06874847412109375, -0.06412315368652344, -0.059497833251953125, -0.05487251281738281, -0.0502471923828125, -0.04562187194824219, -0.040996551513671875, -0.03637123107910156, -0.03174591064453125, -0.027120590209960938, -0.022495269775390625, -0.017869949340820312, -0.01324462890625, -0.008619308471679688, -0.003993988037109375, 0.0006313323974609375, 0.00525665283203125, 0.009881973266601562, 0.014507293701171875, 0.019132614135742188, 0.0237579345703125, 0.028383255004882812, 0.033008575439453125, 0.03763389587402344, 0.04225921630859375, 0.04688453674316406, 0.051509857177734375, 0.05613517761230469, 0.060760498046875, 0.06538581848144531, 0.07001113891601562, 0.07463645935058594, 0.07926177978515625, 0.08388710021972656, 0.08851242065429688, 0.09313774108886719, 0.0977630615234375, 0.10238838195800781, 0.10701370239257812, 0.11163902282714844, 0.11626434326171875, 0.12088966369628906, 0.12551498413085938, 0.1301403045654297, 0.134765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 4.0, 10.0, 16.0, 36.0, 73.0, 119.0, 259.0, 551.0, 1349.0, 3880.0, 14379.0, 84369.0, 643276.0, 257950.0, 31253.0, 7261.0, 2202.0, 839.0, 368.0, 178.0, 91.0, 33.0, 25.0, 18.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.150634765625, -0.1462993621826172, -0.14196395874023438, -0.13762855529785156, -0.13329315185546875, -0.12895774841308594, -0.12462234497070312, -0.12028694152832031, -0.1159515380859375, -0.11161613464355469, -0.10728073120117188, -0.10294532775878906, -0.09860992431640625, -0.09427452087402344, -0.08993911743164062, -0.08560371398925781, -0.081268310546875, -0.07693290710449219, -0.07259750366210938, -0.06826210021972656, -0.06392669677734375, -0.05959129333496094, -0.055255889892578125, -0.05092048645019531, -0.0465850830078125, -0.04224967956542969, -0.037914276123046875, -0.03357887268066406, -0.02924346923828125, -0.024908065795898438, -0.020572662353515625, -0.016237258911132812, -0.01190185546875, -0.0075664520263671875, -0.003231048583984375, 0.0011043548583984375, 0.00543975830078125, 0.009775161743164062, 0.014110565185546875, 0.018445968627929688, 0.0227813720703125, 0.027116775512695312, 0.031452178955078125, 0.03578758239746094, 0.04012298583984375, 0.04445838928222656, 0.048793792724609375, 0.05312919616699219, 0.057464599609375, 0.06180000305175781, 0.06613540649414062, 0.07047080993652344, 0.07480621337890625, 0.07914161682128906, 0.08347702026367188, 0.08781242370605469, 0.0921478271484375, 0.09648323059082031, 0.10081863403320312, 0.10515403747558594, 0.10948944091796875, 0.11382484436035156, 0.11816024780273438, 0.12249565124511719, 0.1268310546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 14.0, 6.0, 11.0, 20.0, 13.0, 19.0, 26.0, 32.0, 48.0, 69.0, 96.0, 119.0, 139.0, 76.0, 88.0, 52.0, 36.0, 27.0, 25.0, 23.0, 11.0, 7.0, 13.0, 4.0, 7.0, 10.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001958608627319336, -0.0001884009689092636, -0.00018094107508659363, -0.00017348118126392365, -0.00016602128744125366, -0.00015856139361858368, -0.0001511014997959137, -0.0001436416059732437, -0.00013618171215057373, -0.00012872181832790375, -0.00012126192450523376, -0.00011380203068256378, -0.0001063421368598938, -9.888224303722382e-05, -9.142234921455383e-05, -8.396245539188385e-05, -7.650256156921387e-05, -6.904266774654388e-05, -6.15827739238739e-05, -5.412288010120392e-05, -4.6662986278533936e-05, -3.920309245586395e-05, -3.174319863319397e-05, -2.4283304810523987e-05, -1.6823410987854004e-05, -9.363517165184021e-06, -1.903623342514038e-06, 5.556270480155945e-06, 1.3016164302825928e-05, 2.047605812549591e-05, 2.7935951948165894e-05, 3.5395845770835876e-05, 4.285573959350586e-05, 5.031563341617584e-05, 5.7775527238845825e-05, 6.523542106151581e-05, 7.269531488418579e-05, 8.015520870685577e-05, 8.761510252952576e-05, 9.507499635219574e-05, 0.00010253489017486572, 0.0001099947839975357, 0.00011745467782020569, 0.00012491457164287567, 0.00013237446546554565, 0.00013983435928821564, 0.00014729425311088562, 0.0001547541469335556, 0.00016221404075622559, 0.00016967393457889557, 0.00017713382840156555, 0.00018459372222423553, 0.00019205361604690552, 0.0001995135098695755, 0.00020697340369224548, 0.00021443329751491547, 0.00022189319133758545, 0.00022935308516025543, 0.00023681297898292542, 0.0002442728728055954, 0.0002517327666282654, 0.00025919266045093536, 0.00026665255427360535, 0.00027411244809627533, 0.0002815723419189453]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 4.0, 0.0, 7.0, 10.0, 8.0, 20.0, 25.0, 33.0, 76.0, 137.0, 201.0, 346.0, 699.0, 1447.0, 3282.0, 8676.0, 25949.0, 97654.0, 414300.0, 372398.0, 86367.0, 23221.0, 7688.0, 3110.0, 1403.0, 678.0, 321.0, 201.0, 99.0, 75.0, 43.0, 17.0, 17.0, 13.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.078369140625, -0.07566261291503906, -0.07295608520507812, -0.07024955749511719, -0.06754302978515625, -0.06483650207519531, -0.062129974365234375, -0.05942344665527344, -0.0567169189453125, -0.05401039123535156, -0.051303863525390625, -0.04859733581542969, -0.04589080810546875, -0.04318428039550781, -0.040477752685546875, -0.03777122497558594, -0.035064697265625, -0.03235816955566406, -0.029651641845703125, -0.026945114135742188, -0.02423858642578125, -0.021532058715820312, -0.018825531005859375, -0.016119003295898438, -0.0134124755859375, -0.010705947875976562, -0.007999420166015625, -0.0052928924560546875, -0.00258636474609375, 0.0001201629638671875, 0.002826690673828125, 0.0055332183837890625, 0.00823974609375, 0.010946273803710938, 0.013652801513671875, 0.016359329223632812, 0.01906585693359375, 0.021772384643554688, 0.024478912353515625, 0.027185440063476562, 0.0298919677734375, 0.03259849548339844, 0.035305023193359375, 0.03801155090332031, 0.04071807861328125, 0.04342460632324219, 0.046131134033203125, 0.04883766174316406, 0.051544189453125, 0.05425071716308594, 0.056957244873046875, 0.05966377258300781, 0.06237030029296875, 0.06507682800292969, 0.06778335571289062, 0.07048988342285156, 0.0731964111328125, 0.07590293884277344, 0.07860946655273438, 0.08131599426269531, 0.08402252197265625, 0.08672904968261719, 0.08943557739257812, 0.09214210510253906, 0.0948486328125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 2.0, 9.0, 6.0, 5.0, 4.0, 14.0, 9.0, 17.0, 13.0, 18.0, 30.0, 30.0, 33.0, 36.0, 46.0, 60.0, 59.0, 74.0, 58.0, 68.0, 53.0, 47.0, 53.0, 44.0, 37.0, 24.0, 25.0, 19.0, 18.0, 10.0, 17.0, 10.0, 12.0, 12.0, 5.0, 6.0, 1.0, 4.0, 5.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041259765625, -0.039856910705566406, -0.03845405578613281, -0.03705120086669922, -0.035648345947265625, -0.03424549102783203, -0.03284263610839844, -0.031439781188964844, -0.03003692626953125, -0.028634071350097656, -0.027231216430664062, -0.02582836151123047, -0.024425506591796875, -0.02302265167236328, -0.021619796752929688, -0.020216941833496094, -0.0188140869140625, -0.017411231994628906, -0.016008377075195312, -0.014605522155761719, -0.013202667236328125, -0.011799812316894531, -0.010396957397460938, -0.008994102478027344, -0.00759124755859375, -0.006188392639160156, -0.0047855377197265625, -0.0033826828002929688, -0.001979827880859375, -0.0005769729614257812, 0.0008258819580078125, 0.0022287368774414062, 0.003631591796875, 0.005034446716308594, 0.0064373016357421875, 0.007840156555175781, 0.009243011474609375, 0.010645866394042969, 0.012048721313476562, 0.013451576232910156, 0.01485443115234375, 0.016257286071777344, 0.017660140991210938, 0.01906299591064453, 0.020465850830078125, 0.02186870574951172, 0.023271560668945312, 0.024674415588378906, 0.0260772705078125, 0.027480125427246094, 0.028882980346679688, 0.03028583526611328, 0.031688690185546875, 0.03309154510498047, 0.03449440002441406, 0.035897254943847656, 0.03730010986328125, 0.038702964782714844, 0.04010581970214844, 0.04150867462158203, 0.042911529541015625, 0.04431438446044922, 0.04571723937988281, 0.047120094299316406, 0.04852294921875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 4.0, 10.0, 10.0, 21.0, 53.0, 57.0, 113.0, 171.0, 178.0, 154.0, 126.0, 52.0, 21.0, 20.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7017371654510498, -1.6440130472183228, -1.5862889289855957, -1.5285649299621582, -1.4708408117294312, -1.413116693496704, -1.3553926944732666, -1.2976685762405396, -1.2399444580078125, -1.1822203397750854, -1.1244962215423584, -1.066772222518921, -1.0090481042861938, -0.9513239860534668, -0.8935999274253845, -0.8358758687973022, -0.7781517505645752, -0.7204276323318481, -0.6627035737037659, -0.6049795150756836, -0.5472553968429565, -0.4895313084125519, -0.4318072199821472, -0.37408313155174255, -0.3163590431213379, -0.2586349546909332, -0.20091086626052856, -0.1431867778301239, -0.08546268939971924, -0.027738600969314575, 0.029985487461090088, 0.08770957589149475, 0.14543354511260986, 0.20315763354301453, 0.2608817219734192, 0.31860581040382385, 0.3763298988342285, 0.4340539872646332, 0.49177807569503784, 0.5495021343231201, 0.6072262525558472, 0.6649503707885742, 0.7226744294166565, 0.7803984880447388, 0.8381226062774658, 0.8958467245101929, 0.9535707831382751, 1.0112948417663574, 1.0690189599990845, 1.1267430782318115, 1.184467077255249, 1.242191195487976, 1.2999153137207031, 1.3576394319534302, 1.4153635501861572, 1.4730875492095947, 1.5308116674423218, 1.5885357856750488, 1.6462597846984863, 1.7039839029312134, 1.7617080211639404, 1.8194321393966675, 1.8771562576293945, 1.934880256652832, 1.992604374885559]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 15.0, 10.0, 7.0, 11.0, 17.0, 25.0, 23.0, 21.0, 31.0, 40.0, 43.0, 32.0, 43.0, 66.0, 49.0, 61.0, 46.0, 49.0, 45.0, 51.0, 40.0, 39.0, 37.0, 34.0, 29.0, 28.0, 23.0, 28.0, 12.0, 17.0, 10.0, 4.0, 5.0, 7.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8695508241653442, -0.8437083959579468, -0.8178660273551941, -0.7920236587524414, -0.766181230545044, -0.7403388023376465, -0.7144964337348938, -0.6886540651321411, -0.6628116369247437, -0.6369692087173462, -0.6111268401145935, -0.5852844715118408, -0.5594420433044434, -0.5335996150970459, -0.5077572464942932, -0.48191484808921814, -0.45607244968414307, -0.430230051279068, -0.4043876528739929, -0.37854525446891785, -0.3527028560638428, -0.3268604576587677, -0.3010180592536926, -0.27517566084861755, -0.24933326244354248, -0.2234908640384674, -0.19764846563339233, -0.17180606722831726, -0.1459636688232422, -0.12012127041816711, -0.09427887201309204, -0.06843647360801697, -0.04259401559829712, -0.016751617193222046, 0.009090781211853027, 0.0349331796169281, 0.060775578022003174, 0.08661797642707825, 0.11246037483215332, 0.1383027732372284, 0.16414517164230347, 0.18998757004737854, 0.2158299684524536, 0.2416723668575287, 0.26751476526260376, 0.29335716366767883, 0.3191995620727539, 0.345041960477829, 0.37088435888290405, 0.3967267572879791, 0.4225691556930542, 0.4484115540981293, 0.47425395250320435, 0.500096321105957, 0.5259387493133545, 0.551781177520752, 0.5776235461235046, 0.6034659147262573, 0.6293083429336548, 0.6551507711410522, 0.6809931397438049, 0.7068355083465576, 0.7326779365539551, 0.7585203647613525, 0.7843627333641052]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 10.0, 7.0, 5.0, 21.0, 30.0, 55.0, 161.0, 503.0, 2045.0, 97100.0, 4089576.0, 3500.0, 768.0, 239.0, 111.0, 48.0, 37.0, 23.0, 13.0, 9.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8876953125, -1.8250274658203125, -1.762359619140625, -1.6996917724609375, -1.63702392578125, -1.5743560791015625, -1.511688232421875, -1.4490203857421875, -1.3863525390625, -1.3236846923828125, -1.261016845703125, -1.1983489990234375, -1.13568115234375, -1.0730133056640625, -1.010345458984375, -0.9476776123046875, -0.885009765625, -0.8223419189453125, -0.759674072265625, -0.6970062255859375, -0.63433837890625, -0.5716705322265625, -0.509002685546875, -0.4463348388671875, -0.3836669921875, -0.3209991455078125, -0.258331298828125, -0.1956634521484375, -0.13299560546875, -0.0703277587890625, -0.007659912109375, 0.0550079345703125, 0.11767578125, 0.1803436279296875, 0.243011474609375, 0.3056793212890625, 0.36834716796875, 0.4310150146484375, 0.493682861328125, 0.5563507080078125, 0.6190185546875, 0.6816864013671875, 0.744354248046875, 0.8070220947265625, 0.86968994140625, 0.9323577880859375, 0.995025634765625, 1.0576934814453125, 1.120361328125, 1.1830291748046875, 1.245697021484375, 1.3083648681640625, 1.37103271484375, 1.4337005615234375, 1.496368408203125, 1.5590362548828125, 1.6217041015625, 1.6843719482421875, 1.747039794921875, 1.8097076416015625, 1.87237548828125, 1.9350433349609375, 1.997711181640625, 2.0603790283203125, 2.123046875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 17.0, 10.0, 39.0, 60.0, 85.0, 104.0, 124.0, 169.0, 140.0, 93.0, 74.0, 46.0, 30.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.077392578125, -0.07455921173095703, -0.07172584533691406, -0.0688924789428711, -0.06605911254882812, -0.06322574615478516, -0.06039237976074219, -0.05755901336669922, -0.05472564697265625, -0.05189228057861328, -0.04905891418457031, -0.046225547790527344, -0.043392181396484375, -0.040558815002441406, -0.03772544860839844, -0.03489208221435547, -0.0320587158203125, -0.02922534942626953, -0.026391983032226562, -0.023558616638183594, -0.020725250244140625, -0.017891883850097656, -0.015058517456054688, -0.012225151062011719, -0.00939178466796875, -0.006558418273925781, -0.0037250518798828125, -0.0008916854858398438, 0.001941680908203125, 0.004775047302246094, 0.0076084136962890625, 0.010441780090332031, 0.013275146484375, 0.01610851287841797, 0.018941879272460938, 0.021775245666503906, 0.024608612060546875, 0.027441978454589844, 0.030275344848632812, 0.03310871124267578, 0.03594207763671875, 0.03877544403076172, 0.04160881042480469, 0.044442176818847656, 0.047275543212890625, 0.050108909606933594, 0.05294227600097656, 0.05577564239501953, 0.0586090087890625, 0.06144237518310547, 0.06427574157714844, 0.0671091079711914, 0.06994247436523438, 0.07277584075927734, 0.07560920715332031, 0.07844257354736328, 0.08127593994140625, 0.08410930633544922, 0.08694267272949219, 0.08977603912353516, 0.09260940551757812, 0.0954427719116211, 0.09827613830566406, 0.10110950469970703, 0.10394287109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 9.0, 5.0, 10.0, 18.0, 26.0, 53.0, 92.0, 175.0, 466.0, 1133.0, 3034.0, 9245.0, 48019.0, 3871320.0, 234392.0, 18511.0, 4708.0, 1658.0, 669.0, 355.0, 152.0, 100.0, 50.0, 39.0, 15.0, 10.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394287109375, -0.3776893615722656, -0.36109161376953125, -0.3444938659667969, -0.3278961181640625, -0.3112983703613281, -0.29470062255859375, -0.2781028747558594, -0.261505126953125, -0.24490737915039062, -0.22830963134765625, -0.21171188354492188, -0.1951141357421875, -0.17851638793945312, -0.16191864013671875, -0.14532089233398438, -0.12872314453125, -0.11212539672851562, -0.09552764892578125, -0.07892990112304688, -0.0623321533203125, -0.045734405517578125, -0.02913665771484375, -0.012538909912109375, 0.004058837890625, 0.020656585693359375, 0.03725433349609375, 0.053852081298828125, 0.0704498291015625, 0.08704757690429688, 0.10364532470703125, 0.12024307250976562, 0.1368408203125, 0.15343856811523438, 0.17003631591796875, 0.18663406372070312, 0.2032318115234375, 0.21982955932617188, 0.23642730712890625, 0.2530250549316406, 0.269622802734375, 0.2862205505371094, 0.30281829833984375, 0.3194160461425781, 0.3360137939453125, 0.3526115417480469, 0.36920928955078125, 0.3858070373535156, 0.40240478515625, 0.4190025329589844, 0.43560028076171875, 0.4521980285644531, 0.4687957763671875, 0.4853935241699219, 0.5019912719726562, 0.5185890197753906, 0.535186767578125, 0.5517845153808594, 0.5683822631835938, 0.5849800109863281, 0.6015777587890625, 0.6181755065917969, 0.6347732543945312, 0.6513710021972656, 0.66796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 8.0, 10.0, 12.0, 18.0, 35.0, 40.0, 97.0, 293.0, 2457.0, 781.0, 160.0, 73.0, 35.0, 17.0, 20.0, 2.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09661865234375, -0.0911874771118164, -0.08575630187988281, -0.08032512664794922, -0.07489395141601562, -0.06946277618408203, -0.06403160095214844, -0.058600425720214844, -0.05316925048828125, -0.047738075256347656, -0.04230690002441406, -0.03687572479248047, -0.031444549560546875, -0.02601337432861328, -0.020582199096679688, -0.015151023864746094, -0.0097198486328125, -0.004288673400878906, 0.0011425018310546875, 0.006573677062988281, 0.012004852294921875, 0.01743602752685547, 0.022867202758789062, 0.028298377990722656, 0.03372955322265625, 0.039160728454589844, 0.04459190368652344, 0.05002307891845703, 0.055454254150390625, 0.06088542938232422, 0.06631660461425781, 0.0717477798461914, 0.077178955078125, 0.0826101303100586, 0.08804130554199219, 0.09347248077392578, 0.09890365600585938, 0.10433483123779297, 0.10976600646972656, 0.11519718170166016, 0.12062835693359375, 0.12605953216552734, 0.13149070739746094, 0.13692188262939453, 0.14235305786132812, 0.14778423309326172, 0.1532154083251953, 0.1586465835571289, 0.1640777587890625, 0.1695089340209961, 0.1749401092529297, 0.18037128448486328, 0.18580245971679688, 0.19123363494873047, 0.19666481018066406, 0.20209598541259766, 0.20752716064453125, 0.21295833587646484, 0.21838951110839844, 0.22382068634033203, 0.22925186157226562, 0.23468303680419922, 0.2401142120361328, 0.2455453872680664, 0.2509765625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 8.0, 11.0, 22.0, 26.0, 42.0, 121.0, 191.0, 298.0, 169.0, 68.0, 36.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.987760066986084, -1.9468356370925903, -1.9059113264083862, -1.8649868965148926, -1.8240625858306885, -1.7831381559371948, -1.7422138452529907, -1.701289415359497, -1.660365104675293, -1.6194406747817993, -1.5785163640975952, -1.5375919342041016, -1.4966676235198975, -1.4557431936264038, -1.4148188829421997, -1.373894453048706, -1.3329700231552124, -1.2920455932617188, -1.2511212825775146, -1.210196852684021, -1.169272541999817, -1.1283481121063232, -1.0874238014221191, -1.0464993715286255, -1.0055749416351318, -0.964650571346283, -0.9237262010574341, -0.8828018307685852, -0.8418774604797363, -0.8009530305862427, -0.7600286602973938, -0.7191042900085449, -0.6781799793243408, -0.6372556090354919, -0.5963312387466431, -0.5554068684577942, -0.5144824981689453, -0.47355809807777405, -0.4326336979866028, -0.3917093276977539, -0.35078495740890503, -0.30986058712005615, -0.2689362168312073, -0.228011816740036, -0.18708744645118713, -0.14616307616233826, -0.10523869097232819, -0.06431430578231812, -0.02338993549346924, 0.017534442245960236, 0.05845881998538971, 0.09938319772481918, 0.14030757546424866, 0.18123194575309753, 0.2221563309431076, 0.2630807161331177, 0.30400508642196655, 0.34492945671081543, 0.3858538269996643, 0.42677822709083557, 0.46770259737968445, 0.5086269378662109, 0.5495513677597046, 0.5904757380485535, 0.6314001083374023]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 8.0, 8.0, 11.0, 18.0, 12.0, 31.0, 20.0, 33.0, 34.0, 36.0, 36.0, 36.0, 47.0, 44.0, 49.0, 75.0, 65.0, 48.0, 55.0, 39.0, 37.0, 34.0, 31.0, 39.0, 31.0, 24.0, 20.0, 13.0, 13.0, 9.0, 12.0, 7.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.45119738578796387, -0.43792837858200073, -0.4246593713760376, -0.41139036417007446, -0.39812135696411133, -0.3848523497581482, -0.37158337235450745, -0.3583143651485443, -0.3450453579425812, -0.33177635073661804, -0.3185073435306549, -0.3052383363246918, -0.291969358921051, -0.2787003517150879, -0.26543134450912476, -0.2521623373031616, -0.2388933300971985, -0.22562432289123535, -0.21235531568527222, -0.19908632338047028, -0.18581731617450714, -0.172548308968544, -0.15927931666374207, -0.14601030945777893, -0.1327413022518158, -0.11947229504585266, -0.10620329529047012, -0.09293429553508759, -0.07966528832912445, -0.06639628112316132, -0.05312728136777878, -0.03985828161239624, -0.026589274406433105, -0.01332027092576027, -5.126744508743286e-05, 0.013217736035585403, 0.02648673951625824, 0.039755746722221375, 0.05302474647760391, 0.06629374623298645, 0.07956275343894958, 0.09283176064491272, 0.10610076040029526, 0.1193697601556778, 0.13263876736164093, 0.14590777456760406, 0.159176766872406, 0.17244577407836914, 0.18571478128433228, 0.1989837884902954, 0.21225279569625854, 0.22552178800106049, 0.23879079520702362, 0.25205981731414795, 0.2653287947177887, 0.27859780192375183, 0.29186680912971497, 0.3051358163356781, 0.31840482354164124, 0.33167383074760437, 0.3449428081512451, 0.35821181535720825, 0.3714808225631714, 0.3847498297691345, 0.39801883697509766]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 3.0, 6.0, 7.0, 8.0, 12.0, 19.0, 24.0, 44.0, 54.0, 88.0, 116.0, 192.0, 377.0, 829.0, 2602.0, 13528.0, 158294.0, 782399.0, 78157.0, 8403.0, 1869.0, 659.0, 296.0, 188.0, 133.0, 63.0, 46.0, 37.0, 28.0, 24.0, 12.0, 7.0, 6.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.6748046875, -0.653961181640625, -0.63311767578125, -0.612274169921875, -0.5914306640625, -0.570587158203125, -0.54974365234375, -0.528900146484375, -0.508056640625, -0.487213134765625, -0.46636962890625, -0.445526123046875, -0.4246826171875, -0.403839111328125, -0.38299560546875, -0.362152099609375, -0.34130859375, -0.320465087890625, -0.29962158203125, -0.278778076171875, -0.2579345703125, -0.237091064453125, -0.21624755859375, -0.195404052734375, -0.174560546875, -0.153717041015625, -0.13287353515625, -0.112030029296875, -0.0911865234375, -0.070343017578125, -0.04949951171875, -0.028656005859375, -0.0078125, 0.013031005859375, 0.03387451171875, 0.054718017578125, 0.0755615234375, 0.096405029296875, 0.11724853515625, 0.138092041015625, 0.158935546875, 0.179779052734375, 0.20062255859375, 0.221466064453125, 0.2423095703125, 0.263153076171875, 0.28399658203125, 0.304840087890625, 0.32568359375, 0.346527099609375, 0.36737060546875, 0.388214111328125, 0.4090576171875, 0.429901123046875, 0.45074462890625, 0.471588134765625, 0.492431640625, 0.513275146484375, 0.53411865234375, 0.554962158203125, 0.5758056640625, 0.596649169921875, 0.61749267578125, 0.638336181640625, 0.6591796875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 11.0, 9.0, 22.0, 32.0, 71.0, 100.0, 132.0, 119.0, 137.0, 126.0, 102.0, 50.0, 52.0, 27.0, 14.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0760498046875, -0.07301712036132812, -0.06998443603515625, -0.06695175170898438, -0.0639190673828125, -0.060886383056640625, -0.05785369873046875, -0.054821014404296875, -0.051788330078125, -0.048755645751953125, -0.04572296142578125, -0.042690277099609375, -0.0396575927734375, -0.036624908447265625, -0.03359222412109375, -0.030559539794921875, -0.02752685546875, -0.024494171142578125, -0.02146148681640625, -0.018428802490234375, -0.0153961181640625, -0.012363433837890625, -0.00933074951171875, -0.006298065185546875, -0.003265380859375, -0.000232696533203125, 0.00279998779296875, 0.005832672119140625, 0.0088653564453125, 0.011898040771484375, 0.01493072509765625, 0.017963409423828125, 0.02099609375, 0.024028778076171875, 0.02706146240234375, 0.030094146728515625, 0.0331268310546875, 0.036159515380859375, 0.03919219970703125, 0.042224884033203125, 0.045257568359375, 0.048290252685546875, 0.05132293701171875, 0.054355621337890625, 0.0573883056640625, 0.060420989990234375, 0.06345367431640625, 0.06648635864257812, 0.06951904296875, 0.07255172729492188, 0.07558441162109375, 0.07861709594726562, 0.0816497802734375, 0.08468246459960938, 0.08771514892578125, 0.09074783325195312, 0.093780517578125, 0.09681320190429688, 0.09984588623046875, 0.10287857055664062, 0.1059112548828125, 0.10894393920898438, 0.11197662353515625, 0.11500930786132812, 0.1180419921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 14.0, 8.0, 15.0, 20.0, 29.0, 38.0, 60.0, 78.0, 125.0, 228.0, 434.0, 820.0, 1728.0, 4358.0, 11944.0, 40976.0, 213336.0, 597279.0, 132831.0, 28795.0, 9049.0, 3266.0, 1415.0, 718.0, 370.0, 212.0, 124.0, 65.0, 50.0, 44.0, 28.0, 20.0, 19.0, 16.0, 5.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0], "bins": [-0.388916015625, -0.37903785705566406, -0.3691596984863281, -0.3592815399169922, -0.34940338134765625, -0.3395252227783203, -0.3296470642089844, -0.31976890563964844, -0.3098907470703125, -0.30001258850097656, -0.2901344299316406, -0.2802562713623047, -0.27037811279296875, -0.2604999542236328, -0.2506217956542969, -0.24074363708496094, -0.230865478515625, -0.22098731994628906, -0.21110916137695312, -0.2012310028076172, -0.19135284423828125, -0.1814746856689453, -0.17159652709960938, -0.16171836853027344, -0.1518402099609375, -0.14196205139160156, -0.13208389282226562, -0.12220573425292969, -0.11232757568359375, -0.10244941711425781, -0.09257125854492188, -0.08269309997558594, -0.07281494140625, -0.06293678283691406, -0.053058624267578125, -0.04318046569824219, -0.03330230712890625, -0.023424148559570312, -0.013545989990234375, -0.0036678314208984375, 0.0062103271484375, 0.016088485717773438, 0.025966644287109375, 0.03584480285644531, 0.04572296142578125, 0.05560111999511719, 0.06547927856445312, 0.07535743713378906, 0.085235595703125, 0.09511375427246094, 0.10499191284179688, 0.11487007141113281, 0.12474822998046875, 0.1346263885498047, 0.14450454711914062, 0.15438270568847656, 0.1642608642578125, 0.17413902282714844, 0.18401718139648438, 0.1938953399658203, 0.20377349853515625, 0.2136516571044922, 0.22352981567382812, 0.23340797424316406, 0.2432861328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 12.0, 3.0, 17.0, 10.0, 15.0, 17.0, 20.0, 17.0, 24.0, 40.0, 37.0, 36.0, 45.0, 43.0, 57.0, 47.0, 57.0, 55.0, 59.0, 61.0, 49.0, 47.0, 39.0, 27.0, 21.0, 26.0, 21.0, 14.0, 17.0, 14.0, 7.0, 8.0, 7.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.2333984375, -0.227447509765625, -0.22149658203125, -0.215545654296875, -0.2095947265625, -0.203643798828125, -0.19769287109375, -0.191741943359375, -0.185791015625, -0.179840087890625, -0.17388916015625, -0.167938232421875, -0.1619873046875, -0.156036376953125, -0.15008544921875, -0.144134521484375, -0.13818359375, -0.132232666015625, -0.12628173828125, -0.120330810546875, -0.1143798828125, -0.108428955078125, -0.10247802734375, -0.096527099609375, -0.090576171875, -0.084625244140625, -0.07867431640625, -0.072723388671875, -0.0667724609375, -0.060821533203125, -0.05487060546875, -0.048919677734375, -0.04296875, -0.037017822265625, -0.03106689453125, -0.025115966796875, -0.0191650390625, -0.013214111328125, -0.00726318359375, -0.001312255859375, 0.004638671875, 0.010589599609375, 0.01654052734375, 0.022491455078125, 0.0284423828125, 0.034393310546875, 0.04034423828125, 0.046295166015625, 0.05224609375, 0.058197021484375, 0.06414794921875, 0.070098876953125, 0.0760498046875, 0.082000732421875, 0.08795166015625, 0.093902587890625, 0.099853515625, 0.105804443359375, 0.11175537109375, 0.117706298828125, 0.1236572265625, 0.129608154296875, 0.13555908203125, 0.141510009765625, 0.1474609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 6.0, 10.0, 14.0, 18.0, 25.0, 38.0, 37.0, 78.0, 130.0, 228.0, 347.0, 552.0, 1000.0, 1679.0, 3358.0, 6831.0, 15343.0, 44412.0, 221437.0, 596931.0, 105985.0, 28066.0, 11000.0, 4990.0, 2575.0, 1413.0, 839.0, 464.0, 284.0, 162.0, 104.0, 75.0, 34.0, 32.0, 13.0, 17.0, 7.0, 6.0, 8.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1612548828125, -0.15593338012695312, -0.15061187744140625, -0.14529037475585938, -0.1399688720703125, -0.13464736938476562, -0.12932586669921875, -0.12400436401367188, -0.118682861328125, -0.11336135864257812, -0.10803985595703125, -0.10271835327148438, -0.0973968505859375, -0.09207534790039062, -0.08675384521484375, -0.08143234252929688, -0.07611083984375, -0.07078933715820312, -0.06546783447265625, -0.060146331787109375, -0.0548248291015625, -0.049503326416015625, -0.04418182373046875, -0.038860321044921875, -0.033538818359375, -0.028217315673828125, -0.02289581298828125, -0.017574310302734375, -0.0122528076171875, -0.006931304931640625, -0.00160980224609375, 0.003711700439453125, 0.009033203125, 0.014354705810546875, 0.01967620849609375, 0.024997711181640625, 0.0303192138671875, 0.035640716552734375, 0.04096221923828125, 0.046283721923828125, 0.051605224609375, 0.056926727294921875, 0.06224822998046875, 0.06756973266601562, 0.0728912353515625, 0.07821273803710938, 0.08353424072265625, 0.08885574340820312, 0.09417724609375, 0.09949874877929688, 0.10482025146484375, 0.11014175415039062, 0.1154632568359375, 0.12078475952148438, 0.12610626220703125, 0.13142776489257812, 0.136749267578125, 0.14207077026367188, 0.14739227294921875, 0.15271377563476562, 0.1580352783203125, 0.16335678100585938, 0.16867828369140625, 0.17399978637695312, 0.1793212890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 3.0, 14.0, 8.0, 11.0, 9.0, 12.0, 16.0, 10.0, 32.0, 21.0, 34.0, 48.0, 70.0, 89.0, 97.0, 95.0, 87.0, 55.0, 56.0, 44.0, 38.0, 23.0, 21.0, 27.0, 13.0, 12.0, 13.0, 12.0, 5.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000164031982421875, -0.00015877559781074524, -0.00015351921319961548, -0.00014826282858848572, -0.00014300644397735596, -0.0001377500593662262, -0.00013249367475509644, -0.00012723729014396667, -0.00012198090553283691, -0.00011672452092170715, -0.00011146813631057739, -0.00010621175169944763, -0.00010095536708831787, -9.569898247718811e-05, -9.044259786605835e-05, -8.518621325492859e-05, -7.992982864379883e-05, -7.467344403266907e-05, -6.94170594215393e-05, -6.416067481040955e-05, -5.8904290199279785e-05, -5.3647905588150024e-05, -4.8391520977020264e-05, -4.31351363658905e-05, -3.787875175476074e-05, -3.262236714363098e-05, -2.736598253250122e-05, -2.210959792137146e-05, -1.68532133102417e-05, -1.1596828699111938e-05, -6.340444087982178e-06, -1.084059476852417e-06, 4.172325134277344e-06, 9.428709745407104e-06, 1.4685094356536865e-05, 1.9941478967666626e-05, 2.5197863578796387e-05, 3.0454248189926147e-05, 3.571063280105591e-05, 4.096701741218567e-05, 4.622340202331543e-05, 5.147978663444519e-05, 5.673617124557495e-05, 6.199255585670471e-05, 6.724894046783447e-05, 7.250532507896423e-05, 7.7761709690094e-05, 8.301809430122375e-05, 8.827447891235352e-05, 9.353086352348328e-05, 9.878724813461304e-05, 0.0001040436327457428, 0.00010930001735687256, 0.00011455640196800232, 0.00011981278657913208, 0.00012506917119026184, 0.0001303255558013916, 0.00013558194041252136, 0.00014083832502365112, 0.00014609470963478088, 0.00015135109424591064, 0.0001566074788570404, 0.00016186386346817017, 0.00016712024807929993, 0.0001723766326904297]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 10.0, 10.0, 18.0, 23.0, 28.0, 62.0, 69.0, 141.0, 248.0, 620.0, 1461.0, 4829.0, 22061.0, 236828.0, 730885.0, 39477.0, 8107.0, 2099.0, 786.0, 356.0, 166.0, 94.0, 60.0, 39.0, 18.0, 17.0, 10.0, 4.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.330078125, -0.3191375732421875, -0.308197021484375, -0.2972564697265625, -0.28631591796875, -0.2753753662109375, -0.264434814453125, -0.2534942626953125, -0.2425537109375, -0.2316131591796875, -0.220672607421875, -0.2097320556640625, -0.19879150390625, -0.1878509521484375, -0.176910400390625, -0.1659698486328125, -0.155029296875, -0.1440887451171875, -0.133148193359375, -0.1222076416015625, -0.11126708984375, -0.1003265380859375, -0.089385986328125, -0.0784454345703125, -0.0675048828125, -0.0565643310546875, -0.045623779296875, -0.0346832275390625, -0.02374267578125, -0.0128021240234375, -0.001861572265625, 0.0090789794921875, 0.02001953125, 0.0309600830078125, 0.041900634765625, 0.0528411865234375, 0.06378173828125, 0.0747222900390625, 0.085662841796875, 0.0966033935546875, 0.1075439453125, 0.1184844970703125, 0.129425048828125, 0.1403656005859375, 0.15130615234375, 0.1622467041015625, 0.173187255859375, 0.1841278076171875, 0.195068359375, 0.2060089111328125, 0.216949462890625, 0.2278900146484375, 0.23883056640625, 0.2497711181640625, 0.260711669921875, 0.2716522216796875, 0.2825927734375, 0.2935333251953125, 0.304473876953125, 0.3154144287109375, 0.32635498046875, 0.3372955322265625, 0.348236083984375, 0.3591766357421875, 0.3701171875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 4.0, 8.0, 4.0, 9.0, 11.0, 13.0, 12.0, 22.0, 27.0, 55.0, 57.0, 108.0, 153.0, 151.0, 107.0, 71.0, 37.0, 34.0, 36.0, 7.0, 12.0, 11.0, 7.0, 5.0, 6.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14990234375, -0.14521408081054688, -0.14052581787109375, -0.13583755493164062, -0.1311492919921875, -0.12646102905273438, -0.12177276611328125, -0.11708450317382812, -0.112396240234375, -0.10770797729492188, -0.10301971435546875, -0.09833145141601562, -0.0936431884765625, -0.08895492553710938, -0.08426666259765625, -0.07957839965820312, -0.07489013671875, -0.07020187377929688, -0.06551361083984375, -0.060825347900390625, -0.0561370849609375, -0.051448822021484375, -0.04676055908203125, -0.042072296142578125, -0.037384033203125, -0.032695770263671875, -0.02800750732421875, -0.023319244384765625, -0.0186309814453125, -0.013942718505859375, -0.00925445556640625, -0.004566192626953125, 0.0001220703125, 0.004810333251953125, 0.00949859619140625, 0.014186859130859375, 0.0188751220703125, 0.023563385009765625, 0.02825164794921875, 0.032939910888671875, 0.037628173828125, 0.042316436767578125, 0.04700469970703125, 0.051692962646484375, 0.0563812255859375, 0.061069488525390625, 0.06575775146484375, 0.07044601440429688, 0.07513427734375, 0.07982254028320312, 0.08451080322265625, 0.08919906616210938, 0.0938873291015625, 0.09857559204101562, 0.10326385498046875, 0.10795211791992188, 0.112640380859375, 0.11732864379882812, 0.12201690673828125, 0.12670516967773438, 0.1313934326171875, 0.13608169555664062, 0.14076995849609375, 0.14545822143554688, 0.150146484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 12.0, 26.0, 44.0, 123.0, 261.0, 278.0, 136.0, 58.0, 37.0, 16.0, 7.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25489616394043, -5.124401569366455, -4.9939069747924805, -4.863412380218506, -4.732917785644531, -4.602423191070557, -4.471928596496582, -4.341434478759766, -4.210939407348633, -4.080444812774658, -3.9499502182006836, -3.819455623626709, -3.6889610290527344, -3.5584664344787598, -3.4279720783233643, -3.2974774837493896, -3.166983127593994, -3.0364885330200195, -2.905993938446045, -2.7754993438720703, -2.6450047492980957, -2.514510154724121, -2.3840157985687256, -2.253521203994751, -2.1230266094207764, -1.9925320148468018, -1.8620374202728271, -1.731542944908142, -1.6010483503341675, -1.4705537557601929, -1.3400592803955078, -1.2095646858215332, -1.0790703296661377, -0.9485757350921631, -0.8180812001228333, -0.6875866651535034, -0.5570920705795288, -0.4265974760055542, -0.29610294103622437, -0.16560840606689453, -0.03511381149291992, 0.0953807532787323, 0.22587531805038452, 0.35636988282203674, 0.48686444759368896, 0.6173590421676636, 0.7478535771369934, 0.8783481121063232, 1.0088427066802979, 1.1393373012542725, 1.269831895828247, 1.4003263711929321, 1.5308209657669067, 1.6613155603408813, 1.7918100357055664, 1.922304630279541, 2.0527992248535156, 2.1832938194274902, 2.313788414001465, 2.4442830085754395, 2.574777603149414, 2.7052721977233887, 2.835766553878784, 2.966261148452759, 3.0967557430267334]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 3.0, 3.0, 8.0, 7.0, 9.0, 14.0, 21.0, 29.0, 32.0, 21.0, 30.0, 36.0, 27.0, 28.0, 39.0, 51.0, 44.0, 47.0, 51.0, 40.0, 39.0, 46.0, 54.0, 40.0, 37.0, 33.0, 21.0, 28.0, 17.0, 18.0, 20.0, 22.0, 15.0, 17.0, 8.0, 7.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.0936529636383057, -1.0605049133300781, -1.0273569822311401, -0.9942089915275574, -0.9610610008239746, -0.9279129505157471, -0.8947649598121643, -0.8616169691085815, -0.8284689784049988, -0.795320987701416, -0.7621729969978333, -0.7290250062942505, -0.695876955986023, -0.662729024887085, -0.6295809745788574, -0.5964329838752747, -0.5632849931716919, -0.5301370024681091, -0.49698901176452637, -0.4638409912586212, -0.43069300055503845, -0.3975450098514557, -0.36439698934555054, -0.3312489986419678, -0.298101007938385, -0.26495301723480225, -0.2318050116300583, -0.19865700602531433, -0.16550901532173157, -0.1323610246181488, -0.09921301901340485, -0.06606501340866089, -0.032917022705078125, 0.0002309754490852356, 0.033378973603248596, 0.06652697175741196, 0.09967496991157532, 0.13282296061515808, 0.16597096621990204, 0.199118971824646, 0.23226696252822876, 0.2654149532318115, 0.2985629439353943, 0.33171096444129944, 0.3648589551448822, 0.39800694584846497, 0.4311549663543701, 0.4643029570579529, 0.49745094776153564, 0.5305989384651184, 0.5637469291687012, 0.5968949198722839, 0.6300429105758667, 0.6631909608840942, 0.696338951587677, 0.7294869422912598, 0.7626349329948425, 0.7957829236984253, 0.8289309144020081, 0.8620789051055908, 0.8952269554138184, 0.9283748865127563, 0.9615229368209839, 0.9946709275245667, 1.0278189182281494]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 6.0, 5.0, 9.0, 6.0, 11.0, 15.0, 16.0, 17.0, 43.0, 89.0, 156.0, 434.0, 1955.0, 12021.0, 3773816.0, 394972.0, 8403.0, 1347.0, 440.0, 203.0, 114.0, 70.0, 37.0, 23.0, 20.0, 12.0, 11.0, 6.0, 13.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87060546875, -0.8405075073242188, -0.8104095458984375, -0.7803115844726562, -0.750213623046875, -0.7201156616210938, -0.6900177001953125, -0.6599197387695312, -0.62982177734375, -0.5997238159179688, -0.5696258544921875, -0.5395278930664062, -0.509429931640625, -0.47933197021484375, -0.4492340087890625, -0.41913604736328125, -0.3890380859375, -0.35894012451171875, -0.3288421630859375, -0.29874420166015625, -0.268646240234375, -0.23854827880859375, -0.2084503173828125, -0.17835235595703125, -0.14825439453125, -0.11815643310546875, -0.0880584716796875, -0.05796051025390625, -0.027862548828125, 0.00223541259765625, 0.0323333740234375, 0.06243133544921875, 0.092529296875, 0.12262725830078125, 0.1527252197265625, 0.18282318115234375, 0.212921142578125, 0.24301910400390625, 0.2731170654296875, 0.30321502685546875, 0.33331298828125, 0.36341094970703125, 0.3935089111328125, 0.42360687255859375, 0.453704833984375, 0.48380279541015625, 0.5139007568359375, 0.5439987182617188, 0.5740966796875, 0.6041946411132812, 0.6342926025390625, 0.6643905639648438, 0.694488525390625, 0.7245864868164062, 0.7546844482421875, 0.7847824096679688, 0.81488037109375, 0.8449783325195312, 0.8750762939453125, 0.9051742553710938, 0.935272216796875, 0.9653701782226562, 0.9954681396484375, 1.0255661010742188, 1.0556640625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 5.0, 24.0, 19.0, 43.0, 69.0, 78.0, 94.0, 130.0, 100.0, 109.0, 114.0, 79.0, 48.0, 44.0, 20.0, 15.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07470703125, -0.07176971435546875, -0.0688323974609375, -0.06589508056640625, -0.062957763671875, -0.06002044677734375, -0.0570831298828125, -0.05414581298828125, -0.05120849609375, -0.04827117919921875, -0.0453338623046875, -0.04239654541015625, -0.039459228515625, -0.03652191162109375, -0.0335845947265625, -0.03064727783203125, -0.0277099609375, -0.02477264404296875, -0.0218353271484375, -0.01889801025390625, -0.015960693359375, -0.01302337646484375, -0.0100860595703125, -0.00714874267578125, -0.00421142578125, -0.00127410888671875, 0.0016632080078125, 0.00460052490234375, 0.007537841796875, 0.01047515869140625, 0.0134124755859375, 0.01634979248046875, 0.019287109375, 0.02222442626953125, 0.0251617431640625, 0.02809906005859375, 0.031036376953125, 0.03397369384765625, 0.0369110107421875, 0.03984832763671875, 0.04278564453125, 0.04572296142578125, 0.0486602783203125, 0.05159759521484375, 0.054534912109375, 0.05747222900390625, 0.0604095458984375, 0.06334686279296875, 0.0662841796875, 0.06922149658203125, 0.0721588134765625, 0.07509613037109375, 0.078033447265625, 0.08097076416015625, 0.0839080810546875, 0.08684539794921875, 0.08978271484375, 0.09272003173828125, 0.0956573486328125, 0.09859466552734375, 0.101531982421875, 0.10446929931640625, 0.1074066162109375, 0.11034393310546875, 0.11328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 15.0, 29.0, 43.0, 67.0, 132.0, 213.0, 393.0, 824.0, 2012.0, 5923.0, 26523.0, 864528.0, 3249279.0, 33027.0, 7095.0, 2264.0, 946.0, 448.0, 214.0, 112.0, 73.0, 46.0, 21.0, 15.0, 13.0, 6.0, 4.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.439453125, -0.4211883544921875, -0.402923583984375, -0.3846588134765625, -0.36639404296875, -0.3481292724609375, -0.329864501953125, -0.3115997314453125, -0.2933349609375, -0.2750701904296875, -0.256805419921875, -0.2385406494140625, -0.22027587890625, -0.2020111083984375, -0.183746337890625, -0.1654815673828125, -0.147216796875, -0.1289520263671875, -0.110687255859375, -0.0924224853515625, -0.07415771484375, -0.0558929443359375, -0.037628173828125, -0.0193634033203125, -0.0010986328125, 0.0171661376953125, 0.035430908203125, 0.0536956787109375, 0.07196044921875, 0.0902252197265625, 0.108489990234375, 0.1267547607421875, 0.14501953125, 0.1632843017578125, 0.181549072265625, 0.1998138427734375, 0.21807861328125, 0.2363433837890625, 0.254608154296875, 0.2728729248046875, 0.2911376953125, 0.3094024658203125, 0.327667236328125, 0.3459320068359375, 0.36419677734375, 0.3824615478515625, 0.400726318359375, 0.4189910888671875, 0.437255859375, 0.4555206298828125, 0.473785400390625, 0.4920501708984375, 0.51031494140625, 0.5285797119140625, 0.546844482421875, 0.5651092529296875, 0.5833740234375, 0.6016387939453125, 0.619903564453125, 0.6381683349609375, 0.65643310546875, 0.6746978759765625, 0.692962646484375, 0.7112274169921875, 0.7294921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 6.0, 13.0, 14.0, 23.0, 30.0, 50.0, 120.0, 324.0, 2186.0, 888.0, 207.0, 80.0, 38.0, 31.0, 21.0, 11.0, 7.0, 3.0, 13.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189208984375, -0.183258056640625, -0.17730712890625, -0.171356201171875, -0.1654052734375, -0.159454345703125, -0.15350341796875, -0.147552490234375, -0.1416015625, -0.135650634765625, -0.12969970703125, -0.123748779296875, -0.1177978515625, -0.111846923828125, -0.10589599609375, -0.099945068359375, -0.093994140625, -0.088043212890625, -0.08209228515625, -0.076141357421875, -0.0701904296875, -0.064239501953125, -0.05828857421875, -0.052337646484375, -0.04638671875, -0.040435791015625, -0.03448486328125, -0.028533935546875, -0.0225830078125, -0.016632080078125, -0.01068115234375, -0.004730224609375, 0.001220703125, 0.007171630859375, 0.01312255859375, 0.019073486328125, 0.0250244140625, 0.030975341796875, 0.03692626953125, 0.042877197265625, 0.048828125, 0.054779052734375, 0.06072998046875, 0.066680908203125, 0.0726318359375, 0.078582763671875, 0.08453369140625, 0.090484619140625, 0.096435546875, 0.102386474609375, 0.10833740234375, 0.114288330078125, 0.1202392578125, 0.126190185546875, 0.13214111328125, 0.138092041015625, 0.14404296875, 0.149993896484375, 0.15594482421875, 0.161895751953125, 0.1678466796875, 0.173797607421875, 0.17974853515625, 0.185699462890625, 0.191650390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 14.0, 33.0, 57.0, 130.0, 228.0, 242.0, 131.0, 86.0, 36.0, 18.0, 9.0, 8.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2889631986618042, -1.244719386100769, -1.2004756927490234, -1.1562318801879883, -1.1119880676269531, -1.0677443742752075, -1.0235005617141724, -0.979256808757782, -0.9350130558013916, -0.8907693028450012, -0.8465255498886108, -0.8022817373275757, -0.7580379843711853, -0.7137942314147949, -0.6695504188537598, -0.6253066658973694, -0.581062912940979, -0.5368191599845886, -0.49257537722587585, -0.4483315944671631, -0.4040878415107727, -0.3598440885543823, -0.31560030579566956, -0.2713565230369568, -0.2271127700805664, -0.18286900222301483, -0.13862523436546326, -0.09438146650791168, -0.05013769865036011, -0.005893930792808533, 0.03834983706474304, 0.08259361982345581, 0.1268373727798462, 0.17108114063739777, 0.21532490849494934, 0.2595686912536621, 0.3038124442100525, 0.34805619716644287, 0.39229997992515564, 0.4365437626838684, 0.4807875156402588, 0.5250312685966492, 0.5692750215530396, 0.6135188341140747, 0.6577625870704651, 0.7020063400268555, 0.7462501525878906, 0.790493905544281, 0.8347376585006714, 0.8789814114570618, 0.9232251644134521, 0.9674689769744873, 1.0117127895355225, 1.055956482887268, 1.1002002954483032, 1.1444439888000488, 1.188687801361084, 1.2329316139221191, 1.2771753072738647, 1.3214191198349, 1.3656628131866455, 1.4099066257476807, 1.4541504383087158, 1.498394250869751, 1.5426379442214966]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 15.0, 21.0, 17.0, 27.0, 26.0, 22.0, 43.0, 53.0, 45.0, 56.0, 50.0, 67.0, 71.0, 52.0, 47.0, 62.0, 42.0, 41.0, 36.0, 41.0, 24.0, 23.0, 14.0, 26.0, 10.0, 13.0, 11.0, 12.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4157258868217468, -0.400950163602829, -0.38617444038391113, -0.3713987171649933, -0.35662299394607544, -0.3418472409248352, -0.32707151770591736, -0.3122957944869995, -0.29752007126808167, -0.2827443480491638, -0.26796862483024597, -0.2531929016113281, -0.23841716349124908, -0.22364144027233124, -0.2088657021522522, -0.19408997893333435, -0.1793142557144165, -0.16453853249549866, -0.1497628092765808, -0.13498707115650177, -0.12021134793758392, -0.10543562471866608, -0.09065989404916763, -0.07588416337966919, -0.06110844016075134, -0.0463327132165432, -0.03155698627233505, -0.016781259328126907, -0.002005532383918762, 0.012770190834999084, 0.027545921504497528, 0.04232165217399597, 0.05709737539291382, 0.07187309861183167, 0.08664882928133011, 0.10142455995082855, 0.1162002831697464, 0.13097600638866425, 0.1457517445087433, 0.16052746772766113, 0.17530319094657898, 0.19007891416549683, 0.20485463738441467, 0.2196303755044937, 0.23440609872341156, 0.2491818219423294, 0.26395756006240845, 0.2787332832813263, 0.29350900650024414, 0.308284729719162, 0.32306045293807983, 0.3378361761569977, 0.3526118993759155, 0.36738765239715576, 0.3821633756160736, 0.39693909883499146, 0.4117148220539093, 0.42649054527282715, 0.441266268491745, 0.45604199171066284, 0.4708177447319031, 0.48559343814849854, 0.5003691911697388, 0.515144944190979, 0.5299206376075745]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 1.0, 0.0, 5.0, 5.0, 7.0, 9.0, 18.0, 22.0, 32.0, 35.0, 55.0, 87.0, 187.0, 390.0, 913.0, 2979.0, 15348.0, 175069.0, 784598.0, 58237.0, 7550.0, 1754.0, 595.0, 276.0, 130.0, 77.0, 47.0, 40.0, 25.0, 10.0, 9.0, 15.0, 10.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6498870849609375, -0.626922607421875, -0.6039581298828125, -0.58099365234375, -0.5580291748046875, -0.535064697265625, -0.5121002197265625, -0.4891357421875, -0.4661712646484375, -0.443206787109375, -0.4202423095703125, -0.39727783203125, -0.3743133544921875, -0.351348876953125, -0.3283843994140625, -0.305419921875, -0.2824554443359375, -0.259490966796875, -0.2365264892578125, -0.21356201171875, -0.1905975341796875, -0.167633056640625, -0.1446685791015625, -0.1217041015625, -0.0987396240234375, -0.075775146484375, -0.0528106689453125, -0.02984619140625, -0.0068817138671875, 0.016082763671875, 0.0390472412109375, 0.06201171875, 0.0849761962890625, 0.107940673828125, 0.1309051513671875, 0.15386962890625, 0.1768341064453125, 0.199798583984375, 0.2227630615234375, 0.2457275390625, 0.2686920166015625, 0.291656494140625, 0.3146209716796875, 0.33758544921875, 0.3605499267578125, 0.383514404296875, 0.4064788818359375, 0.429443359375, 0.4524078369140625, 0.475372314453125, 0.4983367919921875, 0.52130126953125, 0.5442657470703125, 0.567230224609375, 0.5901947021484375, 0.6131591796875, 0.6361236572265625, 0.659088134765625, 0.6820526123046875, 0.70501708984375, 0.7279815673828125, 0.750946044921875, 0.7739105224609375, 0.796875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 11.0, 11.0, 19.0, 47.0, 42.0, 61.0, 105.0, 95.0, 129.0, 95.0, 96.0, 96.0, 65.0, 63.0, 25.0, 14.0, 12.0, 11.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.073486328125, -0.07053375244140625, -0.0675811767578125, -0.06462860107421875, -0.061676025390625, -0.05872344970703125, -0.0557708740234375, -0.05281829833984375, -0.04986572265625, -0.04691314697265625, -0.0439605712890625, -0.04100799560546875, -0.038055419921875, -0.03510284423828125, -0.0321502685546875, -0.02919769287109375, -0.0262451171875, -0.02329254150390625, -0.0203399658203125, -0.01738739013671875, -0.014434814453125, -0.01148223876953125, -0.0085296630859375, -0.00557708740234375, -0.00262451171875, 0.00032806396484375, 0.0032806396484375, 0.00623321533203125, 0.009185791015625, 0.01213836669921875, 0.0150909423828125, 0.01804351806640625, 0.02099609375, 0.02394866943359375, 0.0269012451171875, 0.02985382080078125, 0.032806396484375, 0.03575897216796875, 0.0387115478515625, 0.04166412353515625, 0.04461669921875, 0.04756927490234375, 0.0505218505859375, 0.05347442626953125, 0.056427001953125, 0.05937957763671875, 0.0623321533203125, 0.06528472900390625, 0.0682373046875, 0.07118988037109375, 0.0741424560546875, 0.07709503173828125, 0.080047607421875, 0.08300018310546875, 0.0859527587890625, 0.08890533447265625, 0.09185791015625, 0.09481048583984375, 0.0977630615234375, 0.10071563720703125, 0.103668212890625, 0.10662078857421875, 0.1095733642578125, 0.11252593994140625, 0.115478515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 8.0, 6.0, 5.0, 8.0, 16.0, 25.0, 37.0, 49.0, 82.0, 194.0, 343.0, 652.0, 1696.0, 5303.0, 24113.0, 198637.0, 723222.0, 76250.0, 12402.0, 3286.0, 1108.0, 525.0, 237.0, 137.0, 73.0, 31.0, 33.0, 22.0, 10.0, 19.0, 4.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5703125, -0.5536842346191406, -0.5370559692382812, -0.5204277038574219, -0.5037994384765625, -0.4871711730957031, -0.47054290771484375, -0.4539146423339844, -0.437286376953125, -0.4206581115722656, -0.40402984619140625, -0.3874015808105469, -0.3707733154296875, -0.3541450500488281, -0.33751678466796875, -0.3208885192871094, -0.30426025390625, -0.2876319885253906, -0.27100372314453125, -0.2543754577636719, -0.2377471923828125, -0.22111892700195312, -0.20449066162109375, -0.18786239624023438, -0.171234130859375, -0.15460586547851562, -0.13797760009765625, -0.12134933471679688, -0.1047210693359375, -0.08809280395507812, -0.07146453857421875, -0.054836273193359375, -0.0382080078125, -0.021579742431640625, -0.00495147705078125, 0.011676788330078125, 0.0283050537109375, 0.044933319091796875, 0.06156158447265625, 0.07818984985351562, 0.094818115234375, 0.11144638061523438, 0.12807464599609375, 0.14470291137695312, 0.1613311767578125, 0.17795944213867188, 0.19458770751953125, 0.21121597290039062, 0.22784423828125, 0.24447250366210938, 0.26110076904296875, 0.2777290344238281, 0.2943572998046875, 0.3109855651855469, 0.32761383056640625, 0.3442420959472656, 0.360870361328125, 0.3774986267089844, 0.39412689208984375, 0.4107551574707031, 0.4273834228515625, 0.4440116882324219, 0.46063995361328125, 0.4772682189941406, 0.493896484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 6.0, 2.0, 1.0, 5.0, 10.0, 7.0, 13.0, 12.0, 24.0, 33.0, 34.0, 45.0, 50.0, 68.0, 64.0, 57.0, 70.0, 81.0, 69.0, 82.0, 52.0, 48.0, 36.0, 34.0, 22.0, 26.0, 22.0, 11.0, 7.0, 5.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.334228515625, -0.3251934051513672, -0.3161582946777344, -0.30712318420410156, -0.29808807373046875, -0.28905296325683594, -0.2800178527832031, -0.2709827423095703, -0.2619476318359375, -0.2529125213623047, -0.24387741088867188, -0.23484230041503906, -0.22580718994140625, -0.21677207946777344, -0.20773696899414062, -0.1987018585205078, -0.189666748046875, -0.1806316375732422, -0.17159652709960938, -0.16256141662597656, -0.15352630615234375, -0.14449119567871094, -0.13545608520507812, -0.1264209747314453, -0.1173858642578125, -0.10835075378417969, -0.09931564331054688, -0.09028053283691406, -0.08124542236328125, -0.07221031188964844, -0.06317520141601562, -0.05414009094238281, -0.04510498046875, -0.03606986999511719, -0.027034759521484375, -0.017999649047851562, -0.00896453857421875, 7.05718994140625e-05, 0.009105682373046875, 0.018140792846679688, 0.0271759033203125, 0.03621101379394531, 0.045246124267578125, 0.05428123474121094, 0.06331634521484375, 0.07235145568847656, 0.08138656616210938, 0.09042167663574219, 0.099456787109375, 0.10849189758300781, 0.11752700805664062, 0.12656211853027344, 0.13559722900390625, 0.14463233947753906, 0.15366744995117188, 0.1627025604248047, 0.1717376708984375, 0.1807727813720703, 0.18980789184570312, 0.19884300231933594, 0.20787811279296875, 0.21691322326660156, 0.22594833374023438, 0.2349834442138672, 0.2440185546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 4.0, 13.0, 27.0, 30.0, 76.0, 119.0, 253.0, 460.0, 745.0, 1584.0, 3467.0, 8906.0, 31635.0, 409825.0, 540781.0, 34181.0, 9350.0, 3623.0, 1729.0, 800.0, 440.0, 227.0, 115.0, 73.0, 35.0, 19.0, 13.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.367919921875, -0.3579826354980469, -0.34804534912109375, -0.3381080627441406, -0.3281707763671875, -0.3182334899902344, -0.30829620361328125, -0.2983589172363281, -0.288421630859375, -0.2784843444824219, -0.26854705810546875, -0.2586097717285156, -0.2486724853515625, -0.23873519897460938, -0.22879791259765625, -0.21886062622070312, -0.20892333984375, -0.19898605346679688, -0.18904876708984375, -0.17911148071289062, -0.1691741943359375, -0.15923690795898438, -0.14929962158203125, -0.13936233520507812, -0.129425048828125, -0.11948776245117188, -0.10955047607421875, -0.09961318969726562, -0.0896759033203125, -0.07973861694335938, -0.06980133056640625, -0.059864044189453125, -0.0499267578125, -0.039989471435546875, -0.03005218505859375, -0.020114898681640625, -0.0101776123046875, -0.000240325927734375, 0.00969696044921875, 0.019634246826171875, 0.029571533203125, 0.039508819580078125, 0.04944610595703125, 0.059383392333984375, 0.0693206787109375, 0.07925796508789062, 0.08919525146484375, 0.09913253784179688, 0.10906982421875, 0.11900711059570312, 0.12894439697265625, 0.13888168334960938, 0.1488189697265625, 0.15875625610351562, 0.16869354248046875, 0.17863082885742188, 0.188568115234375, 0.19850540161132812, 0.20844268798828125, 0.21837997436523438, 0.2283172607421875, 0.23825454711914062, 0.24819183349609375, 0.2581291198730469, 0.26806640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 5.0, 7.0, 3.0, 6.0, 18.0, 20.0, 28.0, 30.0, 36.0, 48.0, 50.0, 94.0, 101.0, 113.0, 88.0, 81.0, 66.0, 42.0, 37.0, 29.0, 22.0, 13.0, 11.0, 4.0, 9.0, 3.0, 6.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00015211105346679688, -0.00014755688607692719, -0.0001430027186870575, -0.0001384485512971878, -0.00013389438390731812, -0.00012934021651744843, -0.00012478604912757874, -0.00012023188173770905, -0.00011567771434783936, -0.00011112354695796967, -0.00010656937956809998, -0.00010201521217823029, -9.74610447883606e-05, -9.29068773984909e-05, -8.835271000862122e-05, -8.379854261875153e-05, -7.924437522888184e-05, -7.469020783901215e-05, -7.013604044914246e-05, -6.558187305927277e-05, -6.1027705669403076e-05, -5.6473538279533386e-05, -5.1919370889663696e-05, -4.7365203499794006e-05, -4.2811036109924316e-05, -3.8256868720054626e-05, -3.3702701330184937e-05, -2.9148533940315247e-05, -2.4594366550445557e-05, -2.0040199160575867e-05, -1.5486031770706177e-05, -1.0931864380836487e-05, -6.377696990966797e-06, -1.823529601097107e-06, 2.730637788772583e-06, 7.284805178642273e-06, 1.1838972568511963e-05, 1.6393139958381653e-05, 2.0947307348251343e-05, 2.5501474738121033e-05, 3.0055642127990723e-05, 3.460980951786041e-05, 3.91639769077301e-05, 4.371814429759979e-05, 4.827231168746948e-05, 5.282647907733917e-05, 5.738064646720886e-05, 6.193481385707855e-05, 6.648898124694824e-05, 7.104314863681793e-05, 7.559731602668762e-05, 8.015148341655731e-05, 8.4705650806427e-05, 8.925981819629669e-05, 9.381398558616638e-05, 9.836815297603607e-05, 0.00010292232036590576, 0.00010747648775577545, 0.00011203065514564514, 0.00011658482253551483, 0.00012113898992538452, 0.0001256931573152542, 0.0001302473247051239, 0.0001348014920949936, 0.00013935565948486328]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 3.0, 6.0, 5.0, 5.0, 6.0, 8.0, 8.0, 6.0, 19.0, 22.0, 24.0, 35.0, 64.0, 95.0, 140.0, 336.0, 662.0, 1742.0, 4912.0, 18408.0, 155473.0, 821024.0, 33839.0, 7427.0, 2379.0, 856.0, 438.0, 204.0, 121.0, 91.0, 66.0, 35.0, 29.0, 21.0, 12.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.48876953125, -0.4759674072265625, -0.463165283203125, -0.4503631591796875, -0.43756103515625, -0.4247589111328125, -0.411956787109375, -0.3991546630859375, -0.3863525390625, -0.3735504150390625, -0.360748291015625, -0.3479461669921875, -0.33514404296875, -0.3223419189453125, -0.309539794921875, -0.2967376708984375, -0.283935546875, -0.2711334228515625, -0.258331298828125, -0.2455291748046875, -0.23272705078125, -0.2199249267578125, -0.207122802734375, -0.1943206787109375, -0.1815185546875, -0.1687164306640625, -0.155914306640625, -0.1431121826171875, -0.13031005859375, -0.1175079345703125, -0.104705810546875, -0.0919036865234375, -0.0791015625, -0.0662994384765625, -0.053497314453125, -0.0406951904296875, -0.02789306640625, -0.0150909423828125, -0.002288818359375, 0.0105133056640625, 0.0233154296875, 0.0361175537109375, 0.048919677734375, 0.0617218017578125, 0.07452392578125, 0.0873260498046875, 0.100128173828125, 0.1129302978515625, 0.125732421875, 0.1385345458984375, 0.151336669921875, 0.1641387939453125, 0.17694091796875, 0.1897430419921875, 0.202545166015625, 0.2153472900390625, 0.2281494140625, 0.2409515380859375, 0.253753662109375, 0.2665557861328125, 0.27935791015625, 0.2921600341796875, 0.304962158203125, 0.3177642822265625, 0.33056640625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 5.0, 2.0, 2.0, 8.0, 12.0, 7.0, 26.0, 20.0, 28.0, 43.0, 67.0, 255.0, 287.0, 79.0, 31.0, 32.0, 13.0, 17.0, 8.0, 10.0, 7.0, 7.0, 3.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0], "bins": [-0.329833984375, -0.32198524475097656, -0.3141365051269531, -0.3062877655029297, -0.29843902587890625, -0.2905902862548828, -0.2827415466308594, -0.27489280700683594, -0.2670440673828125, -0.25919532775878906, -0.2513465881347656, -0.2434978485107422, -0.23564910888671875, -0.2278003692626953, -0.21995162963867188, -0.21210289001464844, -0.204254150390625, -0.19640541076660156, -0.18855667114257812, -0.1807079315185547, -0.17285919189453125, -0.1650104522705078, -0.15716171264648438, -0.14931297302246094, -0.1414642333984375, -0.13361549377441406, -0.12576675415039062, -0.11791801452636719, -0.11006927490234375, -0.10222053527832031, -0.09437179565429688, -0.08652305603027344, -0.07867431640625, -0.07082557678222656, -0.06297683715820312, -0.05512809753417969, -0.04727935791015625, -0.03943061828613281, -0.031581878662109375, -0.023733139038085938, -0.0158843994140625, -0.008035659790039062, -0.000186920166015625, 0.0076618194580078125, 0.01551055908203125, 0.023359298706054688, 0.031208038330078125, 0.03905677795410156, 0.046905517578125, 0.05475425720214844, 0.06260299682617188, 0.07045173645019531, 0.07830047607421875, 0.08614921569824219, 0.09399795532226562, 0.10184669494628906, 0.1096954345703125, 0.11754417419433594, 0.12539291381835938, 0.1332416534423828, 0.14109039306640625, 0.1489391326904297, 0.15678787231445312, 0.16463661193847656, 0.1724853515625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 15.0, 39.0, 101.0, 246.0, 346.0, 163.0, 66.0, 22.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.880144119262695, -7.684372425079346, -7.488601207733154, -7.292829513549805, -7.097058296203613, -6.901286602020264, -6.705514907836914, -6.509743690490723, -6.313972473144531, -6.118200778961182, -5.92242956161499, -5.726657867431641, -5.530886650085449, -5.3351149559021, -5.13934326171875, -4.943572044372559, -4.747800350189209, -4.552028656005859, -4.356257438659668, -4.160485744476318, -3.964714527130127, -3.7689428329467773, -3.573171377182007, -3.3773999214172363, -3.181628465652466, -2.9858570098876953, -2.790085554122925, -2.5943140983581543, -2.3985424041748047, -2.2027711868286133, -2.0069994926452637, -1.8112280368804932, -1.6154565811157227, -1.4196851253509521, -1.2239136695861816, -1.0281420946121216, -0.8323706388473511, -0.6365991830825806, -0.4408276081085205, -0.24505615234375, -0.04928469657897949, 0.1464867889881134, 0.3422582745552063, 0.5380297899246216, 0.7338012456893921, 0.9295727014541626, 1.1253442764282227, 1.3211157321929932, 1.5168871879577637, 1.7126586437225342, 1.9084300994873047, 2.1042017936706543, 2.2999730110168457, 2.4957447052001953, 2.691516160964966, 2.8872876167297363, 3.083059072494507, 3.2788305282592773, 3.474601984024048, 3.6703734397888184, 3.866145133972168, 4.061916351318359, 4.257688045501709, 4.453459739685059, 4.64923095703125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 0.0, 2.0, 4.0, 3.0, 4.0, 2.0, 5.0, 7.0, 10.0, 11.0, 16.0, 13.0, 23.0, 26.0, 31.0, 42.0, 43.0, 55.0, 42.0, 63.0, 61.0, 48.0, 76.0, 58.0, 60.0, 54.0, 41.0, 34.0, 31.0, 22.0, 22.0, 25.0, 18.0, 17.0, 8.0, 15.0, 5.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.426655888557434, -1.376775860786438, -1.3268959522247314, -1.2770159244537354, -1.2271358966827393, -1.1772558689117432, -1.1273759603500366, -1.0774959325790405, -1.027616024017334, -0.9777360558509827, -0.9278560280799866, -0.8779760599136353, -0.8280960321426392, -0.7782160639762878, -0.7283360958099365, -0.6784560680389404, -0.6285760402679443, -0.578696072101593, -0.5288160443305969, -0.4789360761642456, -0.4290560781955719, -0.3791760802268982, -0.3292961120605469, -0.27941611409187317, -0.22953611612319946, -0.17965611815452576, -0.12977613508701324, -0.07989615201950073, -0.030016154050827026, 0.01986384391784668, 0.069743812084198, 0.1196238100528717, 0.16950368881225586, 0.21938368678092957, 0.26926368474960327, 0.3191436529159546, 0.3690236508846283, 0.418903648853302, 0.4687836170196533, 0.5186636447906494, 0.5685436129570007, 0.618423581123352, 0.6683036088943481, 0.7181835770606995, 0.7680635452270508, 0.8179435729980469, 0.8678235411643982, 0.9177035093307495, 0.9675835371017456, 1.0174635648727417, 1.0673434734344482, 1.1172235012054443, 1.1671035289764404, 1.2169835567474365, 1.266863465309143, 1.3167434930801392, 1.3666234016418457, 1.4165034294128418, 1.4663833379745483, 1.5162633657455444, 1.5661433935165405, 1.616023302078247, 1.6659033298492432, 1.7157833576202393, 1.7656633853912354]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 5.0, 7.0, 8.0, 17.0, 22.0, 39.0, 58.0, 139.0, 422.0, 1464.0, 7691.0, 139102.0, 4023482.0, 18026.0, 2527.0, 650.0, 275.0, 105.0, 78.0, 45.0, 27.0, 24.0, 11.0, 17.0, 5.0, 9.0, 1.0, 6.0, 2.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81982421875, -0.7907638549804688, -0.7617034912109375, -0.7326431274414062, -0.703582763671875, -0.6745223999023438, -0.6454620361328125, -0.6164016723632812, -0.58734130859375, -0.5582809448242188, -0.5292205810546875, -0.5001602172851562, -0.471099853515625, -0.44203948974609375, -0.4129791259765625, -0.38391876220703125, -0.3548583984375, -0.32579803466796875, -0.2967376708984375, -0.26767730712890625, -0.238616943359375, -0.20955657958984375, -0.1804962158203125, -0.15143585205078125, -0.12237548828125, -0.09331512451171875, -0.0642547607421875, -0.03519439697265625, -0.006134033203125, 0.02292633056640625, 0.0519866943359375, 0.08104705810546875, 0.110107421875, 0.13916778564453125, 0.1682281494140625, 0.19728851318359375, 0.226348876953125, 0.25540924072265625, 0.2844696044921875, 0.31352996826171875, 0.34259033203125, 0.37165069580078125, 0.4007110595703125, 0.42977142333984375, 0.458831787109375, 0.48789215087890625, 0.5169525146484375, 0.5460128784179688, 0.5750732421875, 0.6041336059570312, 0.6331939697265625, 0.6622543334960938, 0.691314697265625, 0.7203750610351562, 0.7494354248046875, 0.7784957885742188, 0.80755615234375, 0.8366165161132812, 0.8656768798828125, 0.8947372436523438, 0.923797607421875, 0.9528579711914062, 0.9819183349609375, 1.0109786987304688, 1.0400390625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 8.0, 10.0, 22.0, 34.0, 34.0, 58.0, 74.0, 68.0, 89.0, 118.0, 94.0, 83.0, 78.0, 73.0, 55.0, 29.0, 30.0, 21.0, 8.0, 14.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.072998046875, -0.06995201110839844, -0.06690597534179688, -0.06385993957519531, -0.06081390380859375, -0.05776786804199219, -0.054721832275390625, -0.05167579650878906, -0.0486297607421875, -0.04558372497558594, -0.042537689208984375, -0.03949165344238281, -0.03644561767578125, -0.03339958190917969, -0.030353546142578125, -0.027307510375976562, -0.024261474609375, -0.021215438842773438, -0.018169403076171875, -0.015123367309570312, -0.01207733154296875, -0.009031295776367188, -0.005985260009765625, -0.0029392242431640625, 0.0001068115234375, 0.0031528472900390625, 0.006198883056640625, 0.009244918823242188, 0.01229095458984375, 0.015336990356445312, 0.018383026123046875, 0.021429061889648438, 0.02447509765625, 0.027521133422851562, 0.030567169189453125, 0.03361320495605469, 0.03665924072265625, 0.03970527648925781, 0.042751312255859375, 0.04579734802246094, 0.0488433837890625, 0.05188941955566406, 0.054935455322265625, 0.05798149108886719, 0.06102752685546875, 0.06407356262207031, 0.06711959838867188, 0.07016563415527344, 0.073211669921875, 0.07625770568847656, 0.07930374145507812, 0.08234977722167969, 0.08539581298828125, 0.08844184875488281, 0.09148788452148438, 0.09453392028808594, 0.0975799560546875, 0.10062599182128906, 0.10367202758789062, 0.10671806335449219, 0.10976409912109375, 0.11281013488769531, 0.11585617065429688, 0.11890220642089844, 0.1219482421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 17.0, 18.0, 37.0, 40.0, 61.0, 103.0, 123.0, 223.0, 367.0, 707.0, 1722.0, 4787.0, 19423.0, 397548.0, 3727906.0, 30674.0, 6292.0, 2139.0, 939.0, 434.0, 241.0, 165.0, 103.0, 80.0, 56.0, 26.0, 18.0, 13.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64404296875, -0.6219253540039062, -0.5998077392578125, -0.5776901245117188, -0.555572509765625, -0.5334548950195312, -0.5113372802734375, -0.48921966552734375, -0.46710205078125, -0.44498443603515625, -0.4228668212890625, -0.40074920654296875, -0.378631591796875, -0.35651397705078125, -0.3343963623046875, -0.31227874755859375, -0.2901611328125, -0.26804351806640625, -0.2459259033203125, -0.22380828857421875, -0.201690673828125, -0.17957305908203125, -0.1574554443359375, -0.13533782958984375, -0.11322021484375, -0.09110260009765625, -0.0689849853515625, -0.04686737060546875, -0.024749755859375, -0.00263214111328125, 0.0194854736328125, 0.04160308837890625, 0.063720703125, 0.08583831787109375, 0.1079559326171875, 0.13007354736328125, 0.152191162109375, 0.17430877685546875, 0.1964263916015625, 0.21854400634765625, 0.24066162109375, 0.26277923583984375, 0.2848968505859375, 0.30701446533203125, 0.329132080078125, 0.35124969482421875, 0.3733673095703125, 0.39548492431640625, 0.4176025390625, 0.43972015380859375, 0.4618377685546875, 0.48395538330078125, 0.506072998046875, 0.5281906127929688, 0.5503082275390625, 0.5724258422851562, 0.59454345703125, 0.6166610717773438, 0.6387786865234375, 0.6608963012695312, 0.683013916015625, 0.7051315307617188, 0.7272491455078125, 0.7493667602539062, 0.771484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 4.0, 5.0, 6.0, 11.0, 7.0, 19.0, 41.0, 55.0, 122.0, 375.0, 2681.0, 448.0, 131.0, 69.0, 35.0, 18.0, 10.0, 10.0, 4.0, 2.0, 5.0, 7.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1678466796875, -0.1621570587158203, -0.15646743774414062, -0.15077781677246094, -0.14508819580078125, -0.13939857482910156, -0.13370895385742188, -0.1280193328857422, -0.1223297119140625, -0.11664009094238281, -0.11095046997070312, -0.10526084899902344, -0.09957122802734375, -0.09388160705566406, -0.08819198608398438, -0.08250236511230469, -0.076812744140625, -0.07112312316894531, -0.06543350219726562, -0.05974388122558594, -0.05405426025390625, -0.04836463928222656, -0.042675018310546875, -0.03698539733886719, -0.0312957763671875, -0.025606155395507812, -0.019916534423828125, -0.014226913452148438, -0.00853729248046875, -0.0028476715087890625, 0.002841949462890625, 0.008531570434570312, 0.01422119140625, 0.019910812377929688, 0.025600433349609375, 0.03129005432128906, 0.03697967529296875, 0.04266929626464844, 0.048358917236328125, 0.05404853820800781, 0.0597381591796875, 0.06542778015136719, 0.07111740112304688, 0.07680702209472656, 0.08249664306640625, 0.08818626403808594, 0.09387588500976562, 0.09956550598144531, 0.105255126953125, 0.11094474792480469, 0.11663436889648438, 0.12232398986816406, 0.12801361083984375, 0.13370323181152344, 0.13939285278320312, 0.1450824737548828, 0.1507720947265625, 0.1564617156982422, 0.16215133666992188, 0.16784095764160156, 0.17353057861328125, 0.17922019958496094, 0.18490982055664062, 0.1905994415283203, 0.1962890625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 11.0, 7.0, 28.0, 31.0, 58.0, 105.0, 134.0, 168.0, 140.0, 89.0, 68.0, 58.0, 24.0, 21.0, 18.0, 10.0, 4.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0010321140289307, -0.9733657240867615, -0.9456993341445923, -0.9180329442024231, -0.8903665542602539, -0.8627001643180847, -0.8350337743759155, -0.8073674440383911, -0.7797009944915771, -0.752034604549408, -0.7243682146072388, -0.6967018246650696, -0.6690354347229004, -0.6413690447807312, -0.613702654838562, -0.5860363245010376, -0.5583699345588684, -0.5307035446166992, -0.50303715467453, -0.47537076473236084, -0.44770437479019165, -0.42003798484802246, -0.39237162470817566, -0.36470523476600647, -0.3370388448238373, -0.3093724548816681, -0.2817060649394989, -0.2540397047996521, -0.22637329995632172, -0.19870691001415253, -0.17104053497314453, -0.14337414503097534, -0.11570769548416138, -0.08804130554199219, -0.060374923050403595, -0.032708540558815, -0.005042150616645813, 0.022624239325523376, 0.05029061436653137, 0.07795700430870056, 0.10562339425086975, 0.13328978419303894, 0.16095617413520813, 0.18862254917621613, 0.21628893911838531, 0.2439553290605545, 0.2716217041015625, 0.2992880940437317, 0.3269544839859009, 0.35462087392807007, 0.38228726387023926, 0.40995365381240845, 0.43762004375457764, 0.4652864336967468, 0.49295279383659363, 0.5206191539764404, 0.5482856035232544, 0.5759519934654236, 0.6036183834075928, 0.631284773349762, 0.6589511632919312, 0.6866175532341003, 0.7142839431762695, 0.741950273513794, 0.7696166634559631]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 12.0, 7.0, 14.0, 22.0, 20.0, 32.0, 33.0, 50.0, 47.0, 50.0, 59.0, 66.0, 68.0, 68.0, 59.0, 51.0, 55.0, 56.0, 37.0, 49.0, 33.0, 29.0, 19.0, 20.0, 15.0, 15.0, 11.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5085158944129944, -0.49086201190948486, -0.47320809960365295, -0.45555418729782104, -0.4379003047943115, -0.420246422290802, -0.4025925099849701, -0.3849385976791382, -0.36728471517562866, -0.34963083267211914, -0.33197692036628723, -0.3143230080604553, -0.2966691255569458, -0.2790152430534363, -0.26136133074760437, -0.24370743334293365, -0.22605353593826294, -0.20839963853359222, -0.1907457411289215, -0.1730918437242508, -0.15543794631958008, -0.13778404891490936, -0.12013015151023865, -0.10247625410556793, -0.08482235670089722, -0.0671684592962265, -0.049514561891555786, -0.03186066448688507, -0.014206767082214355, 0.00344713032245636, 0.021101027727127075, 0.03875492513179779, 0.05640876293182373, 0.07406266033649445, 0.09171655774116516, 0.10937045514583588, 0.1270243525505066, 0.1446782499551773, 0.16233214735984802, 0.17998604476451874, 0.19763994216918945, 0.21529383957386017, 0.23294773697853088, 0.2506016492843628, 0.2682555317878723, 0.28590941429138184, 0.30356332659721375, 0.32121723890304565, 0.3388711214065552, 0.3565250039100647, 0.3741789162158966, 0.3918328285217285, 0.40948671102523804, 0.42714059352874756, 0.44479450583457947, 0.4624484181404114, 0.4801023006439209, 0.4977561831474304, 0.5154100656509399, 0.5330640077590942, 0.5507178902626038, 0.5683717727661133, 0.5860257148742676, 0.6036795973777771, 0.6213334798812866]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 3.0, 1.0, 13.0, 12.0, 14.0, 15.0, 35.0, 41.0, 87.0, 150.0, 326.0, 775.0, 2721.0, 18347.0, 362345.0, 630818.0, 27589.0, 3529.0, 935.0, 356.0, 188.0, 86.0, 48.0, 32.0, 26.0, 13.0, 16.0, 5.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8515625, -0.8241653442382812, -0.7967681884765625, -0.7693710327148438, -0.741973876953125, -0.7145767211914062, -0.6871795654296875, -0.6597824096679688, -0.63238525390625, -0.6049880981445312, -0.5775909423828125, -0.5501937866210938, -0.522796630859375, -0.49539947509765625, -0.4680023193359375, -0.44060516357421875, -0.4132080078125, -0.38581085205078125, -0.3584136962890625, -0.33101654052734375, -0.303619384765625, -0.27622222900390625, -0.2488250732421875, -0.22142791748046875, -0.19403076171875, -0.16663360595703125, -0.1392364501953125, -0.11183929443359375, -0.084442138671875, -0.05704498291015625, -0.0296478271484375, -0.00225067138671875, 0.025146484375, 0.05254364013671875, 0.0799407958984375, 0.10733795166015625, 0.134735107421875, 0.16213226318359375, 0.1895294189453125, 0.21692657470703125, 0.24432373046875, 0.27172088623046875, 0.2991180419921875, 0.32651519775390625, 0.353912353515625, 0.38130950927734375, 0.4087066650390625, 0.43610382080078125, 0.4635009765625, 0.49089813232421875, 0.5182952880859375, 0.5456924438476562, 0.573089599609375, 0.6004867553710938, 0.6278839111328125, 0.6552810668945312, 0.68267822265625, 0.7100753784179688, 0.7374725341796875, 0.7648696899414062, 0.792266845703125, 0.8196640014648438, 0.8470611572265625, 0.8744583129882812, 0.90185546875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 9.0, 8.0, 22.0, 34.0, 38.0, 65.0, 52.0, 68.0, 78.0, 119.0, 86.0, 74.0, 95.0, 66.0, 59.0, 40.0, 29.0, 18.0, 12.0, 18.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0772705078125, -0.07419395446777344, -0.07111740112304688, -0.06804084777832031, -0.06496429443359375, -0.06188774108886719, -0.058811187744140625, -0.05573463439941406, -0.0526580810546875, -0.04958152770996094, -0.046504974365234375, -0.04342842102050781, -0.04035186767578125, -0.03727531433105469, -0.034198760986328125, -0.031122207641601562, -0.028045654296875, -0.024969100952148438, -0.021892547607421875, -0.018815994262695312, -0.01573944091796875, -0.012662887573242188, -0.009586334228515625, -0.0065097808837890625, -0.0034332275390625, -0.0003566741943359375, 0.002719879150390625, 0.0057964324951171875, 0.00887298583984375, 0.011949539184570312, 0.015026092529296875, 0.018102645874023438, 0.02117919921875, 0.024255752563476562, 0.027332305908203125, 0.030408859252929688, 0.03348541259765625, 0.03656196594238281, 0.039638519287109375, 0.04271507263183594, 0.0457916259765625, 0.04886817932128906, 0.051944732666015625, 0.05502128601074219, 0.05809783935546875, 0.06117439270019531, 0.06425094604492188, 0.06732749938964844, 0.070404052734375, 0.07348060607910156, 0.07655715942382812, 0.07963371276855469, 0.08271026611328125, 0.08578681945800781, 0.08886337280273438, 0.09193992614746094, 0.0950164794921875, 0.09809303283691406, 0.10116958618164062, 0.10424613952636719, 0.10732269287109375, 0.11039924621582031, 0.11347579956054688, 0.11655235290527344, 0.11962890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 9.0, 5.0, 9.0, 9.0, 15.0, 27.0, 65.0, 119.0, 217.0, 490.0, 1152.0, 3067.0, 11226.0, 54622.0, 493793.0, 420034.0, 48474.0, 10272.0, 3002.0, 1067.0, 446.0, 200.0, 99.0, 48.0, 33.0, 14.0, 14.0, 4.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395751953125, -0.3810768127441406, -0.36640167236328125, -0.3517265319824219, -0.3370513916015625, -0.3223762512207031, -0.30770111083984375, -0.2930259704589844, -0.278350830078125, -0.2636756896972656, -0.24900054931640625, -0.23432540893554688, -0.2196502685546875, -0.20497512817382812, -0.19029998779296875, -0.17562484741210938, -0.16094970703125, -0.14627456665039062, -0.13159942626953125, -0.11692428588867188, -0.1022491455078125, -0.08757400512695312, -0.07289886474609375, -0.058223724365234375, -0.043548583984375, -0.028873443603515625, -0.01419830322265625, 0.000476837158203125, 0.0151519775390625, 0.029827117919921875, 0.04450225830078125, 0.059177398681640625, 0.0738525390625, 0.08852767944335938, 0.10320281982421875, 0.11787796020507812, 0.1325531005859375, 0.14722824096679688, 0.16190338134765625, 0.17657852172851562, 0.191253662109375, 0.20592880249023438, 0.22060394287109375, 0.23527908325195312, 0.2499542236328125, 0.2646293640136719, 0.27930450439453125, 0.2939796447753906, 0.30865478515625, 0.3233299255371094, 0.33800506591796875, 0.3526802062988281, 0.3673553466796875, 0.3820304870605469, 0.39670562744140625, 0.4113807678222656, 0.426055908203125, 0.4407310485839844, 0.45540618896484375, 0.4700813293457031, 0.4847564697265625, 0.4994316101074219, 0.5141067504882812, 0.5287818908691406, 0.54345703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 16.0, 9.0, 17.0, 14.0, 22.0, 30.0, 37.0, 45.0, 47.0, 48.0, 67.0, 48.0, 74.0, 60.0, 65.0, 69.0, 56.0, 64.0, 35.0, 39.0, 31.0, 22.0, 23.0, 11.0, 9.0, 7.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.24627685546875, -0.2369384765625, -0.22760009765625, -0.21826171875, -0.20892333984375, -0.1995849609375, -0.19024658203125, -0.180908203125, -0.17156982421875, -0.1622314453125, -0.15289306640625, -0.1435546875, -0.13421630859375, -0.1248779296875, -0.11553955078125, -0.106201171875, -0.09686279296875, -0.0875244140625, -0.07818603515625, -0.06884765625, -0.05950927734375, -0.0501708984375, -0.04083251953125, -0.031494140625, -0.02215576171875, -0.0128173828125, -0.00347900390625, 0.005859375, 0.01519775390625, 0.0245361328125, 0.03387451171875, 0.043212890625, 0.05255126953125, 0.0618896484375, 0.07122802734375, 0.08056640625, 0.08990478515625, 0.0992431640625, 0.10858154296875, 0.117919921875, 0.12725830078125, 0.1365966796875, 0.14593505859375, 0.1552734375, 0.16461181640625, 0.1739501953125, 0.18328857421875, 0.192626953125, 0.20196533203125, 0.2113037109375, 0.22064208984375, 0.22998046875, 0.23931884765625, 0.2486572265625, 0.25799560546875, 0.267333984375, 0.27667236328125, 0.2860107421875, 0.29534912109375, 0.3046875, 0.31402587890625, 0.3233642578125, 0.33270263671875, 0.342041015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 7.0, 18.0, 29.0, 58.0, 92.0, 183.0, 414.0, 863.0, 2693.0, 10295.0, 62337.0, 890730.0, 65895.0, 10449.0, 2714.0, 954.0, 391.0, 164.0, 109.0, 55.0, 26.0, 24.0, 20.0, 10.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.376953125, -0.36716461181640625, -0.3573760986328125, -0.34758758544921875, -0.337799072265625, -0.32801055908203125, -0.3182220458984375, -0.30843353271484375, -0.29864501953125, -0.28885650634765625, -0.2790679931640625, -0.26927947998046875, -0.259490966796875, -0.24970245361328125, -0.2399139404296875, -0.23012542724609375, -0.2203369140625, -0.21054840087890625, -0.2007598876953125, -0.19097137451171875, -0.181182861328125, -0.17139434814453125, -0.1616058349609375, -0.15181732177734375, -0.14202880859375, -0.13224029541015625, -0.1224517822265625, -0.11266326904296875, -0.102874755859375, -0.09308624267578125, -0.0832977294921875, -0.07350921630859375, -0.063720703125, -0.05393218994140625, -0.0441436767578125, -0.03435516357421875, -0.024566650390625, -0.01477813720703125, -0.0049896240234375, 0.00479888916015625, 0.01458740234375, 0.02437591552734375, 0.0341644287109375, 0.04395294189453125, 0.053741455078125, 0.06352996826171875, 0.0733184814453125, 0.08310699462890625, 0.0928955078125, 0.10268402099609375, 0.1124725341796875, 0.12226104736328125, 0.132049560546875, 0.14183807373046875, 0.1516265869140625, 0.16141510009765625, 0.17120361328125, 0.18099212646484375, 0.1907806396484375, 0.20056915283203125, 0.210357666015625, 0.22014617919921875, 0.2299346923828125, 0.23972320556640625, 0.24951171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 13.0, 11.0, 6.0, 16.0, 24.0, 22.0, 36.0, 61.0, 86.0, 102.0, 133.0, 144.0, 98.0, 75.0, 32.0, 30.0, 24.0, 19.0, 15.0, 7.0, 4.0, 9.0, 6.0, 5.0, 3.0, 3.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00019860267639160156, -0.0001937374472618103, -0.00018887221813201904, -0.00018400698900222778, -0.00017914175987243652, -0.00017427653074264526, -0.000169411301612854, -0.00016454607248306274, -0.00015968084335327148, -0.00015481561422348022, -0.00014995038509368896, -0.0001450851559638977, -0.00014021992683410645, -0.00013535469770431519, -0.00013048946857452393, -0.00012562423944473267, -0.0001207590103149414, -0.00011589378118515015, -0.00011102855205535889, -0.00010616332292556763, -0.00010129809379577637, -9.643286466598511e-05, -9.156763553619385e-05, -8.670240640640259e-05, -8.183717727661133e-05, -7.697194814682007e-05, -7.210671901702881e-05, -6.724148988723755e-05, -6.237626075744629e-05, -5.751103162765503e-05, -5.264580249786377e-05, -4.778057336807251e-05, -4.291534423828125e-05, -3.805011510848999e-05, -3.318488597869873e-05, -2.831965684890747e-05, -2.345442771911621e-05, -1.858919858932495e-05, -1.3723969459533691e-05, -8.858740329742432e-06, -3.993511199951172e-06, 8.717179298400879e-07, 5.736947059631348e-06, 1.0602176189422607e-05, 1.5467405319213867e-05, 2.0332634449005127e-05, 2.5197863578796387e-05, 3.0063092708587646e-05, 3.4928321838378906e-05, 3.9793550968170166e-05, 4.4658780097961426e-05, 4.9524009227752686e-05, 5.4389238357543945e-05, 5.9254467487335205e-05, 6.411969661712646e-05, 6.898492574691772e-05, 7.385015487670898e-05, 7.871538400650024e-05, 8.35806131362915e-05, 8.844584226608276e-05, 9.331107139587402e-05, 9.817630052566528e-05, 0.00010304152965545654, 0.0001079067587852478, 0.00011277198791503906]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 5.0, 7.0, 26.0, 40.0, 62.0, 115.0, 201.0, 476.0, 1205.0, 3729.0, 13609.0, 78408.0, 875967.0, 58500.0, 11187.0, 3050.0, 1062.0, 445.0, 204.0, 106.0, 54.0, 28.0, 19.0, 10.0, 13.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291748046875, -0.28275299072265625, -0.2737579345703125, -0.26476287841796875, -0.255767822265625, -0.24677276611328125, -0.2377777099609375, -0.22878265380859375, -0.21978759765625, -0.21079254150390625, -0.2017974853515625, -0.19280242919921875, -0.183807373046875, -0.17481231689453125, -0.1658172607421875, -0.15682220458984375, -0.1478271484375, -0.13883209228515625, -0.1298370361328125, -0.12084197998046875, -0.111846923828125, -0.10285186767578125, -0.0938568115234375, -0.08486175537109375, -0.07586669921875, -0.06687164306640625, -0.0578765869140625, -0.04888153076171875, -0.039886474609375, -0.03089141845703125, -0.0218963623046875, -0.01290130615234375, -0.00390625, 0.00508880615234375, 0.0140838623046875, 0.02307891845703125, 0.032073974609375, 0.04106903076171875, 0.0500640869140625, 0.05905914306640625, 0.06805419921875, 0.07704925537109375, 0.0860443115234375, 0.09503936767578125, 0.104034423828125, 0.11302947998046875, 0.1220245361328125, 0.13101959228515625, 0.1400146484375, 0.14900970458984375, 0.1580047607421875, 0.16699981689453125, 0.175994873046875, 0.18498992919921875, 0.1939849853515625, 0.20298004150390625, 0.21197509765625, 0.22097015380859375, 0.2299652099609375, 0.23896026611328125, 0.247955322265625, 0.25695037841796875, 0.2659454345703125, 0.27494049072265625, 0.283935546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 8.0, 13.0, 19.0, 23.0, 38.0, 67.0, 144.0, 288.0, 165.0, 81.0, 38.0, 26.0, 18.0, 15.0, 12.0, 10.0, 6.0, 6.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1688232421875, -0.1634960174560547, -0.15816879272460938, -0.15284156799316406, -0.14751434326171875, -0.14218711853027344, -0.13685989379882812, -0.1315326690673828, -0.1262054443359375, -0.12087821960449219, -0.11555099487304688, -0.11022377014160156, -0.10489654541015625, -0.09956932067871094, -0.09424209594726562, -0.08891487121582031, -0.083587646484375, -0.07826042175292969, -0.07293319702148438, -0.06760597229003906, -0.06227874755859375, -0.05695152282714844, -0.051624298095703125, -0.04629707336425781, -0.0409698486328125, -0.03564262390136719, -0.030315399169921875, -0.024988174438476562, -0.01966094970703125, -0.014333724975585938, -0.009006500244140625, -0.0036792755126953125, 0.00164794921875, 0.0069751739501953125, 0.012302398681640625, 0.017629623413085938, 0.02295684814453125, 0.028284072875976562, 0.033611297607421875, 0.03893852233886719, 0.0442657470703125, 0.04959297180175781, 0.054920196533203125, 0.06024742126464844, 0.06557464599609375, 0.07090187072753906, 0.07622909545898438, 0.08155632019042969, 0.086883544921875, 0.09221076965332031, 0.09753799438476562, 0.10286521911621094, 0.10819244384765625, 0.11351966857910156, 0.11884689331054688, 0.12417411804199219, 0.1295013427734375, 0.1348285675048828, 0.14015579223632812, 0.14548301696777344, 0.15081024169921875, 0.15613746643066406, 0.16146469116210938, 0.1667919158935547, 0.172119140625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 28.0, 80.0, 263.0, 363.0, 181.0, 46.0, 26.0, 9.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.628582954406738, -10.429034233093262, -10.229484558105469, -10.029935836791992, -9.8303861618042, -9.630837440490723, -9.43128776550293, -9.231739044189453, -9.032190322875977, -8.8326416015625, -8.633091926574707, -8.43354320526123, -8.233993530273438, -8.034444808959961, -7.834895610809326, -7.635346412658691, -7.435797214508057, -7.236248016357422, -7.036698818206787, -6.837149620056152, -6.637600898742676, -6.438051700592041, -6.238502502441406, -6.0389533042907715, -5.839404106140137, -5.639854907989502, -5.440305709838867, -5.240756988525391, -5.041207790374756, -4.841658592224121, -4.642109394073486, -4.442560195922852, -4.243011951446533, -4.043462753295898, -3.8439137935638428, -3.644364595413208, -3.4448156356811523, -3.2452664375305176, -3.045717239379883, -2.846168041229248, -2.6466190814971924, -2.4470698833465576, -2.247520923614502, -2.047971725463867, -1.848422646522522, -1.6488735675811768, -1.449324369430542, -1.2497752904891968, -1.0502262115478516, -0.8506771326065063, -0.6511279940605164, -0.45157885551452637, -0.25202977657318115, -0.05248069763183594, 0.14706850051879883, 0.34661757946014404, 0.5461666584014893, 0.7457157373428345, 0.9452648758888245, 1.1448140144348145, 1.3443630933761597, 1.5439121723175049, 1.7434613704681396, 1.9430104494094849, 2.14255952835083]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 6.0, 5.0, 6.0, 10.0, 16.0, 21.0, 17.0, 23.0, 23.0, 34.0, 27.0, 40.0, 32.0, 44.0, 44.0, 49.0, 48.0, 43.0, 41.0, 46.0, 43.0, 47.0, 46.0, 45.0, 42.0, 31.0, 28.0, 28.0, 15.0, 17.0, 22.0, 8.0, 10.0, 10.0, 6.0, 9.0, 9.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2197015285491943, -1.1790683269500732, -1.1384351253509521, -1.097801923751831, -1.05716872215271, -1.0165355205535889, -0.9759023189544678, -0.9352691173553467, -0.8946359157562256, -0.8540027141571045, -0.8133695125579834, -0.7727363109588623, -0.7321031093597412, -0.6914699077606201, -0.650836706161499, -0.6102035045623779, -0.5695703029632568, -0.5289371013641357, -0.48830389976501465, -0.44767069816589355, -0.40703749656677246, -0.36640429496765137, -0.3257710933685303, -0.2851378917694092, -0.24450469017028809, -0.203871488571167, -0.1632382869720459, -0.1226050853729248, -0.08197188377380371, -0.04133868217468262, -0.0007054805755615234, 0.03992772102355957, 0.08056092262268066, 0.12119412422180176, 0.16182732582092285, 0.20246052742004395, 0.24309372901916504, 0.28372693061828613, 0.3243601322174072, 0.3649933338165283, 0.4056265354156494, 0.4462597370147705, 0.4868929386138916, 0.5275261402130127, 0.5681593418121338, 0.6087925434112549, 0.649425745010376, 0.6900589466094971, 0.7306921482086182, 0.7713253498077393, 0.8119585514068604, 0.8525917530059814, 0.8932249546051025, 0.9338581562042236, 0.9744913578033447, 1.0151245594024658, 1.055757761001587, 1.096390962600708, 1.137024164199829, 1.1776573657989502, 1.2182905673980713, 1.2589237689971924, 1.2995569705963135, 1.3401901721954346, 1.3808233737945557]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 7.0, 3.0, 6.0, 7.0, 15.0, 14.0, 21.0, 35.0, 53.0, 123.0, 261.0, 618.0, 1701.0, 6201.0, 35975.0, 4015942.0, 116554.0, 12134.0, 2889.0, 915.0, 336.0, 166.0, 94.0, 53.0, 38.0, 20.0, 19.0, 24.0, 7.0, 7.0, 11.0, 9.0, 1.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.96923828125, -0.9342727661132812, -0.8993072509765625, -0.8643417358398438, -0.829376220703125, -0.7944107055664062, -0.7594451904296875, -0.7244796752929688, -0.68951416015625, -0.6545486450195312, -0.6195831298828125, -0.5846176147460938, -0.549652099609375, -0.5146865844726562, -0.4797210693359375, -0.44475555419921875, -0.4097900390625, -0.37482452392578125, -0.3398590087890625, -0.30489349365234375, -0.269927978515625, -0.23496246337890625, -0.1999969482421875, -0.16503143310546875, -0.13006591796875, -0.09510040283203125, -0.0601348876953125, -0.02516937255859375, 0.009796142578125, 0.04476165771484375, 0.0797271728515625, 0.11469268798828125, 0.149658203125, 0.18462371826171875, 0.2195892333984375, 0.25455474853515625, 0.289520263671875, 0.32448577880859375, 0.3594512939453125, 0.39441680908203125, 0.42938232421875, 0.46434783935546875, 0.4993133544921875, 0.5342788696289062, 0.569244384765625, 0.6042098999023438, 0.6391754150390625, 0.6741409301757812, 0.7091064453125, 0.7440719604492188, 0.7790374755859375, 0.8140029907226562, 0.848968505859375, 0.8839340209960938, 0.9188995361328125, 0.9538650512695312, 0.98883056640625, 1.0237960815429688, 1.0587615966796875, 1.0937271118164062, 1.128692626953125, 1.1636581420898438, 1.1986236572265625, 1.2335891723632812, 1.2685546875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 15.0, 18.0, 17.0, 33.0, 50.0, 42.0, 61.0, 70.0, 73.0, 79.0, 82.0, 76.0, 78.0, 61.0, 52.0, 48.0, 36.0, 40.0, 18.0, 17.0, 6.0, 10.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07525634765625, -0.07249927520751953, -0.06974220275878906, -0.0669851303100586, -0.06422805786132812, -0.061470985412597656, -0.05871391296386719, -0.05595684051513672, -0.05319976806640625, -0.05044269561767578, -0.04768562316894531, -0.044928550720214844, -0.042171478271484375, -0.039414405822753906, -0.03665733337402344, -0.03390026092529297, -0.0311431884765625, -0.02838611602783203, -0.025629043579101562, -0.022871971130371094, -0.020114898681640625, -0.017357826232910156, -0.014600753784179688, -0.011843681335449219, -0.00908660888671875, -0.006329536437988281, -0.0035724639892578125, -0.0008153915405273438, 0.001941680908203125, 0.004698753356933594, 0.0074558258056640625, 0.010212898254394531, 0.012969970703125, 0.01572704315185547, 0.018484115600585938, 0.021241188049316406, 0.023998260498046875, 0.026755332946777344, 0.029512405395507812, 0.03226947784423828, 0.03502655029296875, 0.03778362274169922, 0.04054069519042969, 0.043297767639160156, 0.046054840087890625, 0.048811912536621094, 0.05156898498535156, 0.05432605743408203, 0.0570831298828125, 0.05984020233154297, 0.06259727478027344, 0.0653543472290039, 0.06811141967773438, 0.07086849212646484, 0.07362556457519531, 0.07638263702392578, 0.07913970947265625, 0.08189678192138672, 0.08465385437011719, 0.08741092681884766, 0.09016799926757812, 0.0929250717163086, 0.09568214416503906, 0.09843921661376953, 0.1011962890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 5.0, 13.0, 9.0, 10.0, 14.0, 17.0, 16.0, 38.0, 46.0, 74.0, 114.0, 200.0, 377.0, 725.0, 1589.0, 3942.0, 12385.0, 59349.0, 3867411.0, 211903.0, 24654.0, 6737.0, 2449.0, 990.0, 477.0, 282.0, 148.0, 89.0, 45.0, 37.0, 26.0, 21.0, 20.0, 7.0, 10.0, 8.0, 13.0, 7.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.81201171875, -0.7872161865234375, -0.762420654296875, -0.7376251220703125, -0.71282958984375, -0.6880340576171875, -0.663238525390625, -0.6384429931640625, -0.6136474609375, -0.5888519287109375, -0.564056396484375, -0.5392608642578125, -0.51446533203125, -0.4896697998046875, -0.464874267578125, -0.4400787353515625, -0.415283203125, -0.3904876708984375, -0.365692138671875, -0.3408966064453125, -0.31610107421875, -0.2913055419921875, -0.266510009765625, -0.2417144775390625, -0.2169189453125, -0.1921234130859375, -0.167327880859375, -0.1425323486328125, -0.11773681640625, -0.0929412841796875, -0.068145751953125, -0.0433502197265625, -0.0185546875, 0.0062408447265625, 0.031036376953125, 0.0558319091796875, 0.08062744140625, 0.1054229736328125, 0.130218505859375, 0.1550140380859375, 0.1798095703125, 0.2046051025390625, 0.229400634765625, 0.2541961669921875, 0.27899169921875, 0.3037872314453125, 0.328582763671875, 0.3533782958984375, 0.378173828125, 0.4029693603515625, 0.427764892578125, 0.4525604248046875, 0.47735595703125, 0.5021514892578125, 0.526947021484375, 0.5517425537109375, 0.5765380859375, 0.6013336181640625, 0.626129150390625, 0.6509246826171875, 0.67572021484375, 0.7005157470703125, 0.725311279296875, 0.7501068115234375, 0.77490234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 2.0, 9.0, 19.0, 22.0, 39.0, 62.0, 111.0, 386.0, 2973.0, 226.0, 99.0, 37.0, 24.0, 19.0, 9.0, 9.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.372802734375, -0.36458587646484375, -0.3563690185546875, -0.34815216064453125, -0.339935302734375, -0.33171844482421875, -0.3235015869140625, -0.31528472900390625, -0.30706787109375, -0.29885101318359375, -0.2906341552734375, -0.28241729736328125, -0.274200439453125, -0.26598358154296875, -0.2577667236328125, -0.24954986572265625, -0.2413330078125, -0.23311614990234375, -0.2248992919921875, -0.21668243408203125, -0.208465576171875, -0.20024871826171875, -0.1920318603515625, -0.18381500244140625, -0.17559814453125, -0.16738128662109375, -0.1591644287109375, -0.15094757080078125, -0.142730712890625, -0.13451385498046875, -0.1262969970703125, -0.11808013916015625, -0.10986328125, -0.10164642333984375, -0.0934295654296875, -0.08521270751953125, -0.076995849609375, -0.06877899169921875, -0.0605621337890625, -0.05234527587890625, -0.04412841796875, -0.03591156005859375, -0.0276947021484375, -0.01947784423828125, -0.011260986328125, -0.00304412841796875, 0.0051727294921875, 0.01338958740234375, 0.0216064453125, 0.02982330322265625, 0.0380401611328125, 0.04625701904296875, 0.054473876953125, 0.06269073486328125, 0.0709075927734375, 0.07912445068359375, 0.08734130859375, 0.09555816650390625, 0.1037750244140625, 0.11199188232421875, 0.120208740234375, 0.12842559814453125, 0.1366424560546875, 0.14485931396484375, 0.153076171875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 7.0, 6.0, 25.0, 68.0, 182.0, 339.0, 229.0, 94.0, 25.0, 10.0, 11.0, 7.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5613980293273926, -2.493518114089966, -2.425638437271118, -2.3577585220336914, -2.2898788452148438, -2.221998929977417, -2.1541192531585693, -2.0862393379211426, -2.018359661102295, -1.9504798650741577, -1.8826000690460205, -1.8147202730178833, -1.746840476989746, -1.6789606809616089, -1.6110808849334717, -1.543200969696045, -1.4753211736679077, -1.4074413776397705, -1.3395615816116333, -1.271681785583496, -1.2038019895553589, -1.1359221935272217, -1.068042278289795, -1.0001626014709473, -0.9322827458381653, -0.8644029498100281, -0.7965231537818909, -0.7286432981491089, -0.6607635021209717, -0.5928837060928345, -0.5250039100646973, -0.45712411403656006, -0.3892444372177124, -0.3213646411895752, -0.253484845161438, -0.1856050193309784, -0.11772522330284119, -0.04984542727470398, 0.018034398555755615, 0.08591419458389282, 0.15379399061203003, 0.22167378664016724, 0.28955358266830444, 0.35743340849876404, 0.42531320452690125, 0.49319300055503845, 0.561072826385498, 0.6289526224136353, 0.6968324184417725, 0.7647122144699097, 0.8325920104980469, 0.9004718065261841, 0.9683516025543213, 1.0362313985824585, 1.1041111946105957, 1.1719911098480225, 1.2398707866668701, 1.3077505826950073, 1.3756303787231445, 1.4435101747512817, 1.511389970779419, 1.5792697668075562, 1.6471495628356934, 1.7150294780731201, 1.7829092741012573]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 3.0, 4.0, 7.0, 4.0, 8.0, 14.0, 18.0, 28.0, 37.0, 45.0, 40.0, 39.0, 61.0, 80.0, 51.0, 82.0, 62.0, 53.0, 76.0, 42.0, 56.0, 43.0, 40.0, 31.0, 16.0, 16.0, 12.0, 4.0, 12.0, 5.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6327791213989258, -0.6119665503501892, -0.5911539196968079, -0.5703413486480713, -0.5495287179946899, -0.5287161469459534, -0.507903516292572, -0.48709094524383545, -0.4662783443927765, -0.44546574354171753, -0.42465314269065857, -0.4038405418395996, -0.38302797079086304, -0.3622153401374817, -0.3414027690887451, -0.32059016823768616, -0.2997775673866272, -0.27896496653556824, -0.2581523656845093, -0.2373397797346115, -0.21652717888355255, -0.1957145780324936, -0.17490199208259583, -0.15408939123153687, -0.1332767903804779, -0.11246418952941895, -0.09165159612894058, -0.07083900272846222, -0.05002640187740326, -0.0292138010263443, -0.008401207625865936, 0.012411385774612427, 0.03322392702102661, 0.05403652414679527, 0.07484912127256393, 0.0956617146730423, 0.11647431552410126, 0.13728691637516022, 0.15809950232505798, 0.17891210317611694, 0.1997247040271759, 0.22053730487823486, 0.24134990572929382, 0.2621625065803528, 0.28297507762908936, 0.3037877082824707, 0.3246002793312073, 0.34541288018226624, 0.3662254810333252, 0.38703808188438416, 0.4078506827354431, 0.4286632835865021, 0.44947588443756104, 0.4702884554862976, 0.49110105633735657, 0.5119136571884155, 0.5327262878417969, 0.5535388588905334, 0.5743514895439148, 0.5951640605926514, 0.6159766912460327, 0.6367892622947693, 0.6576018929481506, 0.6784144639968872, 0.6992270350456238]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 15.0, 21.0, 11.0, 28.0, 31.0, 66.0, 87.0, 172.0, 347.0, 829.0, 2662.0, 12221.0, 98901.0, 763646.0, 148138.0, 16142.0, 3391.0, 1000.0, 363.0, 188.0, 91.0, 48.0, 43.0, 30.0, 21.0, 7.0, 8.0, 7.0, 7.0, 8.0, 4.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8798828125, -0.852020263671875, -0.82415771484375, -0.796295166015625, -0.7684326171875, -0.740570068359375, -0.71270751953125, -0.684844970703125, -0.656982421875, -0.629119873046875, -0.60125732421875, -0.573394775390625, -0.5455322265625, -0.517669677734375, -0.48980712890625, -0.461944580078125, -0.43408203125, -0.406219482421875, -0.37835693359375, -0.350494384765625, -0.3226318359375, -0.294769287109375, -0.26690673828125, -0.239044189453125, -0.211181640625, -0.183319091796875, -0.15545654296875, -0.127593994140625, -0.0997314453125, -0.071868896484375, -0.04400634765625, -0.016143798828125, 0.01171875, 0.039581298828125, 0.06744384765625, 0.095306396484375, 0.1231689453125, 0.151031494140625, 0.17889404296875, 0.206756591796875, 0.234619140625, 0.262481689453125, 0.29034423828125, 0.318206787109375, 0.3460693359375, 0.373931884765625, 0.40179443359375, 0.429656982421875, 0.45751953125, 0.485382080078125, 0.51324462890625, 0.541107177734375, 0.5689697265625, 0.596832275390625, 0.62469482421875, 0.652557373046875, 0.680419921875, 0.708282470703125, 0.73614501953125, 0.764007568359375, 0.7918701171875, 0.819732666015625, 0.84759521484375, 0.875457763671875, 0.9033203125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 4.0, 15.0, 13.0, 23.0, 30.0, 36.0, 42.0, 61.0, 65.0, 75.0, 86.0, 74.0, 75.0, 74.0, 65.0, 58.0, 43.0, 42.0, 34.0, 29.0, 19.0, 17.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07855224609375, -0.07559490203857422, -0.07263755798339844, -0.06968021392822266, -0.06672286987304688, -0.0637655258178711, -0.06080818176269531, -0.05785083770751953, -0.05489349365234375, -0.05193614959716797, -0.04897880554199219, -0.046021461486816406, -0.043064117431640625, -0.040106773376464844, -0.03714942932128906, -0.03419208526611328, -0.0312347412109375, -0.02827739715576172, -0.025320053100585938, -0.022362709045410156, -0.019405364990234375, -0.016448020935058594, -0.013490676879882812, -0.010533332824707031, -0.00757598876953125, -0.004618644714355469, -0.0016613006591796875, 0.0012960433959960938, 0.004253387451171875, 0.007210731506347656, 0.010168075561523438, 0.013125419616699219, 0.016082763671875, 0.01904010772705078, 0.021997451782226562, 0.024954795837402344, 0.027912139892578125, 0.030869483947753906, 0.03382682800292969, 0.03678417205810547, 0.03974151611328125, 0.04269886016845703, 0.04565620422363281, 0.048613548278808594, 0.051570892333984375, 0.054528236389160156, 0.05748558044433594, 0.06044292449951172, 0.0634002685546875, 0.06635761260986328, 0.06931495666503906, 0.07227230072021484, 0.07522964477539062, 0.0781869888305664, 0.08114433288574219, 0.08410167694091797, 0.08705902099609375, 0.09001636505126953, 0.09297370910644531, 0.0959310531616211, 0.09888839721679688, 0.10184574127197266, 0.10480308532714844, 0.10776042938232422, 0.1107177734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 10.0, 15.0, 22.0, 34.0, 58.0, 102.0, 188.0, 310.0, 714.0, 1711.0, 4489.0, 15055.0, 59394.0, 303487.0, 521364.0, 105999.0, 24301.0, 7025.0, 2359.0, 922.0, 434.0, 217.0, 123.0, 71.0, 50.0, 30.0, 25.0, 12.0, 5.0, 11.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5419921875, -0.529144287109375, -0.51629638671875, -0.503448486328125, -0.4906005859375, -0.477752685546875, -0.46490478515625, -0.452056884765625, -0.439208984375, -0.426361083984375, -0.41351318359375, -0.400665283203125, -0.3878173828125, -0.374969482421875, -0.36212158203125, -0.349273681640625, -0.33642578125, -0.323577880859375, -0.31072998046875, -0.297882080078125, -0.2850341796875, -0.272186279296875, -0.25933837890625, -0.246490478515625, -0.233642578125, -0.220794677734375, -0.20794677734375, -0.195098876953125, -0.1822509765625, -0.169403076171875, -0.15655517578125, -0.143707275390625, -0.130859375, -0.118011474609375, -0.10516357421875, -0.092315673828125, -0.0794677734375, -0.066619873046875, -0.05377197265625, -0.040924072265625, -0.028076171875, -0.015228271484375, -0.00238037109375, 0.010467529296875, 0.0233154296875, 0.036163330078125, 0.04901123046875, 0.061859130859375, 0.07470703125, 0.087554931640625, 0.10040283203125, 0.113250732421875, 0.1260986328125, 0.138946533203125, 0.15179443359375, 0.164642333984375, 0.177490234375, 0.190338134765625, 0.20318603515625, 0.216033935546875, 0.2288818359375, 0.241729736328125, 0.25457763671875, 0.267425537109375, 0.2802734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 8.0, 10.0, 15.0, 15.0, 17.0, 14.0, 27.0, 30.0, 35.0, 44.0, 40.0, 45.0, 59.0, 48.0, 48.0, 47.0, 47.0, 57.0, 45.0, 47.0, 49.0, 35.0, 34.0, 30.0, 31.0, 29.0, 18.0, 9.0, 14.0, 15.0, 7.0, 10.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.314208984375, -0.30422210693359375, -0.2942352294921875, -0.28424835205078125, -0.274261474609375, -0.26427459716796875, -0.2542877197265625, -0.24430084228515625, -0.23431396484375, -0.22432708740234375, -0.2143402099609375, -0.20435333251953125, -0.194366455078125, -0.18437957763671875, -0.1743927001953125, -0.16440582275390625, -0.1544189453125, -0.14443206787109375, -0.1344451904296875, -0.12445831298828125, -0.114471435546875, -0.10448455810546875, -0.0944976806640625, -0.08451080322265625, -0.07452392578125, -0.06453704833984375, -0.0545501708984375, -0.04456329345703125, -0.034576416015625, -0.02458953857421875, -0.0146026611328125, -0.00461578369140625, 0.00537109375, 0.01535797119140625, 0.0253448486328125, 0.03533172607421875, 0.045318603515625, 0.05530548095703125, 0.0652923583984375, 0.07527923583984375, 0.08526611328125, 0.09525299072265625, 0.1052398681640625, 0.11522674560546875, 0.125213623046875, 0.13520050048828125, 0.1451873779296875, 0.15517425537109375, 0.1651611328125, 0.17514801025390625, 0.1851348876953125, 0.19512176513671875, 0.205108642578125, 0.21509552001953125, 0.2250823974609375, 0.23506927490234375, 0.24505615234375, 0.25504302978515625, 0.2650299072265625, 0.27501678466796875, 0.285003662109375, 0.29499053955078125, 0.3049774169921875, 0.31496429443359375, 0.324951171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 4.0, 6.0, 7.0, 13.0, 17.0, 26.0, 49.0, 46.0, 74.0, 125.0, 199.0, 348.0, 633.0, 1236.0, 2551.0, 6326.0, 17485.0, 65115.0, 351606.0, 488160.0, 80564.0, 20942.0, 7122.0, 2851.0, 1369.0, 714.0, 363.0, 223.0, 126.0, 74.0, 52.0, 43.0, 26.0, 18.0, 10.0, 13.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.16787147521972656, -0.16167068481445312, -0.1554698944091797, -0.14926910400390625, -0.1430683135986328, -0.13686752319335938, -0.13066673278808594, -0.1244659423828125, -0.11826515197753906, -0.11206436157226562, -0.10586357116699219, -0.09966278076171875, -0.09346199035644531, -0.08726119995117188, -0.08106040954589844, -0.074859619140625, -0.06865882873535156, -0.062458038330078125, -0.05625724792480469, -0.05005645751953125, -0.04385566711425781, -0.037654876708984375, -0.03145408630371094, -0.0252532958984375, -0.019052505493164062, -0.012851715087890625, -0.0066509246826171875, -0.00045013427734375, 0.0057506561279296875, 0.011951446533203125, 0.018152236938476562, 0.02435302734375, 0.030553817749023438, 0.036754608154296875, 0.04295539855957031, 0.04915618896484375, 0.05535697937011719, 0.061557769775390625, 0.06775856018066406, 0.0739593505859375, 0.08016014099121094, 0.08636093139648438, 0.09256172180175781, 0.09876251220703125, 0.10496330261230469, 0.11116409301757812, 0.11736488342285156, 0.123565673828125, 0.12976646423339844, 0.13596725463867188, 0.1421680450439453, 0.14836883544921875, 0.1545696258544922, 0.16077041625976562, 0.16697120666503906, 0.1731719970703125, 0.17937278747558594, 0.18557357788085938, 0.1917743682861328, 0.19797515869140625, 0.2041759490966797, 0.21037673950195312, 0.21657752990722656, 0.2227783203125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 9.0, 9.0, 8.0, 9.0, 11.0, 13.0, 16.0, 32.0, 33.0, 38.0, 51.0, 79.0, 78.0, 96.0, 107.0, 98.0, 68.0, 44.0, 34.0, 36.0, 28.0, 19.0, 15.0, 12.0, 12.0, 10.0, 7.0, 11.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00018644332885742188, -0.00018140673637390137, -0.00017637014389038086, -0.00017133355140686035, -0.00016629695892333984, -0.00016126036643981934, -0.00015622377395629883, -0.00015118718147277832, -0.0001461505889892578, -0.0001411139965057373, -0.0001360774040222168, -0.0001310408115386963, -0.00012600421905517578, -0.00012096762657165527, -0.00011593103408813477, -0.00011089444160461426, -0.00010585784912109375, -0.00010082125663757324, -9.578466415405273e-05, -9.074807167053223e-05, -8.571147918701172e-05, -8.067488670349121e-05, -7.56382942199707e-05, -7.06017017364502e-05, -6.556510925292969e-05, -6.052851676940918e-05, -5.549192428588867e-05, -5.0455331802368164e-05, -4.5418739318847656e-05, -4.038214683532715e-05, -3.534555435180664e-05, -3.0308961868286133e-05, -2.5272369384765625e-05, -2.0235776901245117e-05, -1.519918441772461e-05, -1.0162591934204102e-05, -5.125999450683594e-06, -8.940696716308594e-08, 4.947185516357422e-06, 9.98377799987793e-06, 1.5020370483398438e-05, 2.0056962966918945e-05, 2.5093555450439453e-05, 3.013014793395996e-05, 3.516674041748047e-05, 4.0203332901000977e-05, 4.5239925384521484e-05, 5.027651786804199e-05, 5.53131103515625e-05, 6.034970283508301e-05, 6.538629531860352e-05, 7.042288780212402e-05, 7.545948028564453e-05, 8.049607276916504e-05, 8.553266525268555e-05, 9.056925773620605e-05, 9.560585021972656e-05, 0.00010064244270324707, 0.00010567903518676758, 0.00011071562767028809, 0.0001157522201538086, 0.0001207888126373291, 0.0001258254051208496, 0.00013086199760437012, 0.00013589859008789062]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 6.0, 8.0, 19.0, 24.0, 29.0, 33.0, 53.0, 106.0, 150.0, 326.0, 604.0, 1203.0, 2724.0, 6288.0, 16733.0, 55144.0, 251632.0, 557433.0, 109253.0, 29324.0, 9766.0, 3891.0, 1878.0, 862.0, 429.0, 218.0, 140.0, 83.0, 62.0, 34.0, 26.0, 13.0, 9.0, 6.0, 5.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.21533203125, -0.20885467529296875, -0.2023773193359375, -0.19589996337890625, -0.189422607421875, -0.18294525146484375, -0.1764678955078125, -0.16999053955078125, -0.16351318359375, -0.15703582763671875, -0.1505584716796875, -0.14408111572265625, -0.137603759765625, -0.13112640380859375, -0.1246490478515625, -0.11817169189453125, -0.1116943359375, -0.10521697998046875, -0.0987396240234375, -0.09226226806640625, -0.085784912109375, -0.07930755615234375, -0.0728302001953125, -0.06635284423828125, -0.05987548828125, -0.05339813232421875, -0.0469207763671875, -0.04044342041015625, -0.033966064453125, -0.02748870849609375, -0.0210113525390625, -0.01453399658203125, -0.008056640625, -0.00157928466796875, 0.0048980712890625, 0.01137542724609375, 0.017852783203125, 0.02433013916015625, 0.0308074951171875, 0.03728485107421875, 0.04376220703125, 0.05023956298828125, 0.0567169189453125, 0.06319427490234375, 0.069671630859375, 0.07614898681640625, 0.0826263427734375, 0.08910369873046875, 0.0955810546875, 0.10205841064453125, 0.1085357666015625, 0.11501312255859375, 0.121490478515625, 0.12796783447265625, 0.1344451904296875, 0.14092254638671875, 0.14739990234375, 0.15387725830078125, 0.1603546142578125, 0.16683197021484375, 0.173309326171875, 0.17978668212890625, 0.1862640380859375, 0.19274139404296875, 0.19921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 7.0, 12.0, 8.0, 13.0, 4.0, 24.0, 15.0, 30.0, 33.0, 41.0, 34.0, 66.0, 100.0, 84.0, 112.0, 84.0, 48.0, 43.0, 44.0, 23.0, 20.0, 20.0, 22.0, 16.0, 15.0, 16.0, 12.0, 2.0, 6.0, 10.0, 5.0, 3.0, 1.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1632080078125, -0.15826034545898438, -0.15331268310546875, -0.14836502075195312, -0.1434173583984375, -0.13846969604492188, -0.13352203369140625, -0.12857437133789062, -0.123626708984375, -0.11867904663085938, -0.11373138427734375, -0.10878372192382812, -0.1038360595703125, -0.09888839721679688, -0.09394073486328125, -0.08899307250976562, -0.08404541015625, -0.07909774780273438, -0.07415008544921875, -0.06920242309570312, -0.0642547607421875, -0.059307098388671875, -0.05435943603515625, -0.049411773681640625, -0.044464111328125, -0.039516448974609375, -0.03456878662109375, -0.029621124267578125, -0.0246734619140625, -0.019725799560546875, -0.01477813720703125, -0.009830474853515625, -0.0048828125, 6.4849853515625e-05, 0.00501251220703125, 0.009960174560546875, 0.0149078369140625, 0.019855499267578125, 0.02480316162109375, 0.029750823974609375, 0.034698486328125, 0.039646148681640625, 0.04459381103515625, 0.049541473388671875, 0.0544891357421875, 0.059436798095703125, 0.06438446044921875, 0.06933212280273438, 0.07427978515625, 0.07922744750976562, 0.08417510986328125, 0.08912277221679688, 0.0940704345703125, 0.09901809692382812, 0.10396575927734375, 0.10891342163085938, 0.113861083984375, 0.11880874633789062, 0.12375640869140625, 0.12870407104492188, 0.1336517333984375, 0.13859939575195312, 0.14354705810546875, 0.14849472045898438, 0.1534423828125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 11.0, 18.0, 28.0, 41.0, 80.0, 124.0, 133.0, 169.0, 128.0, 79.0, 62.0, 42.0, 33.0, 20.0, 10.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5010337829589844, -1.399809718132019, -1.2985855340957642, -1.1973614692687988, -1.096137285232544, -0.9949132204055786, -0.8936890959739685, -0.7924649715423584, -0.6912408471107483, -0.5900167226791382, -0.4887925982475281, -0.38756850361824036, -0.28634437918663025, -0.18512028455734253, -0.08389616012573242, 0.017327964305877686, 0.11855208873748779, 0.2197762131690979, 0.321000337600708, 0.4222244322299957, 0.5234485864639282, 0.6246726512908936, 0.7258967757225037, 0.8271209001541138, 0.9283450245857239, 1.029569149017334, 1.1307932138442993, 1.2320173978805542, 1.3332414627075195, 1.4344656467437744, 1.5356897115707397, 1.636913776397705, 1.73813796043396, 1.8393620252609253, 1.9405862092971802, 2.0418102741241455, 2.1430344581604004, 2.244258403778076, 2.345482587814331, 2.446706771850586, 2.547930955886841, 2.6491551399230957, 2.7503790855407715, 2.8516032695770264, 2.9528274536132812, 3.054051399230957, 3.155275583267212, 3.256499767303467, 3.3577237129211426, 3.4589478969573975, 3.5601718425750732, 3.661396026611328, 3.762620210647583, 3.863844394683838, 3.9650683403015137, 4.066292762756348, 4.167516708374023, 4.268740653991699, 4.369965076446533, 4.471189022064209, 4.572412967681885, 4.673637390136719, 4.7748613357543945, 4.87608528137207, 4.977309703826904]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 2.0, 6.0, 7.0, 5.0, 6.0, 8.0, 9.0, 4.0, 16.0, 12.0, 19.0, 12.0, 25.0, 24.0, 27.0, 29.0, 27.0, 47.0, 41.0, 37.0, 36.0, 42.0, 33.0, 37.0, 49.0, 43.0, 36.0, 34.0, 32.0, 31.0, 42.0, 32.0, 33.0, 25.0, 20.0, 19.0, 12.0, 16.0, 8.0, 8.0, 6.0, 12.0, 9.0, 7.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.6171629428863525, -1.565836787223816, -1.5145106315612793, -1.4631845951080322, -1.4118584394454956, -1.360532283782959, -1.309206247329712, -1.2578800916671753, -1.2065539360046387, -1.155227780342102, -1.1039016246795654, -1.0525755882263184, -1.0012494325637817, -0.9499232769012451, -0.8985971808433533, -0.8472710847854614, -0.7959449291229248, -0.7446187734603882, -0.6932926774024963, -0.6419665813446045, -0.5906404256820679, -0.5393142700195312, -0.4879881739616394, -0.43666204810142517, -0.38533592224121094, -0.3340097963809967, -0.28268367052078247, -0.23135754466056824, -0.180031418800354, -0.12870529294013977, -0.07737916707992554, -0.026053041219711304, 0.02527296543121338, 0.07659909129142761, 0.12792521715164185, 0.17925134301185608, 0.2305774688720703, 0.28190359473228455, 0.3332297205924988, 0.384555846452713, 0.43588197231292725, 0.4872080981731415, 0.5385342240333557, 0.5898603200912476, 0.6411864757537842, 0.6925126314163208, 0.7438387274742126, 0.7951648235321045, 0.8464909791946411, 0.8978171348571777, 0.9491432309150696, 1.0004693269729614, 1.051795482635498, 1.1031216382980347, 1.1544477939605713, 1.2057738304138184, 1.257099986076355, 1.3084261417388916, 1.3597521781921387, 1.4110783338546753, 1.462404489517212, 1.5137306451797485, 1.5650568008422852, 1.6163828372955322, 1.6677089929580688]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 7.0, 8.0, 16.0, 17.0, 28.0, 44.0, 84.0, 145.0, 286.0, 758.0, 2376.0, 10032.0, 129398.0, 4002162.0, 40995.0, 5483.0, 1410.0, 486.0, 210.0, 114.0, 59.0, 44.0, 26.0, 20.0, 11.0, 10.0, 11.0, 8.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0966796875, -1.055023193359375, -1.01336669921875, -0.971710205078125, -0.9300537109375, -0.888397216796875, -0.84674072265625, -0.805084228515625, -0.763427734375, -0.721771240234375, -0.68011474609375, -0.638458251953125, -0.5968017578125, -0.555145263671875, -0.51348876953125, -0.471832275390625, -0.43017578125, -0.388519287109375, -0.34686279296875, -0.305206298828125, -0.2635498046875, -0.221893310546875, -0.18023681640625, -0.138580322265625, -0.096923828125, -0.055267333984375, -0.01361083984375, 0.028045654296875, 0.0697021484375, 0.111358642578125, 0.15301513671875, 0.194671630859375, 0.236328125, 0.277984619140625, 0.31964111328125, 0.361297607421875, 0.4029541015625, 0.444610595703125, 0.48626708984375, 0.527923583984375, 0.569580078125, 0.611236572265625, 0.65289306640625, 0.694549560546875, 0.7362060546875, 0.777862548828125, 0.81951904296875, 0.861175537109375, 0.90283203125, 0.944488525390625, 0.98614501953125, 1.027801513671875, 1.0694580078125, 1.111114501953125, 1.15277099609375, 1.194427490234375, 1.236083984375, 1.277740478515625, 1.31939697265625, 1.361053466796875, 1.4027099609375, 1.444366455078125, 1.48602294921875, 1.527679443359375, 1.5693359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 9.0, 9.0, 6.0, 9.0, 13.0, 16.0, 22.0, 31.0, 30.0, 46.0, 44.0, 37.0, 65.0, 74.0, 66.0, 59.0, 57.0, 69.0, 60.0, 65.0, 51.0, 49.0, 31.0, 17.0, 17.0, 15.0, 20.0, 10.0, 2.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07684326171875, -0.07402515411376953, -0.07120704650878906, -0.0683889389038086, -0.06557083129882812, -0.06275272369384766, -0.05993461608886719, -0.05711650848388672, -0.05429840087890625, -0.05148029327392578, -0.04866218566894531, -0.045844078063964844, -0.043025970458984375, -0.040207862854003906, -0.03738975524902344, -0.03457164764404297, -0.0317535400390625, -0.02893543243408203, -0.026117324829101562, -0.023299217224121094, -0.020481109619140625, -0.017663002014160156, -0.014844894409179688, -0.012026786804199219, -0.00920867919921875, -0.006390571594238281, -0.0035724639892578125, -0.0007543563842773438, 0.002063751220703125, 0.004881858825683594, 0.0076999664306640625, 0.010518074035644531, 0.013336181640625, 0.01615428924560547, 0.018972396850585938, 0.021790504455566406, 0.024608612060546875, 0.027426719665527344, 0.030244827270507812, 0.03306293487548828, 0.03588104248046875, 0.03869915008544922, 0.04151725769042969, 0.044335365295410156, 0.047153472900390625, 0.049971580505371094, 0.05278968811035156, 0.05560779571533203, 0.0584259033203125, 0.06124401092529297, 0.06406211853027344, 0.0668802261352539, 0.06969833374023438, 0.07251644134521484, 0.07533454895019531, 0.07815265655517578, 0.08097076416015625, 0.08378887176513672, 0.08660697937011719, 0.08942508697509766, 0.09224319458007812, 0.0950613021850586, 0.09787940979003906, 0.10069751739501953, 0.103515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 3.0, 2.0, 12.0, 10.0, 12.0, 14.0, 29.0, 43.0, 70.0, 59.0, 101.0, 100.0, 137.0, 219.0, 314.0, 442.0, 615.0, 1017.0, 1556.0, 2413.0, 4026.0, 6862.0, 12198.0, 24668.0, 55800.0, 164070.0, 1869652.0, 1776967.0, 162186.0, 55782.0, 24607.0, 12261.0, 6836.0, 3974.0, 2513.0, 1524.0, 961.0, 646.0, 458.0, 307.0, 188.0, 179.0, 123.0, 89.0, 59.0, 47.0, 40.0, 30.0, 19.0, 18.0, 9.0, 7.0, 9.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.29248046875, -0.2827301025390625, -0.272979736328125, -0.2632293701171875, -0.25347900390625, -0.2437286376953125, -0.233978271484375, -0.2242279052734375, -0.2144775390625, -0.2047271728515625, -0.194976806640625, -0.1852264404296875, -0.17547607421875, -0.1657257080078125, -0.155975341796875, -0.1462249755859375, -0.136474609375, -0.1267242431640625, -0.116973876953125, -0.1072235107421875, -0.09747314453125, -0.0877227783203125, -0.077972412109375, -0.0682220458984375, -0.0584716796875, -0.0487213134765625, -0.038970947265625, -0.0292205810546875, -0.01947021484375, -0.0097198486328125, 3.0517578125e-05, 0.0097808837890625, 0.01953125, 0.0292816162109375, 0.039031982421875, 0.0487823486328125, 0.05853271484375, 0.0682830810546875, 0.078033447265625, 0.0877838134765625, 0.0975341796875, 0.1072845458984375, 0.117034912109375, 0.1267852783203125, 0.13653564453125, 0.1462860107421875, 0.156036376953125, 0.1657867431640625, 0.175537109375, 0.1852874755859375, 0.195037841796875, 0.2047882080078125, 0.21453857421875, 0.2242889404296875, 0.234039306640625, 0.2437896728515625, 0.2535400390625, 0.2632904052734375, 0.273040771484375, 0.2827911376953125, 0.29254150390625, 0.3022918701171875, 0.312042236328125, 0.3217926025390625, 0.33154296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 7.0, 4.0, 7.0, 11.0, 8.0, 18.0, 22.0, 31.0, 33.0, 59.0, 61.0, 92.0, 151.0, 326.0, 973.0, 1419.0, 317.0, 172.0, 105.0, 70.0, 48.0, 29.0, 35.0, 16.0, 14.0, 7.0, 7.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.178466796875, -0.17211341857910156, -0.16576004028320312, -0.1594066619873047, -0.15305328369140625, -0.1466999053955078, -0.14034652709960938, -0.13399314880371094, -0.1276397705078125, -0.12128639221191406, -0.11493301391601562, -0.10857963562011719, -0.10222625732421875, -0.09587287902832031, -0.08951950073242188, -0.08316612243652344, -0.076812744140625, -0.07045936584472656, -0.06410598754882812, -0.05775260925292969, -0.05139923095703125, -0.04504585266113281, -0.038692474365234375, -0.03233909606933594, -0.0259857177734375, -0.019632339477539062, -0.013278961181640625, -0.0069255828857421875, -0.00057220458984375, 0.0057811737060546875, 0.012134552001953125, 0.018487930297851562, 0.02484130859375, 0.031194686889648438, 0.037548065185546875, 0.04390144348144531, 0.05025482177734375, 0.05660820007324219, 0.06296157836914062, 0.06931495666503906, 0.0756683349609375, 0.08202171325683594, 0.08837509155273438, 0.09472846984863281, 0.10108184814453125, 0.10743522644042969, 0.11378860473632812, 0.12014198303222656, 0.126495361328125, 0.13284873962402344, 0.13920211791992188, 0.1455554962158203, 0.15190887451171875, 0.1582622528076172, 0.16461563110351562, 0.17096900939941406, 0.1773223876953125, 0.18367576599121094, 0.19002914428710938, 0.1963825225830078, 0.20273590087890625, 0.2090892791748047, 0.21544265747070312, 0.22179603576660156, 0.2281494140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 16.0, 47.0, 118.0, 271.0, 318.0, 159.0, 56.0, 8.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.373052597045898, -6.235969543457031, -6.098886966705322, -5.961804389953613, -5.824721336364746, -5.687638282775879, -5.55055570602417, -5.413473129272461, -5.276390075683594, -5.139307022094727, -5.002224445343018, -4.865141868591309, -4.728058815002441, -4.590975761413574, -4.453893184661865, -4.316810607910156, -4.179727554321289, -4.042644500732422, -3.905561923980713, -3.768479108810425, -3.6313962936401367, -3.4943134784698486, -3.3572306632995605, -3.2201478481292725, -3.0830650329589844, -2.9459822177886963, -2.808899402618408, -2.67181658744812, -2.534733772277832, -2.397650957107544, -2.260568141937256, -2.1234853267669678, -1.9864027500152588, -1.8493199348449707, -1.7122371196746826, -1.5751543045043945, -1.4380714893341064, -1.3009886741638184, -1.1639058589935303, -1.0268230438232422, -0.8897402286529541, -0.752657413482666, -0.6155745983123779, -0.47849178314208984, -0.34140896797180176, -0.20432615280151367, -0.06724333763122559, 0.0698394775390625, 0.20692229270935059, 0.34400510787963867, 0.48108792304992676, 0.6181707382202148, 0.7552535533905029, 0.892336368560791, 1.029419183731079, 1.1665019989013672, 1.3035848140716553, 1.4406676292419434, 1.5777504444122314, 1.7148332595825195, 1.8519160747528076, 1.9889988899230957, 2.126081705093384, 2.263164520263672, 2.40024733543396]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 6.0, 7.0, 14.0, 20.0, 21.0, 25.0, 24.0, 35.0, 37.0, 36.0, 49.0, 48.0, 51.0, 55.0, 46.0, 39.0, 51.0, 41.0, 44.0, 41.0, 48.0, 48.0, 32.0, 40.0, 30.0, 21.0, 21.0, 16.0, 11.0, 10.0, 7.0, 8.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0187013149261475, -0.9874435663223267, -0.9561858773231506, -0.9249281287193298, -0.893670380115509, -0.862412691116333, -0.8311549425125122, -0.7998971939086914, -0.7686394453048706, -0.7373816967010498, -0.7061240077018738, -0.674866259098053, -0.6436085104942322, -0.6123508214950562, -0.5810930728912354, -0.5498353242874146, -0.5185776352882385, -0.4873199164867401, -0.4560621678829193, -0.4248044490814209, -0.3935467004776001, -0.3622889816761017, -0.33103126287460327, -0.29977351427078247, -0.26851579546928406, -0.23725806176662445, -0.20600032806396484, -0.17474260926246643, -0.14348487555980682, -0.11222714185714722, -0.0809694230556488, -0.0497116893529892, -0.018454015254974365, 0.012803714722394943, 0.04406144469976425, 0.07531917095184326, 0.10657690465450287, 0.13783463835716248, 0.1690923571586609, 0.2003500908613205, 0.2316078245639801, 0.2628655433654785, 0.2941232919692993, 0.32538101077079773, 0.35663872957229614, 0.38789647817611694, 0.41915419697761536, 0.45041191577911377, 0.48166966438293457, 0.5129274129867554, 0.5441851019859314, 0.5754428505897522, 0.606700599193573, 0.637958288192749, 0.6692160367965698, 0.7004737854003906, 0.7317315340042114, 0.7629892826080322, 0.7942469716072083, 0.825504720211029, 0.8567624688148499, 0.8880201578140259, 0.9192779064178467, 0.9505356550216675, 0.9817933440208435]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 8.0, 9.0, 7.0, 11.0, 15.0, 22.0, 31.0, 53.0, 87.0, 131.0, 208.0, 382.0, 1000.0, 2598.0, 7671.0, 26908.0, 114096.0, 439213.0, 347459.0, 79511.0, 19673.0, 5853.0, 1969.0, 795.0, 353.0, 179.0, 93.0, 68.0, 38.0, 26.0, 22.0, 10.0, 7.0, 9.0, 9.0, 10.0, 5.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46826171875, -0.4525909423828125, -0.436920166015625, -0.4212493896484375, -0.40557861328125, -0.3899078369140625, -0.374237060546875, -0.3585662841796875, -0.3428955078125, -0.3272247314453125, -0.311553955078125, -0.2958831787109375, -0.28021240234375, -0.2645416259765625, -0.248870849609375, -0.2332000732421875, -0.217529296875, -0.2018585205078125, -0.186187744140625, -0.1705169677734375, -0.15484619140625, -0.1391754150390625, -0.123504638671875, -0.1078338623046875, -0.0921630859375, -0.0764923095703125, -0.060821533203125, -0.0451507568359375, -0.02947998046875, -0.0138092041015625, 0.001861572265625, 0.0175323486328125, 0.033203125, 0.0488739013671875, 0.064544677734375, 0.0802154541015625, 0.09588623046875, 0.1115570068359375, 0.127227783203125, 0.1428985595703125, 0.1585693359375, 0.1742401123046875, 0.189910888671875, 0.2055816650390625, 0.22125244140625, 0.2369232177734375, 0.252593994140625, 0.2682647705078125, 0.283935546875, 0.2996063232421875, 0.315277099609375, 0.3309478759765625, 0.34661865234375, 0.3622894287109375, 0.377960205078125, 0.3936309814453125, 0.4093017578125, 0.4249725341796875, 0.440643310546875, 0.4563140869140625, 0.47198486328125, 0.4876556396484375, 0.503326416015625, 0.5189971923828125, 0.53466796875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 3.0, 7.0, 10.0, 17.0, 13.0, 19.0, 24.0, 30.0, 33.0, 44.0, 60.0, 62.0, 56.0, 61.0, 62.0, 71.0, 64.0, 71.0, 45.0, 60.0, 38.0, 35.0, 25.0, 17.0, 22.0, 15.0, 11.0, 12.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08648681640625, -0.08324527740478516, -0.08000373840332031, -0.07676219940185547, -0.07352066040039062, -0.07027912139892578, -0.06703758239746094, -0.0637960433959961, -0.06055450439453125, -0.057312965393066406, -0.05407142639160156, -0.05082988739013672, -0.047588348388671875, -0.04434680938720703, -0.04110527038574219, -0.037863731384277344, -0.0346221923828125, -0.031380653381347656, -0.028139114379882812, -0.02489757537841797, -0.021656036376953125, -0.01841449737548828, -0.015172958374023438, -0.011931419372558594, -0.00868988037109375, -0.005448341369628906, -0.0022068023681640625, 0.0010347366333007812, 0.004276275634765625, 0.007517814636230469, 0.010759353637695312, 0.014000892639160156, 0.017242431640625, 0.020483970642089844, 0.023725509643554688, 0.02696704864501953, 0.030208587646484375, 0.03345012664794922, 0.03669166564941406, 0.039933204650878906, 0.04317474365234375, 0.046416282653808594, 0.04965782165527344, 0.05289936065673828, 0.056140899658203125, 0.05938243865966797, 0.06262397766113281, 0.06586551666259766, 0.0691070556640625, 0.07234859466552734, 0.07559013366699219, 0.07883167266845703, 0.08207321166992188, 0.08531475067138672, 0.08855628967285156, 0.0917978286743164, 0.09503936767578125, 0.0982809066772461, 0.10152244567871094, 0.10476398468017578, 0.10800552368164062, 0.11124706268310547, 0.11448860168457031, 0.11773014068603516, 0.1209716796875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 6.0, 10.0, 14.0, 14.0, 27.0, 27.0, 50.0, 68.0, 95.0, 169.0, 290.0, 491.0, 960.0, 1974.0, 4491.0, 11304.0, 32037.0, 106703.0, 355190.0, 368542.0, 112166.0, 33374.0, 11708.0, 4483.0, 1982.0, 1012.0, 535.0, 299.0, 181.0, 102.0, 75.0, 62.0, 39.0, 16.0, 18.0, 16.0, 11.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.357666015625, -0.3453407287597656, -0.33301544189453125, -0.3206901550292969, -0.3083648681640625, -0.2960395812988281, -0.28371429443359375, -0.2713890075683594, -0.259063720703125, -0.24673843383789062, -0.23441314697265625, -0.22208786010742188, -0.2097625732421875, -0.19743728637695312, -0.18511199951171875, -0.17278671264648438, -0.16046142578125, -0.14813613891601562, -0.13581085205078125, -0.12348556518554688, -0.1111602783203125, -0.09883499145507812, -0.08650970458984375, -0.07418441772460938, -0.061859130859375, -0.049533843994140625, -0.03720855712890625, -0.024883270263671875, -0.0125579833984375, -0.000232696533203125, 0.01209259033203125, 0.024417877197265625, 0.0367431640625, 0.049068450927734375, 0.06139373779296875, 0.07371902465820312, 0.0860443115234375, 0.09836959838867188, 0.11069488525390625, 0.12302017211914062, 0.135345458984375, 0.14767074584960938, 0.15999603271484375, 0.17232131958007812, 0.1846466064453125, 0.19697189331054688, 0.20929718017578125, 0.22162246704101562, 0.23394775390625, 0.24627304077148438, 0.25859832763671875, 0.2709236145019531, 0.2832489013671875, 0.2955741882324219, 0.30789947509765625, 0.3202247619628906, 0.332550048828125, 0.3448753356933594, 0.35720062255859375, 0.3695259094238281, 0.3818511962890625, 0.3941764831542969, 0.40650177001953125, 0.4188270568847656, 0.43115234375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 6.0, 7.0, 8.0, 11.0, 9.0, 8.0, 17.0, 17.0, 13.0, 24.0, 25.0, 24.0, 25.0, 35.0, 34.0, 37.0, 41.0, 48.0, 40.0, 51.0, 33.0, 39.0, 42.0, 38.0, 46.0, 38.0, 31.0, 24.0, 36.0, 26.0, 31.0, 18.0, 21.0, 15.0, 16.0, 15.0, 10.0, 11.0, 7.0, 5.0, 9.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 6.0], "bins": [-0.4169921875, -0.4053916931152344, -0.39379119873046875, -0.3821907043457031, -0.3705902099609375, -0.3589897155761719, -0.34738922119140625, -0.3357887268066406, -0.324188232421875, -0.3125877380371094, -0.30098724365234375, -0.2893867492675781, -0.2777862548828125, -0.2661857604980469, -0.25458526611328125, -0.24298477172851562, -0.23138427734375, -0.21978378295898438, -0.20818328857421875, -0.19658279418945312, -0.1849822998046875, -0.17338180541992188, -0.16178131103515625, -0.15018081665039062, -0.138580322265625, -0.12697982788085938, -0.11537933349609375, -0.10377883911132812, -0.0921783447265625, -0.08057785034179688, -0.06897735595703125, -0.057376861572265625, -0.0457763671875, -0.034175872802734375, -0.02257537841796875, -0.010974884033203125, 0.0006256103515625, 0.012226104736328125, 0.02382659912109375, 0.035427093505859375, 0.047027587890625, 0.058628082275390625, 0.07022857666015625, 0.08182907104492188, 0.0934295654296875, 0.10503005981445312, 0.11663055419921875, 0.12823104858398438, 0.13983154296875, 0.15143203735351562, 0.16303253173828125, 0.17463302612304688, 0.1862335205078125, 0.19783401489257812, 0.20943450927734375, 0.22103500366210938, 0.232635498046875, 0.24423599243164062, 0.25583648681640625, 0.2674369812011719, 0.2790374755859375, 0.2906379699707031, 0.30223846435546875, 0.3138389587402344, 0.325439453125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 3.0, 9.0, 9.0, 19.0, 31.0, 54.0, 79.0, 158.0, 354.0, 1022.0, 3578.0, 17146.0, 177815.0, 766008.0, 69202.0, 9646.0, 2215.0, 661.0, 272.0, 105.0, 55.0, 45.0, 21.0, 19.0, 12.0, 2.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.716796875, -0.6998634338378906, -0.6829299926757812, -0.6659965515136719, -0.6490631103515625, -0.6321296691894531, -0.6151962280273438, -0.5982627868652344, -0.581329345703125, -0.5643959045410156, -0.5474624633789062, -0.5305290222167969, -0.5135955810546875, -0.4966621398925781, -0.47972869873046875, -0.4627952575683594, -0.44586181640625, -0.4289283752441406, -0.41199493408203125, -0.3950614929199219, -0.3781280517578125, -0.3611946105957031, -0.34426116943359375, -0.3273277282714844, -0.310394287109375, -0.2934608459472656, -0.27652740478515625, -0.2595939636230469, -0.2426605224609375, -0.22572708129882812, -0.20879364013671875, -0.19186019897460938, -0.1749267578125, -0.15799331665039062, -0.14105987548828125, -0.12412643432617188, -0.1071929931640625, -0.09025955200195312, -0.07332611083984375, -0.056392669677734375, -0.039459228515625, -0.022525787353515625, -0.00559234619140625, 0.011341094970703125, 0.0282745361328125, 0.045207977294921875, 0.06214141845703125, 0.07907485961914062, 0.09600830078125, 0.11294174194335938, 0.12987518310546875, 0.14680862426757812, 0.1637420654296875, 0.18067550659179688, 0.19760894775390625, 0.21454238891601562, 0.231475830078125, 0.24840927124023438, 0.26534271240234375, 0.2822761535644531, 0.2992095947265625, 0.3161430358886719, 0.33307647705078125, 0.3500099182128906, 0.366943359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 1.0, 5.0, 2.0, 8.0, 5.0, 12.0, 10.0, 13.0, 11.0, 11.0, 25.0, 22.0, 25.0, 32.0, 44.0, 42.0, 54.0, 69.0, 74.0, 82.0, 63.0, 75.0, 67.0, 40.0, 33.0, 34.0, 21.0, 20.0, 17.0, 8.0, 12.0, 5.0, 9.0, 13.0, 6.0, 6.0, 3.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.511543273925781e-05, -8.224882185459137e-05, -7.938221096992493e-05, -7.651560008525848e-05, -7.364898920059204e-05, -7.07823783159256e-05, -6.791576743125916e-05, -6.504915654659271e-05, -6.218254566192627e-05, -5.931593477725983e-05, -5.6449323892593384e-05, -5.358271300792694e-05, -5.07161021232605e-05, -4.7849491238594055e-05, -4.498288035392761e-05, -4.211626946926117e-05, -3.9249658584594727e-05, -3.6383047699928284e-05, -3.351643681526184e-05, -3.06498259305954e-05, -2.7783215045928955e-05, -2.4916604161262512e-05, -2.204999327659607e-05, -1.9183382391929626e-05, -1.6316771507263184e-05, -1.345016062259674e-05, -1.0583549737930298e-05, -7.716938853263855e-06, -4.850327968597412e-06, -1.9837170839309692e-06, 8.828938007354736e-07, 3.7495046854019165e-06, 6.616115570068359e-06, 9.482726454734802e-06, 1.2349337339401245e-05, 1.5215948224067688e-05, 1.808255910873413e-05, 2.0949169993400574e-05, 2.3815780878067017e-05, 2.668239176273346e-05, 2.9549002647399902e-05, 3.2415613532066345e-05, 3.528222441673279e-05, 3.814883530139923e-05, 4.1015446186065674e-05, 4.388205707073212e-05, 4.674866795539856e-05, 4.9615278840065e-05, 5.2481889724731445e-05, 5.534850060939789e-05, 5.821511149406433e-05, 6.108172237873077e-05, 6.394833326339722e-05, 6.681494414806366e-05, 6.96815550327301e-05, 7.254816591739655e-05, 7.541477680206299e-05, 7.828138768672943e-05, 8.114799857139587e-05, 8.401460945606232e-05, 8.688122034072876e-05, 8.97478312253952e-05, 9.261444211006165e-05, 9.548105299472809e-05, 9.834766387939453e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 4.0, 18.0, 11.0, 12.0, 21.0, 27.0, 55.0, 74.0, 94.0, 156.0, 297.0, 511.0, 934.0, 1705.0, 3857.0, 10077.0, 32370.0, 165836.0, 605147.0, 175369.0, 33716.0, 10071.0, 4069.0, 1836.0, 929.0, 533.0, 274.0, 195.0, 114.0, 77.0, 54.0, 30.0, 24.0, 15.0, 7.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.3310546875, -0.3202056884765625, -0.309356689453125, -0.2985076904296875, -0.28765869140625, -0.2768096923828125, -0.265960693359375, -0.2551116943359375, -0.2442626953125, -0.2334136962890625, -0.222564697265625, -0.2117156982421875, -0.20086669921875, -0.1900177001953125, -0.179168701171875, -0.1683197021484375, -0.157470703125, -0.1466217041015625, -0.135772705078125, -0.1249237060546875, -0.11407470703125, -0.1032257080078125, -0.092376708984375, -0.0815277099609375, -0.0706787109375, -0.0598297119140625, -0.048980712890625, -0.0381317138671875, -0.02728271484375, -0.0164337158203125, -0.005584716796875, 0.0052642822265625, 0.01611328125, 0.0269622802734375, 0.037811279296875, 0.0486602783203125, 0.05950927734375, 0.0703582763671875, 0.081207275390625, 0.0920562744140625, 0.1029052734375, 0.1137542724609375, 0.124603271484375, 0.1354522705078125, 0.14630126953125, 0.1571502685546875, 0.167999267578125, 0.1788482666015625, 0.189697265625, 0.2005462646484375, 0.211395263671875, 0.2222442626953125, 0.23309326171875, 0.2439422607421875, 0.254791259765625, 0.2656402587890625, 0.2764892578125, 0.2873382568359375, 0.298187255859375, 0.3090362548828125, 0.31988525390625, 0.3307342529296875, 0.341583251953125, 0.3524322509765625, 0.36328125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 1.0, 3.0, 3.0, 4.0, 12.0, 9.0, 9.0, 16.0, 16.0, 23.0, 22.0, 41.0, 49.0, 58.0, 77.0, 91.0, 92.0, 98.0, 108.0, 56.0, 66.0, 41.0, 27.0, 14.0, 18.0, 14.0, 11.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28955078125, -0.2790870666503906, -0.26862335205078125, -0.2581596374511719, -0.2476959228515625, -0.23723220825195312, -0.22676849365234375, -0.21630477905273438, -0.205841064453125, -0.19537734985351562, -0.18491363525390625, -0.17444992065429688, -0.1639862060546875, -0.15352249145507812, -0.14305877685546875, -0.13259506225585938, -0.12213134765625, -0.11166763305664062, -0.10120391845703125, -0.09074020385742188, -0.0802764892578125, -0.06981277465820312, -0.05934906005859375, -0.048885345458984375, -0.038421630859375, -0.027957916259765625, -0.01749420166015625, -0.007030487060546875, 0.0034332275390625, 0.013896942138671875, 0.02436065673828125, 0.034824371337890625, 0.0452880859375, 0.055751800537109375, 0.06621551513671875, 0.07667922973632812, 0.0871429443359375, 0.09760665893554688, 0.10807037353515625, 0.11853408813476562, 0.128997802734375, 0.13946151733398438, 0.14992523193359375, 0.16038894653320312, 0.1708526611328125, 0.18131637573242188, 0.19178009033203125, 0.20224380493164062, 0.21270751953125, 0.22317123413085938, 0.23363494873046875, 0.24409866333007812, 0.2545623779296875, 0.2650260925292969, 0.27548980712890625, 0.2859535217285156, 0.296417236328125, 0.3068809509277344, 0.31734466552734375, 0.3278083801269531, 0.3382720947265625, 0.3487358093261719, 0.35919952392578125, 0.3696632385253906, 0.380126953125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 18.0, 39.0, 50.0, 90.0, 135.0, 157.0, 144.0, 141.0, 90.0, 64.0, 26.0, 25.0, 10.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.374970436096191, -5.2225871086120605, -5.0702033042907715, -4.917819976806641, -4.76543664932251, -4.613053321838379, -4.46066951751709, -4.308286190032959, -4.155902862548828, -4.003519535064697, -3.8511359691619873, -3.6987524032592773, -3.5463690757751465, -3.3939855098724365, -3.2416019439697266, -3.0892186164855957, -2.9368348121643066, -2.7844512462615967, -2.632067918777466, -2.479684352874756, -2.327301025390625, -2.174917459487915, -2.022533893585205, -1.8701504468917847, -1.7177670001983643, -1.5653835535049438, -1.4130001068115234, -1.2606165409088135, -1.108233094215393, -0.9558496475219727, -0.8034661412239075, -0.6510826349258423, -0.4986991882324219, -0.3463157117366791, -0.19393223524093628, -0.04154875874519348, 0.11083471775054932, 0.2632181644439697, 0.4156016707420349, 0.5679851770401001, 0.7203686237335205, 0.8727520704269409, 1.0251355171203613, 1.1775190830230713, 1.3299025297164917, 1.482285976409912, 1.634669542312622, 1.7870529890060425, 1.939436435699463, 2.091820001602173, 2.2442033290863037, 2.3965868949890137, 2.5489702224731445, 2.7013537883758545, 2.8537373542785645, 3.0061206817626953, 3.1585042476654053, 3.3108878135681152, 3.463271141052246, 3.615654706954956, 3.768038272857666, 3.920421600341797, 4.072804927825928, 4.225188732147217, 4.377572059631348]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 12.0, 5.0, 8.0, 12.0, 20.0, 14.0, 15.0, 30.0, 29.0, 30.0, 36.0, 31.0, 40.0, 35.0, 49.0, 46.0, 45.0, 52.0, 50.0, 52.0, 48.0, 44.0, 45.0, 30.0, 41.0, 19.0, 29.0, 21.0, 24.0, 15.0, 13.0, 6.0, 11.0, 5.0, 8.0, 8.0, 5.0, 1.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.269749164581299, -2.2009003162384033, -2.132051467895508, -2.0632026195526123, -1.9943537712097168, -1.9255049228668213, -1.8566560745239258, -1.7878072261810303, -1.7189583778381348, -1.6501095294952393, -1.5812606811523438, -1.5124118328094482, -1.4435629844665527, -1.3747141361236572, -1.3058652877807617, -1.2370164394378662, -1.1681677103042603, -1.0993188619613647, -1.0304700136184692, -0.9616211652755737, -0.8927723169326782, -0.8239234685897827, -0.755074679851532, -0.6862258315086365, -0.617376983165741, -0.5485281348228455, -0.47967928647994995, -0.41083046793937683, -0.3419816195964813, -0.2731327712535858, -0.2042839527130127, -0.1354351043701172, -0.06658625602722168, 0.002262584865093231, 0.07111142575740814, 0.13996025919914246, 0.20880910754203796, 0.27765795588493347, 0.3465067744255066, 0.4153556227684021, 0.4842044711112976, 0.5530533194541931, 0.6219021677970886, 0.6907509565353394, 0.7595998048782349, 0.8284486532211304, 0.8972975015640259, 0.9661463499069214, 1.034995198249817, 1.1038440465927124, 1.172692894935608, 1.2415417432785034, 1.310390591621399, 1.3792394399642944, 1.4480881690979004, 1.516937017440796, 1.5857858657836914, 1.654634714126587, 1.7234835624694824, 1.792332410812378, 1.8611812591552734, 1.930030107498169, 1.9988789558410645, 2.06772780418396, 2.1365766525268555]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 17.0, 26.0, 48.0, 131.0, 356.0, 2263.0, 4166656.0, 23440.0, 963.0, 207.0, 89.0, 35.0, 17.0, 6.0, 6.0, 8.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.70703125, -2.60601806640625, -2.5050048828125, -2.40399169921875, -2.302978515625, -2.20196533203125, -2.1009521484375, -1.99993896484375, -1.89892578125, -1.79791259765625, -1.6968994140625, -1.59588623046875, -1.494873046875, -1.39385986328125, -1.2928466796875, -1.19183349609375, -1.0908203125, -0.98980712890625, -0.8887939453125, -0.78778076171875, -0.686767578125, -0.58575439453125, -0.4847412109375, -0.38372802734375, -0.28271484375, -0.18170166015625, -0.0806884765625, 0.02032470703125, 0.121337890625, 0.22235107421875, 0.3233642578125, 0.42437744140625, 0.525390625, 0.62640380859375, 0.7274169921875, 0.82843017578125, 0.929443359375, 1.03045654296875, 1.1314697265625, 1.23248291015625, 1.33349609375, 1.43450927734375, 1.5355224609375, 1.63653564453125, 1.737548828125, 1.83856201171875, 1.9395751953125, 2.04058837890625, 2.1416015625, 2.24261474609375, 2.3436279296875, 2.44464111328125, 2.545654296875, 2.64666748046875, 2.7476806640625, 2.84869384765625, 2.94970703125, 3.05072021484375, 3.1517333984375, 3.25274658203125, 3.353759765625, 3.45477294921875, 3.5557861328125, 3.65679931640625, 3.7578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 9.0, 6.0, 6.0, 6.0, 14.0, 11.0, 11.0, 24.0, 22.0, 28.0, 31.0, 28.0, 38.0, 31.0, 58.0, 59.0, 48.0, 51.0, 51.0, 56.0, 58.0, 53.0, 51.0, 40.0, 34.0, 40.0, 26.0, 28.0, 20.0, 14.0, 9.0, 10.0, 8.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.092041015625, -0.088623046875, -0.085205078125, -0.081787109375, -0.078369140625, -0.074951171875, -0.071533203125, -0.068115234375, -0.064697265625, -0.061279296875, -0.057861328125, -0.054443359375, -0.051025390625, -0.047607421875, -0.044189453125, -0.040771484375, -0.037353515625, -0.033935546875, -0.030517578125, -0.027099609375, -0.023681640625, -0.020263671875, -0.016845703125, -0.013427734375, -0.010009765625, -0.006591796875, -0.003173828125, 0.000244140625, 0.003662109375, 0.007080078125, 0.010498046875, 0.013916015625, 0.017333984375, 0.020751953125, 0.024169921875, 0.027587890625, 0.031005859375, 0.034423828125, 0.037841796875, 0.041259765625, 0.044677734375, 0.048095703125, 0.051513671875, 0.054931640625, 0.058349609375, 0.061767578125, 0.065185546875, 0.068603515625, 0.072021484375, 0.075439453125, 0.078857421875, 0.082275390625, 0.085693359375, 0.089111328125, 0.092529296875, 0.095947265625, 0.099365234375, 0.102783203125, 0.106201171875, 0.109619140625, 0.113037109375, 0.116455078125, 0.119873046875, 0.123291015625, 0.126708984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 14.0, 13.0, 22.0, 25.0, 51.0, 63.0, 77.0, 130.0, 189.0, 254.0, 413.0, 649.0, 987.0, 1583.0, 2567.0, 4980.0, 11648.0, 53988.0, 4013983.0, 75917.0, 13402.0, 5524.0, 2887.0, 1697.0, 1072.0, 725.0, 472.0, 281.0, 192.0, 136.0, 95.0, 61.0, 52.0, 37.0, 27.0, 19.0, 16.0, 8.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6904296875, -0.66986083984375, -0.6492919921875, -0.62872314453125, -0.608154296875, -0.58758544921875, -0.5670166015625, -0.54644775390625, -0.52587890625, -0.50531005859375, -0.4847412109375, -0.46417236328125, -0.443603515625, -0.42303466796875, -0.4024658203125, -0.38189697265625, -0.361328125, -0.34075927734375, -0.3201904296875, -0.29962158203125, -0.279052734375, -0.25848388671875, -0.2379150390625, -0.21734619140625, -0.19677734375, -0.17620849609375, -0.1556396484375, -0.13507080078125, -0.114501953125, -0.09393310546875, -0.0733642578125, -0.05279541015625, -0.0322265625, -0.01165771484375, 0.0089111328125, 0.02947998046875, 0.050048828125, 0.07061767578125, 0.0911865234375, 0.11175537109375, 0.13232421875, 0.15289306640625, 0.1734619140625, 0.19403076171875, 0.214599609375, 0.23516845703125, 0.2557373046875, 0.27630615234375, 0.296875, 0.31744384765625, 0.3380126953125, 0.35858154296875, 0.379150390625, 0.39971923828125, 0.4202880859375, 0.44085693359375, 0.46142578125, 0.48199462890625, 0.5025634765625, 0.52313232421875, 0.543701171875, 0.56427001953125, 0.5848388671875, 0.60540771484375, 0.6259765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 8.0, 16.0, 11.0, 32.0, 75.0, 425.0, 3294.0, 111.0, 31.0, 22.0, 10.0, 5.0, 3.0, 6.0, 5.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.12017631530761719, -0.11498641967773438, -0.10979652404785156, -0.10460662841796875, -0.09941673278808594, -0.09422683715820312, -0.08903694152832031, -0.0838470458984375, -0.07865715026855469, -0.07346725463867188, -0.06827735900878906, -0.06308746337890625, -0.05789756774902344, -0.052707672119140625, -0.04751777648925781, -0.042327880859375, -0.03713798522949219, -0.031948089599609375, -0.026758193969726562, -0.02156829833984375, -0.016378402709960938, -0.011188507080078125, -0.0059986114501953125, -0.0008087158203125, 0.0043811798095703125, 0.009571075439453125, 0.014760971069335938, 0.01995086669921875, 0.025140762329101562, 0.030330657958984375, 0.03552055358886719, 0.04071044921875, 0.04590034484863281, 0.051090240478515625, 0.05628013610839844, 0.06147003173828125, 0.06665992736816406, 0.07184982299804688, 0.07703971862792969, 0.0822296142578125, 0.08741950988769531, 0.09260940551757812, 0.09779930114746094, 0.10298919677734375, 0.10817909240722656, 0.11336898803710938, 0.11855888366699219, 0.123748779296875, 0.1289386749267578, 0.13412857055664062, 0.13931846618652344, 0.14450836181640625, 0.14969825744628906, 0.15488815307617188, 0.1600780487060547, 0.1652679443359375, 0.1704578399658203, 0.17564773559570312, 0.18083763122558594, 0.18602752685546875, 0.19121742248535156, 0.19640731811523438, 0.2015972137451172, 0.206787109375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 9.0, 33.0, 113.0, 271.0, 324.0, 153.0, 61.0, 22.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3774867355823517, -0.33077162504196167, -0.28405648469924927, -0.23734137415885925, -0.19062626361846924, -0.14391115307807922, -0.09719601273536682, -0.05048090219497681, -0.003765791654586792, 0.04294932633638382, 0.08966444432735443, 0.13637956976890564, 0.18309468030929565, 0.22980979084968567, 0.27652493119239807, 0.3232400417327881, 0.3699551522731781, 0.4166702628135681, 0.4633854031562805, 0.5101004838943481, 0.5568156242370605, 0.603530764579773, 0.6502459049224854, 0.696960985660553, 0.7436760663986206, 0.790391206741333, 0.8371062874794006, 0.883821427822113, 0.9305365085601807, 0.9772516489028931, 1.0239667892456055, 1.0706819295883179, 1.1173970699310303, 1.1641122102737427, 1.210827350616455, 1.257542371749878, 1.3042575120925903, 1.3509726524353027, 1.3976877927780151, 1.4444029331207275, 1.4911179542541504, 1.5378330945968628, 1.5845482349395752, 1.631263256072998, 1.6779783964157104, 1.7246935367584229, 1.7714086771011353, 1.8181238174438477, 1.86483895778656, 1.9115540981292725, 1.9582692384719849, 2.0049843788146973, 2.05169939994812, 2.098414421081543, 2.145129680633545, 2.1918447017669678, 2.2385599613189697, 2.2852749824523926, 2.3319902420043945, 2.3787052631378174, 2.4254205226898193, 2.472135543823242, 2.518850803375244, 2.565565824508667, 2.61228084564209]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 6.0, 4.0, 7.0, 4.0, 6.0, 8.0, 10.0, 24.0, 14.0, 18.0, 34.0, 30.0, 33.0, 42.0, 57.0, 50.0, 50.0, 47.0, 47.0, 54.0, 54.0, 59.0, 37.0, 43.0, 46.0, 35.0, 35.0, 26.0, 19.0, 24.0, 14.0, 20.0, 11.0, 7.0, 6.0, 7.0, 8.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3685368299484253, -0.35679641366004944, -0.34505602717399597, -0.3333156108856201, -0.32157519459724426, -0.3098347783088684, -0.29809439182281494, -0.2863539755344391, -0.27461355924606323, -0.2628731429576874, -0.2511327564716339, -0.23939234018325806, -0.2276519238948822, -0.21591152250766754, -0.20417112112045288, -0.19243070483207703, -0.18069031834602356, -0.1689499169588089, -0.15720950067043304, -0.14546909928321838, -0.13372868299484253, -0.12198828160762787, -0.11024788022041321, -0.09850747138261795, -0.08676706254482269, -0.07502665370702744, -0.06328624486923218, -0.05154584348201752, -0.03980543464422226, -0.028065025806427002, -0.01632462441921234, -0.004584215581417084, 0.007156193256378174, 0.018896600231528282, 0.03063700720667839, 0.04237741231918335, 0.05411782115697861, 0.06585822999477386, 0.07759863138198853, 0.08933904021978378, 0.10107944905757904, 0.1128198578953743, 0.12456026673316956, 0.13630066812038422, 0.14804106950759888, 0.15978148579597473, 0.1715218871831894, 0.18326228857040405, 0.1950027048587799, 0.20674310624599457, 0.21848352253437042, 0.23022392392158508, 0.24196434020996094, 0.2537047266960144, 0.26544514298439026, 0.2771855592727661, 0.2889259457588196, 0.30066636204719543, 0.3124067485332489, 0.32414716482162476, 0.3358875811100006, 0.34762799739837646, 0.35936838388442993, 0.3711088001728058, 0.38284921646118164]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 7.0, 6.0, 20.0, 23.0, 29.0, 47.0, 72.0, 163.0, 237.0, 529.0, 1427.0, 4010.0, 13910.0, 59420.0, 301361.0, 507118.0, 123075.0, 26312.0, 6856.0, 2214.0, 845.0, 379.0, 189.0, 91.0, 47.0, 44.0, 27.0, 23.0, 19.0, 10.0, 4.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6958541870117188, -0.6749114990234375, -0.6539688110351562, -0.633026123046875, -0.6120834350585938, -0.5911407470703125, -0.5701980590820312, -0.54925537109375, -0.5283126831054688, -0.5073699951171875, -0.48642730712890625, -0.465484619140625, -0.44454193115234375, -0.4235992431640625, -0.40265655517578125, -0.3817138671875, -0.36077117919921875, -0.3398284912109375, -0.31888580322265625, -0.297943115234375, -0.27700042724609375, -0.2560577392578125, -0.23511505126953125, -0.21417236328125, -0.19322967529296875, -0.1722869873046875, -0.15134429931640625, -0.130401611328125, -0.10945892333984375, -0.0885162353515625, -0.06757354736328125, -0.046630859375, -0.02568817138671875, -0.0047454833984375, 0.01619720458984375, 0.037139892578125, 0.05808258056640625, 0.0790252685546875, 0.09996795654296875, 0.12091064453125, 0.14185333251953125, 0.1627960205078125, 0.18373870849609375, 0.204681396484375, 0.22562408447265625, 0.2465667724609375, 0.26750946044921875, 0.2884521484375, 0.30939483642578125, 0.3303375244140625, 0.35128021240234375, 0.372222900390625, 0.39316558837890625, 0.4141082763671875, 0.43505096435546875, 0.45599365234375, 0.47693634033203125, 0.4978790283203125, 0.5188217163085938, 0.539764404296875, 0.5607070922851562, 0.5816497802734375, 0.6025924682617188, 0.62353515625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 10.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 6.0, 12.0, 13.0, 22.0, 15.0, 20.0, 31.0, 25.0, 43.0, 42.0, 38.0, 40.0, 49.0, 44.0, 54.0, 48.0, 48.0, 48.0, 41.0, 38.0, 41.0, 46.0, 32.0, 30.0, 35.0, 22.0, 16.0, 17.0, 6.0, 10.0, 8.0, 7.0, 6.0, 1.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10345458984375, -0.09978199005126953, -0.09610939025878906, -0.0924367904663086, -0.08876419067382812, -0.08509159088134766, -0.08141899108886719, -0.07774639129638672, -0.07407379150390625, -0.07040119171142578, -0.06672859191894531, -0.06305599212646484, -0.059383392333984375, -0.055710792541503906, -0.05203819274902344, -0.04836559295654297, -0.0446929931640625, -0.04102039337158203, -0.03734779357910156, -0.033675193786621094, -0.030002593994140625, -0.026329994201660156, -0.022657394409179688, -0.01898479461669922, -0.01531219482421875, -0.011639595031738281, -0.007966995239257812, -0.004294395446777344, -0.000621795654296875, 0.0030508041381835938, 0.0067234039306640625, 0.010396003723144531, 0.014068603515625, 0.01774120330810547, 0.021413803100585938, 0.025086402893066406, 0.028759002685546875, 0.032431602478027344, 0.03610420227050781, 0.03977680206298828, 0.04344940185546875, 0.04712200164794922, 0.05079460144042969, 0.054467201232910156, 0.058139801025390625, 0.061812400817871094, 0.06548500061035156, 0.06915760040283203, 0.0728302001953125, 0.07650279998779297, 0.08017539978027344, 0.0838479995727539, 0.08752059936523438, 0.09119319915771484, 0.09486579895019531, 0.09853839874267578, 0.10221099853515625, 0.10588359832763672, 0.10955619812011719, 0.11322879791259766, 0.11690139770507812, 0.1205739974975586, 0.12424659729003906, 0.12791919708251953, 0.131591796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 5.0, 3.0, 7.0, 12.0, 14.0, 20.0, 41.0, 51.0, 74.0, 119.0, 250.0, 418.0, 754.0, 1654.0, 3996.0, 11601.0, 40253.0, 175679.0, 543820.0, 202816.0, 46295.0, 12630.0, 4404.0, 1720.0, 841.0, 412.0, 254.0, 153.0, 67.0, 63.0, 41.0, 29.0, 19.0, 17.0, 10.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6533203125, -0.6349411010742188, -0.6165618896484375, -0.5981826782226562, -0.579803466796875, -0.5614242553710938, -0.5430450439453125, -0.5246658325195312, -0.50628662109375, -0.48790740966796875, -0.4695281982421875, -0.45114898681640625, -0.432769775390625, -0.41439056396484375, -0.3960113525390625, -0.37763214111328125, -0.3592529296875, -0.34087371826171875, -0.3224945068359375, -0.30411529541015625, -0.285736083984375, -0.26735687255859375, -0.2489776611328125, -0.23059844970703125, -0.21221923828125, -0.19384002685546875, -0.1754608154296875, -0.15708160400390625, -0.138702392578125, -0.12032318115234375, -0.1019439697265625, -0.08356475830078125, -0.065185546875, -0.04680633544921875, -0.0284271240234375, -0.01004791259765625, 0.008331298828125, 0.02671051025390625, 0.0450897216796875, 0.06346893310546875, 0.08184814453125, 0.10022735595703125, 0.1186065673828125, 0.13698577880859375, 0.155364990234375, 0.17374420166015625, 0.1921234130859375, 0.21050262451171875, 0.2288818359375, 0.24726104736328125, 0.2656402587890625, 0.28401947021484375, 0.302398681640625, 0.32077789306640625, 0.3391571044921875, 0.35753631591796875, 0.37591552734375, 0.39429473876953125, 0.4126739501953125, 0.43105316162109375, 0.449432373046875, 0.46781158447265625, 0.4861907958984375, 0.5045700073242188, 0.52294921875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 0.0, 5.0, 1.0, 6.0, 7.0, 10.0, 13.0, 19.0, 21.0, 22.0, 25.0, 31.0, 39.0, 37.0, 44.0, 47.0, 39.0, 52.0, 52.0, 56.0, 38.0, 47.0, 46.0, 41.0, 32.0, 48.0, 37.0, 38.0, 26.0, 26.0, 18.0, 20.0, 17.0, 12.0, 13.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.92724609375, -0.9027481079101562, -0.8782501220703125, -0.8537521362304688, -0.829254150390625, -0.8047561645507812, -0.7802581787109375, -0.7557601928710938, -0.73126220703125, -0.7067642211914062, -0.6822662353515625, -0.6577682495117188, -0.633270263671875, -0.6087722778320312, -0.5842742919921875, -0.5597763061523438, -0.5352783203125, -0.5107803344726562, -0.4862823486328125, -0.46178436279296875, -0.437286376953125, -0.41278839111328125, -0.3882904052734375, -0.36379241943359375, -0.33929443359375, -0.31479644775390625, -0.2902984619140625, -0.26580047607421875, -0.241302490234375, -0.21680450439453125, -0.1923065185546875, -0.16780853271484375, -0.143310546875, -0.11881256103515625, -0.0943145751953125, -0.06981658935546875, -0.045318603515625, -0.02082061767578125, 0.0036773681640625, 0.02817535400390625, 0.05267333984375, 0.07717132568359375, 0.1016693115234375, 0.12616729736328125, 0.150665283203125, 0.17516326904296875, 0.1996612548828125, 0.22415924072265625, 0.2486572265625, 0.27315521240234375, 0.2976531982421875, 0.32215118408203125, 0.346649169921875, 0.37114715576171875, 0.3956451416015625, 0.42014312744140625, 0.44464111328125, 0.46913909912109375, 0.4936370849609375, 0.5181350708007812, 0.542633056640625, 0.5671310424804688, 0.5916290283203125, 0.6161270141601562, 0.640625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 5.0, 13.0, 16.0, 22.0, 32.0, 61.0, 98.0, 161.0, 339.0, 717.0, 1767.0, 6564.0, 48253.0, 794060.0, 177894.0, 13618.0, 2933.0, 1045.0, 396.0, 209.0, 149.0, 82.0, 47.0, 23.0, 14.0, 10.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52587890625, -0.5069046020507812, -0.4879302978515625, -0.46895599365234375, -0.449981689453125, -0.43100738525390625, -0.4120330810546875, -0.39305877685546875, -0.37408447265625, -0.35511016845703125, -0.3361358642578125, -0.31716156005859375, -0.298187255859375, -0.27921295166015625, -0.2602386474609375, -0.24126434326171875, -0.2222900390625, -0.20331573486328125, -0.1843414306640625, -0.16536712646484375, -0.146392822265625, -0.12741851806640625, -0.1084442138671875, -0.08946990966796875, -0.07049560546875, -0.05152130126953125, -0.0325469970703125, -0.01357269287109375, 0.005401611328125, 0.02437591552734375, 0.0433502197265625, 0.06232452392578125, 0.081298828125, 0.10027313232421875, 0.1192474365234375, 0.13822174072265625, 0.157196044921875, 0.17617034912109375, 0.1951446533203125, 0.21411895751953125, 0.23309326171875, 0.25206756591796875, 0.2710418701171875, 0.29001617431640625, 0.308990478515625, 0.32796478271484375, 0.3469390869140625, 0.36591339111328125, 0.3848876953125, 0.40386199951171875, 0.4228363037109375, 0.44181060791015625, 0.460784912109375, 0.47975921630859375, 0.4987335205078125, 0.5177078247070312, 0.53668212890625, 0.5556564331054688, 0.5746307373046875, 0.5936050415039062, 0.612579345703125, 0.6315536499023438, 0.6505279541015625, 0.6695022583007812, 0.6884765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 6.0, 9.0, 8.0, 15.0, 23.0, 20.0, 34.0, 26.0, 41.0, 49.0, 73.0, 64.0, 77.0, 77.0, 100.0, 69.0, 54.0, 60.0, 30.0, 33.0, 20.0, 32.0, 10.0, 16.0, 8.0, 7.0, 5.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011336803436279297, -0.00010988861322402954, -0.00010640919208526611, -0.00010292977094650269, -9.945034980773926e-05, -9.597092866897583e-05, -9.24915075302124e-05, -8.901208639144897e-05, -8.553266525268555e-05, -8.205324411392212e-05, -7.857382297515869e-05, -7.509440183639526e-05, -7.161498069763184e-05, -6.813555955886841e-05, -6.465613842010498e-05, -6.117671728134155e-05, -5.7697296142578125e-05, -5.42178750038147e-05, -5.073845386505127e-05, -4.725903272628784e-05, -4.3779611587524414e-05, -4.0300190448760986e-05, -3.682076930999756e-05, -3.334134817123413e-05, -2.9861927032470703e-05, -2.6382505893707275e-05, -2.2903084754943848e-05, -1.942366361618042e-05, -1.5944242477416992e-05, -1.2464821338653564e-05, -8.985400199890137e-06, -5.505979061126709e-06, -2.0265579223632812e-06, 1.4528632164001465e-06, 4.932284355163574e-06, 8.411705493927002e-06, 1.189112663269043e-05, 1.5370547771453857e-05, 1.8849968910217285e-05, 2.2329390048980713e-05, 2.580881118774414e-05, 2.928823232650757e-05, 3.2767653465270996e-05, 3.6247074604034424e-05, 3.972649574279785e-05, 4.320591688156128e-05, 4.668533802032471e-05, 5.0164759159088135e-05, 5.364418029785156e-05, 5.712360143661499e-05, 6.060302257537842e-05, 6.408244371414185e-05, 6.756186485290527e-05, 7.10412859916687e-05, 7.452070713043213e-05, 7.800012826919556e-05, 8.147954940795898e-05, 8.495897054672241e-05, 8.843839168548584e-05, 9.191781282424927e-05, 9.53972339630127e-05, 9.887665510177612e-05, 0.00010235607624053955, 0.00010583549737930298, 0.0001093149185180664]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 7.0, 22.0, 15.0, 30.0, 52.0, 73.0, 105.0, 197.0, 338.0, 757.0, 1816.0, 5989.0, 37589.0, 660157.0, 314179.0, 20290.0, 4130.0, 1438.0, 613.0, 290.0, 186.0, 100.0, 62.0, 43.0, 29.0, 13.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6201171875, -0.6028251647949219, -0.5855331420898438, -0.5682411193847656, -0.5509490966796875, -0.5336570739746094, -0.5163650512695312, -0.4990730285644531, -0.481781005859375, -0.4644889831542969, -0.44719696044921875, -0.4299049377441406, -0.4126129150390625, -0.3953208923339844, -0.37802886962890625, -0.3607368469238281, -0.34344482421875, -0.3261528015136719, -0.30886077880859375, -0.2915687561035156, -0.2742767333984375, -0.2569847106933594, -0.23969268798828125, -0.22240066528320312, -0.205108642578125, -0.18781661987304688, -0.17052459716796875, -0.15323257446289062, -0.1359405517578125, -0.11864852905273438, -0.10135650634765625, -0.08406448364257812, -0.0667724609375, -0.049480438232421875, -0.03218841552734375, -0.014896392822265625, 0.0023956298828125, 0.019687652587890625, 0.03697967529296875, 0.054271697998046875, 0.071563720703125, 0.08885574340820312, 0.10614776611328125, 0.12343978881835938, 0.1407318115234375, 0.15802383422851562, 0.17531585693359375, 0.19260787963867188, 0.20989990234375, 0.22719192504882812, 0.24448394775390625, 0.2617759704589844, 0.2790679931640625, 0.2963600158691406, 0.31365203857421875, 0.3309440612792969, 0.348236083984375, 0.3655281066894531, 0.38282012939453125, 0.4001121520996094, 0.4174041748046875, 0.4346961975097656, 0.45198822021484375, 0.4692802429199219, 0.486572265625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 7.0, 7.0, 20.0, 42.0, 52.0, 115.0, 212.0, 234.0, 147.0, 68.0, 38.0, 27.0, 13.0, 1.0, 9.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0009765625, -0.972442626953125, -0.94390869140625, -0.915374755859375, -0.8868408203125, -0.858306884765625, -0.82977294921875, -0.801239013671875, -0.772705078125, -0.744171142578125, -0.71563720703125, -0.687103271484375, -0.6585693359375, -0.630035400390625, -0.60150146484375, -0.572967529296875, -0.54443359375, -0.515899658203125, -0.48736572265625, -0.458831787109375, -0.4302978515625, -0.401763916015625, -0.37322998046875, -0.344696044921875, -0.316162109375, -0.287628173828125, -0.25909423828125, -0.230560302734375, -0.2020263671875, -0.173492431640625, -0.14495849609375, -0.116424560546875, -0.087890625, -0.059356689453125, -0.03082275390625, -0.002288818359375, 0.0262451171875, 0.054779052734375, 0.08331298828125, 0.111846923828125, 0.140380859375, 0.168914794921875, 0.19744873046875, 0.225982666015625, 0.2545166015625, 0.283050537109375, 0.31158447265625, 0.340118408203125, 0.36865234375, 0.397186279296875, 0.42572021484375, 0.454254150390625, 0.4827880859375, 0.511322021484375, 0.53985595703125, 0.568389892578125, 0.596923828125, 0.625457763671875, 0.65399169921875, 0.682525634765625, 0.7110595703125, 0.739593505859375, 0.76812744140625, 0.796661376953125, 0.8251953125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 10.0, 33.0, 65.0, 123.0, 167.0, 200.0, 173.0, 118.0, 56.0, 29.0, 17.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.487395286560059, -6.2320942878723145, -5.9767937660217285, -5.721492767333984, -5.466192245483398, -5.210891246795654, -4.95559024810791, -4.700289726257324, -4.44498872756958, -4.189687728881836, -3.93438720703125, -3.679086208343506, -3.423785448074341, -3.168484687805176, -2.9131836891174316, -2.6578829288482666, -2.4025821685791016, -2.1472814083099365, -1.891980528831482, -1.6366796493530273, -1.3813788890838623, -1.1260781288146973, -0.8707772493362427, -0.6154763698577881, -0.36017560958862305, -0.10487478971481323, 0.15042603015899658, 0.4057268500328064, 0.6610276699066162, 0.9163284301757812, 1.1716293096542358, 1.4269301891326904, 1.682229995727539, 1.937530755996704, 2.192831516265869, 2.4481325149536133, 2.7034332752227783, 2.9587340354919434, 3.2140350341796875, 3.4693357944488525, 3.7246365547180176, 3.9799373149871826, 4.235238075256348, 4.490539073944092, 4.745840072631836, 5.001140594482422, 5.256441593170166, 5.51174259185791, 5.767043113708496, 6.02234411239624, 6.277644634246826, 6.53294563293457, 6.788246154785156, 7.0435471534729, 7.2988481521606445, 7.5541486740112305, 7.809449672698975, 8.064750671386719, 8.320051193237305, 8.57535171508789, 8.830653190612793, 9.085953712463379, 9.341254234313965, 9.596555709838867, 9.851856231689453]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 5.0, 12.0, 6.0, 9.0, 8.0, 15.0, 12.0, 15.0, 24.0, 27.0, 19.0, 32.0, 37.0, 39.0, 32.0, 44.0, 26.0, 44.0, 49.0, 48.0, 43.0, 45.0, 34.0, 46.0, 41.0, 36.0, 38.0, 28.0, 32.0, 23.0, 23.0, 13.0, 14.0, 12.0, 11.0, 8.0, 12.0, 6.0, 8.0, 11.0, 6.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4015274047851562, -3.2882487773895264, -3.1749703884124756, -3.0616917610168457, -2.948413372039795, -2.835134744644165, -2.7218563556671143, -2.6085777282714844, -2.4952993392944336, -2.3820207118988037, -2.268742322921753, -2.155463695526123, -2.0421853065490723, -1.9289066791534424, -1.8156282901763916, -1.7023496627807617, -1.5890711545944214, -1.475792646408081, -1.3625141382217407, -1.2492356300354004, -1.13595712184906, -1.0226786136627197, -0.9094000458717346, -0.7961215376853943, -0.682843029499054, -0.5695645213127136, -0.4562860131263733, -0.34300747513771057, -0.22972896695137024, -0.11645042896270752, -0.0031719207763671875, 0.11010658740997314, 0.22338509559631348, 0.3366636037826538, 0.44994211196899414, 0.5632206201553345, 0.6764991283416748, 0.7897776961326599, 0.9030562043190002, 1.0163347721099854, 1.1296131610870361, 1.2428916692733765, 1.3561701774597168, 1.4694486856460571, 1.5827271938323975, 1.6960058212280273, 1.8092842102050781, 1.922562837600708, 2.035841464996338, 2.1491200923919678, 2.2623984813690186, 2.3756771087646484, 2.488955497741699, 2.602234125137329, 2.71551251411438, 2.8287911415100098, 2.9420695304870605, 3.0553481578826904, 3.168626546859741, 3.281905174255371, 3.395183563232422, 3.5084621906280518, 3.6217405796051025, 3.7350192070007324, 3.848297595977783]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 8.0, 6.0, 21.0, 21.0, 63.0, 133.0, 289.0, 1144.0, 12436.0, 4171479.0, 7292.0, 862.0, 293.0, 129.0, 46.0, 26.0, 9.0, 5.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.071990966796875, -1.99359130859375, -1.915191650390625, -1.8367919921875, -1.758392333984375, -1.67999267578125, -1.601593017578125, -1.523193359375, -1.444793701171875, -1.36639404296875, -1.287994384765625, -1.2095947265625, -1.131195068359375, -1.05279541015625, -0.974395751953125, -0.89599609375, -0.817596435546875, -0.73919677734375, -0.660797119140625, -0.5823974609375, -0.503997802734375, -0.42559814453125, -0.347198486328125, -0.268798828125, -0.190399169921875, -0.11199951171875, -0.033599853515625, 0.0447998046875, 0.123199462890625, 0.20159912109375, 0.279998779296875, 0.3583984375, 0.436798095703125, 0.51519775390625, 0.593597412109375, 0.6719970703125, 0.750396728515625, 0.82879638671875, 0.907196044921875, 0.985595703125, 1.063995361328125, 1.14239501953125, 1.220794677734375, 1.2991943359375, 1.377593994140625, 1.45599365234375, 1.534393310546875, 1.61279296875, 1.691192626953125, 1.76959228515625, 1.847991943359375, 1.9263916015625, 2.004791259765625, 2.08319091796875, 2.161590576171875, 2.239990234375, 2.318389892578125, 2.39678955078125, 2.475189208984375, 2.5535888671875, 2.631988525390625, 2.71038818359375, 2.788787841796875, 2.8671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 2.0, 3.0, 6.0, 7.0, 11.0, 12.0, 11.0, 14.0, 17.0, 15.0, 24.0, 45.0, 40.0, 47.0, 51.0, 56.0, 59.0, 64.0, 71.0, 59.0, 71.0, 65.0, 47.0, 33.0, 45.0, 24.0, 18.0, 28.0, 11.0, 5.0, 13.0, 2.0, 5.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1728515625, -0.167266845703125, -0.16168212890625, -0.156097412109375, -0.1505126953125, -0.144927978515625, -0.13934326171875, -0.133758544921875, -0.128173828125, -0.122589111328125, -0.11700439453125, -0.111419677734375, -0.1058349609375, -0.100250244140625, -0.09466552734375, -0.089080810546875, -0.08349609375, -0.077911376953125, -0.07232666015625, -0.066741943359375, -0.0611572265625, -0.055572509765625, -0.04998779296875, -0.044403076171875, -0.038818359375, -0.033233642578125, -0.02764892578125, -0.022064208984375, -0.0164794921875, -0.010894775390625, -0.00531005859375, 0.000274658203125, 0.005859375, 0.011444091796875, 0.01702880859375, 0.022613525390625, 0.0281982421875, 0.033782958984375, 0.03936767578125, 0.044952392578125, 0.050537109375, 0.056121826171875, 0.06170654296875, 0.067291259765625, 0.0728759765625, 0.078460693359375, 0.08404541015625, 0.089630126953125, 0.09521484375, 0.100799560546875, 0.10638427734375, 0.111968994140625, 0.1175537109375, 0.123138427734375, 0.12872314453125, 0.134307861328125, 0.139892578125, 0.145477294921875, 0.15106201171875, 0.156646728515625, 0.1622314453125, 0.167816162109375, 0.17340087890625, 0.178985595703125, 0.1845703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 4.0, 12.0, 10.0, 16.0, 26.0, 29.0, 44.0, 72.0, 147.0, 193.0, 318.0, 518.0, 816.0, 1371.0, 2547.0, 6040.0, 18815.0, 111411.0, 3935552.0, 88389.0, 16561.0, 5602.0, 2404.0, 1342.0, 700.0, 498.0, 296.0, 186.0, 119.0, 68.0, 63.0, 43.0, 19.0, 12.0, 14.0, 10.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432373046875, -0.4146919250488281, -0.39701080322265625, -0.3793296813964844, -0.3616485595703125, -0.3439674377441406, -0.32628631591796875, -0.3086051940917969, -0.290924072265625, -0.2732429504394531, -0.25556182861328125, -0.23788070678710938, -0.2201995849609375, -0.20251846313476562, -0.18483734130859375, -0.16715621948242188, -0.14947509765625, -0.13179397583007812, -0.11411285400390625, -0.09643173217773438, -0.0787506103515625, -0.061069488525390625, -0.04338836669921875, -0.025707244873046875, -0.008026123046875, 0.009654998779296875, 0.02733612060546875, 0.045017242431640625, 0.0626983642578125, 0.08037948608398438, 0.09806060791015625, 0.11574172973632812, 0.1334228515625, 0.15110397338867188, 0.16878509521484375, 0.18646621704101562, 0.2041473388671875, 0.22182846069335938, 0.23950958251953125, 0.2571907043457031, 0.274871826171875, 0.2925529479980469, 0.31023406982421875, 0.3279151916503906, 0.3455963134765625, 0.3632774353027344, 0.38095855712890625, 0.3986396789550781, 0.41632080078125, 0.4340019226074219, 0.45168304443359375, 0.4693641662597656, 0.4870452880859375, 0.5047264099121094, 0.5224075317382812, 0.5400886535644531, 0.557769775390625, 0.5754508972167969, 0.5931320190429688, 0.6108131408691406, 0.6284942626953125, 0.6461753845214844, 0.6638565063476562, 0.6815376281738281, 0.69921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 10.0, 12.0, 18.0, 10.0, 32.0, 54.0, 92.0, 310.0, 3030.0, 322.0, 63.0, 40.0, 25.0, 16.0, 15.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1285400390625, -0.12403106689453125, -0.1195220947265625, -0.11501312255859375, -0.110504150390625, -0.10599517822265625, -0.1014862060546875, -0.09697723388671875, -0.09246826171875, -0.08795928955078125, -0.0834503173828125, -0.07894134521484375, -0.074432373046875, -0.06992340087890625, -0.0654144287109375, -0.06090545654296875, -0.056396484375, -0.05188751220703125, -0.0473785400390625, -0.04286956787109375, -0.038360595703125, -0.03385162353515625, -0.0293426513671875, -0.02483367919921875, -0.02032470703125, -0.01581573486328125, -0.0113067626953125, -0.00679779052734375, -0.002288818359375, 0.00222015380859375, 0.0067291259765625, 0.01123809814453125, 0.0157470703125, 0.02025604248046875, 0.0247650146484375, 0.02927398681640625, 0.033782958984375, 0.03829193115234375, 0.0428009033203125, 0.04730987548828125, 0.05181884765625, 0.05632781982421875, 0.0608367919921875, 0.06534576416015625, 0.069854736328125, 0.07436370849609375, 0.0788726806640625, 0.08338165283203125, 0.087890625, 0.09239959716796875, 0.0969085693359375, 0.10141754150390625, 0.105926513671875, 0.11043548583984375, 0.1149444580078125, 0.11945343017578125, 0.12396240234375, 0.12847137451171875, 0.1329803466796875, 0.13748931884765625, 0.141998291015625, 0.14650726318359375, 0.1510162353515625, 0.15552520751953125, 0.1600341796875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 8.0, 19.0, 36.0, 55.0, 107.0, 165.0, 168.0, 172.0, 128.0, 66.0, 37.0, 14.0, 13.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.437459945678711, -1.4099187850952148, -1.3823776245117188, -1.3548364639282227, -1.327295184135437, -1.299754023551941, -1.2722128629684448, -1.2446717023849487, -1.2171305418014526, -1.1895893812179565, -1.1620482206344604, -1.1345070600509644, -1.1069657802581787, -1.0794246196746826, -1.0518834590911865, -1.0243422985076904, -0.9968011379241943, -0.9692599773406982, -0.9417187571525574, -0.9141775965690613, -0.8866364359855652, -0.8590952157974243, -0.8315540552139282, -0.8040128946304321, -0.7764716744422913, -0.7489305138587952, -0.7213892936706543, -0.6938481330871582, -0.6663069725036621, -0.638765811920166, -0.6112245917320251, -0.583683431148529, -0.556142270565033, -0.5286011099815369, -0.501059889793396, -0.4735187292098999, -0.4459775686264038, -0.4184363782405853, -0.39089518785476685, -0.36335402727127075, -0.33581286668777466, -0.3082716763019562, -0.2807305157184601, -0.2531893253326416, -0.2256481647491455, -0.19810697436332703, -0.17056579887866974, -0.14302462339401245, -0.11548343300819397, -0.08794225752353668, -0.060401078313589096, -0.03285989910364151, -0.005318723618984222, 0.022222459316253662, 0.04976363480091095, 0.07730481028556824, 0.10484598577022552, 0.1323871612548828, 0.1599283367395401, 0.1874695122241974, 0.21501070261001587, 0.24255187809467316, 0.27009305357933044, 0.2976342439651489, 0.325175404548645]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 5.0, 11.0, 19.0, 17.0, 10.0, 21.0, 23.0, 27.0, 40.0, 33.0, 43.0, 39.0, 45.0, 45.0, 45.0, 48.0, 48.0, 50.0, 41.0, 43.0, 44.0, 32.0, 26.0, 30.0, 31.0, 35.0, 23.0, 19.0, 19.0, 23.0, 15.0, 8.0, 12.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.40835845470428467, -0.39749452471733093, -0.3866305649280548, -0.3757666349411011, -0.36490267515182495, -0.3540387451648712, -0.3431748151779175, -0.33231085538864136, -0.32144689559936523, -0.3105829656124115, -0.2997190058231354, -0.28885507583618164, -0.2779911160469055, -0.2671271860599518, -0.25626325607299805, -0.24539929628372192, -0.2345353662967682, -0.22367142140865326, -0.21280747652053833, -0.2019435465335846, -0.19107958674430847, -0.18021565675735474, -0.1693517118692398, -0.15848776698112488, -0.14762382209300995, -0.13675987720489502, -0.1258959323167801, -0.11503199487924576, -0.10416804999113083, -0.0933041051030159, -0.08244016766548157, -0.07157622277736664, -0.06071227788925171, -0.04984833300113678, -0.03898439183831215, -0.02812045067548752, -0.01725650578737259, -0.00639256089925766, 0.004471376538276672, 0.015335321426391602, 0.02619926631450653, 0.03706321120262146, 0.04792715236544609, 0.05879109352827072, 0.06965503841638565, 0.08051898330450058, 0.09138292074203491, 0.10224686563014984, 0.11311081051826477, 0.1239747554063797, 0.13483870029449463, 0.14570263028144836, 0.1565665900707245, 0.16743052005767822, 0.17829446494579315, 0.18915840983390808, 0.200022354722023, 0.21088629961013794, 0.22175024449825287, 0.2326141893863678, 0.24347811937332153, 0.25434207916259766, 0.2652060091495514, 0.2760699391365051, 0.28693389892578125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 9.0, 7.0, 12.0, 13.0, 30.0, 40.0, 44.0, 88.0, 141.0, 200.0, 381.0, 688.0, 1217.0, 2602.0, 5560.0, 13901.0, 40633.0, 145975.0, 447575.0, 278179.0, 72749.0, 22485.0, 8435.0, 3630.0, 1733.0, 935.0, 480.0, 330.0, 173.0, 109.0, 62.0, 47.0, 28.0, 21.0, 9.0, 14.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.57958984375, -0.5642318725585938, -0.5488739013671875, -0.5335159301757812, -0.518157958984375, -0.5027999877929688, -0.4874420166015625, -0.47208404541015625, -0.45672607421875, -0.44136810302734375, -0.4260101318359375, -0.41065216064453125, -0.395294189453125, -0.37993621826171875, -0.3645782470703125, -0.34922027587890625, -0.3338623046875, -0.31850433349609375, -0.3031463623046875, -0.28778839111328125, -0.272430419921875, -0.25707244873046875, -0.2417144775390625, -0.22635650634765625, -0.21099853515625, -0.19564056396484375, -0.1802825927734375, -0.16492462158203125, -0.149566650390625, -0.13420867919921875, -0.1188507080078125, -0.10349273681640625, -0.088134765625, -0.07277679443359375, -0.0574188232421875, -0.04206085205078125, -0.026702880859375, -0.01134490966796875, 0.0040130615234375, 0.01937103271484375, 0.03472900390625, 0.05008697509765625, 0.0654449462890625, 0.08080291748046875, 0.096160888671875, 0.11151885986328125, 0.1268768310546875, 0.14223480224609375, 0.1575927734375, 0.17295074462890625, 0.1883087158203125, 0.20366668701171875, 0.219024658203125, 0.23438262939453125, 0.2497406005859375, 0.26509857177734375, 0.28045654296875, 0.29581451416015625, 0.3111724853515625, 0.32653045654296875, 0.341888427734375, 0.35724639892578125, 0.3726043701171875, 0.38796234130859375, 0.4033203125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 6.0, 8.0, 9.0, 17.0, 25.0, 24.0, 29.0, 36.0, 43.0, 46.0, 57.0, 68.0, 76.0, 71.0, 69.0, 65.0, 59.0, 58.0, 42.0, 41.0, 29.0, 24.0, 15.0, 14.0, 12.0, 12.0, 9.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183837890625, -0.17761993408203125, -0.1714019775390625, -0.16518402099609375, -0.158966064453125, -0.15274810791015625, -0.1465301513671875, -0.14031219482421875, -0.13409423828125, -0.12787628173828125, -0.1216583251953125, -0.11544036865234375, -0.109222412109375, -0.10300445556640625, -0.0967864990234375, -0.09056854248046875, -0.0843505859375, -0.07813262939453125, -0.0719146728515625, -0.06569671630859375, -0.059478759765625, -0.05326080322265625, -0.0470428466796875, -0.04082489013671875, -0.03460693359375, -0.02838897705078125, -0.0221710205078125, -0.01595306396484375, -0.009735107421875, -0.00351715087890625, 0.0027008056640625, 0.00891876220703125, 0.01513671875, 0.02135467529296875, 0.0275726318359375, 0.03379058837890625, 0.040008544921875, 0.04622650146484375, 0.0524444580078125, 0.05866241455078125, 0.06488037109375, 0.07109832763671875, 0.0773162841796875, 0.08353424072265625, 0.089752197265625, 0.09597015380859375, 0.1021881103515625, 0.10840606689453125, 0.1146240234375, 0.12084197998046875, 0.1270599365234375, 0.13327789306640625, 0.139495849609375, 0.14571380615234375, 0.1519317626953125, 0.15814971923828125, 0.16436767578125, 0.17058563232421875, 0.1768035888671875, 0.18302154541015625, 0.189239501953125, 0.19545745849609375, 0.2016754150390625, 0.20789337158203125, 0.214111328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 4.0, 7.0, 12.0, 16.0, 28.0, 37.0, 52.0, 83.0, 104.0, 201.0, 313.0, 541.0, 1049.0, 2291.0, 5866.0, 18373.0, 74408.0, 414101.0, 425267.0, 76620.0, 18511.0, 5827.0, 2317.0, 1106.0, 555.0, 310.0, 184.0, 136.0, 75.0, 47.0, 32.0, 17.0, 20.0, 11.0, 12.0, 4.0, 1.0, 3.0, 2.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5478515625, -0.5295944213867188, -0.5113372802734375, -0.49308013916015625, -0.474822998046875, -0.45656585693359375, -0.4383087158203125, -0.42005157470703125, -0.40179443359375, -0.38353729248046875, -0.3652801513671875, -0.34702301025390625, -0.328765869140625, -0.31050872802734375, -0.2922515869140625, -0.27399444580078125, -0.2557373046875, -0.23748016357421875, -0.2192230224609375, -0.20096588134765625, -0.182708740234375, -0.16445159912109375, -0.1461944580078125, -0.12793731689453125, -0.10968017578125, -0.09142303466796875, -0.0731658935546875, -0.05490875244140625, -0.036651611328125, -0.01839447021484375, -0.0001373291015625, 0.01811981201171875, 0.036376953125, 0.05463409423828125, 0.0728912353515625, 0.09114837646484375, 0.109405517578125, 0.12766265869140625, 0.1459197998046875, 0.16417694091796875, 0.18243408203125, 0.20069122314453125, 0.2189483642578125, 0.23720550537109375, 0.255462646484375, 0.27371978759765625, 0.2919769287109375, 0.31023406982421875, 0.3284912109375, 0.34674835205078125, 0.3650054931640625, 0.38326263427734375, 0.401519775390625, 0.41977691650390625, 0.4380340576171875, 0.45629119873046875, 0.47454833984375, 0.49280548095703125, 0.5110626220703125, 0.5293197631835938, 0.547576904296875, 0.5658340454101562, 0.5840911865234375, 0.6023483276367188, 0.62060546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 16.0, 11.0, 8.0, 12.0, 18.0, 15.0, 21.0, 32.0, 36.0, 44.0, 41.0, 46.0, 48.0, 52.0, 40.0, 65.0, 56.0, 50.0, 52.0, 54.0, 32.0, 30.0, 40.0, 40.0, 30.0, 22.0, 17.0, 11.0, 13.0, 6.0, 10.0, 5.0, 6.0, 1.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79931640625, -0.7733078002929688, -0.7472991943359375, -0.7212905883789062, -0.695281982421875, -0.6692733764648438, -0.6432647705078125, -0.6172561645507812, -0.59124755859375, -0.5652389526367188, -0.5392303466796875, -0.5132217407226562, -0.487213134765625, -0.46120452880859375, -0.4351959228515625, -0.40918731689453125, -0.3831787109375, -0.35717010498046875, -0.3311614990234375, -0.30515289306640625, -0.279144287109375, -0.25313568115234375, -0.2271270751953125, -0.20111846923828125, -0.17510986328125, -0.14910125732421875, -0.1230926513671875, -0.09708404541015625, -0.071075439453125, -0.04506683349609375, -0.0190582275390625, 0.00695037841796875, 0.032958984375, 0.05896759033203125, 0.0849761962890625, 0.11098480224609375, 0.136993408203125, 0.16300201416015625, 0.1890106201171875, 0.21501922607421875, 0.24102783203125, 0.26703643798828125, 0.2930450439453125, 0.31905364990234375, 0.345062255859375, 0.37107086181640625, 0.3970794677734375, 0.42308807373046875, 0.4490966796875, 0.47510528564453125, 0.5011138916015625, 0.5271224975585938, 0.553131103515625, 0.5791397094726562, 0.6051483154296875, 0.6311569213867188, 0.65716552734375, 0.6831741333007812, 0.7091827392578125, 0.7351913452148438, 0.761199951171875, 0.7872085571289062, 0.8132171630859375, 0.8392257690429688, 0.865234375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 8.0, 9.0, 12.0, 23.0, 34.0, 74.0, 153.0, 332.0, 955.0, 4324.0, 42796.0, 869844.0, 119925.0, 7832.0, 1416.0, 449.0, 178.0, 73.0, 49.0, 25.0, 16.0, 10.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44873046875, -0.428009033203125, -0.40728759765625, -0.386566162109375, -0.3658447265625, -0.345123291015625, -0.32440185546875, -0.303680419921875, -0.282958984375, -0.262237548828125, -0.24151611328125, -0.220794677734375, -0.2000732421875, -0.179351806640625, -0.15863037109375, -0.137908935546875, -0.1171875, -0.096466064453125, -0.07574462890625, -0.055023193359375, -0.0343017578125, -0.013580322265625, 0.00714111328125, 0.027862548828125, 0.048583984375, 0.069305419921875, 0.09002685546875, 0.110748291015625, 0.1314697265625, 0.152191162109375, 0.17291259765625, 0.193634033203125, 0.21435546875, 0.235076904296875, 0.25579833984375, 0.276519775390625, 0.2972412109375, 0.317962646484375, 0.33868408203125, 0.359405517578125, 0.380126953125, 0.400848388671875, 0.42156982421875, 0.442291259765625, 0.4630126953125, 0.483734130859375, 0.50445556640625, 0.525177001953125, 0.5458984375, 0.566619873046875, 0.58734130859375, 0.608062744140625, 0.6287841796875, 0.649505615234375, 0.67022705078125, 0.690948486328125, 0.711669921875, 0.732391357421875, 0.75311279296875, 0.773834228515625, 0.7945556640625, 0.815277099609375, 0.83599853515625, 0.856719970703125, 0.87744140625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 1.0, 3.0, 6.0, 6.0, 14.0, 12.0, 10.0, 21.0, 18.0, 23.0, 37.0, 36.0, 49.0, 49.0, 80.0, 60.0, 87.0, 62.0, 89.0, 53.0, 52.0, 35.0, 40.0, 27.0, 24.0, 21.0, 14.0, 20.0, 10.0, 9.0, 6.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.812810897827148e-05, -6.632879376411438e-05, -6.452947854995728e-05, -6.273016333580017e-05, -6.0930848121643066e-05, -5.913153290748596e-05, -5.733221769332886e-05, -5.553290247917175e-05, -5.373358726501465e-05, -5.1934272050857544e-05, -5.013495683670044e-05, -4.8335641622543335e-05, -4.653632640838623e-05, -4.4737011194229126e-05, -4.293769598007202e-05, -4.113838076591492e-05, -3.933906555175781e-05, -3.753975033760071e-05, -3.5740435123443604e-05, -3.39411199092865e-05, -3.2141804695129395e-05, -3.034248948097229e-05, -2.8543174266815186e-05, -2.674385905265808e-05, -2.4944543838500977e-05, -2.3145228624343872e-05, -2.1345913410186768e-05, -1.9546598196029663e-05, -1.774728298187256e-05, -1.5947967767715454e-05, -1.414865255355835e-05, -1.2349337339401245e-05, -1.055002212524414e-05, -8.750706911087036e-06, -6.951391696929932e-06, -5.152076482772827e-06, -3.3527612686157227e-06, -1.5534460544586182e-06, 2.4586915969848633e-07, 2.045184373855591e-06, 3.844499588012695e-06, 5.6438148021698e-06, 7.443130016326904e-06, 9.242445230484009e-06, 1.1041760444641113e-05, 1.2841075658798218e-05, 1.4640390872955322e-05, 1.6439706087112427e-05, 1.823902130126953e-05, 2.0038336515426636e-05, 2.183765172958374e-05, 2.3636966943740845e-05, 2.543628215789795e-05, 2.7235597372055054e-05, 2.9034912586212158e-05, 3.083422780036926e-05, 3.263354301452637e-05, 3.443285822868347e-05, 3.6232173442840576e-05, 3.803148865699768e-05, 3.9830803871154785e-05, 4.163011908531189e-05, 4.3429434299468994e-05, 4.52287495136261e-05, 4.70280647277832e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 7.0, 11.0, 19.0, 39.0, 64.0, 162.0, 313.0, 1013.0, 6016.0, 147894.0, 864487.0, 25119.0, 2425.0, 548.0, 221.0, 104.0, 54.0, 27.0, 15.0, 12.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99462890625, -0.9721603393554688, -0.9496917724609375, -0.9272232055664062, -0.904754638671875, -0.8822860717773438, -0.8598175048828125, -0.8373489379882812, -0.81488037109375, -0.7924118041992188, -0.7699432373046875, -0.7474746704101562, -0.725006103515625, -0.7025375366210938, -0.6800689697265625, -0.6576004028320312, -0.6351318359375, -0.6126632690429688, -0.5901947021484375, -0.5677261352539062, -0.545257568359375, -0.5227890014648438, -0.5003204345703125, -0.47785186767578125, -0.45538330078125, -0.43291473388671875, -0.4104461669921875, -0.38797760009765625, -0.365509033203125, -0.34304046630859375, -0.3205718994140625, -0.29810333251953125, -0.275634765625, -0.25316619873046875, -0.2306976318359375, -0.20822906494140625, -0.185760498046875, -0.16329193115234375, -0.1408233642578125, -0.11835479736328125, -0.09588623046875, -0.07341766357421875, -0.0509490966796875, -0.02848052978515625, -0.006011962890625, 0.01645660400390625, 0.0389251708984375, 0.06139373779296875, 0.0838623046875, 0.10633087158203125, 0.1287994384765625, 0.15126800537109375, 0.173736572265625, 0.19620513916015625, 0.2186737060546875, 0.24114227294921875, 0.26361083984375, 0.28607940673828125, 0.3085479736328125, 0.33101654052734375, 0.353485107421875, 0.37595367431640625, 0.3984222412109375, 0.42089080810546875, 0.443359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 10.0, 17.0, 24.0, 43.0, 75.0, 137.0, 156.0, 155.0, 129.0, 100.0, 68.0, 40.0, 21.0, 14.0, 10.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91845703125, -0.899444580078125, -0.88043212890625, -0.861419677734375, -0.8424072265625, -0.823394775390625, -0.80438232421875, -0.785369873046875, -0.766357421875, -0.747344970703125, -0.72833251953125, -0.709320068359375, -0.6903076171875, -0.671295166015625, -0.65228271484375, -0.633270263671875, -0.6142578125, -0.595245361328125, -0.57623291015625, -0.557220458984375, -0.5382080078125, -0.519195556640625, -0.50018310546875, -0.481170654296875, -0.462158203125, -0.443145751953125, -0.42413330078125, -0.405120849609375, -0.3861083984375, -0.367095947265625, -0.34808349609375, -0.329071044921875, -0.31005859375, -0.291046142578125, -0.27203369140625, -0.253021240234375, -0.2340087890625, -0.214996337890625, -0.19598388671875, -0.176971435546875, -0.157958984375, -0.138946533203125, -0.11993408203125, -0.100921630859375, -0.0819091796875, -0.062896728515625, -0.04388427734375, -0.024871826171875, -0.005859375, 0.013153076171875, 0.03216552734375, 0.051177978515625, 0.0701904296875, 0.089202880859375, 0.10821533203125, 0.127227783203125, 0.146240234375, 0.165252685546875, 0.18426513671875, 0.203277587890625, 0.2222900390625, 0.241302490234375, 0.26031494140625, 0.279327392578125, 0.29833984375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 39.0, 139.0, 394.0, 324.0, 84.0, 19.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71856689453125, -24.211984634399414, -23.705402374267578, -23.198822021484375, -22.69223976135254, -22.185657501220703, -21.6790771484375, -21.172494888305664, -20.665912628173828, -20.159330368041992, -19.652748107910156, -19.146167755126953, -18.639585494995117, -18.13300323486328, -17.626422882080078, -17.119840621948242, -16.613258361816406, -16.10667610168457, -15.60009479522705, -15.093513488769531, -14.586931228637695, -14.08034896850586, -13.57376766204834, -13.06718635559082, -12.560604095458984, -12.054021835327148, -11.547440528869629, -11.04085922241211, -10.534276962280273, -10.027694702148438, -9.521113395690918, -9.014532089233398, -8.507948875427246, -8.001367568969727, -7.494785308837891, -6.988203525543213, -6.481621742248535, -5.975039958953857, -5.46845817565918, -4.961876392364502, -4.455294609069824, -3.9487128257751465, -3.4421310424804688, -2.935549259185791, -2.4289674758911133, -1.9223856925964355, -1.4158039093017578, -0.9092221260070801, -0.40264034271240234, 0.10394144058227539, 0.6105232238769531, 1.1171050071716309, 1.6236867904663086, 2.1302685737609863, 2.636850357055664, 3.143432140350342, 3.6500139236450195, 4.156595706939697, 4.663177490234375, 5.169759273529053, 5.6763410568237305, 6.182922840118408, 6.689504623413086, 7.196086406707764, 7.702668190002441]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 8.0, 5.0, 4.0, 6.0, 8.0, 11.0, 14.0, 13.0, 20.0, 23.0, 12.0, 22.0, 33.0, 34.0, 31.0, 37.0, 39.0, 55.0, 47.0, 45.0, 46.0, 55.0, 49.0, 46.0, 39.0, 34.0, 45.0, 33.0, 24.0, 19.0, 24.0, 18.0, 25.0, 20.0, 15.0, 10.0, 8.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1863694190979004, -3.081331491470337, -2.9762935638427734, -2.87125563621521, -2.7662177085876465, -2.661179542541504, -2.5561418533325195, -2.451103687286377, -2.3460657596588135, -2.24102783203125, -2.1359899044036865, -2.030951976776123, -1.92591392993927, -1.8208760023117065, -1.715838074684143, -1.61080002784729, -1.5057622194290161, -1.4007242918014526, -1.2956863641738892, -1.1906483173370361, -1.0856103897094727, -0.9805724620819092, -0.8755345344543457, -0.7704965472221375, -0.665458619594574, -0.5604206919670105, -0.45538270473480225, -0.35034477710723877, -0.2453068196773529, -0.14026886224746704, -0.035230934619903564, 0.06980705261230469, 0.17484498023986816, 0.27988293766975403, 0.3849208950996399, 0.48995882272720337, 0.5949968099594116, 0.7000347375869751, 0.8050726652145386, 0.9101106524467468, 1.015148639678955, 1.1201865673065186, 1.225224494934082, 1.3302624225616455, 1.4353004693984985, 1.540338397026062, 1.6453763246536255, 1.7504143714904785, 1.8554521799087524, 1.960490107536316, 2.065528154373169, 2.1705660820007324, 2.275604009628296, 2.3806419372558594, 2.485679864883423, 2.5907177925109863, 2.69575572013855, 2.8007936477661133, 2.9058315753936768, 3.0108695030212402, 3.1159074306488037, 3.220945358276367, 3.3259835243225098, 3.4310214519500732, 3.5360593795776367]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 19.0, 18.0, 35.0, 54.0, 121.0, 255.0, 648.0, 1883.0, 7579.0, 118170.0, 4046612.0, 14492.0, 2751.0, 868.0, 384.0, 156.0, 79.0, 61.0, 38.0, 19.0, 12.0, 4.0, 6.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79052734375, -0.7603225708007812, -0.7301177978515625, -0.6999130249023438, -0.669708251953125, -0.6395034790039062, -0.6092987060546875, -0.5790939331054688, -0.54888916015625, -0.5186843872070312, -0.4884796142578125, -0.45827484130859375, -0.428070068359375, -0.39786529541015625, -0.3676605224609375, -0.33745574951171875, -0.3072509765625, -0.27704620361328125, -0.2468414306640625, -0.21663665771484375, -0.186431884765625, -0.15622711181640625, -0.1260223388671875, -0.09581756591796875, -0.06561279296875, -0.03540802001953125, -0.0052032470703125, 0.02500152587890625, 0.055206298828125, 0.08541107177734375, 0.1156158447265625, 0.14582061767578125, 0.176025390625, 0.20623016357421875, 0.2364349365234375, 0.26663970947265625, 0.296844482421875, 0.32704925537109375, 0.3572540283203125, 0.38745880126953125, 0.41766357421875, 0.44786834716796875, 0.4780731201171875, 0.5082778930664062, 0.538482666015625, 0.5686874389648438, 0.5988922119140625, 0.6290969848632812, 0.6593017578125, 0.6895065307617188, 0.7197113037109375, 0.7499160766601562, 0.780120849609375, 0.8103256225585938, 0.8405303955078125, 0.8707351684570312, 0.90093994140625, 0.9311447143554688, 0.9613494873046875, 0.9915542602539062, 1.021759033203125, 1.0519638061523438, 1.0821685791015625, 1.1123733520507812, 1.142578125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 8.0, 13.0, 13.0, 17.0, 20.0, 33.0, 28.0, 44.0, 50.0, 40.0, 54.0, 56.0, 53.0, 54.0, 85.0, 50.0, 75.0, 46.0, 32.0, 32.0, 34.0, 34.0, 27.0, 17.0, 18.0, 17.0, 6.0, 4.0, 7.0, 8.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2003173828125, -0.1948699951171875, -0.189422607421875, -0.1839752197265625, -0.17852783203125, -0.1730804443359375, -0.167633056640625, -0.1621856689453125, -0.15673828125, -0.1512908935546875, -0.145843505859375, -0.1403961181640625, -0.13494873046875, -0.1295013427734375, -0.124053955078125, -0.1186065673828125, -0.1131591796875, -0.1077117919921875, -0.102264404296875, -0.0968170166015625, -0.09136962890625, -0.0859222412109375, -0.080474853515625, -0.0750274658203125, -0.069580078125, -0.0641326904296875, -0.058685302734375, -0.0532379150390625, -0.04779052734375, -0.0423431396484375, -0.036895751953125, -0.0314483642578125, -0.0260009765625, -0.0205535888671875, -0.015106201171875, -0.0096588134765625, -0.00421142578125, 0.0012359619140625, 0.006683349609375, 0.0121307373046875, 0.017578125, 0.0230255126953125, 0.028472900390625, 0.0339202880859375, 0.03936767578125, 0.0448150634765625, 0.050262451171875, 0.0557098388671875, 0.0611572265625, 0.0666046142578125, 0.072052001953125, 0.0774993896484375, 0.08294677734375, 0.0883941650390625, 0.093841552734375, 0.0992889404296875, 0.104736328125, 0.1101837158203125, 0.115631103515625, 0.1210784912109375, 0.12652587890625, 0.1319732666015625, 0.137420654296875, 0.1428680419921875, 0.1483154296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 4.0, 10.0, 13.0, 15.0, 33.0, 43.0, 65.0, 79.0, 151.0, 220.0, 311.0, 509.0, 915.0, 1957.0, 5236.0, 21281.0, 389690.0, 3736840.0, 26236.0, 5945.0, 2123.0, 1023.0, 561.0, 364.0, 225.0, 126.0, 100.0, 67.0, 50.0, 28.0, 14.0, 14.0, 7.0, 9.0, 4.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75341796875, -0.72991943359375, -0.7064208984375, -0.68292236328125, -0.659423828125, -0.63592529296875, -0.6124267578125, -0.58892822265625, -0.5654296875, -0.54193115234375, -0.5184326171875, -0.49493408203125, -0.471435546875, -0.44793701171875, -0.4244384765625, -0.40093994140625, -0.37744140625, -0.35394287109375, -0.3304443359375, -0.30694580078125, -0.283447265625, -0.25994873046875, -0.2364501953125, -0.21295166015625, -0.189453125, -0.16595458984375, -0.1424560546875, -0.11895751953125, -0.095458984375, -0.07196044921875, -0.0484619140625, -0.02496337890625, -0.00146484375, 0.02203369140625, 0.0455322265625, 0.06903076171875, 0.092529296875, 0.11602783203125, 0.1395263671875, 0.16302490234375, 0.1865234375, 0.21002197265625, 0.2335205078125, 0.25701904296875, 0.280517578125, 0.30401611328125, 0.3275146484375, 0.35101318359375, 0.37451171875, 0.39801025390625, 0.4215087890625, 0.44500732421875, 0.468505859375, 0.49200439453125, 0.5155029296875, 0.53900146484375, 0.5625, 0.58599853515625, 0.6094970703125, 0.63299560546875, 0.656494140625, 0.67999267578125, 0.7034912109375, 0.72698974609375, 0.75048828125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 14.0, 19.0, 27.0, 57.0, 134.0, 3326.0, 334.0, 65.0, 39.0, 14.0, 12.0, 6.0, 8.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.23583984375, -0.23005294799804688, -0.22426605224609375, -0.21847915649414062, -0.2126922607421875, -0.20690536499023438, -0.20111846923828125, -0.19533157348632812, -0.189544677734375, -0.18375778198242188, -0.17797088623046875, -0.17218399047851562, -0.1663970947265625, -0.16061019897460938, -0.15482330322265625, -0.14903640747070312, -0.14324951171875, -0.13746261596679688, -0.13167572021484375, -0.12588882446289062, -0.1201019287109375, -0.11431503295898438, -0.10852813720703125, -0.10274124145507812, -0.096954345703125, -0.09116744995117188, -0.08538055419921875, -0.07959365844726562, -0.0738067626953125, -0.06801986694335938, -0.06223297119140625, -0.056446075439453125, -0.0506591796875, -0.044872283935546875, -0.03908538818359375, -0.033298492431640625, -0.0275115966796875, -0.021724700927734375, -0.01593780517578125, -0.010150909423828125, -0.004364013671875, 0.001422882080078125, 0.00720977783203125, 0.012996673583984375, 0.0187835693359375, 0.024570465087890625, 0.03035736083984375, 0.036144256591796875, 0.04193115234375, 0.047718048095703125, 0.05350494384765625, 0.059291839599609375, 0.0650787353515625, 0.07086563110351562, 0.07665252685546875, 0.08243942260742188, 0.088226318359375, 0.09401321411132812, 0.09980010986328125, 0.10558700561523438, 0.1113739013671875, 0.11716079711914062, 0.12294769287109375, 0.12873458862304688, 0.134521484375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 12.0, 23.0, 30.0, 67.0, 125.0, 189.0, 217.0, 169.0, 91.0, 42.0, 23.0, 10.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3320741057395935, -0.30270153284072876, -0.2733289897441864, -0.24395643174648285, -0.2145838737487793, -0.18521131575107574, -0.1558387577533722, -0.12646619975566864, -0.09709364175796509, -0.06772108376026154, -0.03834852576255798, -0.008975967764854431, 0.02039659023284912, 0.04976914823055267, 0.07914170622825623, 0.10851426422595978, 0.13788682222366333, 0.16725938022136688, 0.19663193821907043, 0.226004496216774, 0.25537705421447754, 0.2847496271133423, 0.31412217020988464, 0.343494713306427, 0.37286728620529175, 0.4022398591041565, 0.43161240220069885, 0.4609849452972412, 0.49035751819610596, 0.5197300910949707, 0.5491026639938354, 0.5784751772880554, 0.6078476905822754, 0.6372202634811401, 0.6665928363800049, 0.6959653496742249, 0.7253379225730896, 0.7547104954719543, 0.7840830087661743, 0.8134555816650391, 0.8428281545639038, 0.8722007274627686, 0.9015733003616333, 0.9309458136558533, 0.960318386554718, 0.9896909594535828, 1.0190634727478027, 1.0484360456466675, 1.0778086185455322, 1.107181191444397, 1.1365537643432617, 1.1659263372421265, 1.1952989101409912, 1.2246713638305664, 1.2540439367294312, 1.283416509628296, 1.3127890825271606, 1.3421616554260254, 1.3715342283248901, 1.4009068012237549, 1.43027925491333, 1.4596518278121948, 1.4890244007110596, 1.5183969736099243, 1.547769546508789]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 5.0, 12.0, 10.0, 10.0, 12.0, 11.0, 19.0, 19.0, 19.0, 22.0, 23.0, 38.0, 46.0, 38.0, 41.0, 42.0, 54.0, 37.0, 46.0, 37.0, 32.0, 42.0, 29.0, 39.0, 41.0, 28.0, 27.0, 27.0, 26.0, 26.0, 25.0, 25.0, 14.0, 10.0, 15.0, 8.0, 10.0, 3.0, 5.0, 8.0, 2.0, 5.0, 10.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2520633935928345, -0.2437812238931656, -0.2354990392923355, -0.22721686959266663, -0.21893468499183655, -0.21065251529216766, -0.20237034559249878, -0.1940881609916687, -0.18580599129199982, -0.17752382159233093, -0.16924163699150085, -0.16095946729183197, -0.15267729759216309, -0.144395112991333, -0.13611294329166412, -0.12783077359199524, -0.11954858899116516, -0.11126641184091568, -0.1029842346906662, -0.09470206499099731, -0.08641988784074783, -0.07813771069049835, -0.06985554099082947, -0.06157336384057999, -0.053291186690330505, -0.045009009540081024, -0.03672683611512184, -0.02844466082751751, -0.020162485539913177, -0.011880308389663696, -0.0035981349647045135, 0.004684038460254669, 0.01296621561050415, 0.021248390898108482, 0.029530566185712814, 0.037812739610672, 0.04609491676092148, 0.05437709391117096, 0.06265926361083984, 0.07094144076108932, 0.0792236179113388, 0.08750579506158829, 0.09578797221183777, 0.10407014191150665, 0.11235231906175613, 0.12063449621200562, 0.1289166659116745, 0.13719883561134338, 0.14548102021217346, 0.15376318991184235, 0.16204537451267242, 0.1703275442123413, 0.1786097288131714, 0.18689189851284027, 0.19517406821250916, 0.20345625281333923, 0.21173842251300812, 0.220020592212677, 0.22830277681350708, 0.23658494651317596, 0.24486711621284485, 0.2531493008136749, 0.261431485414505, 0.2697136402130127, 0.2779958248138428]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 1.0, 12.0, 7.0, 13.0, 13.0, 28.0, 36.0, 64.0, 68.0, 127.0, 196.0, 364.0, 655.0, 1278.0, 2722.0, 6114.0, 15138.0, 42868.0, 137754.0, 406513.0, 297053.0, 89012.0, 28947.0, 10592.0, 4589.0, 2054.0, 979.0, 558.0, 308.0, 164.0, 104.0, 74.0, 45.0, 23.0, 25.0, 12.0, 11.0, 6.0, 6.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35888671875, -0.3468513488769531, -0.33481597900390625, -0.3227806091308594, -0.3107452392578125, -0.2987098693847656, -0.28667449951171875, -0.2746391296386719, -0.262603759765625, -0.2505683898925781, -0.23853302001953125, -0.22649765014648438, -0.2144622802734375, -0.20242691040039062, -0.19039154052734375, -0.17835617065429688, -0.16632080078125, -0.15428543090820312, -0.14225006103515625, -0.13021469116210938, -0.1181793212890625, -0.10614395141601562, -0.09410858154296875, -0.08207321166992188, -0.070037841796875, -0.058002471923828125, -0.04596710205078125, -0.033931732177734375, -0.0218963623046875, -0.009860992431640625, 0.00217437744140625, 0.014209747314453125, 0.0262451171875, 0.038280487060546875, 0.05031585693359375, 0.062351226806640625, 0.0743865966796875, 0.08642196655273438, 0.09845733642578125, 0.11049270629882812, 0.122528076171875, 0.13456344604492188, 0.14659881591796875, 0.15863418579101562, 0.1706695556640625, 0.18270492553710938, 0.19474029541015625, 0.20677566528320312, 0.21881103515625, 0.23084640502929688, 0.24288177490234375, 0.2549171447753906, 0.2669525146484375, 0.2789878845214844, 0.29102325439453125, 0.3030586242675781, 0.315093994140625, 0.3271293640136719, 0.33916473388671875, 0.3512001037597656, 0.3632354736328125, 0.3752708435058594, 0.38730621337890625, 0.3993415832519531, 0.411376953125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 0.0, 5.0, 6.0, 8.0, 8.0, 11.0, 18.0, 18.0, 17.0, 21.0, 22.0, 40.0, 45.0, 33.0, 50.0, 50.0, 58.0, 44.0, 53.0, 64.0, 54.0, 48.0, 41.0, 34.0, 28.0, 45.0, 35.0, 26.0, 17.0, 25.0, 13.0, 11.0, 14.0, 8.0, 8.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.188232421875, -0.18310165405273438, -0.17797088623046875, -0.17284011840820312, -0.1677093505859375, -0.16257858276367188, -0.15744781494140625, -0.15231704711914062, -0.147186279296875, -0.14205551147460938, -0.13692474365234375, -0.13179397583007812, -0.1266632080078125, -0.12153244018554688, -0.11640167236328125, -0.11127090454101562, -0.10614013671875, -0.10100936889648438, -0.09587860107421875, -0.09074783325195312, -0.0856170654296875, -0.08048629760742188, -0.07535552978515625, -0.07022476196289062, -0.065093994140625, -0.059963226318359375, -0.05483245849609375, -0.049701690673828125, -0.0445709228515625, -0.039440155029296875, -0.03430938720703125, -0.029178619384765625, -0.0240478515625, -0.018917083740234375, -0.01378631591796875, -0.008655548095703125, -0.0035247802734375, 0.001605987548828125, 0.00673675537109375, 0.011867523193359375, 0.016998291015625, 0.022129058837890625, 0.02725982666015625, 0.032390594482421875, 0.0375213623046875, 0.042652130126953125, 0.04778289794921875, 0.052913665771484375, 0.05804443359375, 0.06317520141601562, 0.06830596923828125, 0.07343673706054688, 0.0785675048828125, 0.08369827270507812, 0.08882904052734375, 0.09395980834960938, 0.099090576171875, 0.10422134399414062, 0.10935211181640625, 0.11448287963867188, 0.1196136474609375, 0.12474441528320312, 0.12987518310546875, 0.13500595092773438, 0.14013671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 15.0, 9.0, 16.0, 19.0, 41.0, 47.0, 80.0, 124.0, 191.0, 332.0, 634.0, 1255.0, 2606.0, 7041.0, 23344.0, 109216.0, 589633.0, 250629.0, 43782.0, 11703.0, 4034.0, 1738.0, 845.0, 470.0, 242.0, 170.0, 93.0, 72.0, 52.0, 33.0, 16.0, 16.0, 10.0, 10.0, 5.0, 3.0, 4.0, 2.0, 3.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.529296875, -0.5126113891601562, -0.4959259033203125, -0.47924041748046875, -0.462554931640625, -0.44586944580078125, -0.4291839599609375, -0.41249847412109375, -0.39581298828125, -0.37912750244140625, -0.3624420166015625, -0.34575653076171875, -0.329071044921875, -0.31238555908203125, -0.2957000732421875, -0.27901458740234375, -0.2623291015625, -0.24564361572265625, -0.2289581298828125, -0.21227264404296875, -0.195587158203125, -0.17890167236328125, -0.1622161865234375, -0.14553070068359375, -0.12884521484375, -0.11215972900390625, -0.0954742431640625, -0.07878875732421875, -0.062103271484375, -0.04541778564453125, -0.0287322998046875, -0.01204681396484375, 0.004638671875, 0.02132415771484375, 0.0380096435546875, 0.05469512939453125, 0.071380615234375, 0.08806610107421875, 0.1047515869140625, 0.12143707275390625, 0.13812255859375, 0.15480804443359375, 0.1714935302734375, 0.18817901611328125, 0.204864501953125, 0.22154998779296875, 0.2382354736328125, 0.25492095947265625, 0.2716064453125, 0.28829193115234375, 0.3049774169921875, 0.32166290283203125, 0.338348388671875, 0.35503387451171875, 0.3717193603515625, 0.38840484619140625, 0.40509033203125, 0.42177581787109375, 0.4384613037109375, 0.45514678955078125, 0.471832275390625, 0.48851776123046875, 0.5052032470703125, 0.5218887329101562, 0.53857421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 1.0, 1.0, 7.0, 4.0, 8.0, 14.0, 14.0, 26.0, 18.0, 20.0, 35.0, 37.0, 38.0, 31.0, 45.0, 47.0, 56.0, 51.0, 46.0, 61.0, 50.0, 42.0, 43.0, 46.0, 45.0, 30.0, 34.0, 25.0, 21.0, 21.0, 16.0, 17.0, 18.0, 6.0, 8.0, 9.0, 5.0, 0.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67041015625, -0.6444091796875, -0.618408203125, -0.5924072265625, -0.56640625, -0.5404052734375, -0.514404296875, -0.4884033203125, -0.46240234375, -0.4364013671875, -0.410400390625, -0.3843994140625, -0.3583984375, -0.3323974609375, -0.306396484375, -0.2803955078125, -0.25439453125, -0.2283935546875, -0.202392578125, -0.1763916015625, -0.150390625, -0.1243896484375, -0.098388671875, -0.0723876953125, -0.04638671875, -0.0203857421875, 0.005615234375, 0.0316162109375, 0.0576171875, 0.0836181640625, 0.109619140625, 0.1356201171875, 0.16162109375, 0.1876220703125, 0.213623046875, 0.2396240234375, 0.265625, 0.2916259765625, 0.317626953125, 0.3436279296875, 0.36962890625, 0.3956298828125, 0.421630859375, 0.4476318359375, 0.4736328125, 0.4996337890625, 0.525634765625, 0.5516357421875, 0.57763671875, 0.6036376953125, 0.629638671875, 0.6556396484375, 0.681640625, 0.7076416015625, 0.733642578125, 0.7596435546875, 0.78564453125, 0.8116455078125, 0.837646484375, 0.8636474609375, 0.8896484375, 0.9156494140625, 0.941650390625, 0.9676513671875, 0.99365234375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 10.0, 10.0, 24.0, 45.0, 94.0, 166.0, 501.0, 1343.0, 6661.0, 119850.0, 892773.0, 22684.0, 3069.0, 797.0, 279.0, 116.0, 56.0, 21.0, 19.0, 7.0, 7.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83349609375, -0.8117141723632812, -0.7899322509765625, -0.7681503295898438, -0.746368408203125, -0.7245864868164062, -0.7028045654296875, -0.6810226440429688, -0.65924072265625, -0.6374588012695312, -0.6156768798828125, -0.5938949584960938, -0.572113037109375, -0.5503311157226562, -0.5285491943359375, -0.5067672729492188, -0.4849853515625, -0.46320343017578125, -0.4414215087890625, -0.41963958740234375, -0.397857666015625, -0.37607574462890625, -0.3542938232421875, -0.33251190185546875, -0.31072998046875, -0.28894805908203125, -0.2671661376953125, -0.24538421630859375, -0.223602294921875, -0.20182037353515625, -0.1800384521484375, -0.15825653076171875, -0.136474609375, -0.11469268798828125, -0.0929107666015625, -0.07112884521484375, -0.049346923828125, -0.02756500244140625, -0.0057830810546875, 0.01599884033203125, 0.03778076171875, 0.05956268310546875, 0.0813446044921875, 0.10312652587890625, 0.124908447265625, 0.14669036865234375, 0.1684722900390625, 0.19025421142578125, 0.2120361328125, 0.23381805419921875, 0.2555999755859375, 0.27738189697265625, 0.299163818359375, 0.32094573974609375, 0.3427276611328125, 0.36450958251953125, 0.38629150390625, 0.40807342529296875, 0.4298553466796875, 0.45163726806640625, 0.473419189453125, 0.49520111083984375, 0.5169830322265625, 0.5387649536132812, 0.560546875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 10.0, 18.0, 20.0, 21.0, 28.0, 54.0, 61.0, 92.0, 92.0, 117.0, 142.0, 90.0, 70.0, 47.0, 27.0, 26.0, 22.0, 9.0, 12.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.355213165283203e-05, -7.114652544260025e-05, -6.874091923236847e-05, -6.633531302213669e-05, -6.392970681190491e-05, -6.152410060167313e-05, -5.9118494391441345e-05, -5.6712888181209564e-05, -5.430728197097778e-05, -5.1901675760746e-05, -4.949606955051422e-05, -4.709046334028244e-05, -4.468485713005066e-05, -4.227925091981888e-05, -3.98736447095871e-05, -3.7468038499355316e-05, -3.5062432289123535e-05, -3.2656826078891754e-05, -3.0251219868659973e-05, -2.7845613658428192e-05, -2.544000744819641e-05, -2.303440123796463e-05, -2.062879502773285e-05, -1.8223188817501068e-05, -1.5817582607269287e-05, -1.3411976397037506e-05, -1.1006370186805725e-05, -8.600763976573944e-06, -6.195157766342163e-06, -3.789551556110382e-06, -1.383945345878601e-06, 1.02166086435318e-06, 3.427267074584961e-06, 5.832873284816742e-06, 8.238479495048523e-06, 1.0644085705280304e-05, 1.3049691915512085e-05, 1.5455298125743866e-05, 1.7860904335975647e-05, 2.0266510546207428e-05, 2.267211675643921e-05, 2.507772296667099e-05, 2.748332917690277e-05, 2.9888935387134552e-05, 3.229454159736633e-05, 3.4700147807598114e-05, 3.7105754017829895e-05, 3.9511360228061676e-05, 4.191696643829346e-05, 4.432257264852524e-05, 4.672817885875702e-05, 4.91337850689888e-05, 5.153939127922058e-05, 5.394499748945236e-05, 5.635060369968414e-05, 5.8756209909915924e-05, 6.11618161201477e-05, 6.356742233037949e-05, 6.597302854061127e-05, 6.837863475084305e-05, 7.078424096107483e-05, 7.318984717130661e-05, 7.559545338153839e-05, 7.800105959177017e-05, 8.040666580200195e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 10.0, 31.0, 17.0, 50.0, 88.0, 158.0, 341.0, 1095.0, 4738.0, 51601.0, 922562.0, 60612.0, 5268.0, 1190.0, 432.0, 146.0, 76.0, 48.0, 28.0, 19.0, 12.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.86279296875, -0.843414306640625, -0.82403564453125, -0.804656982421875, -0.7852783203125, -0.765899658203125, -0.74652099609375, -0.727142333984375, -0.707763671875, -0.688385009765625, -0.66900634765625, -0.649627685546875, -0.6302490234375, -0.610870361328125, -0.59149169921875, -0.572113037109375, -0.552734375, -0.533355712890625, -0.51397705078125, -0.494598388671875, -0.4752197265625, -0.455841064453125, -0.43646240234375, -0.417083740234375, -0.397705078125, -0.378326416015625, -0.35894775390625, -0.339569091796875, -0.3201904296875, -0.300811767578125, -0.28143310546875, -0.262054443359375, -0.24267578125, -0.223297119140625, -0.20391845703125, -0.184539794921875, -0.1651611328125, -0.145782470703125, -0.12640380859375, -0.107025146484375, -0.087646484375, -0.068267822265625, -0.04888916015625, -0.029510498046875, -0.0101318359375, 0.009246826171875, 0.02862548828125, 0.048004150390625, 0.0673828125, 0.086761474609375, 0.10614013671875, 0.125518798828125, 0.1448974609375, 0.164276123046875, 0.18365478515625, 0.203033447265625, 0.222412109375, 0.241790771484375, 0.26116943359375, 0.280548095703125, 0.2999267578125, 0.319305419921875, 0.33868408203125, 0.358062744140625, 0.37744140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 9.0, 6.0, 7.0, 17.0, 32.0, 58.0, 115.0, 173.0, 198.0, 170.0, 105.0, 48.0, 22.0, 18.0, 7.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8701171875, -0.8495750427246094, -0.8290328979492188, -0.8084907531738281, -0.7879486083984375, -0.7674064636230469, -0.7468643188476562, -0.7263221740722656, -0.705780029296875, -0.6852378845214844, -0.6646957397460938, -0.6441535949707031, -0.6236114501953125, -0.6030693054199219, -0.5825271606445312, -0.5619850158691406, -0.54144287109375, -0.5209007263183594, -0.5003585815429688, -0.4798164367675781, -0.4592742919921875, -0.4387321472167969, -0.41819000244140625, -0.3976478576660156, -0.377105712890625, -0.3565635681152344, -0.33602142333984375, -0.3154792785644531, -0.2949371337890625, -0.2743949890136719, -0.25385284423828125, -0.23331069946289062, -0.2127685546875, -0.19222640991210938, -0.17168426513671875, -0.15114212036132812, -0.1305999755859375, -0.11005783081054688, -0.08951568603515625, -0.06897354125976562, -0.048431396484375, -0.027889251708984375, -0.00734710693359375, 0.013195037841796875, 0.0337371826171875, 0.054279327392578125, 0.07482147216796875, 0.09536361694335938, 0.11590576171875, 0.13644790649414062, 0.15699005126953125, 0.17753219604492188, 0.1980743408203125, 0.21861648559570312, 0.23915863037109375, 0.2597007751464844, 0.280242919921875, 0.3007850646972656, 0.32132720947265625, 0.3418693542480469, 0.3624114990234375, 0.3829536437988281, 0.40349578857421875, 0.4240379333496094, 0.444580078125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 5.0, 10.0, 25.0, 34.0, 56.0, 80.0, 103.0, 170.0, 141.0, 124.0, 82.0, 73.0, 37.0, 20.0, 11.0, 5.0, 4.0, 8.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.760673522949219, -4.623292446136475, -4.4859113693237305, -4.348530292510986, -4.211149215698242, -4.073768138885498, -3.936387300491333, -3.799006223678589, -3.6616251468658447, -3.5242440700531006, -3.3868629932403564, -3.2494819164276123, -3.1121010780334473, -2.974720001220703, -2.837338924407959, -2.699957847595215, -2.5625767707824707, -2.4251956939697266, -2.2878146171569824, -2.1504335403442383, -2.013052463531494, -1.8756715059280396, -1.738290548324585, -1.6009094715118408, -1.4635283946990967, -1.3261473178863525, -1.1887662410736084, -1.0513852834701538, -0.9140042066574097, -0.7766231298446655, -0.6392421126365662, -0.5018610954284668, -0.36448049545288086, -0.2270994484424591, -0.08971840143203735, 0.0476626455783844, 0.18504369258880615, 0.3224247694015503, 0.45980578660964966, 0.597186803817749, 0.7345678806304932, 0.8719489574432373, 1.0093300342559814, 1.146710991859436, 1.2840920686721802, 1.4214731454849243, 1.558854103088379, 1.696235179901123, 1.8336162567138672, 1.9709973335266113, 2.1083784103393555, 2.2457594871520996, 2.3831405639648438, 2.520521640777588, 2.657902479171753, 2.795283555984497, 2.932664632797241, 3.0700457096099854, 3.2074267864227295, 3.3448078632354736, 3.4821887016296387, 3.619569778442383, 3.756950855255127, 3.894331932067871, 4.031713008880615]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 11.0, 7.0, 10.0, 24.0, 23.0, 23.0, 36.0, 34.0, 45.0, 54.0, 70.0, 62.0, 54.0, 63.0, 64.0, 69.0, 73.0, 48.0, 44.0, 38.0, 35.0, 33.0, 13.0, 22.0, 5.0, 12.0, 6.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.619312286376953, -4.472311019897461, -4.325309753417969, -4.178308486938477, -4.031307220458984, -3.884305953979492, -3.7373046875, -3.590303421020508, -3.4433021545410156, -3.2963008880615234, -3.1492996215820312, -3.002298355102539, -2.855297088623047, -2.7082958221435547, -2.5612945556640625, -2.4142932891845703, -2.2672922611236572, -2.120290994644165, -1.9732897281646729, -1.8262884616851807, -1.6792871952056885, -1.5322859287261963, -1.3852847814559937, -1.2382835149765015, -1.0912822484970093, -0.9442809820175171, -0.7972797155380249, -0.6502785086631775, -0.5032772421836853, -0.3562759757041931, -0.2092747688293457, -0.062273502349853516, 0.08472776412963867, 0.23172901570796967, 0.37873026728630066, 0.5257315039634705, 0.6727327704429626, 0.8197340369224548, 0.9667352437973022, 1.1137365102767944, 1.2607377767562866, 1.4077390432357788, 1.554740309715271, 1.7017414569854736, 1.8487427234649658, 1.995743989944458, 2.14274525642395, 2.2897465229034424, 2.4367477893829346, 2.5837490558624268, 2.730750322341919, 2.877751588821411, 3.0247528553009033, 3.1717541217803955, 3.3187551498413086, 3.465756416320801, 3.612757682800293, 3.759758949279785, 3.9067602157592773, 4.0537614822387695, 4.200762748718262, 4.347764015197754, 4.494765281677246, 4.641766548156738, 4.7887678146362305]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 15.0, 21.0, 34.0, 83.0, 178.0, 463.0, 1590.0, 26611.0, 4159233.0, 4589.0, 852.0, 323.0, 124.0, 71.0, 33.0, 22.0, 16.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8671875, -1.7987060546875, -1.730224609375, -1.6617431640625, -1.59326171875, -1.5247802734375, -1.456298828125, -1.3878173828125, -1.3193359375, -1.2508544921875, -1.182373046875, -1.1138916015625, -1.04541015625, -0.9769287109375, -0.908447265625, -0.8399658203125, -0.771484375, -0.7030029296875, -0.634521484375, -0.5660400390625, -0.49755859375, -0.4290771484375, -0.360595703125, -0.2921142578125, -0.2236328125, -0.1551513671875, -0.086669921875, -0.0181884765625, 0.05029296875, 0.1187744140625, 0.187255859375, 0.2557373046875, 0.32421875, 0.3927001953125, 0.461181640625, 0.5296630859375, 0.59814453125, 0.6666259765625, 0.735107421875, 0.8035888671875, 0.8720703125, 0.9405517578125, 1.009033203125, 1.0775146484375, 1.14599609375, 1.2144775390625, 1.282958984375, 1.3514404296875, 1.419921875, 1.4884033203125, 1.556884765625, 1.6253662109375, 1.69384765625, 1.7623291015625, 1.830810546875, 1.8992919921875, 1.9677734375, 2.0362548828125, 2.104736328125, 2.1732177734375, 2.24169921875, 2.3101806640625, 2.378662109375, 2.4471435546875, 2.515625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 5.0, 8.0, 14.0, 16.0, 32.0, 32.0, 48.0, 59.0, 71.0, 81.0, 88.0, 102.0, 106.0, 66.0, 70.0, 46.0, 44.0, 32.0, 17.0, 18.0, 12.0, 12.0, 8.0, 1.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2100830078125, -0.2018566131591797, -0.19363021850585938, -0.18540382385253906, -0.17717742919921875, -0.16895103454589844, -0.16072463989257812, -0.1524982452392578, -0.1442718505859375, -0.1360454559326172, -0.12781906127929688, -0.11959266662597656, -0.11136627197265625, -0.10313987731933594, -0.09491348266601562, -0.08668708801269531, -0.078460693359375, -0.07023429870605469, -0.062007904052734375, -0.05378150939941406, -0.04555511474609375, -0.03732872009277344, -0.029102325439453125, -0.020875930786132812, -0.0126495361328125, -0.0044231414794921875, 0.003803253173828125, 0.012029647827148438, 0.02025604248046875, 0.028482437133789062, 0.036708831787109375, 0.04493522644042969, 0.05316162109375, 0.06138801574707031, 0.06961441040039062, 0.07784080505371094, 0.08606719970703125, 0.09429359436035156, 0.10251998901367188, 0.11074638366699219, 0.1189727783203125, 0.1271991729736328, 0.13542556762695312, 0.14365196228027344, 0.15187835693359375, 0.16010475158691406, 0.16833114624023438, 0.1765575408935547, 0.184783935546875, 0.1930103302001953, 0.20123672485351562, 0.20946311950683594, 0.21768951416015625, 0.22591590881347656, 0.23414230346679688, 0.2423686981201172, 0.2505950927734375, 0.2588214874267578, 0.2670478820800781, 0.27527427673339844, 0.28350067138671875, 0.29172706604003906, 0.2999534606933594, 0.3081798553466797, 0.31640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 7.0, 4.0, 12.0, 8.0, 17.0, 22.0, 33.0, 39.0, 64.0, 97.0, 147.0, 249.0, 425.0, 908.0, 2317.0, 7141.0, 31065.0, 3608392.0, 509721.0, 24046.0, 5847.0, 1890.0, 767.0, 385.0, 183.0, 137.0, 103.0, 51.0, 47.0, 49.0, 22.0, 17.0, 15.0, 11.0, 6.0, 8.0, 5.0, 10.0, 2.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.572265625, -0.5510101318359375, -0.529754638671875, -0.5084991455078125, -0.48724365234375, -0.4659881591796875, -0.444732666015625, -0.4234771728515625, -0.4022216796875, -0.3809661865234375, -0.359710693359375, -0.3384552001953125, -0.31719970703125, -0.2959442138671875, -0.274688720703125, -0.2534332275390625, -0.232177734375, -0.2109222412109375, -0.189666748046875, -0.1684112548828125, -0.14715576171875, -0.1259002685546875, -0.104644775390625, -0.0833892822265625, -0.0621337890625, -0.0408782958984375, -0.019622802734375, 0.0016326904296875, 0.02288818359375, 0.0441436767578125, 0.065399169921875, 0.0866546630859375, 0.10791015625, 0.1291656494140625, 0.150421142578125, 0.1716766357421875, 0.19293212890625, 0.2141876220703125, 0.235443115234375, 0.2566986083984375, 0.2779541015625, 0.2992095947265625, 0.320465087890625, 0.3417205810546875, 0.36297607421875, 0.3842315673828125, 0.405487060546875, 0.4267425537109375, 0.447998046875, 0.4692535400390625, 0.490509033203125, 0.5117645263671875, 0.53302001953125, 0.5542755126953125, 0.575531005859375, 0.5967864990234375, 0.6180419921875, 0.6392974853515625, 0.660552978515625, 0.6818084716796875, 0.70306396484375, 0.7243194580078125, 0.745574951171875, 0.7668304443359375, 0.7880859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 7.0, 11.0, 7.0, 14.0, 21.0, 45.0, 110.0, 343.0, 2988.0, 312.0, 78.0, 58.0, 18.0, 14.0, 18.0, 11.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1895751953125, -0.18114662170410156, -0.17271804809570312, -0.1642894744873047, -0.15586090087890625, -0.1474323272705078, -0.13900375366210938, -0.13057518005371094, -0.1221466064453125, -0.11371803283691406, -0.10528945922851562, -0.09686088562011719, -0.08843231201171875, -0.08000373840332031, -0.07157516479492188, -0.06314659118652344, -0.054718017578125, -0.04628944396972656, -0.037860870361328125, -0.029432296752929688, -0.02100372314453125, -0.012575149536132812, -0.004146575927734375, 0.0042819976806640625, 0.0127105712890625, 0.021139144897460938, 0.029567718505859375, 0.03799629211425781, 0.04642486572265625, 0.05485343933105469, 0.06328201293945312, 0.07171058654785156, 0.08013916015625, 0.08856773376464844, 0.09699630737304688, 0.10542488098144531, 0.11385345458984375, 0.12228202819824219, 0.13071060180664062, 0.13913917541503906, 0.1475677490234375, 0.15599632263183594, 0.16442489624023438, 0.1728534698486328, 0.18128204345703125, 0.1897106170654297, 0.19813919067382812, 0.20656776428222656, 0.214996337890625, 0.22342491149902344, 0.23185348510742188, 0.2402820587158203, 0.24871063232421875, 0.2571392059326172, 0.2655677795410156, 0.27399635314941406, 0.2824249267578125, 0.29085350036621094, 0.2992820739746094, 0.3077106475830078, 0.31613922119140625, 0.3245677947998047, 0.3329963684082031, 0.34142494201660156, 0.349853515625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 15.0, 38.0, 73.0, 166.0, 227.0, 196.0, 148.0, 72.0, 24.0, 22.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4027714729309082, -1.3457975387573242, -1.2888234853744507, -1.2318495512008667, -1.1748754978179932, -1.1179015636444092, -1.0609276294708252, -1.0039535760879517, -0.9469795823097229, -0.8900055885314941, -0.8330315947532654, -0.7760576009750366, -0.7190836668014526, -0.6621096134185791, -0.6051356792449951, -0.5481616854667664, -0.4911876916885376, -0.43421369791030884, -0.3772397041320801, -0.3202657401561737, -0.26329174637794495, -0.2063177525997162, -0.14934378862380981, -0.09236979484558105, -0.035395801067352295, 0.021578185260295868, 0.07855217158794403, 0.1355261504650116, 0.19250014424324036, 0.24947413802146912, 0.3064481019973755, 0.36342209577560425, 0.420396089553833, 0.47737008333206177, 0.5343440771102905, 0.5913180112838745, 0.648292064666748, 0.705265998840332, 0.7622399926185608, 0.8192139863967896, 0.8761879801750183, 0.9331619739532471, 0.9901359677314758, 1.0471099615097046, 1.1040838956832886, 1.161057949066162, 1.218031883239746, 1.27500581741333, 1.3319798707962036, 1.3889538049697876, 1.4459278583526611, 1.5029017925262451, 1.5598758459091187, 1.6168497800827026, 1.6738238334655762, 1.7307977676391602, 1.7877717018127441, 1.8447456359863281, 1.9017196893692017, 1.9586936235427856, 2.015667676925659, 2.072641611099243, 2.129615545272827, 2.1865897178649902, 2.243563652038574]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 9.0, 10.0, 8.0, 19.0, 21.0, 23.0, 23.0, 36.0, 25.0, 33.0, 37.0, 42.0, 45.0, 50.0, 37.0, 55.0, 54.0, 54.0, 48.0, 39.0, 53.0, 37.0, 48.0, 25.0, 24.0, 23.0, 12.0, 26.0, 15.0, 17.0, 5.0, 16.0, 11.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6615283489227295, -0.6415097713470459, -0.6214911937713623, -0.6014726758003235, -0.5814540982246399, -0.5614355206489563, -0.5414169430732727, -0.5213984251022339, -0.5013798475265503, -0.4813612699508667, -0.4613427221775055, -0.4413241446018219, -0.4213055968284607, -0.4012870192527771, -0.3812684416770935, -0.3612498939037323, -0.3412313163280487, -0.3212127387523651, -0.3011941909790039, -0.2811756134033203, -0.2611570656299591, -0.2411384880542755, -0.2211199253797531, -0.2011013627052307, -0.1810828000307083, -0.1610642373561859, -0.1410456746816635, -0.12102710455656052, -0.10100854188203812, -0.08098997920751572, -0.06097140908241272, -0.04095284640789032, -0.02093428373336792, -0.0009157191962003708, 0.01910284534096718, 0.03912141174077988, 0.05913997441530228, 0.07915853708982468, 0.09917710721492767, 0.11919566988945007, 0.13921423256397247, 0.15923279523849487, 0.17925135791301727, 0.19926992058753967, 0.21928849816322327, 0.23930704593658447, 0.25932562351226807, 0.27934420108795166, 0.29936274886131287, 0.31938132643699646, 0.33939987421035767, 0.35941845178604126, 0.37943699955940247, 0.39945557713508606, 0.41947412490844727, 0.43949270248413086, 0.45951128005981445, 0.47952985763549805, 0.49954840540885925, 0.5195669531822205, 0.539585530757904, 0.5596041083335876, 0.5796226859092712, 0.5996412038803101, 0.6196597814559937]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 6.0, 10.0, 12.0, 25.0, 32.0, 41.0, 86.0, 127.0, 260.0, 505.0, 1098.0, 3042.0, 10523.0, 53009.0, 377393.0, 508035.0, 74220.0, 13814.0, 3751.0, 1286.0, 582.0, 280.0, 136.0, 99.0, 54.0, 46.0, 24.0, 12.0, 13.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.72314453125, -0.7025375366210938, -0.6819305419921875, -0.6613235473632812, -0.640716552734375, -0.6201095581054688, -0.5995025634765625, -0.5788955688476562, -0.55828857421875, -0.5376815795898438, -0.5170745849609375, -0.49646759033203125, -0.475860595703125, -0.45525360107421875, -0.4346466064453125, -0.41403961181640625, -0.3934326171875, -0.37282562255859375, -0.3522186279296875, -0.33161163330078125, -0.311004638671875, -0.29039764404296875, -0.2697906494140625, -0.24918365478515625, -0.22857666015625, -0.20796966552734375, -0.1873626708984375, -0.16675567626953125, -0.146148681640625, -0.12554168701171875, -0.1049346923828125, -0.08432769775390625, -0.063720703125, -0.04311370849609375, -0.0225067138671875, -0.00189971923828125, 0.018707275390625, 0.03931427001953125, 0.0599212646484375, 0.08052825927734375, 0.10113525390625, 0.12174224853515625, 0.1423492431640625, 0.16295623779296875, 0.183563232421875, 0.20417022705078125, 0.2247772216796875, 0.24538421630859375, 0.2659912109375, 0.28659820556640625, 0.3072052001953125, 0.32781219482421875, 0.348419189453125, 0.36902618408203125, 0.3896331787109375, 0.41024017333984375, 0.43084716796875, 0.45145416259765625, 0.4720611572265625, 0.49266815185546875, 0.513275146484375, 0.5338821411132812, 0.5544891357421875, 0.5750961303710938, 0.595703125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 7.0, 12.0, 26.0, 27.0, 35.0, 37.0, 45.0, 54.0, 65.0, 74.0, 89.0, 99.0, 85.0, 74.0, 52.0, 61.0, 42.0, 33.0, 21.0, 15.0, 12.0, 8.0, 8.0, 4.0, 8.0, 1.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.225341796875, -0.21707534790039062, -0.20880889892578125, -0.20054244995117188, -0.1922760009765625, -0.18400955200195312, -0.17574310302734375, -0.16747665405273438, -0.159210205078125, -0.15094375610351562, -0.14267730712890625, -0.13441085815429688, -0.1261444091796875, -0.11787796020507812, -0.10961151123046875, -0.10134506225585938, -0.09307861328125, -0.08481216430664062, -0.07654571533203125, -0.06827926635742188, -0.0600128173828125, -0.051746368408203125, -0.04347991943359375, -0.035213470458984375, -0.026947021484375, -0.018680572509765625, -0.01041412353515625, -0.002147674560546875, 0.0061187744140625, 0.014385223388671875, 0.02265167236328125, 0.030918121337890625, 0.0391845703125, 0.047451019287109375, 0.05571746826171875, 0.06398391723632812, 0.0722503662109375, 0.08051681518554688, 0.08878326416015625, 0.09704971313476562, 0.105316162109375, 0.11358261108398438, 0.12184906005859375, 0.13011550903320312, 0.1383819580078125, 0.14664840698242188, 0.15491485595703125, 0.16318130493164062, 0.17144775390625, 0.17971420288085938, 0.18798065185546875, 0.19624710083007812, 0.2045135498046875, 0.21277999877929688, 0.22104644775390625, 0.22931289672851562, 0.237579345703125, 0.24584579467773438, 0.25411224365234375, 0.2623786926269531, 0.2706451416015625, 0.2789115905761719, 0.28717803955078125, 0.2954444885253906, 0.3037109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 3.0, 3.0, 9.0, 8.0, 10.0, 14.0, 16.0, 32.0, 40.0, 49.0, 70.0, 112.0, 145.0, 224.0, 367.0, 544.0, 993.0, 1903.0, 4539.0, 14609.0, 66620.0, 465258.0, 410261.0, 60193.0, 13685.0, 4439.0, 1911.0, 938.0, 516.0, 345.0, 203.0, 151.0, 105.0, 63.0, 43.0, 33.0, 25.0, 22.0, 13.0, 6.0, 9.0, 7.0, 2.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5191879272460938, -0.5012664794921875, -0.48334503173828125, -0.465423583984375, -0.44750213623046875, -0.4295806884765625, -0.41165924072265625, -0.39373779296875, -0.37581634521484375, -0.3578948974609375, -0.33997344970703125, -0.322052001953125, -0.30413055419921875, -0.2862091064453125, -0.26828765869140625, -0.2503662109375, -0.23244476318359375, -0.2145233154296875, -0.19660186767578125, -0.178680419921875, -0.16075897216796875, -0.1428375244140625, -0.12491607666015625, -0.10699462890625, -0.08907318115234375, -0.0711517333984375, -0.05323028564453125, -0.035308837890625, -0.01738739013671875, 0.0005340576171875, 0.01845550537109375, 0.036376953125, 0.05429840087890625, 0.0722198486328125, 0.09014129638671875, 0.108062744140625, 0.12598419189453125, 0.1439056396484375, 0.16182708740234375, 0.17974853515625, 0.19766998291015625, 0.2155914306640625, 0.23351287841796875, 0.251434326171875, 0.26935577392578125, 0.2872772216796875, 0.30519866943359375, 0.3231201171875, 0.34104156494140625, 0.3589630126953125, 0.37688446044921875, 0.394805908203125, 0.41272735595703125, 0.4306488037109375, 0.44857025146484375, 0.46649169921875, 0.48441314697265625, 0.5023345947265625, 0.5202560424804688, 0.538177490234375, 0.5560989379882812, 0.5740203857421875, 0.5919418334960938, 0.60986328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 7.0, 8.0, 12.0, 22.0, 24.0, 25.0, 31.0, 33.0, 38.0, 37.0, 35.0, 40.0, 59.0, 55.0, 58.0, 50.0, 46.0, 58.0, 43.0, 49.0, 44.0, 41.0, 34.0, 25.0, 23.0, 21.0, 18.0, 7.0, 15.0, 7.0, 6.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7216796875, -0.6967391967773438, -0.6717987060546875, -0.6468582153320312, -0.621917724609375, -0.5969772338867188, -0.5720367431640625, -0.5470962524414062, -0.52215576171875, -0.49721527099609375, -0.4722747802734375, -0.44733428955078125, -0.422393798828125, -0.39745330810546875, -0.3725128173828125, -0.34757232666015625, -0.3226318359375, -0.29769134521484375, -0.2727508544921875, -0.24781036376953125, -0.222869873046875, -0.19792938232421875, -0.1729888916015625, -0.14804840087890625, -0.12310791015625, -0.09816741943359375, -0.0732269287109375, -0.04828643798828125, -0.023345947265625, 0.00159454345703125, 0.0265350341796875, 0.05147552490234375, 0.076416015625, 0.10135650634765625, 0.1262969970703125, 0.15123748779296875, 0.176177978515625, 0.20111846923828125, 0.2260589599609375, 0.25099945068359375, 0.27593994140625, 0.30088043212890625, 0.3258209228515625, 0.35076141357421875, 0.375701904296875, 0.40064239501953125, 0.4255828857421875, 0.45052337646484375, 0.4754638671875, 0.5004043579101562, 0.5253448486328125, 0.5502853393554688, 0.575225830078125, 0.6001663208007812, 0.6251068115234375, 0.6500473022460938, 0.67498779296875, 0.6999282836914062, 0.7248687744140625, 0.7498092651367188, 0.774749755859375, 0.7996902465820312, 0.8246307373046875, 0.8495712280273438, 0.87451171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 12.0, 6.0, 12.0, 14.0, 23.0, 29.0, 41.0, 57.0, 103.0, 199.0, 393.0, 793.0, 2256.0, 9444.0, 78730.0, 805910.0, 132777.0, 12823.0, 2996.0, 1012.0, 392.0, 185.0, 129.0, 68.0, 37.0, 31.0, 22.0, 13.0, 8.0, 13.0, 7.0, 3.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2705078125, -0.26070404052734375, -0.2509002685546875, -0.24109649658203125, -0.231292724609375, -0.22148895263671875, -0.2116851806640625, -0.20188140869140625, -0.19207763671875, -0.18227386474609375, -0.1724700927734375, -0.16266632080078125, -0.152862548828125, -0.14305877685546875, -0.1332550048828125, -0.12345123291015625, -0.1136474609375, -0.10384368896484375, -0.0940399169921875, -0.08423614501953125, -0.074432373046875, -0.06462860107421875, -0.0548248291015625, -0.04502105712890625, -0.03521728515625, -0.02541351318359375, -0.0156097412109375, -0.00580596923828125, 0.003997802734375, 0.01380157470703125, 0.0236053466796875, 0.03340911865234375, 0.043212890625, 0.05301666259765625, 0.0628204345703125, 0.07262420654296875, 0.082427978515625, 0.09223175048828125, 0.1020355224609375, 0.11183929443359375, 0.12164306640625, 0.13144683837890625, 0.1412506103515625, 0.15105438232421875, 0.160858154296875, 0.17066192626953125, 0.1804656982421875, 0.19026947021484375, 0.2000732421875, 0.20987701416015625, 0.2196807861328125, 0.22948455810546875, 0.239288330078125, 0.24909210205078125, 0.2588958740234375, 0.26869964599609375, 0.27850341796875, 0.28830718994140625, 0.2981109619140625, 0.30791473388671875, 0.317718505859375, 0.32752227783203125, 0.3373260498046875, 0.34712982177734375, 0.35693359375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 13.0, 11.0, 5.0, 20.0, 15.0, 14.0, 32.0, 35.0, 62.0, 77.0, 96.0, 96.0, 119.0, 82.0, 80.0, 69.0, 52.0, 23.0, 27.0, 18.0, 10.0, 11.0, 7.0, 6.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.172325134277344e-05, -3.983639180660248e-05, -3.794953227043152e-05, -3.606267273426056e-05, -3.41758131980896e-05, -3.228895366191864e-05, -3.040209412574768e-05, -2.851523458957672e-05, -2.6628375053405762e-05, -2.4741515517234802e-05, -2.2854655981063843e-05, -2.0967796444892883e-05, -1.9080936908721924e-05, -1.7194077372550964e-05, -1.5307217836380005e-05, -1.3420358300209045e-05, -1.1533498764038086e-05, -9.646639227867126e-06, -7.759779691696167e-06, -5.8729201555252075e-06, -3.986060619354248e-06, -2.0992010831832886e-06, -2.123415470123291e-07, 1.6745179891586304e-06, 3.56137752532959e-06, 5.448237061500549e-06, 7.335096597671509e-06, 9.221956133842468e-06, 1.1108815670013428e-05, 1.2995675206184387e-05, 1.4882534742355347e-05, 1.6769394278526306e-05, 1.8656253814697266e-05, 2.0543113350868225e-05, 2.2429972887039185e-05, 2.4316832423210144e-05, 2.6203691959381104e-05, 2.8090551495552063e-05, 2.9977411031723022e-05, 3.186427056789398e-05, 3.375113010406494e-05, 3.56379896402359e-05, 3.752484917640686e-05, 3.941170871257782e-05, 4.129856824874878e-05, 4.318542778491974e-05, 4.50722873210907e-05, 4.695914685726166e-05, 4.884600639343262e-05, 5.073286592960358e-05, 5.2619725465774536e-05, 5.4506585001945496e-05, 5.6393444538116455e-05, 5.8280304074287415e-05, 6.0167163610458374e-05, 6.205402314662933e-05, 6.394088268280029e-05, 6.582774221897125e-05, 6.771460175514221e-05, 6.960146129131317e-05, 7.148832082748413e-05, 7.337518036365509e-05, 7.526203989982605e-05, 7.714889943599701e-05, 7.903575897216797e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 6.0, 14.0, 14.0, 33.0, 48.0, 91.0, 158.0, 350.0, 897.0, 2930.0, 18521.0, 435703.0, 562887.0, 21734.0, 3343.0, 997.0, 396.0, 183.0, 98.0, 53.0, 38.0, 21.0, 11.0, 7.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275390625, -0.262298583984375, -0.24920654296875, -0.236114501953125, -0.2230224609375, -0.209930419921875, -0.19683837890625, -0.183746337890625, -0.170654296875, -0.157562255859375, -0.14447021484375, -0.131378173828125, -0.1182861328125, -0.105194091796875, -0.09210205078125, -0.079010009765625, -0.06591796875, -0.052825927734375, -0.03973388671875, -0.026641845703125, -0.0135498046875, -0.000457763671875, 0.01263427734375, 0.025726318359375, 0.038818359375, 0.051910400390625, 0.06500244140625, 0.078094482421875, 0.0911865234375, 0.104278564453125, 0.11737060546875, 0.130462646484375, 0.1435546875, 0.156646728515625, 0.16973876953125, 0.182830810546875, 0.1959228515625, 0.209014892578125, 0.22210693359375, 0.235198974609375, 0.248291015625, 0.261383056640625, 0.27447509765625, 0.287567138671875, 0.3006591796875, 0.313751220703125, 0.32684326171875, 0.339935302734375, 0.35302734375, 0.366119384765625, 0.37921142578125, 0.392303466796875, 0.4053955078125, 0.418487548828125, 0.43157958984375, 0.444671630859375, 0.457763671875, 0.470855712890625, 0.48394775390625, 0.497039794921875, 0.5101318359375, 0.523223876953125, 0.53631591796875, 0.549407958984375, 0.5625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 13.0, 10.0, 17.0, 27.0, 45.0, 57.0, 60.0, 65.0, 111.0, 120.0, 117.0, 83.0, 64.0, 52.0, 45.0, 30.0, 12.0, 17.0, 15.0, 11.0, 7.0, 3.0, 8.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3720703125, -0.36244964599609375, -0.3528289794921875, -0.34320831298828125, -0.333587646484375, -0.32396697998046875, -0.3143463134765625, -0.30472564697265625, -0.29510498046875, -0.28548431396484375, -0.2758636474609375, -0.26624298095703125, -0.256622314453125, -0.24700164794921875, -0.2373809814453125, -0.22776031494140625, -0.2181396484375, -0.20851898193359375, -0.1988983154296875, -0.18927764892578125, -0.179656982421875, -0.17003631591796875, -0.1604156494140625, -0.15079498291015625, -0.14117431640625, -0.13155364990234375, -0.1219329833984375, -0.11231231689453125, -0.102691650390625, -0.09307098388671875, -0.0834503173828125, -0.07382965087890625, -0.064208984375, -0.05458831787109375, -0.0449676513671875, -0.03534698486328125, -0.025726318359375, -0.01610565185546875, -0.0064849853515625, 0.00313568115234375, 0.01275634765625, 0.02237701416015625, 0.0319976806640625, 0.04161834716796875, 0.051239013671875, 0.06085968017578125, 0.0704803466796875, 0.08010101318359375, 0.0897216796875, 0.09934234619140625, 0.1089630126953125, 0.11858367919921875, 0.128204345703125, 0.13782501220703125, 0.1474456787109375, 0.15706634521484375, 0.16668701171875, 0.17630767822265625, 0.1859283447265625, 0.19554901123046875, 0.205169677734375, 0.21479034423828125, 0.2244110107421875, 0.23403167724609375, 0.24365234375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 9.0, 20.0, 24.0, 57.0, 84.0, 113.0, 160.0, 160.0, 141.0, 87.0, 44.0, 37.0, 19.0, 9.0, 6.0, 11.0, 1.0, 4.0, 1.0, 0.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4722366333007812, -2.3181440830230713, -2.1640515327453613, -2.0099592208862305, -1.8558666706085205, -1.7017741203308105, -1.5476816892623901, -1.3935892581939697, -1.2394967079162598, -1.0854041576385498, -0.9313117265701294, -0.7772192358970642, -0.623126745223999, -0.46903425455093384, -0.31494176387786865, -0.16084933280944824, -0.006756782531738281, 0.1473357081413269, 0.3014281988143921, 0.4555206894874573, 0.6096131801605225, 0.7637056708335876, 0.9177981615066528, 1.0718905925750732, 1.2259831428527832, 1.3800756931304932, 1.5341681241989136, 1.688260555267334, 1.842353105545044, 1.996445655822754, 2.1505379676818848, 2.3046305179595947, 2.4587230682373047, 2.6128156185150146, 2.7669081687927246, 2.9210004806518555, 3.0750930309295654, 3.2291855812072754, 3.3832778930664062, 3.537370443344116, 3.691462993621826, 3.845555543899536, 3.999648094177246, 4.153740406036377, 4.307832717895508, 4.461925506591797, 4.616017818450928, 4.770110130310059, 4.924202919006348, 5.0782952308654785, 5.232388019561768, 5.386480331420898, 5.5405731201171875, 5.694665431976318, 5.848757743835449, 6.002850532531738, 6.156942844390869, 6.31103515625, 6.465127944946289, 6.61922025680542, 6.773312568664551, 6.92740535736084, 7.081497669219971, 7.235589981079102, 7.389682769775391]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 7.0, 12.0, 5.0, 10.0, 19.0, 22.0, 25.0, 34.0, 31.0, 39.0, 38.0, 56.0, 62.0, 48.0, 70.0, 54.0, 66.0, 60.0, 57.0, 56.0, 36.0, 39.0, 25.0, 31.0, 28.0, 15.0, 6.0, 11.0, 12.0, 9.0, 1.0, 7.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.9957969188690186, -3.8682360649108887, -3.740675449371338, -3.613114833831787, -3.4855539798736572, -3.3579931259155273, -3.2304325103759766, -3.102871894836426, -2.975311040878296, -2.847750186920166, -2.7201895713806152, -2.5926289558410645, -2.4650681018829346, -2.3375072479248047, -2.209946632385254, -2.082386016845703, -1.9548251628875732, -1.827264428138733, -1.6997036933898926, -1.5721429586410522, -1.444582223892212, -1.3170214891433716, -1.1894607543945312, -1.061900019645691, -0.9343392848968506, -0.8067785501480103, -0.6792178153991699, -0.5516570806503296, -0.42409634590148926, -0.2965356111526489, -0.1689748764038086, -0.04141414165496826, 0.08614635467529297, 0.2137070894241333, 0.34126782417297363, 0.46882855892181396, 0.5963892936706543, 0.7239500284194946, 0.851510763168335, 0.9790714979171753, 1.1066322326660156, 1.234192967414856, 1.3617537021636963, 1.4893144369125366, 1.616875171661377, 1.7444359064102173, 1.8719966411590576, 1.999557375907898, 2.1271181106567383, 2.254678726196289, 2.382239580154419, 2.509800434112549, 2.6373610496520996, 2.7649216651916504, 2.8924825191497803, 3.02004337310791, 3.147603988647461, 3.2751646041870117, 3.4027254581451416, 3.5302863121032715, 3.6578469276428223, 3.785407543182373, 3.912968397140503, 4.040529251098633, 4.168089866638184]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 8.0, 7.0, 16.0, 25.0, 53.0, 76.0, 136.0, 307.0, 781.0, 2777.0, 15864.0, 373906.0, 3754764.0, 37628.0, 5207.0, 1430.0, 579.0, 293.0, 154.0, 88.0, 49.0, 45.0, 22.0, 18.0, 7.0, 12.0, 6.0, 8.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.71240234375, -0.6841354370117188, -0.6558685302734375, -0.6276016235351562, -0.599334716796875, -0.5710678100585938, -0.5428009033203125, -0.5145339965820312, -0.48626708984375, -0.45800018310546875, -0.4297332763671875, -0.40146636962890625, -0.373199462890625, -0.34493255615234375, -0.3166656494140625, -0.28839874267578125, -0.2601318359375, -0.23186492919921875, -0.2035980224609375, -0.17533111572265625, -0.147064208984375, -0.11879730224609375, -0.0905303955078125, -0.06226348876953125, -0.03399658203125, -0.00572967529296875, 0.0225372314453125, 0.05080413818359375, 0.079071044921875, 0.10733795166015625, 0.1356048583984375, 0.16387176513671875, 0.192138671875, 0.22040557861328125, 0.2486724853515625, 0.27693939208984375, 0.305206298828125, 0.33347320556640625, 0.3617401123046875, 0.39000701904296875, 0.41827392578125, 0.44654083251953125, 0.4748077392578125, 0.5030746459960938, 0.531341552734375, 0.5596084594726562, 0.5878753662109375, 0.6161422729492188, 0.6444091796875, 0.6726760864257812, 0.7009429931640625, 0.7292098999023438, 0.757476806640625, 0.7857437133789062, 0.8140106201171875, 0.8422775268554688, 0.87054443359375, 0.8988113403320312, 0.9270782470703125, 0.9553451538085938, 0.983612060546875, 1.0118789672851562, 1.0401458740234375, 1.0684127807617188, 1.0966796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 16.0, 16.0, 33.0, 53.0, 60.0, 73.0, 85.0, 104.0, 116.0, 97.0, 94.0, 86.0, 51.0, 30.0, 28.0, 25.0, 12.0, 6.0, 7.0, 8.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2144775390625, -0.20458412170410156, -0.19469070434570312, -0.1847972869873047, -0.17490386962890625, -0.1650104522705078, -0.15511703491210938, -0.14522361755371094, -0.1353302001953125, -0.12543678283691406, -0.11554336547851562, -0.10564994812011719, -0.09575653076171875, -0.08586311340332031, -0.07596969604492188, -0.06607627868652344, -0.056182861328125, -0.04628944396972656, -0.036396026611328125, -0.026502609252929688, -0.01660919189453125, -0.0067157745361328125, 0.003177642822265625, 0.013071060180664062, 0.0229644775390625, 0.03285789489746094, 0.042751312255859375, 0.05264472961425781, 0.06253814697265625, 0.07243156433105469, 0.08232498168945312, 0.09221839904785156, 0.10211181640625, 0.11200523376464844, 0.12189865112304688, 0.1317920684814453, 0.14168548583984375, 0.1515789031982422, 0.16147232055664062, 0.17136573791503906, 0.1812591552734375, 0.19115257263183594, 0.20104598999023438, 0.2109394073486328, 0.22083282470703125, 0.2307262420654297, 0.24061965942382812, 0.25051307678222656, 0.260406494140625, 0.27029991149902344, 0.2801933288574219, 0.2900867462158203, 0.29998016357421875, 0.3098735809326172, 0.3197669982910156, 0.32966041564941406, 0.3395538330078125, 0.34944725036621094, 0.3593406677246094, 0.3692340850830078, 0.37912750244140625, 0.3890209197998047, 0.3989143371582031, 0.40880775451660156, 0.418701171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 14.0, 9.0, 24.0, 46.0, 113.0, 205.0, 496.0, 1315.0, 4824.0, 33885.0, 3489155.0, 640202.0, 19593.0, 3025.0, 839.0, 269.0, 109.0, 47.0, 33.0, 23.0, 14.0, 7.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.18359375, -1.1506118774414062, -1.1176300048828125, -1.0846481323242188, -1.051666259765625, -1.0186843872070312, -0.9857025146484375, -0.9527206420898438, -0.91973876953125, -0.8867568969726562, -0.8537750244140625, -0.8207931518554688, -0.787811279296875, -0.7548294067382812, -0.7218475341796875, -0.6888656616210938, -0.6558837890625, -0.6229019165039062, -0.5899200439453125, -0.5569381713867188, -0.523956298828125, -0.49097442626953125, -0.4579925537109375, -0.42501068115234375, -0.39202880859375, -0.35904693603515625, -0.3260650634765625, -0.29308319091796875, -0.260101318359375, -0.22711944580078125, -0.1941375732421875, -0.16115570068359375, -0.128173828125, -0.09519195556640625, -0.0622100830078125, -0.02922821044921875, 0.003753662109375, 0.03673553466796875, 0.0697174072265625, 0.10269927978515625, 0.13568115234375, 0.16866302490234375, 0.2016448974609375, 0.23462677001953125, 0.267608642578125, 0.30059051513671875, 0.3335723876953125, 0.36655426025390625, 0.3995361328125, 0.43251800537109375, 0.4654998779296875, 0.49848175048828125, 0.531463623046875, 0.5644454956054688, 0.5974273681640625, 0.6304092407226562, 0.66339111328125, 0.6963729858398438, 0.7293548583984375, 0.7623367309570312, 0.795318603515625, 0.8283004760742188, 0.8612823486328125, 0.8942642211914062, 0.92724609375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 5.0, 4.0, 8.0, 21.0, 11.0, 17.0, 26.0, 41.0, 61.0, 89.0, 196.0, 538.0, 1402.0, 934.0, 334.0, 145.0, 74.0, 51.0, 27.0, 19.0, 17.0, 10.0, 10.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.83544921875, -0.8149604797363281, -0.7944717407226562, -0.7739830017089844, -0.7534942626953125, -0.7330055236816406, -0.7125167846679688, -0.6920280456542969, -0.671539306640625, -0.6510505676269531, -0.6305618286132812, -0.6100730895996094, -0.5895843505859375, -0.5690956115722656, -0.5486068725585938, -0.5281181335449219, -0.50762939453125, -0.4871406555175781, -0.46665191650390625, -0.4461631774902344, -0.4256744384765625, -0.4051856994628906, -0.38469696044921875, -0.3642082214355469, -0.343719482421875, -0.3232307434082031, -0.30274200439453125, -0.2822532653808594, -0.2617645263671875, -0.24127578735351562, -0.22078704833984375, -0.20029830932617188, -0.1798095703125, -0.15932083129882812, -0.13883209228515625, -0.11834335327148438, -0.0978546142578125, -0.07736587524414062, -0.05687713623046875, -0.036388397216796875, -0.015899658203125, 0.004589080810546875, 0.02507781982421875, 0.045566558837890625, 0.0660552978515625, 0.08654403686523438, 0.10703277587890625, 0.12752151489257812, 0.14801025390625, 0.16849899291992188, 0.18898773193359375, 0.20947647094726562, 0.2299652099609375, 0.2504539489746094, 0.27094268798828125, 0.2914314270019531, 0.311920166015625, 0.3324089050292969, 0.35289764404296875, 0.3733863830566406, 0.3938751220703125, 0.4143638610839844, 0.43485260009765625, 0.4553413391113281, 0.475830078125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 21.0, 43.0, 146.0, 311.0, 295.0, 120.0, 33.0, 8.0, 8.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.209362030029297, -11.918783187866211, -11.628205299377441, -11.337626457214355, -11.04704761505127, -10.7564697265625, -10.465890884399414, -10.175312042236328, -9.884733200073242, -9.594154357910156, -9.303576469421387, -9.0129976272583, -8.722418785095215, -8.431840896606445, -8.14126205444336, -7.850683212280273, -7.560105323791504, -7.269526958465576, -6.97894811630249, -6.6883697509765625, -6.397790908813477, -6.107212543487549, -5.816634178161621, -5.526055335998535, -5.235476970672607, -4.94489860534668, -4.654319763183594, -4.363741397857666, -4.073163032531738, -3.7825841903686523, -3.4920058250427246, -3.2014272212982178, -2.910849094390869, -2.6202704906463623, -2.3296918869018555, -2.0391135215759277, -1.748534917831421, -1.457956314086914, -1.1673778295516968, -0.8767993450164795, -0.5862207412719727, -0.2956421971321106, -0.005063652992248535, 0.2855148911476135, 0.5760934352874756, 0.8666720390319824, 1.1572505235671997, 1.447829008102417, 1.7384076118469238, 2.0289862155914307, 2.3195648193359375, 2.6101431846618652, 2.900721788406372, 3.191300392150879, 3.4818787574768066, 3.7724573612213135, 4.06303596496582, 4.353614330291748, 4.644193172454834, 4.934771537780762, 5.225350379943848, 5.515928745269775, 5.806507110595703, 6.097085952758789, 6.387664318084717]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 5.0, 3.0, 3.0, 5.0, 10.0, 19.0, 20.0, 26.0, 24.0, 39.0, 39.0, 49.0, 43.0, 48.0, 60.0, 80.0, 62.0, 72.0, 60.0, 62.0, 45.0, 59.0, 34.0, 33.0, 14.0, 16.0, 17.0, 15.0, 7.0, 11.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.943206787109375, -3.8272318840026855, -3.711256742477417, -3.5952818393707275, -3.479306936264038, -3.3633317947387695, -3.24735689163208, -3.1313819885253906, -3.015407085418701, -2.8994321823120117, -2.783457040786743, -2.6674821376800537, -2.5515072345733643, -2.4355320930480957, -2.3195571899414062, -2.203582286834717, -2.0876071453094482, -1.9716321229934692, -1.8556572198867798, -1.7396821975708008, -1.6237072944641113, -1.5077322721481323, -1.3917572498321533, -1.2757823467254639, -1.1598073244094849, -1.0438323020935059, -0.9278573989868164, -0.8118823766708374, -0.6959074139595032, -0.579932451248169, -0.46395742893218994, -0.3479824662208557, -0.23200750350952148, -0.11603252589702606, -5.754828453063965e-05, 0.11591744422912598, 0.2318924069404602, 0.34786736965179443, 0.46384239196777344, 0.5798173546791077, 0.6957923173904419, 0.8117672801017761, 0.9277422428131104, 1.0437172651290894, 1.1596922874450684, 1.2756671905517578, 1.3916422128677368, 1.5076172351837158, 1.6235921382904053, 1.7395671606063843, 1.8555420637130737, 1.9715170860290527, 2.087491989135742, 2.2034668922424316, 2.3194420337677, 2.4354169368743896, 2.551392078399658, 2.6673669815063477, 2.783342123031616, 2.8993170261383057, 3.015291929244995, 3.1312670707702637, 3.247241973876953, 3.3632168769836426, 3.479191780090332]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 5.0, 12.0, 12.0, 20.0, 25.0, 35.0, 59.0, 55.0, 146.0, 248.0, 440.0, 751.0, 1501.0, 2927.0, 6757.0, 16667.0, 45311.0, 130864.0, 358745.0, 311475.0, 108826.0, 37908.0, 14368.0, 5866.0, 2596.0, 1296.0, 656.0, 406.0, 206.0, 110.0, 88.0, 55.0, 39.0, 17.0, 13.0, 10.0, 8.0, 9.0, 2.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.369873046875, -0.3589668273925781, -0.34806060791015625, -0.3371543884277344, -0.3262481689453125, -0.3153419494628906, -0.30443572998046875, -0.2935295104980469, -0.282623291015625, -0.2717170715332031, -0.26081085205078125, -0.24990463256835938, -0.2389984130859375, -0.22809219360351562, -0.21718597412109375, -0.20627975463867188, -0.19537353515625, -0.18446731567382812, -0.17356109619140625, -0.16265487670898438, -0.1517486572265625, -0.14084243774414062, -0.12993621826171875, -0.11902999877929688, -0.108123779296875, -0.09721755981445312, -0.08631134033203125, -0.07540512084960938, -0.0644989013671875, -0.053592681884765625, -0.04268646240234375, -0.031780242919921875, -0.0208740234375, -0.009967803955078125, 0.00093841552734375, 0.011844635009765625, 0.0227508544921875, 0.033657073974609375, 0.04456329345703125, 0.055469512939453125, 0.066375732421875, 0.07728195190429688, 0.08818817138671875, 0.09909439086914062, 0.1100006103515625, 0.12090682983398438, 0.13181304931640625, 0.14271926879882812, 0.15362548828125, 0.16453170776367188, 0.17543792724609375, 0.18634414672851562, 0.1972503662109375, 0.20815658569335938, 0.21906280517578125, 0.22996902465820312, 0.240875244140625, 0.2517814636230469, 0.26268768310546875, 0.2735939025878906, 0.2845001220703125, 0.2954063415527344, 0.30631256103515625, 0.3172187805175781, 0.328125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 9.0, 11.0, 15.0, 15.0, 20.0, 25.0, 41.0, 34.0, 51.0, 47.0, 70.0, 68.0, 63.0, 57.0, 56.0, 50.0, 59.0, 47.0, 61.0, 29.0, 40.0, 26.0, 24.0, 20.0, 16.0, 7.0, 9.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.2467041015625, -0.2401447296142578, -0.23358535766601562, -0.22702598571777344, -0.22046661376953125, -0.21390724182128906, -0.20734786987304688, -0.2007884979248047, -0.1942291259765625, -0.1876697540283203, -0.18111038208007812, -0.17455101013183594, -0.16799163818359375, -0.16143226623535156, -0.15487289428710938, -0.1483135223388672, -0.141754150390625, -0.1351947784423828, -0.12863540649414062, -0.12207603454589844, -0.11551666259765625, -0.10895729064941406, -0.10239791870117188, -0.09583854675292969, -0.0892791748046875, -0.08271980285644531, -0.07616043090820312, -0.06960105895996094, -0.06304168701171875, -0.05648231506347656, -0.049922943115234375, -0.04336357116699219, -0.03680419921875, -0.030244827270507812, -0.023685455322265625, -0.017126083374023438, -0.01056671142578125, -0.0040073394775390625, 0.002552032470703125, 0.009111404418945312, 0.0156707763671875, 0.022230148315429688, 0.028789520263671875, 0.03534889221191406, 0.04190826416015625, 0.04846763610839844, 0.055027008056640625, 0.06158638000488281, 0.068145751953125, 0.07470512390136719, 0.08126449584960938, 0.08782386779785156, 0.09438323974609375, 0.10094261169433594, 0.10750198364257812, 0.11406135559082031, 0.1206207275390625, 0.1271800994873047, 0.13373947143554688, 0.14029884338378906, 0.14685821533203125, 0.15341758728027344, 0.15997695922851562, 0.1665363311767578, 0.173095703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 9.0, 6.0, 15.0, 15.0, 21.0, 23.0, 37.0, 51.0, 70.0, 107.0, 135.0, 213.0, 349.0, 510.0, 897.0, 1792.0, 4189.0, 14090.0, 81507.0, 674099.0, 228493.0, 29258.0, 7067.0, 2519.0, 1187.0, 658.0, 354.0, 260.0, 177.0, 124.0, 83.0, 64.0, 50.0, 31.0, 22.0, 19.0, 20.0, 10.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.732421875, -0.711334228515625, -0.69024658203125, -0.669158935546875, -0.6480712890625, -0.626983642578125, -0.60589599609375, -0.584808349609375, -0.563720703125, -0.542633056640625, -0.52154541015625, -0.500457763671875, -0.4793701171875, -0.458282470703125, -0.43719482421875, -0.416107177734375, -0.39501953125, -0.373931884765625, -0.35284423828125, -0.331756591796875, -0.3106689453125, -0.289581298828125, -0.26849365234375, -0.247406005859375, -0.226318359375, -0.205230712890625, -0.18414306640625, -0.163055419921875, -0.1419677734375, -0.120880126953125, -0.09979248046875, -0.078704833984375, -0.0576171875, -0.036529541015625, -0.01544189453125, 0.005645751953125, 0.0267333984375, 0.047821044921875, 0.06890869140625, 0.089996337890625, 0.111083984375, 0.132171630859375, 0.15325927734375, 0.174346923828125, 0.1954345703125, 0.216522216796875, 0.23760986328125, 0.258697509765625, 0.27978515625, 0.300872802734375, 0.32196044921875, 0.343048095703125, 0.3641357421875, 0.385223388671875, 0.40631103515625, 0.427398681640625, 0.448486328125, 0.469573974609375, 0.49066162109375, 0.511749267578125, 0.5328369140625, 0.553924560546875, 0.57501220703125, 0.596099853515625, 0.6171875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 8.0, 6.0, 15.0, 7.0, 9.0, 16.0, 18.0, 30.0, 22.0, 33.0, 36.0, 36.0, 41.0, 31.0, 40.0, 52.0, 50.0, 49.0, 41.0, 48.0, 56.0, 40.0, 49.0, 36.0, 35.0, 25.0, 28.0, 17.0, 23.0, 22.0, 14.0, 5.0, 10.0, 11.0, 2.0, 5.0, 4.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0], "bins": [-0.9169921875, -0.8912353515625, -0.865478515625, -0.8397216796875, -0.81396484375, -0.7882080078125, -0.762451171875, -0.7366943359375, -0.7109375, -0.6851806640625, -0.659423828125, -0.6336669921875, -0.60791015625, -0.5821533203125, -0.556396484375, -0.5306396484375, -0.5048828125, -0.4791259765625, -0.453369140625, -0.4276123046875, -0.40185546875, -0.3760986328125, -0.350341796875, -0.3245849609375, -0.298828125, -0.2730712890625, -0.247314453125, -0.2215576171875, -0.19580078125, -0.1700439453125, -0.144287109375, -0.1185302734375, -0.0927734375, -0.0670166015625, -0.041259765625, -0.0155029296875, 0.01025390625, 0.0360107421875, 0.061767578125, 0.0875244140625, 0.11328125, 0.1390380859375, 0.164794921875, 0.1905517578125, 0.21630859375, 0.2420654296875, 0.267822265625, 0.2935791015625, 0.3193359375, 0.3450927734375, 0.370849609375, 0.3966064453125, 0.42236328125, 0.4481201171875, 0.473876953125, 0.4996337890625, 0.525390625, 0.5511474609375, 0.576904296875, 0.6026611328125, 0.62841796875, 0.6541748046875, 0.679931640625, 0.7056884765625, 0.7314453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 12.0, 20.0, 29.0, 60.0, 105.0, 225.0, 539.0, 1912.0, 10411.0, 254766.0, 756896.0, 19469.0, 2700.0, 782.0, 287.0, 139.0, 72.0, 35.0, 23.0, 16.0, 9.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.552734375, -0.538238525390625, -0.52374267578125, -0.509246826171875, -0.4947509765625, -0.480255126953125, -0.46575927734375, -0.451263427734375, -0.436767578125, -0.422271728515625, -0.40777587890625, -0.393280029296875, -0.3787841796875, -0.364288330078125, -0.34979248046875, -0.335296630859375, -0.32080078125, -0.306304931640625, -0.29180908203125, -0.277313232421875, -0.2628173828125, -0.248321533203125, -0.23382568359375, -0.219329833984375, -0.204833984375, -0.190338134765625, -0.17584228515625, -0.161346435546875, -0.1468505859375, -0.132354736328125, -0.11785888671875, -0.103363037109375, -0.0888671875, -0.074371337890625, -0.05987548828125, -0.045379638671875, -0.0308837890625, -0.016387939453125, -0.00189208984375, 0.012603759765625, 0.027099609375, 0.041595458984375, 0.05609130859375, 0.070587158203125, 0.0850830078125, 0.099578857421875, 0.11407470703125, 0.128570556640625, 0.14306640625, 0.157562255859375, 0.17205810546875, 0.186553955078125, 0.2010498046875, 0.215545654296875, 0.23004150390625, 0.244537353515625, 0.259033203125, 0.273529052734375, 0.28802490234375, 0.302520751953125, 0.3170166015625, 0.331512451171875, 0.34600830078125, 0.360504150390625, 0.375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 3.0, 4.0, 5.0, 8.0, 8.0, 12.0, 19.0, 41.0, 46.0, 85.0, 123.0, 160.0, 159.0, 110.0, 73.0, 38.0, 23.0, 13.0, 16.0, 13.0, 11.0, 3.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.916854858398438e-05, -8.595548570156097e-05, -8.274242281913757e-05, -7.952935993671417e-05, -7.631629705429077e-05, -7.310323417186737e-05, -6.989017128944397e-05, -6.667710840702057e-05, -6.346404552459717e-05, -6.025098264217377e-05, -5.7037919759750366e-05, -5.3824856877326965e-05, -5.0611793994903564e-05, -4.7398731112480164e-05, -4.418566823005676e-05, -4.097260534763336e-05, -3.775954246520996e-05, -3.454647958278656e-05, -3.133341670036316e-05, -2.8120353817939758e-05, -2.4907290935516357e-05, -2.1694228053092957e-05, -1.8481165170669556e-05, -1.5268102288246155e-05, -1.2055039405822754e-05, -8.841976523399353e-06, -5.628913640975952e-06, -2.4158507585525513e-06, 7.972121238708496e-07, 4.0102750062942505e-06, 7.223337888717651e-06, 1.0436400771141052e-05, 1.3649463653564453e-05, 1.6862526535987854e-05, 2.0075589418411255e-05, 2.3288652300834656e-05, 2.6501715183258057e-05, 2.9714778065681458e-05, 3.292784094810486e-05, 3.614090383052826e-05, 3.935396671295166e-05, 4.256702959537506e-05, 4.578009247779846e-05, 4.899315536022186e-05, 5.2206218242645264e-05, 5.5419281125068665e-05, 5.8632344007492065e-05, 6.184540688991547e-05, 6.505846977233887e-05, 6.827153265476227e-05, 7.148459553718567e-05, 7.469765841960907e-05, 7.791072130203247e-05, 8.112378418445587e-05, 8.433684706687927e-05, 8.754990994930267e-05, 9.076297283172607e-05, 9.397603571414948e-05, 9.718909859657288e-05, 0.00010040216147899628, 0.00010361522436141968, 0.00010682828724384308, 0.00011004135012626648, 0.00011325441300868988, 0.00011646747589111328]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 5.0, 10.0, 12.0, 12.0, 29.0, 33.0, 54.0, 65.0, 111.0, 168.0, 307.0, 599.0, 1282.0, 3448.0, 13432.0, 109987.0, 800469.0, 99558.0, 12903.0, 3304.0, 1305.0, 571.0, 307.0, 171.0, 115.0, 78.0, 57.0, 49.0, 24.0, 15.0, 13.0, 14.0, 9.0, 3.0, 5.0, 2.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.338134765625, -0.3277244567871094, -0.31731414794921875, -0.3069038391113281, -0.2964935302734375, -0.2860832214355469, -0.27567291259765625, -0.2652626037597656, -0.254852294921875, -0.24444198608398438, -0.23403167724609375, -0.22362136840820312, -0.2132110595703125, -0.20280075073242188, -0.19239044189453125, -0.18198013305664062, -0.17156982421875, -0.16115951538085938, -0.15074920654296875, -0.14033889770507812, -0.1299285888671875, -0.11951828002929688, -0.10910797119140625, -0.09869766235351562, -0.088287353515625, -0.07787704467773438, -0.06746673583984375, -0.057056427001953125, -0.0466461181640625, -0.036235809326171875, -0.02582550048828125, -0.015415191650390625, -0.0050048828125, 0.005405426025390625, 0.01581573486328125, 0.026226043701171875, 0.0366363525390625, 0.047046661376953125, 0.05745697021484375, 0.06786727905273438, 0.078277587890625, 0.08868789672851562, 0.09909820556640625, 0.10950851440429688, 0.1199188232421875, 0.13032913208007812, 0.14073944091796875, 0.15114974975585938, 0.16156005859375, 0.17197036743164062, 0.18238067626953125, 0.19279098510742188, 0.2032012939453125, 0.21361160278320312, 0.22402191162109375, 0.23443222045898438, 0.244842529296875, 0.2552528381347656, 0.26566314697265625, 0.2760734558105469, 0.2864837646484375, 0.2968940734863281, 0.30730438232421875, 0.3177146911621094, 0.328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 9.0, 9.0, 15.0, 13.0, 28.0, 34.0, 56.0, 55.0, 84.0, 96.0, 110.0, 123.0, 95.0, 73.0, 51.0, 45.0, 33.0, 19.0, 16.0, 7.0, 6.0, 10.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.335693359375, -0.3247032165527344, -0.31371307373046875, -0.3027229309082031, -0.2917327880859375, -0.2807426452636719, -0.26975250244140625, -0.2587623596191406, -0.247772216796875, -0.23678207397460938, -0.22579193115234375, -0.21480178833007812, -0.2038116455078125, -0.19282150268554688, -0.18183135986328125, -0.17084121704101562, -0.15985107421875, -0.14886093139648438, -0.13787078857421875, -0.12688064575195312, -0.1158905029296875, -0.10490036010742188, -0.09391021728515625, -0.08292007446289062, -0.071929931640625, -0.060939788818359375, -0.04994964599609375, -0.038959503173828125, -0.0279693603515625, -0.016979217529296875, -0.00598907470703125, 0.005001068115234375, 0.0159912109375, 0.026981353759765625, 0.03797149658203125, 0.048961639404296875, 0.0599517822265625, 0.07094192504882812, 0.08193206787109375, 0.09292221069335938, 0.103912353515625, 0.11490249633789062, 0.12589263916015625, 0.13688278198242188, 0.1478729248046875, 0.15886306762695312, 0.16985321044921875, 0.18084335327148438, 0.19183349609375, 0.20282363891601562, 0.21381378173828125, 0.22480392456054688, 0.2357940673828125, 0.24678421020507812, 0.25777435302734375, 0.2687644958496094, 0.279754638671875, 0.2907447814941406, 0.30173492431640625, 0.3127250671386719, 0.3237152099609375, 0.3347053527832031, 0.34569549560546875, 0.3566856384277344, 0.36767578125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 45.0, 243.0, 542.0, 132.0, 21.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.13543701171875, -11.639826774597168, -11.144216537475586, -10.648606300354004, -10.152996063232422, -9.657386779785156, -9.161776542663574, -8.666166305541992, -8.17055606842041, -7.674945831298828, -7.179335594177246, -6.683725833892822, -6.18811559677124, -5.692505359649658, -5.196895599365234, -4.701285362243652, -4.20567512512207, -3.7100648880004883, -3.2144548892974854, -2.7188448905944824, -2.2232346534729004, -1.7276244163513184, -1.2320144176483154, -0.7364044189453125, -0.24079418182373047, 0.254815936088562, 0.7504260540008545, 1.246036171913147, 1.7416462898254395, 2.2372565269470215, 2.7328665256500244, 3.2284765243530273, 3.7240867614746094, 4.219696998596191, 4.715307235717773, 5.210916996002197, 5.706527233123779, 6.202137470245361, 6.697747230529785, 7.193357467651367, 7.688967704772949, 8.184577941894531, 8.680188179016113, 9.175798416137695, 9.671407699584961, 10.16701889038086, 10.662628173828125, 11.158238410949707, 11.653848648071289, 12.149458885192871, 12.645069122314453, 13.140679359436035, 13.636289596557617, 14.131898880004883, 14.627509117126465, 15.123119354248047, 15.618729591369629, 16.11433982849121, 16.609949111938477, 17.105560302734375, 17.60116958618164, 18.09678077697754, 18.592390060424805, 19.088001251220703, 19.58361053466797]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 9.0, 13.0, 21.0, 21.0, 30.0, 42.0, 52.0, 49.0, 68.0, 70.0, 83.0, 79.0, 96.0, 71.0, 64.0, 51.0, 43.0, 35.0, 21.0, 34.0, 16.0, 11.0, 7.0, 6.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.211576461791992, -5.023486137390137, -4.835395812988281, -4.647305488586426, -4.45921516418457, -4.271124839782715, -4.083034515380859, -3.894944190979004, -3.7068538665771484, -3.518763542175293, -3.3306732177734375, -3.142582893371582, -2.9544925689697266, -2.766402244567871, -2.5783119201660156, -2.39022159576416, -2.2021310329437256, -2.01404070854187, -1.8259503841400146, -1.6378600597381592, -1.4497697353363037, -1.2616794109344482, -1.0735889673233032, -0.8854986429214478, -0.6974083185195923, -0.5093179941177368, -0.32122763991355896, -0.1331372857093811, 0.054953038692474365, 0.24304336309432983, 0.4311337471008301, 0.6192240715026855, 0.807314395904541, 0.9954047203063965, 1.183495044708252, 1.3715853691101074, 1.559675693511963, 1.7477660179138184, 1.9358564615249634, 2.1239466667175293, 2.3120369911193848, 2.5001273155212402, 2.6882176399230957, 2.876307964324951, 3.0643982887268066, 3.252488613128662, 3.4405789375305176, 3.628669261932373, 3.8167598247528076, 4.004850387573242, 4.192940711975098, 4.381031036376953, 4.569121360778809, 4.757211685180664, 4.9453020095825195, 5.133392333984375, 5.3214826583862305, 5.509572982788086, 5.697663307189941, 5.885753631591797, 6.073843955993652, 6.261934280395508, 6.450024604797363, 6.638114929199219, 6.826205253601074]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 7.0, 3.0, 3.0, 12.0, 9.0, 24.0, 24.0, 42.0, 57.0, 102.0, 207.0, 450.0, 1283.0, 4574.0, 25020.0, 1090526.0, 3019244.0, 43331.0, 6542.0, 1808.0, 587.0, 219.0, 95.0, 36.0, 23.0, 12.0, 9.0, 5.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.72216796875, -0.7032127380371094, -0.6842575073242188, -0.6653022766113281, -0.6463470458984375, -0.6273918151855469, -0.6084365844726562, -0.5894813537597656, -0.570526123046875, -0.5515708923339844, -0.5326156616210938, -0.5136604309082031, -0.4947052001953125, -0.4757499694824219, -0.45679473876953125, -0.4378395080566406, -0.41888427734375, -0.3999290466308594, -0.38097381591796875, -0.3620185852050781, -0.3430633544921875, -0.3241081237792969, -0.30515289306640625, -0.2861976623535156, -0.267242431640625, -0.24828720092773438, -0.22933197021484375, -0.21037673950195312, -0.1914215087890625, -0.17246627807617188, -0.15351104736328125, -0.13455581665039062, -0.1156005859375, -0.09664535522460938, -0.07769012451171875, -0.058734893798828125, -0.0397796630859375, -0.020824432373046875, -0.00186920166015625, 0.017086029052734375, 0.036041259765625, 0.054996490478515625, 0.07395172119140625, 0.09290695190429688, 0.1118621826171875, 0.13081741333007812, 0.14977264404296875, 0.16872787475585938, 0.18768310546875, 0.20663833618164062, 0.22559356689453125, 0.24454879760742188, 0.2635040283203125, 0.2824592590332031, 0.30141448974609375, 0.3203697204589844, 0.339324951171875, 0.3582801818847656, 0.37723541259765625, 0.3961906433105469, 0.4151458740234375, 0.4341011047363281, 0.45305633544921875, 0.4720115661621094, 0.490966796875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 12.0, 18.0, 47.0, 121.0, 217.0, 227.0, 180.0, 111.0, 54.0, 13.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90625, -0.8825912475585938, -0.8589324951171875, -0.8352737426757812, -0.811614990234375, -0.7879562377929688, -0.7642974853515625, -0.7406387329101562, -0.71697998046875, -0.6933212280273438, -0.6696624755859375, -0.6460037231445312, -0.622344970703125, -0.5986862182617188, -0.5750274658203125, -0.5513687133789062, -0.5277099609375, -0.5040512084960938, -0.4803924560546875, -0.45673370361328125, -0.433074951171875, -0.40941619873046875, -0.3857574462890625, -0.36209869384765625, -0.33843994140625, -0.31478118896484375, -0.2911224365234375, -0.26746368408203125, -0.243804931640625, -0.22014617919921875, -0.1964874267578125, -0.17282867431640625, -0.149169921875, -0.12551116943359375, -0.1018524169921875, -0.07819366455078125, -0.054534912109375, -0.03087615966796875, -0.0072174072265625, 0.01644134521484375, 0.04010009765625, 0.06375885009765625, 0.0874176025390625, 0.11107635498046875, 0.134735107421875, 0.15839385986328125, 0.1820526123046875, 0.20571136474609375, 0.2293701171875, 0.25302886962890625, 0.2766876220703125, 0.30034637451171875, 0.324005126953125, 0.34766387939453125, 0.3713226318359375, 0.39498138427734375, 0.41864013671875, 0.44229888916015625, 0.4659576416015625, 0.48961639404296875, 0.513275146484375, 0.5369338989257812, 0.5605926513671875, 0.5842514038085938, 0.60791015625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 0.0, 5.0, 8.0, 9.0, 22.0, 22.0, 55.0, 71.0, 163.0, 232.0, 458.0, 829.0, 1837.0, 4070.0, 11908.0, 47521.0, 534357.0, 3397950.0, 156927.0, 25005.0, 7437.0, 2750.0, 1329.0, 609.0, 319.0, 164.0, 112.0, 50.0, 25.0, 17.0, 8.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47412109375, -0.4598846435546875, -0.445648193359375, -0.4314117431640625, -0.41717529296875, -0.4029388427734375, -0.388702392578125, -0.3744659423828125, -0.3602294921875, -0.3459930419921875, -0.331756591796875, -0.3175201416015625, -0.30328369140625, -0.2890472412109375, -0.274810791015625, -0.2605743408203125, -0.246337890625, -0.2321014404296875, -0.217864990234375, -0.2036285400390625, -0.18939208984375, -0.1751556396484375, -0.160919189453125, -0.1466827392578125, -0.1324462890625, -0.1182098388671875, -0.103973388671875, -0.0897369384765625, -0.07550048828125, -0.0612640380859375, -0.047027587890625, -0.0327911376953125, -0.0185546875, -0.0043182373046875, 0.009918212890625, 0.0241546630859375, 0.03839111328125, 0.0526275634765625, 0.066864013671875, 0.0811004638671875, 0.0953369140625, 0.1095733642578125, 0.123809814453125, 0.1380462646484375, 0.15228271484375, 0.1665191650390625, 0.180755615234375, 0.1949920654296875, 0.209228515625, 0.2234649658203125, 0.237701416015625, 0.2519378662109375, 0.26617431640625, 0.2804107666015625, 0.294647216796875, 0.3088836669921875, 0.3231201171875, 0.3373565673828125, 0.351593017578125, 0.3658294677734375, 0.38006591796875, 0.3943023681640625, 0.408538818359375, 0.4227752685546875, 0.43701171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 8.0, 11.0, 15.0, 18.0, 27.0, 43.0, 101.0, 135.0, 358.0, 765.0, 1180.0, 721.0, 324.0, 142.0, 87.0, 35.0, 21.0, 14.0, 13.0, 14.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.578125, -0.56134033203125, -0.5445556640625, -0.52777099609375, -0.510986328125, -0.49420166015625, -0.4774169921875, -0.46063232421875, -0.44384765625, -0.42706298828125, -0.4102783203125, -0.39349365234375, -0.376708984375, -0.35992431640625, -0.3431396484375, -0.32635498046875, -0.3095703125, -0.29278564453125, -0.2760009765625, -0.25921630859375, -0.242431640625, -0.22564697265625, -0.2088623046875, -0.19207763671875, -0.17529296875, -0.15850830078125, -0.1417236328125, -0.12493896484375, -0.108154296875, -0.09136962890625, -0.0745849609375, -0.05780029296875, -0.041015625, -0.02423095703125, -0.0074462890625, 0.00933837890625, 0.026123046875, 0.04290771484375, 0.0596923828125, 0.07647705078125, 0.09326171875, 0.11004638671875, 0.1268310546875, 0.14361572265625, 0.160400390625, 0.17718505859375, 0.1939697265625, 0.21075439453125, 0.2275390625, 0.24432373046875, 0.2611083984375, 0.27789306640625, 0.294677734375, 0.31146240234375, 0.3282470703125, 0.34503173828125, 0.36181640625, 0.37860107421875, 0.3953857421875, 0.41217041015625, 0.428955078125, 0.44573974609375, 0.4625244140625, 0.47930908203125, 0.49609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 1.0, 8.0, 6.0, 7.0, 19.0, 46.0, 120.0, 266.0, 327.0, 138.0, 39.0, 12.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.333754539489746, -9.119314193725586, -8.90487289428711, -8.69043254852295, -8.475991249084473, -8.261550903320312, -8.047109603881836, -7.832668781280518, -7.618227958679199, -7.403787136077881, -7.1893463134765625, -6.974905490875244, -6.760464668273926, -6.546023845672607, -6.331583023071289, -6.117142200469971, -5.902701377868652, -5.688260555267334, -5.473819732666016, -5.259378910064697, -5.044938087463379, -4.8304972648620605, -4.616056442260742, -4.401615619659424, -4.187175273895264, -3.9727344512939453, -3.758293628692627, -3.5438528060913086, -3.3294119834899902, -3.114971160888672, -2.9005303382873535, -2.686089515686035, -2.471648693084717, -2.2572078704833984, -2.04276704788208, -1.8283262252807617, -1.6138854026794434, -1.3994446992874146, -1.1850038766860962, -0.9705630540847778, -0.7561222314834595, -0.5416814088821411, -0.32724061608314514, -0.11279982328414917, 0.10164099931716919, 0.3160817623138428, 0.5305225849151611, 0.7449634075164795, 0.9594042301177979, 1.1738450527191162, 1.3882858753204346, 1.602726697921753, 1.8171675205230713, 2.0316081047058105, 2.246048927307129, 2.4604897499084473, 2.6749305725097656, 2.889371395111084, 3.1038122177124023, 3.3182530403137207, 3.532693862915039, 3.7471346855163574, 3.961575508117676, 4.176016330718994, 4.3904571533203125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 12.0, 9.0, 18.0, 36.0, 44.0, 54.0, 71.0, 76.0, 81.0, 96.0, 104.0, 77.0, 64.0, 66.0, 45.0, 32.0, 31.0, 25.0, 19.0, 11.0, 5.0, 7.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4142866134643555, -2.293680191040039, -2.1730735301971436, -2.052467107772827, -1.9318605661392212, -1.8112540245056152, -1.6906476020812988, -1.5700410604476929, -1.449434518814087, -1.328827977180481, -1.2082215547561646, -1.0876150131225586, -0.9670084714889526, -0.8464019894599915, -0.7257955074310303, -0.6051889657974243, -0.4845825433731079, -0.36397603154182434, -0.24336953461170197, -0.12276303768157959, -0.0021565258502960205, 0.11844998598098755, 0.23905646800994873, 0.3596630096435547, 0.48026949167251587, 0.600875973701477, 0.721482515335083, 0.8420889973640442, 0.9626954793930054, 1.0833020210266113, 1.2039084434509277, 1.3245151042938232, 1.4451215267181396, 1.5657280683517456, 1.686334490776062, 1.806941032409668, 1.927547574043274, 2.04815411567688, 2.1687605381011963, 2.289367198944092, 2.409973621368408, 2.5305800437927246, 2.65118670463562, 2.7717931270599365, 2.892399549484253, 3.0130062103271484, 3.133612632751465, 3.2542190551757812, 3.3748254776000977, 3.495431900024414, 3.6160385608673096, 3.736644983291626, 3.8572514057159424, 3.977858066558838, 4.098464488983154, 4.219070911407471, 4.339677810668945, 4.460284233093262, 4.580890655517578, 4.7014970779418945, 4.822103977203369, 4.9427103996276855, 5.063316822052002, 5.183923244476318, 5.304529666900635]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 4.0, 9.0, 9.0, 5.0, 10.0, 9.0, 20.0, 37.0, 47.0, 71.0, 124.0, 217.0, 367.0, 637.0, 1303.0, 2444.0, 6012.0, 14778.0, 40205.0, 122495.0, 379995.0, 323640.0, 100551.0, 33176.0, 12448.0, 5114.0, 2214.0, 1122.0, 592.0, 344.0, 203.0, 109.0, 79.0, 51.0, 33.0, 10.0, 24.0, 15.0, 8.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3388671875, -0.3285713195800781, -0.31827545166015625, -0.3079795837402344, -0.2976837158203125, -0.2873878479003906, -0.27709197998046875, -0.2667961120605469, -0.256500244140625, -0.24620437622070312, -0.23590850830078125, -0.22561264038085938, -0.2153167724609375, -0.20502090454101562, -0.19472503662109375, -0.18442916870117188, -0.17413330078125, -0.16383743286132812, -0.15354156494140625, -0.14324569702148438, -0.1329498291015625, -0.12265396118164062, -0.11235809326171875, -0.10206222534179688, -0.091766357421875, -0.08147048950195312, -0.07117462158203125, -0.060878753662109375, -0.0505828857421875, -0.040287017822265625, -0.02999114990234375, -0.019695281982421875, -0.0093994140625, 0.000896453857421875, 0.01119232177734375, 0.021488189697265625, 0.0317840576171875, 0.042079925537109375, 0.05237579345703125, 0.06267166137695312, 0.072967529296875, 0.08326339721679688, 0.09355926513671875, 0.10385513305664062, 0.1141510009765625, 0.12444686889648438, 0.13474273681640625, 0.14503860473632812, 0.15533447265625, 0.16563034057617188, 0.17592620849609375, 0.18622207641601562, 0.1965179443359375, 0.20681381225585938, 0.21710968017578125, 0.22740554809570312, 0.237701416015625, 0.24799728393554688, 0.25829315185546875, 0.2685890197753906, 0.2788848876953125, 0.2891807556152344, 0.29947662353515625, 0.3097724914550781, 0.320068359375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 11.0, 7.0, 10.0, 19.0, 31.0, 41.0, 54.0, 66.0, 71.0, 80.0, 88.0, 84.0, 83.0, 82.0, 60.0, 65.0, 47.0, 34.0, 29.0, 16.0, 15.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1973876953125, -0.1881427764892578, -0.17889785766601562, -0.16965293884277344, -0.16040802001953125, -0.15116310119628906, -0.14191818237304688, -0.1326732635498047, -0.1234283447265625, -0.11418342590332031, -0.10493850708007812, -0.09569358825683594, -0.08644866943359375, -0.07720375061035156, -0.06795883178710938, -0.05871391296386719, -0.049468994140625, -0.04022407531738281, -0.030979156494140625, -0.021734237670898438, -0.01248931884765625, -0.0032444000244140625, 0.006000518798828125, 0.015245437622070312, 0.0244903564453125, 0.03373527526855469, 0.042980194091796875, 0.05222511291503906, 0.06147003173828125, 0.07071495056152344, 0.07995986938476562, 0.08920478820800781, 0.09844970703125, 0.10769462585449219, 0.11693954467773438, 0.12618446350097656, 0.13542938232421875, 0.14467430114746094, 0.15391921997070312, 0.1631641387939453, 0.1724090576171875, 0.1816539764404297, 0.19089889526367188, 0.20014381408691406, 0.20938873291015625, 0.21863365173339844, 0.22787857055664062, 0.2371234893798828, 0.246368408203125, 0.2556133270263672, 0.2648582458496094, 0.27410316467285156, 0.28334808349609375, 0.29259300231933594, 0.3018379211425781, 0.3110828399658203, 0.3203277587890625, 0.3295726776123047, 0.3388175964355469, 0.34806251525878906, 0.35730743408203125, 0.36655235290527344, 0.3757972717285156, 0.3850421905517578, 0.394287109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 9.0, 13.0, 24.0, 36.0, 58.0, 93.0, 130.0, 244.0, 444.0, 889.0, 2071.0, 7003.0, 41108.0, 597077.0, 359502.0, 30456.0, 5747.0, 1848.0, 765.0, 443.0, 216.0, 150.0, 77.0, 47.0, 28.0, 15.0, 18.0, 11.0, 7.0, 5.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8544921875, -0.8313522338867188, -0.8082122802734375, -0.7850723266601562, -0.761932373046875, -0.7387924194335938, -0.7156524658203125, -0.6925125122070312, -0.66937255859375, -0.6462326049804688, -0.6230926513671875, -0.5999526977539062, -0.576812744140625, -0.5536727905273438, -0.5305328369140625, -0.5073928833007812, -0.4842529296875, -0.46111297607421875, -0.4379730224609375, -0.41483306884765625, -0.391693115234375, -0.36855316162109375, -0.3454132080078125, -0.32227325439453125, -0.29913330078125, -0.27599334716796875, -0.2528533935546875, -0.22971343994140625, -0.206573486328125, -0.18343353271484375, -0.1602935791015625, -0.13715362548828125, -0.114013671875, -0.09087371826171875, -0.0677337646484375, -0.04459381103515625, -0.021453857421875, 0.00168609619140625, 0.0248260498046875, 0.04796600341796875, 0.07110595703125, 0.09424591064453125, 0.1173858642578125, 0.14052581787109375, 0.163665771484375, 0.18680572509765625, 0.2099456787109375, 0.23308563232421875, 0.2562255859375, 0.27936553955078125, 0.3025054931640625, 0.32564544677734375, 0.348785400390625, 0.37192535400390625, 0.3950653076171875, 0.41820526123046875, 0.44134521484375, 0.46448516845703125, 0.4876251220703125, 0.5107650756835938, 0.533905029296875, 0.5570449829101562, 0.5801849365234375, 0.6033248901367188, 0.62646484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 6.0, 1.0, 7.0, 6.0, 12.0, 17.0, 18.0, 29.0, 25.0, 31.0, 36.0, 41.0, 46.0, 51.0, 62.0, 64.0, 62.0, 55.0, 60.0, 44.0, 46.0, 38.0, 44.0, 41.0, 35.0, 30.0, 14.0, 12.0, 11.0, 18.0, 11.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.78466796875, -0.760650634765625, -0.73663330078125, -0.712615966796875, -0.6885986328125, -0.664581298828125, -0.64056396484375, -0.616546630859375, -0.592529296875, -0.568511962890625, -0.54449462890625, -0.520477294921875, -0.4964599609375, -0.472442626953125, -0.44842529296875, -0.424407958984375, -0.400390625, -0.376373291015625, -0.35235595703125, -0.328338623046875, -0.3043212890625, -0.280303955078125, -0.25628662109375, -0.232269287109375, -0.208251953125, -0.184234619140625, -0.16021728515625, -0.136199951171875, -0.1121826171875, -0.088165283203125, -0.06414794921875, -0.040130615234375, -0.01611328125, 0.007904052734375, 0.03192138671875, 0.055938720703125, 0.0799560546875, 0.103973388671875, 0.12799072265625, 0.152008056640625, 0.176025390625, 0.200042724609375, 0.22406005859375, 0.248077392578125, 0.2720947265625, 0.296112060546875, 0.32012939453125, 0.344146728515625, 0.3681640625, 0.392181396484375, 0.41619873046875, 0.440216064453125, 0.4642333984375, 0.488250732421875, 0.51226806640625, 0.536285400390625, 0.560302734375, 0.584320068359375, 0.60833740234375, 0.632354736328125, 0.6563720703125, 0.680389404296875, 0.70440673828125, 0.728424072265625, 0.75244140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 8.0, 5.0, 12.0, 14.0, 14.0, 40.0, 72.0, 127.0, 344.0, 1425.0, 16057.0, 1002699.0, 25345.0, 1691.0, 372.0, 148.0, 57.0, 37.0, 17.0, 16.0, 10.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7431640625, -0.7216567993164062, -0.7001495361328125, -0.6786422729492188, -0.657135009765625, -0.6356277465820312, -0.6141204833984375, -0.5926132202148438, -0.57110595703125, -0.5495986938476562, -0.5280914306640625, -0.5065841674804688, -0.485076904296875, -0.46356964111328125, -0.4420623779296875, -0.42055511474609375, -0.3990478515625, -0.37754058837890625, -0.3560333251953125, -0.33452606201171875, -0.313018798828125, -0.29151153564453125, -0.2700042724609375, -0.24849700927734375, -0.22698974609375, -0.20548248291015625, -0.1839752197265625, -0.16246795654296875, -0.140960693359375, -0.11945343017578125, -0.0979461669921875, -0.07643890380859375, -0.054931640625, -0.03342437744140625, -0.0119171142578125, 0.00959014892578125, 0.031097412109375, 0.05260467529296875, 0.0741119384765625, 0.09561920166015625, 0.11712646484375, 0.13863372802734375, 0.1601409912109375, 0.18164825439453125, 0.203155517578125, 0.22466278076171875, 0.2461700439453125, 0.26767730712890625, 0.2891845703125, 0.31069183349609375, 0.3321990966796875, 0.35370635986328125, 0.375213623046875, 0.39672088623046875, 0.4182281494140625, 0.43973541259765625, 0.46124267578125, 0.48274993896484375, 0.5042572021484375, 0.5257644653320312, 0.547271728515625, 0.5687789916992188, 0.5902862548828125, 0.6117935180664062, 0.63330078125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 4.0, 10.0, 4.0, 9.0, 7.0, 14.0, 23.0, 36.0, 42.0, 78.0, 120.0, 184.0, 151.0, 104.0, 67.0, 41.0, 24.0, 9.0, 16.0, 8.0, 13.0, 6.0, 3.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.66787338256836e-05, -9.354948997497559e-05, -9.042024612426758e-05, -8.729100227355957e-05, -8.416175842285156e-05, -8.103251457214355e-05, -7.790327072143555e-05, -7.477402687072754e-05, -7.164478302001953e-05, -6.851553916931152e-05, -6.538629531860352e-05, -6.225705146789551e-05, -5.91278076171875e-05, -5.599856376647949e-05, -5.2869319915771484e-05, -4.9740076065063477e-05, -4.661083221435547e-05, -4.348158836364746e-05, -4.035234451293945e-05, -3.7223100662231445e-05, -3.409385681152344e-05, -3.096461296081543e-05, -2.7835369110107422e-05, -2.4706125259399414e-05, -2.1576881408691406e-05, -1.84476375579834e-05, -1.531839370727539e-05, -1.2189149856567383e-05, -9.059906005859375e-06, -5.930662155151367e-06, -2.8014183044433594e-06, 3.2782554626464844e-07, 3.4570693969726562e-06, 6.586313247680664e-06, 9.715557098388672e-06, 1.284480094909668e-05, 1.5974044799804688e-05, 1.9103288650512695e-05, 2.2232532501220703e-05, 2.536177635192871e-05, 2.849102020263672e-05, 3.1620264053344727e-05, 3.4749507904052734e-05, 3.787875175476074e-05, 4.100799560546875e-05, 4.413723945617676e-05, 4.7266483306884766e-05, 5.0395727157592773e-05, 5.352497100830078e-05, 5.665421485900879e-05, 5.97834587097168e-05, 6.29127025604248e-05, 6.604194641113281e-05, 6.917119026184082e-05, 7.230043411254883e-05, 7.542967796325684e-05, 7.855892181396484e-05, 8.168816566467285e-05, 8.481740951538086e-05, 8.794665336608887e-05, 9.107589721679688e-05, 9.420514106750488e-05, 9.733438491821289e-05, 0.0001004636287689209, 0.0001035928726196289]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 6.0, 17.0, 5.0, 27.0, 21.0, 38.0, 55.0, 119.0, 182.0, 342.0, 730.0, 1974.0, 8007.0, 90528.0, 874021.0, 62800.0, 6481.0, 1793.0, 681.0, 294.0, 156.0, 85.0, 54.0, 40.0, 28.0, 13.0, 15.0, 12.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.349365234375, -0.339508056640625, -0.32965087890625, -0.319793701171875, -0.3099365234375, -0.300079345703125, -0.29022216796875, -0.280364990234375, -0.2705078125, -0.260650634765625, -0.25079345703125, -0.240936279296875, -0.2310791015625, -0.221221923828125, -0.21136474609375, -0.201507568359375, -0.191650390625, -0.181793212890625, -0.17193603515625, -0.162078857421875, -0.1522216796875, -0.142364501953125, -0.13250732421875, -0.122650146484375, -0.11279296875, -0.102935791015625, -0.09307861328125, -0.083221435546875, -0.0733642578125, -0.063507080078125, -0.05364990234375, -0.043792724609375, -0.033935546875, -0.024078369140625, -0.01422119140625, -0.004364013671875, 0.0054931640625, 0.015350341796875, 0.02520751953125, 0.035064697265625, 0.044921875, 0.054779052734375, 0.06463623046875, 0.074493408203125, 0.0843505859375, 0.094207763671875, 0.10406494140625, 0.113922119140625, 0.123779296875, 0.133636474609375, 0.14349365234375, 0.153350830078125, 0.1632080078125, 0.173065185546875, 0.18292236328125, 0.192779541015625, 0.20263671875, 0.212493896484375, 0.22235107421875, 0.232208251953125, 0.2420654296875, 0.251922607421875, 0.26177978515625, 0.271636962890625, 0.281494140625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 18.0, 37.0, 55.0, 81.0, 110.0, 140.0, 152.0, 134.0, 109.0, 60.0, 39.0, 18.0, 15.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3466796875, -0.33713531494140625, -0.3275909423828125, -0.31804656982421875, -0.308502197265625, -0.29895782470703125, -0.2894134521484375, -0.27986907958984375, -0.27032470703125, -0.26078033447265625, -0.2512359619140625, -0.24169158935546875, -0.232147216796875, -0.22260284423828125, -0.2130584716796875, -0.20351409912109375, -0.1939697265625, -0.18442535400390625, -0.1748809814453125, -0.16533660888671875, -0.155792236328125, -0.14624786376953125, -0.1367034912109375, -0.12715911865234375, -0.11761474609375, -0.10807037353515625, -0.0985260009765625, -0.08898162841796875, -0.079437255859375, -0.06989288330078125, -0.0603485107421875, -0.05080413818359375, -0.041259765625, -0.03171539306640625, -0.0221710205078125, -0.01262664794921875, -0.003082275390625, 0.00646209716796875, 0.0160064697265625, 0.02555084228515625, 0.03509521484375, 0.04463958740234375, 0.0541839599609375, 0.06372833251953125, 0.073272705078125, 0.08281707763671875, 0.0923614501953125, 0.10190582275390625, 0.1114501953125, 0.12099456787109375, 0.1305389404296875, 0.14008331298828125, 0.149627685546875, 0.15917205810546875, 0.1687164306640625, 0.17826080322265625, 0.18780517578125, 0.19734954833984375, 0.2068939208984375, 0.21643829345703125, 0.225982666015625, 0.23552703857421875, 0.2450714111328125, 0.25461578369140625, 0.26416015625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 3.0, 1.0, 3.0, 6.0, 15.0, 28.0, 94.0, 285.0, 355.0, 154.0, 42.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.229070663452148, -8.975621223449707, -8.722171783447266, -8.46872329711914, -8.2152738571167, -7.961824417114258, -7.708375453948975, -7.454926490783691, -7.20147705078125, -6.948027610778809, -6.694578647613525, -6.441129684448242, -6.187680244445801, -5.934230804443359, -5.680781841278076, -5.427332878112793, -5.173883438110352, -4.92043399810791, -4.666985034942627, -4.413536071777344, -4.160086631774902, -3.90663743019104, -3.6531882286071777, -3.3997390270233154, -3.146289825439453, -2.892840623855591, -2.6393914222717285, -2.385942220687866, -2.132493019104004, -1.8790438175201416, -1.6255946159362793, -1.372145414352417, -1.118697166442871, -0.8652479648590088, -0.6117987632751465, -0.3583495616912842, -0.10490036010742188, 0.14854884147644043, 0.40199804306030273, 0.655447244644165, 0.9088964462280273, 1.1623456478118896, 1.415794849395752, 1.6692440509796143, 1.9226932525634766, 2.176142454147339, 2.429591655731201, 2.6830408573150635, 2.936490058898926, 3.189939260482788, 3.4433884620666504, 3.6968376636505127, 3.950286865234375, 4.203736305236816, 4.4571852684021, 4.710634231567383, 4.964083671569824, 5.217533111572266, 5.470982074737549, 5.724431037902832, 5.977880477905273, 6.231329917907715, 6.484778881072998, 6.738227844238281, 6.991677284240723]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 13.0, 19.0, 33.0, 28.0, 47.0, 49.0, 71.0, 81.0, 95.0, 112.0, 93.0, 66.0, 73.0, 55.0, 41.0, 41.0, 22.0, 19.0, 15.0, 15.0, 2.0, 1.0, 6.0, 1.0, 1.0, 2.0], "bins": [-7.168698310852051, -7.0177226066589355, -6.866746425628662, -6.715770721435547, -6.564794540405273, -6.413818836212158, -6.262842655181885, -6.1118669509887695, -5.960890769958496, -5.809915065765381, -5.658938884735107, -5.507963180541992, -5.356986999511719, -5.2060112953186035, -5.05503511428833, -4.904059410095215, -4.753083229064941, -4.602107524871826, -4.451131343841553, -4.3001556396484375, -4.149179458618164, -3.9982035160064697, -3.8472275733947754, -3.69625186920166, -3.545276165008545, -3.3943002223968506, -3.2433242797851562, -3.092348337173462, -2.9413723945617676, -2.7903964519500732, -2.639420509338379, -2.4884448051452637, -2.3374688625335693, -2.186492919921875, -2.0355169773101807, -1.8845410346984863, -1.733565092086792, -1.5825891494750977, -1.4316133260726929, -1.2806373834609985, -1.1296614408493042, -0.9786854982376099, -0.8277095556259155, -0.676733672618866, -0.5257577300071716, -0.3747817873954773, -0.22380590438842773, -0.0728299617767334, 0.07814598083496094, 0.22912190854549408, 0.3800978362560272, 0.5310737490653992, 0.6820496916770935, 0.8330256342887878, 0.9840015172958374, 1.1349774599075317, 1.285953402519226, 1.4369293451309204, 1.5879052877426147, 1.7388811111450195, 1.8898570537567139, 2.040832996368408, 2.1918089389801025, 2.342784881591797, 2.493760824203491]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 3.0, 7.0, 5.0, 19.0, 25.0, 44.0, 86.0, 144.0, 364.0, 1126.0, 3684.0, 17577.0, 204274.0, 3615151.0, 321277.0, 23278.0, 5004.0, 1471.0, 434.0, 165.0, 57.0, 44.0, 12.0, 9.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432373046875, -0.4190940856933594, -0.40581512451171875, -0.3925361633300781, -0.3792572021484375, -0.3659782409667969, -0.35269927978515625, -0.3394203186035156, -0.326141357421875, -0.3128623962402344, -0.29958343505859375, -0.2863044738769531, -0.2730255126953125, -0.2597465515136719, -0.24646759033203125, -0.23318862915039062, -0.21990966796875, -0.20663070678710938, -0.19335174560546875, -0.18007278442382812, -0.1667938232421875, -0.15351486206054688, -0.14023590087890625, -0.12695693969726562, -0.113677978515625, -0.10039901733398438, -0.08712005615234375, -0.07384109497070312, -0.0605621337890625, -0.047283172607421875, -0.03400421142578125, -0.020725250244140625, -0.0074462890625, 0.005832672119140625, 0.01911163330078125, 0.032390594482421875, 0.0456695556640625, 0.058948516845703125, 0.07222747802734375, 0.08550643920898438, 0.098785400390625, 0.11206436157226562, 0.12534332275390625, 0.13862228393554688, 0.1519012451171875, 0.16518020629882812, 0.17845916748046875, 0.19173812866210938, 0.20501708984375, 0.21829605102539062, 0.23157501220703125, 0.24485397338867188, 0.2581329345703125, 0.2714118957519531, 0.28469085693359375, 0.2979698181152344, 0.311248779296875, 0.3245277404785156, 0.33780670166015625, 0.3510856628417969, 0.3643646240234375, 0.3776435852050781, 0.39092254638671875, 0.4042015075683594, 0.41748046875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 13.0, 17.0, 21.0, 40.0, 57.0, 72.0, 80.0, 102.0, 116.0, 111.0, 100.0, 87.0, 74.0, 43.0, 28.0, 21.0, 12.0, 9.0, 4.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.5390625, -0.5282325744628906, -0.5174026489257812, -0.5065727233886719, -0.4957427978515625, -0.4849128723144531, -0.47408294677734375, -0.4632530212402344, -0.452423095703125, -0.4415931701660156, -0.43076324462890625, -0.4199333190917969, -0.4091033935546875, -0.3982734680175781, -0.38744354248046875, -0.3766136169433594, -0.36578369140625, -0.3549537658691406, -0.34412384033203125, -0.3332939147949219, -0.3224639892578125, -0.3116340637207031, -0.30080413818359375, -0.2899742126464844, -0.279144287109375, -0.2683143615722656, -0.25748443603515625, -0.24665451049804688, -0.2358245849609375, -0.22499465942382812, -0.21416473388671875, -0.20333480834960938, -0.1925048828125, -0.18167495727539062, -0.17084503173828125, -0.16001510620117188, -0.1491851806640625, -0.13835525512695312, -0.12752532958984375, -0.11669540405273438, -0.105865478515625, -0.09503555297851562, -0.08420562744140625, -0.07337570190429688, -0.0625457763671875, -0.051715850830078125, -0.04088592529296875, -0.030055999755859375, -0.01922607421875, -0.008396148681640625, 0.00243377685546875, 0.013263702392578125, 0.0240936279296875, 0.034923553466796875, 0.04575347900390625, 0.056583404541015625, 0.067413330078125, 0.07824325561523438, 0.08907318115234375, 0.09990310668945312, 0.1107330322265625, 0.12156295776367188, 0.13239288330078125, 0.14322280883789062, 0.154052734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 11.0, 22.0, 28.0, 48.0, 49.0, 110.0, 193.0, 343.0, 709.0, 1605.0, 4205.0, 13620.0, 60209.0, 639840.0, 3244060.0, 185104.0, 31014.0, 8205.0, 2691.0, 1130.0, 481.0, 266.0, 116.0, 88.0, 34.0, 32.0, 23.0, 19.0, 4.0, 8.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.49694061279296875, -0.4846038818359375, -0.47226715087890625, -0.459930419921875, -0.44759368896484375, -0.4352569580078125, -0.42292022705078125, -0.41058349609375, -0.39824676513671875, -0.3859100341796875, -0.37357330322265625, -0.361236572265625, -0.34889984130859375, -0.3365631103515625, -0.32422637939453125, -0.3118896484375, -0.29955291748046875, -0.2872161865234375, -0.27487945556640625, -0.262542724609375, -0.25020599365234375, -0.2378692626953125, -0.22553253173828125, -0.21319580078125, -0.20085906982421875, -0.1885223388671875, -0.17618560791015625, -0.163848876953125, -0.15151214599609375, -0.1391754150390625, -0.12683868408203125, -0.114501953125, -0.10216522216796875, -0.0898284912109375, -0.07749176025390625, -0.065155029296875, -0.05281829833984375, -0.0404815673828125, -0.02814483642578125, -0.01580810546875, -0.00347137451171875, 0.0088653564453125, 0.02120208740234375, 0.033538818359375, 0.04587554931640625, 0.0582122802734375, 0.07054901123046875, 0.0828857421875, 0.09522247314453125, 0.1075592041015625, 0.11989593505859375, 0.132232666015625, 0.14456939697265625, 0.1569061279296875, 0.16924285888671875, 0.18157958984375, 0.19391632080078125, 0.2062530517578125, 0.21858978271484375, 0.230926513671875, 0.24326324462890625, 0.2555999755859375, 0.26793670654296875, 0.2802734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 7.0, 6.0, 10.0, 12.0, 19.0, 28.0, 37.0, 50.0, 71.0, 131.0, 176.0, 364.0, 572.0, 848.0, 672.0, 406.0, 229.0, 113.0, 74.0, 58.0, 46.0, 38.0, 29.0, 12.0, 7.0, 14.0, 13.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.423828125, -0.410858154296875, -0.39788818359375, -0.384918212890625, -0.3719482421875, -0.358978271484375, -0.34600830078125, -0.333038330078125, -0.320068359375, -0.307098388671875, -0.29412841796875, -0.281158447265625, -0.2681884765625, -0.255218505859375, -0.24224853515625, -0.229278564453125, -0.21630859375, -0.203338623046875, -0.19036865234375, -0.177398681640625, -0.1644287109375, -0.151458740234375, -0.13848876953125, -0.125518798828125, -0.112548828125, -0.099578857421875, -0.08660888671875, -0.073638916015625, -0.0606689453125, -0.047698974609375, -0.03472900390625, -0.021759033203125, -0.0087890625, 0.004180908203125, 0.01715087890625, 0.030120849609375, 0.0430908203125, 0.056060791015625, 0.06903076171875, 0.082000732421875, 0.094970703125, 0.107940673828125, 0.12091064453125, 0.133880615234375, 0.1468505859375, 0.159820556640625, 0.17279052734375, 0.185760498046875, 0.19873046875, 0.211700439453125, 0.22467041015625, 0.237640380859375, 0.2506103515625, 0.263580322265625, 0.27655029296875, 0.289520263671875, 0.302490234375, 0.315460205078125, 0.32843017578125, 0.341400146484375, 0.3543701171875, 0.367340087890625, 0.38031005859375, 0.393280029296875, 0.40625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 7.0, 10.0, 28.0, 67.0, 164.0, 259.0, 257.0, 111.0, 54.0, 17.0, 10.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.897769927978516, -6.7234272956848145, -6.5490851402282715, -6.37474250793457, -6.200399875640869, -6.026057243347168, -5.851715087890625, -5.677372455596924, -5.503029823303223, -5.3286871910095215, -5.1543450355529785, -4.980002403259277, -4.805659770965576, -4.631317138671875, -4.456974983215332, -4.282632350921631, -4.108290195465088, -3.933947801589966, -3.7596051692962646, -3.5852627754211426, -3.4109201431274414, -3.2365777492523193, -3.0622353553771973, -2.887892723083496, -2.713550329208374, -2.539207935333252, -2.364865303039551, -2.1905229091644287, -2.0161805152893066, -1.8418378829956055, -1.6674954891204834, -1.4931529760360718, -1.3188109397888184, -1.1444684267044067, -0.9701259732246399, -0.795783519744873, -0.6214410066604614, -0.4470984935760498, -0.27275609970092773, -0.09841358661651611, 0.07592892646789551, 0.25027140974998474, 0.424613893032074, 0.5989563465118408, 0.7732988595962524, 0.9476413726806641, 1.1219837665557861, 1.2963262796401978, 1.4706687927246094, 1.645011305809021, 1.8193538188934326, 1.9936962127685547, 2.168038845062256, 2.342381238937378, 2.5167236328125, 2.691066265106201, 2.8654086589813232, 3.0397510528564453, 3.2140936851501465, 3.3884360790252686, 3.5627784729003906, 3.737121105194092, 3.911463499069214, 4.085805892944336, 4.260148525238037]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 11.0, 18.0, 20.0, 26.0, 36.0, 49.0, 42.0, 54.0, 54.0, 60.0, 61.0, 54.0, 60.0, 64.0, 66.0, 66.0, 43.0, 40.0, 40.0, 31.0, 28.0, 15.0, 16.0, 14.0, 14.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5479464530944824, -1.4687660932540894, -1.3895858526229858, -1.3104054927825928, -1.2312252521514893, -1.1520448923110962, -1.0728645324707031, -0.9936842918395996, -0.9145039916038513, -0.835323691368103, -0.7561433911323547, -0.6769630908966064, -0.5977827310562134, -0.5186024904251099, -0.4394221305847168, -0.3602418303489685, -0.2810615301132202, -0.20188122987747192, -0.12270091474056244, -0.043520599603652954, 0.03565970063209534, 0.11484000086784363, 0.1940203309059143, 0.2732006311416626, 0.3523809313774109, 0.4315612316131592, 0.5107415318489075, 0.5899218320846558, 0.6691021919250488, 0.7482824325561523, 0.8274627923965454, 0.9066430926322937, 0.985823392868042, 1.065003752708435, 1.1441839933395386, 1.2233643531799316, 1.3025445938110352, 1.3817249536514282, 1.4609053134918213, 1.5400855541229248, 1.6192657947540283, 1.6984461545944214, 1.777626395225525, 1.856806755065918, 1.9359869956970215, 2.015167236328125, 2.0943477153778076, 2.173527956008911, 2.2527084350585938, 2.3318886756896973, 2.41106915473938, 2.4902493953704834, 2.569429636001587, 2.6486098766326904, 2.727790355682373, 2.8069705963134766, 2.88615083694458, 2.9653310775756836, 3.044511556625366, 3.1236917972564697, 3.2028720378875732, 3.2820522785186768, 3.3612327575683594, 3.440412998199463, 3.5195932388305664]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 4.0, 11.0, 19.0, 28.0, 51.0, 87.0, 164.0, 298.0, 554.0, 1129.0, 2601.0, 6625.0, 18498.0, 53917.0, 160824.0, 391511.0, 269526.0, 92997.0, 31162.0, 10995.0, 4145.0, 1733.0, 814.0, 373.0, 185.0, 133.0, 66.0, 36.0, 19.0, 17.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3330078125, -0.32369232177734375, -0.3143768310546875, -0.30506134033203125, -0.295745849609375, -0.28643035888671875, -0.2771148681640625, -0.26779937744140625, -0.25848388671875, -0.24916839599609375, -0.2398529052734375, -0.23053741455078125, -0.221221923828125, -0.21190643310546875, -0.2025909423828125, -0.19327545166015625, -0.1839599609375, -0.17464447021484375, -0.1653289794921875, -0.15601348876953125, -0.146697998046875, -0.13738250732421875, -0.1280670166015625, -0.11875152587890625, -0.10943603515625, -0.10012054443359375, -0.0908050537109375, -0.08148956298828125, -0.072174072265625, -0.06285858154296875, -0.0535430908203125, -0.04422760009765625, -0.034912109375, -0.02559661865234375, -0.0162811279296875, -0.00696563720703125, 0.002349853515625, 0.01166534423828125, 0.0209808349609375, 0.03029632568359375, 0.03961181640625, 0.04892730712890625, 0.0582427978515625, 0.06755828857421875, 0.076873779296875, 0.08618927001953125, 0.0955047607421875, 0.10482025146484375, 0.1141357421875, 0.12345123291015625, 0.1327667236328125, 0.14208221435546875, 0.151397705078125, 0.16071319580078125, 0.1700286865234375, 0.17934417724609375, 0.18865966796875, 0.19797515869140625, 0.2072906494140625, 0.21660614013671875, 0.225921630859375, 0.23523712158203125, 0.2445526123046875, 0.25386810302734375, 0.26318359375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 10.0, 11.0, 9.0, 13.0, 13.0, 21.0, 23.0, 26.0, 39.0, 30.0, 27.0, 42.0, 59.0, 44.0, 50.0, 48.0, 50.0, 67.0, 57.0, 67.0, 48.0, 38.0, 39.0, 30.0, 32.0, 23.0, 17.0, 16.0, 10.0, 14.0, 9.0, 7.0, 8.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1807861328125, -0.17549514770507812, -0.17020416259765625, -0.16491317749023438, -0.1596221923828125, -0.15433120727539062, -0.14904022216796875, -0.14374923706054688, -0.138458251953125, -0.13316726684570312, -0.12787628173828125, -0.12258529663085938, -0.1172943115234375, -0.11200332641601562, -0.10671234130859375, -0.10142135620117188, -0.09613037109375, -0.09083938598632812, -0.08554840087890625, -0.08025741577148438, -0.0749664306640625, -0.06967544555664062, -0.06438446044921875, -0.059093475341796875, -0.053802490234375, -0.048511505126953125, -0.04322052001953125, -0.037929534912109375, -0.0326385498046875, -0.027347564697265625, -0.02205657958984375, -0.016765594482421875, -0.011474609375, -0.006183624267578125, -0.00089263916015625, 0.004398345947265625, 0.0096893310546875, 0.014980316162109375, 0.02027130126953125, 0.025562286376953125, 0.030853271484375, 0.036144256591796875, 0.04143524169921875, 0.046726226806640625, 0.0520172119140625, 0.057308197021484375, 0.06259918212890625, 0.06789016723632812, 0.07318115234375, 0.07847213745117188, 0.08376312255859375, 0.08905410766601562, 0.0943450927734375, 0.09963607788085938, 0.10492706298828125, 0.11021804809570312, 0.115509033203125, 0.12080001831054688, 0.12609100341796875, 0.13138198852539062, 0.1366729736328125, 0.14196395874023438, 0.14725494384765625, 0.15254592895507812, 0.1578369140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 9.0, 9.0, 18.0, 8.0, 20.0, 46.0, 36.0, 67.0, 56.0, 86.0, 143.0, 181.0, 286.0, 366.0, 535.0, 773.0, 1311.0, 2944.0, 8012.0, 39496.0, 341286.0, 582538.0, 52888.0, 9900.0, 3172.0, 1544.0, 828.0, 537.0, 388.0, 298.0, 222.0, 153.0, 102.0, 77.0, 54.0, 47.0, 30.0, 25.0, 19.0, 11.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.5104293823242188, -0.4940032958984375, -0.47757720947265625, -0.461151123046875, -0.44472503662109375, -0.4282989501953125, -0.41187286376953125, -0.39544677734375, -0.37902069091796875, -0.3625946044921875, -0.34616851806640625, -0.329742431640625, -0.31331634521484375, -0.2968902587890625, -0.28046417236328125, -0.2640380859375, -0.24761199951171875, -0.2311859130859375, -0.21475982666015625, -0.198333740234375, -0.18190765380859375, -0.1654815673828125, -0.14905548095703125, -0.13262939453125, -0.11620330810546875, -0.0997772216796875, -0.08335113525390625, -0.066925048828125, -0.05049896240234375, -0.0340728759765625, -0.01764678955078125, -0.001220703125, 0.01520538330078125, 0.0316314697265625, 0.04805755615234375, 0.064483642578125, 0.08090972900390625, 0.0973358154296875, 0.11376190185546875, 0.13018798828125, 0.14661407470703125, 0.1630401611328125, 0.17946624755859375, 0.195892333984375, 0.21231842041015625, 0.2287445068359375, 0.24517059326171875, 0.2615966796875, 0.27802276611328125, 0.2944488525390625, 0.31087493896484375, 0.327301025390625, 0.34372711181640625, 0.3601531982421875, 0.37657928466796875, 0.39300537109375, 0.40943145751953125, 0.4258575439453125, 0.44228363037109375, 0.458709716796875, 0.47513580322265625, 0.4915618896484375, 0.5079879760742188, 0.5244140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 6.0, 4.0, 7.0, 7.0, 11.0, 11.0, 13.0, 23.0, 24.0, 26.0, 45.0, 31.0, 38.0, 42.0, 49.0, 42.0, 37.0, 49.0, 43.0, 55.0, 47.0, 46.0, 48.0, 48.0, 29.0, 30.0, 26.0, 27.0, 28.0, 21.0, 19.0, 16.0, 7.0, 12.0, 7.0, 8.0, 3.0, 9.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71826171875, -0.6978836059570312, -0.6775054931640625, -0.6571273803710938, -0.636749267578125, -0.6163711547851562, -0.5959930419921875, -0.5756149291992188, -0.55523681640625, -0.5348587036132812, -0.5144805908203125, -0.49410247802734375, -0.473724365234375, -0.45334625244140625, -0.4329681396484375, -0.41259002685546875, -0.3922119140625, -0.37183380126953125, -0.3514556884765625, -0.33107757568359375, -0.310699462890625, -0.29032135009765625, -0.2699432373046875, -0.24956512451171875, -0.22918701171875, -0.20880889892578125, -0.1884307861328125, -0.16805267333984375, -0.147674560546875, -0.12729644775390625, -0.1069183349609375, -0.08654022216796875, -0.066162109375, -0.04578399658203125, -0.0254058837890625, -0.00502777099609375, 0.015350341796875, 0.03572845458984375, 0.0561065673828125, 0.07648468017578125, 0.09686279296875, 0.11724090576171875, 0.1376190185546875, 0.15799713134765625, 0.178375244140625, 0.19875335693359375, 0.2191314697265625, 0.23950958251953125, 0.2598876953125, 0.28026580810546875, 0.3006439208984375, 0.32102203369140625, 0.341400146484375, 0.36177825927734375, 0.3821563720703125, 0.40253448486328125, 0.42291259765625, 0.44329071044921875, 0.4636688232421875, 0.48404693603515625, 0.504425048828125, 0.5248031616210938, 0.5451812744140625, 0.5655593872070312, 0.5859375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 8.0, 8.0, 8.0, 18.0, 23.0, 30.0, 41.0, 57.0, 94.0, 189.0, 340.0, 877.0, 3080.0, 19742.0, 324893.0, 663585.0, 29728.0, 3903.0, 1026.0, 407.0, 182.0, 117.0, 71.0, 46.0, 26.0, 18.0, 15.0, 8.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2320556640625, -0.22544097900390625, -0.2188262939453125, -0.21221160888671875, -0.205596923828125, -0.19898223876953125, -0.1923675537109375, -0.18575286865234375, -0.17913818359375, -0.17252349853515625, -0.1659088134765625, -0.15929412841796875, -0.152679443359375, -0.14606475830078125, -0.1394500732421875, -0.13283538818359375, -0.126220703125, -0.11960601806640625, -0.1129913330078125, -0.10637664794921875, -0.099761962890625, -0.09314727783203125, -0.0865325927734375, -0.07991790771484375, -0.07330322265625, -0.06668853759765625, -0.0600738525390625, -0.05345916748046875, -0.046844482421875, -0.04022979736328125, -0.0336151123046875, -0.02700042724609375, -0.0203857421875, -0.01377105712890625, -0.0071563720703125, -0.00054168701171875, 0.006072998046875, 0.01268768310546875, 0.0193023681640625, 0.02591705322265625, 0.03253173828125, 0.03914642333984375, 0.0457611083984375, 0.05237579345703125, 0.058990478515625, 0.06560516357421875, 0.0722198486328125, 0.07883453369140625, 0.08544921875, 0.09206390380859375, 0.0986785888671875, 0.10529327392578125, 0.111907958984375, 0.11852264404296875, 0.1251373291015625, 0.13175201416015625, 0.13836669921875, 0.14498138427734375, 0.1515960693359375, 0.15821075439453125, 0.164825439453125, 0.17144012451171875, 0.1780548095703125, 0.18466949462890625, 0.1912841796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 5.0, 1.0, 7.0, 4.0, 11.0, 4.0, 6.0, 7.0, 7.0, 8.0, 15.0, 22.0, 15.0, 9.0, 15.0, 19.0, 36.0, 56.0, 117.0, 191.0, 158.0, 85.0, 40.0, 28.0, 17.0, 19.0, 18.0, 13.0, 9.0, 12.0, 10.0, 3.0, 7.0, 6.0, 7.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001399517059326172, -0.00013565830886363983, -0.00013136491179466248, -0.00012707151472568512, -0.00012277811765670776, -0.00011848472058773041, -0.00011419132351875305, -0.0001098979264497757, -0.00010560452938079834, -0.00010131113231182098, -9.701773524284363e-05, -9.272433817386627e-05, -8.843094110488892e-05, -8.413754403591156e-05, -7.98441469669342e-05, -7.555074989795685e-05, -7.125735282897949e-05, -6.696395576000214e-05, -6.267055869102478e-05, -5.8377161622047424e-05, -5.408376455307007e-05, -4.979036748409271e-05, -4.5496970415115356e-05, -4.1203573346138e-05, -3.6910176277160645e-05, -3.261677920818329e-05, -2.8323382139205933e-05, -2.4029985070228577e-05, -1.973658800125122e-05, -1.5443190932273865e-05, -1.1149793863296509e-05, -6.856396794319153e-06, -2.562999725341797e-06, 1.730397343635559e-06, 6.023794412612915e-06, 1.0317191481590271e-05, 1.4610588550567627e-05, 1.8903985619544983e-05, 2.319738268852234e-05, 2.7490779757499695e-05, 3.178417682647705e-05, 3.607757389545441e-05, 4.037097096443176e-05, 4.466436803340912e-05, 4.8957765102386475e-05, 5.325116217136383e-05, 5.7544559240341187e-05, 6.183795630931854e-05, 6.61313533782959e-05, 7.042475044727325e-05, 7.471814751625061e-05, 7.901154458522797e-05, 8.330494165420532e-05, 8.759833872318268e-05, 9.189173579216003e-05, 9.618513286113739e-05, 0.00010047852993011475, 0.0001047719269990921, 0.00010906532406806946, 0.00011335872113704681, 0.00011765211820602417, 0.00012194551527500153, 0.00012623891234397888, 0.00013053230941295624, 0.0001348257064819336]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 13.0, 20.0, 17.0, 22.0, 28.0, 43.0, 56.0, 84.0, 108.0, 138.0, 238.0, 329.0, 597.0, 973.0, 1807.0, 4386.0, 13590.0, 64080.0, 580896.0, 317551.0, 45519.0, 10465.0, 3645.0, 1577.0, 849.0, 481.0, 324.0, 200.0, 138.0, 89.0, 69.0, 62.0, 35.0, 17.0, 17.0, 15.0, 11.0, 14.0, 7.0, 4.0, 5.0, 7.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.1270751953125, -0.12282562255859375, -0.1185760498046875, -0.11432647705078125, -0.110076904296875, -0.10582733154296875, -0.1015777587890625, -0.09732818603515625, -0.09307861328125, -0.08882904052734375, -0.0845794677734375, -0.08032989501953125, -0.076080322265625, -0.07183074951171875, -0.0675811767578125, -0.06333160400390625, -0.05908203125, -0.05483245849609375, -0.0505828857421875, -0.04633331298828125, -0.042083740234375, -0.03783416748046875, -0.0335845947265625, -0.02933502197265625, -0.02508544921875, -0.02083587646484375, -0.0165863037109375, -0.01233673095703125, -0.008087158203125, -0.00383758544921875, 0.0004119873046875, 0.00466156005859375, 0.0089111328125, 0.01316070556640625, 0.0174102783203125, 0.02165985107421875, 0.025909423828125, 0.03015899658203125, 0.0344085693359375, 0.03865814208984375, 0.04290771484375, 0.04715728759765625, 0.0514068603515625, 0.05565643310546875, 0.059906005859375, 0.06415557861328125, 0.0684051513671875, 0.07265472412109375, 0.076904296875, 0.08115386962890625, 0.0854034423828125, 0.08965301513671875, 0.093902587890625, 0.09815216064453125, 0.1024017333984375, 0.10665130615234375, 0.11090087890625, 0.11515045166015625, 0.1194000244140625, 0.12364959716796875, 0.127899169921875, 0.13214874267578125, 0.1363983154296875, 0.14064788818359375, 0.1448974609375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 8.0, 4.0, 5.0, 9.0, 16.0, 17.0, 19.0, 24.0, 28.0, 28.0, 46.0, 56.0, 51.0, 66.0, 86.0, 97.0, 70.0, 64.0, 57.0, 46.0, 47.0, 32.0, 28.0, 18.0, 16.0, 19.0, 11.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12030029296875, -0.11610698699951172, -0.11191368103027344, -0.10772037506103516, -0.10352706909179688, -0.0993337631225586, -0.09514045715332031, -0.09094715118408203, -0.08675384521484375, -0.08256053924560547, -0.07836723327636719, -0.0741739273071289, -0.06998062133789062, -0.06578731536865234, -0.06159400939941406, -0.05740070343017578, -0.0532073974609375, -0.04901409149169922, -0.04482078552246094, -0.040627479553222656, -0.036434173583984375, -0.032240867614746094, -0.028047561645507812, -0.02385425567626953, -0.01966094970703125, -0.015467643737792969, -0.011274337768554688, -0.007081031799316406, -0.002887725830078125, 0.0013055801391601562, 0.0054988861083984375, 0.009692192077636719, 0.013885498046875, 0.01807880401611328, 0.022272109985351562, 0.026465415954589844, 0.030658721923828125, 0.034852027893066406, 0.03904533386230469, 0.04323863983154297, 0.04743194580078125, 0.05162525177001953, 0.05581855773925781, 0.060011863708496094, 0.06420516967773438, 0.06839847564697266, 0.07259178161621094, 0.07678508758544922, 0.0809783935546875, 0.08517169952392578, 0.08936500549316406, 0.09355831146240234, 0.09775161743164062, 0.1019449234008789, 0.10613822937011719, 0.11033153533935547, 0.11452484130859375, 0.11871814727783203, 0.12291145324707031, 0.1271047592163086, 0.13129806518554688, 0.13549137115478516, 0.13968467712402344, 0.14387798309326172, 0.1480712890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 29.0, 78.0, 169.0, 385.0, 189.0, 76.0, 28.0, 21.0, 6.0, 1.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5342133045196533, -2.358384132385254, -2.1825547218322754, -2.006725549697876, -1.8308961391448975, -1.655066967010498, -1.479237675666809, -1.3034083843231201, -1.1275790929794312, -0.9517498016357422, -0.7759205102920532, -0.600091278553009, -0.42426198720932007, -0.2484326958656311, -0.07260346412658691, 0.10322582721710205, 0.279055118560791, 0.45488440990448, 0.630713701248169, 0.8065429329872131, 0.9823722243309021, 1.1582014560699463, 1.3340307474136353, 1.5098600387573242, 1.6856893301010132, 1.8615186214447021, 2.0373477935791016, 2.21317720413208, 2.3890063762664795, 2.564835786819458, 2.7406649589538574, 2.916494369506836, 3.0923237800598145, 3.268152952194214, 3.4439823627471924, 3.619811534881592, 3.7956409454345703, 3.9714701175689697, 4.147299289703369, 4.323128700256348, 4.498958110809326, 4.674787521362305, 4.850616455078125, 5.0264458656311035, 5.202275276184082, 5.3781046867370605, 5.553933620452881, 5.729763031005859, 5.90559196472168, 6.081421375274658, 6.2572503089904785, 6.433079719543457, 6.6089091300964355, 6.784738540649414, 6.960567474365234, 7.136396884918213, 7.312226295471191, 7.48805570602417, 7.66388463973999, 7.839714050292969, 8.015542984008789, 8.191372871398926, 8.367201805114746, 8.543031692504883, 8.718860626220703]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 9.0, 11.0, 17.0, 13.0, 16.0, 23.0, 28.0, 36.0, 51.0, 58.0, 80.0, 98.0, 118.0, 83.0, 65.0, 51.0, 49.0, 55.0, 36.0, 34.0, 26.0, 16.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7334065437316895, -2.612025737762451, -2.490644931793213, -2.3692641258239746, -2.2478833198547363, -2.126502513885498, -2.0051217079162598, -1.8837409019470215, -1.7623600959777832, -1.640979290008545, -1.5195984840393066, -1.3982176780700684, -1.27683687210083, -1.1554560661315918, -1.0340752601623535, -0.9126943945884705, -0.7913135290145874, -0.6699327230453491, -0.5485519170761108, -0.42717108130455017, -0.3057902753353119, -0.18440943956375122, -0.06302863359451294, 0.05835217237472534, 0.17973297834396362, 0.3011137843132019, 0.4224945902824402, 0.5438754558563232, 0.6652562618255615, 0.7866370677947998, 0.9080178737640381, 1.0293986797332764, 1.1507794857025146, 1.272160291671753, 1.3935410976409912, 1.5149219036102295, 1.6363027095794678, 1.757683515548706, 1.8790643215179443, 2.0004451274871826, 2.121825933456421, 2.243206739425659, 2.3645875453948975, 2.4859683513641357, 2.607349157333374, 2.7287299633026123, 2.8501107692718506, 2.971491575241089, 3.0928726196289062, 3.2142534255981445, 3.335634231567383, 3.457015037536621, 3.5783958435058594, 3.6997766494750977, 3.821157455444336, 3.942538261413574, 4.0639190673828125, 4.185299873352051, 4.306680679321289, 4.428061485290527, 4.549442291259766, 4.670823097229004, 4.792203903198242, 4.9135847091674805, 5.034965515136719]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 3.0, 6.0, 7.0, 11.0, 21.0, 34.0, 54.0, 116.0, 173.0, 343.0, 713.0, 1821.0, 5408.0, 19559.0, 114707.0, 2181478.0, 1748455.0, 97465.0, 16612.0, 4339.0, 1512.0, 623.0, 328.0, 165.0, 95.0, 75.0, 43.0, 39.0, 21.0, 12.0, 12.0, 10.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2171630859375, -0.2077045440673828, -0.19824600219726562, -0.18878746032714844, -0.17932891845703125, -0.16987037658691406, -0.16041183471679688, -0.1509532928466797, -0.1414947509765625, -0.1320362091064453, -0.12257766723632812, -0.11311912536621094, -0.10366058349609375, -0.09420204162597656, -0.08474349975585938, -0.07528495788574219, -0.065826416015625, -0.05636787414550781, -0.046909332275390625, -0.03745079040527344, -0.02799224853515625, -0.018533706665039062, -0.009075164794921875, 0.0003833770751953125, 0.0098419189453125, 0.019300460815429688, 0.028759002685546875, 0.03821754455566406, 0.04767608642578125, 0.05713462829589844, 0.06659317016601562, 0.07605171203613281, 0.08551025390625, 0.09496879577636719, 0.10442733764648438, 0.11388587951660156, 0.12334442138671875, 0.13280296325683594, 0.14226150512695312, 0.1517200469970703, 0.1611785888671875, 0.1706371307373047, 0.18009567260742188, 0.18955421447753906, 0.19901275634765625, 0.20847129821777344, 0.21792984008789062, 0.2273883819580078, 0.236846923828125, 0.2463054656982422, 0.2557640075683594, 0.26522254943847656, 0.27468109130859375, 0.28413963317871094, 0.2935981750488281, 0.3030567169189453, 0.3125152587890625, 0.3219738006591797, 0.3314323425292969, 0.34089088439941406, 0.35034942626953125, 0.35980796813964844, 0.3692665100097656, 0.3787250518798828, 0.38818359375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 8.0, 12.0, 30.0, 40.0, 44.0, 70.0, 94.0, 86.0, 108.0, 113.0, 91.0, 97.0, 75.0, 59.0, 36.0, 19.0, 14.0, 7.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156005859375, -0.14626312255859375, -0.1365203857421875, -0.12677764892578125, -0.117034912109375, -0.10729217529296875, -0.0975494384765625, -0.08780670166015625, -0.07806396484375, -0.06832122802734375, -0.0585784912109375, -0.04883575439453125, -0.039093017578125, -0.02935028076171875, -0.0196075439453125, -0.00986480712890625, -0.0001220703125, 0.00962066650390625, 0.0193634033203125, 0.02910614013671875, 0.038848876953125, 0.04859161376953125, 0.0583343505859375, 0.06807708740234375, 0.07781982421875, 0.08756256103515625, 0.0973052978515625, 0.10704803466796875, 0.116790771484375, 0.12653350830078125, 0.1362762451171875, 0.14601898193359375, 0.15576171875, 0.16550445556640625, 0.1752471923828125, 0.18498992919921875, 0.194732666015625, 0.20447540283203125, 0.2142181396484375, 0.22396087646484375, 0.23370361328125, 0.24344635009765625, 0.2531890869140625, 0.26293182373046875, 0.272674560546875, 0.28241729736328125, 0.2921600341796875, 0.30190277099609375, 0.3116455078125, 0.32138824462890625, 0.3311309814453125, 0.34087371826171875, 0.350616455078125, 0.36035919189453125, 0.3701019287109375, 0.37984466552734375, 0.38958740234375, 0.39933013916015625, 0.4090728759765625, 0.41881561279296875, 0.428558349609375, 0.43830108642578125, 0.4480438232421875, 0.45778656005859375, 0.467529296875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 10.0, 9.0, 17.0, 23.0, 45.0, 56.0, 94.0, 142.0, 236.0, 422.0, 824.0, 1888.0, 4895.0, 17631.0, 96444.0, 2133714.0, 1834569.0, 82783.0, 14068.0, 3798.0, 1373.0, 553.0, 290.0, 177.0, 92.0, 45.0, 36.0, 14.0, 10.0, 10.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.453857421875, -0.4425048828125, -0.43115234375, -0.4197998046875, -0.408447265625, -0.3970947265625, -0.3857421875, -0.3743896484375, -0.363037109375, -0.3516845703125, -0.34033203125, -0.3289794921875, -0.317626953125, -0.3062744140625, -0.294921875, -0.2835693359375, -0.272216796875, -0.2608642578125, -0.24951171875, -0.2381591796875, -0.226806640625, -0.2154541015625, -0.2041015625, -0.1927490234375, -0.181396484375, -0.1700439453125, -0.15869140625, -0.1473388671875, -0.135986328125, -0.1246337890625, -0.11328125, -0.1019287109375, -0.090576171875, -0.0792236328125, -0.06787109375, -0.0565185546875, -0.045166015625, -0.0338134765625, -0.0224609375, -0.0111083984375, 0.000244140625, 0.0115966796875, 0.02294921875, 0.0343017578125, 0.045654296875, 0.0570068359375, 0.068359375, 0.0797119140625, 0.091064453125, 0.1024169921875, 0.11376953125, 0.1251220703125, 0.136474609375, 0.1478271484375, 0.1591796875, 0.1705322265625, 0.181884765625, 0.1932373046875, 0.20458984375, 0.2159423828125, 0.227294921875, 0.2386474609375, 0.25, 0.2613525390625, 0.272705078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 3.0, 4.0, 7.0, 17.0, 25.0, 24.0, 32.0, 68.0, 97.0, 152.0, 274.0, 597.0, 1046.0, 827.0, 402.0, 215.0, 104.0, 70.0, 31.0, 28.0, 18.0, 10.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5615234375, -0.5473747253417969, -0.5332260131835938, -0.5190773010253906, -0.5049285888671875, -0.4907798767089844, -0.47663116455078125, -0.4624824523925781, -0.448333740234375, -0.4341850280761719, -0.42003631591796875, -0.4058876037597656, -0.3917388916015625, -0.3775901794433594, -0.36344146728515625, -0.3492927551269531, -0.33514404296875, -0.3209953308105469, -0.30684661865234375, -0.2926979064941406, -0.2785491943359375, -0.2644004821777344, -0.25025177001953125, -0.23610305786132812, -0.221954345703125, -0.20780563354492188, -0.19365692138671875, -0.17950820922851562, -0.1653594970703125, -0.15121078491210938, -0.13706207275390625, -0.12291336059570312, -0.1087646484375, -0.09461593627929688, -0.08046722412109375, -0.06631851196289062, -0.0521697998046875, -0.038021087646484375, -0.02387237548828125, -0.009723663330078125, 0.004425048828125, 0.018573760986328125, 0.03272247314453125, 0.046871185302734375, 0.0610198974609375, 0.07516860961914062, 0.08931732177734375, 0.10346603393554688, 0.11761474609375, 0.13176345825195312, 0.14591217041015625, 0.16006088256835938, 0.1742095947265625, 0.18835830688476562, 0.20250701904296875, 0.21665573120117188, 0.230804443359375, 0.24495315551757812, 0.25910186767578125, 0.2732505798339844, 0.2873992919921875, 0.3015480041503906, 0.31569671630859375, 0.3298454284667969, 0.343994140625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 12.0, 17.0, 47.0, 106.0, 257.0, 276.0, 144.0, 86.0, 24.0, 12.0, 3.0, 6.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.865827560424805, -4.718526840209961, -4.571226119995117, -4.423925399780273, -4.27662467956543, -4.129323482513428, -3.982022762298584, -3.8347220420837402, -3.6874213218688965, -3.5401206016540527, -3.392819881439209, -3.245518922805786, -3.0982182025909424, -2.9509174823760986, -2.803616523742676, -2.656315803527832, -2.5090150833129883, -2.3617143630981445, -2.214413642883301, -2.067112684249878, -1.9198119640350342, -1.7725112438201904, -1.6252104043960571, -1.4779095649719238, -1.33060884475708, -1.1833081245422363, -1.036007285118103, -0.8887065052986145, -0.741405725479126, -0.5941049456596375, -0.4468041658401489, -0.2995033264160156, -0.15220308303833008, -0.004902303218841553, 0.14239847660064697, 0.2896992564201355, 0.437000036239624, 0.5843008160591125, 0.7316015958786011, 0.8789024353027344, 1.0262031555175781, 1.1735038757324219, 1.3208047151565552, 1.4681055545806885, 1.6154062747955322, 1.762706995010376, 1.9100078344345093, 2.0573086738586426, 2.2046093940734863, 2.35191011428833, 2.499210834503174, 2.6465117931365967, 2.7938125133514404, 2.941113233566284, 3.088414192199707, 3.235714912414551, 3.3830156326293945, 3.5303163528442383, 3.677617073059082, 3.824918031692505, 3.9722187519073486, 4.1195197105407715, 4.266820430755615, 4.414121150970459, 4.561421871185303]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 9.0, 10.0, 16.0, 20.0, 21.0, 38.0, 52.0, 52.0, 52.0, 58.0, 68.0, 70.0, 77.0, 81.0, 69.0, 79.0, 56.0, 50.0, 29.0, 28.0, 22.0, 14.0, 15.0, 13.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.076953887939453, -2.996114492416382, -2.9152750968933105, -2.8344359397888184, -2.753596544265747, -2.672757148742676, -2.5919177532196045, -2.511078357696533, -2.430239200592041, -2.3493998050689697, -2.2685604095458984, -2.1877212524414062, -2.106881856918335, -2.0260424613952637, -1.9452030658721924, -1.864363670349121, -1.7835242748260498, -1.7026848793029785, -1.6218456029891968, -1.5410062074661255, -1.4601669311523438, -1.3793275356292725, -1.2984881401062012, -1.2176487445831299, -1.1368094682693481, -1.0559700727462769, -0.9751307964324951, -0.8942914009094238, -0.8134520649909973, -0.7326127290725708, -0.6517733335494995, -0.570933997631073, -0.4900949001312256, -0.4092555642127991, -0.32841619849205017, -0.24757684767246246, -0.16673749685287476, -0.08589816093444824, -0.005058795213699341, 0.07578057050704956, 0.15661990642547607, 0.23745925724506378, 0.3182986080646515, 0.3991379737854004, 0.4799773097038269, 0.5608166456222534, 0.6416560411453247, 0.7224953770637512, 0.8033347129821777, 0.8841740489006042, 0.9650133848190308, 1.045852780342102, 1.1266920566558838, 1.207531452178955, 1.2883708477020264, 1.3692102432250977, 1.4500495195388794, 1.5308889150619507, 1.6117281913757324, 1.6925675868988037, 1.773406982421875, 1.8542462587356567, 1.935085654258728, 2.0159249305725098, 2.096764326095581]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 6.0, 16.0, 6.0, 14.0, 19.0, 17.0, 40.0, 56.0, 73.0, 133.0, 230.0, 391.0, 687.0, 1269.0, 2735.0, 6028.0, 14541.0, 37799.0, 104684.0, 302930.0, 363871.0, 134259.0, 47182.0, 17633.0, 7208.0, 3235.0, 1599.0, 818.0, 469.0, 215.0, 144.0, 77.0, 51.0, 35.0, 23.0, 23.0, 14.0, 7.0, 6.0, 2.0, 2.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.237548828125, -0.22938919067382812, -0.22122955322265625, -0.21306991577148438, -0.2049102783203125, -0.19675064086914062, -0.18859100341796875, -0.18043136596679688, -0.172271728515625, -0.16411209106445312, -0.15595245361328125, -0.14779281616210938, -0.1396331787109375, -0.13147354125976562, -0.12331390380859375, -0.11515426635742188, -0.10699462890625, -0.09883499145507812, -0.09067535400390625, -0.08251571655273438, -0.0743560791015625, -0.06619644165039062, -0.05803680419921875, -0.049877166748046875, -0.041717529296875, -0.033557891845703125, -0.02539825439453125, -0.017238616943359375, -0.0090789794921875, -0.000919342041015625, 0.00724029541015625, 0.015399932861328125, 0.0235595703125, 0.031719207763671875, 0.03987884521484375, 0.048038482666015625, 0.0561981201171875, 0.06435775756835938, 0.07251739501953125, 0.08067703247070312, 0.088836669921875, 0.09699630737304688, 0.10515594482421875, 0.11331558227539062, 0.1214752197265625, 0.12963485717773438, 0.13779449462890625, 0.14595413208007812, 0.15411376953125, 0.16227340698242188, 0.17043304443359375, 0.17859268188476562, 0.1867523193359375, 0.19491195678710938, 0.20307159423828125, 0.21123123168945312, 0.219390869140625, 0.22755050659179688, 0.23571014404296875, 0.24386978149414062, 0.2520294189453125, 0.2601890563964844, 0.26834869384765625, 0.2765083312988281, 0.28466796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 2.0, 5.0, 16.0, 6.0, 17.0, 17.0, 19.0, 31.0, 29.0, 28.0, 32.0, 46.0, 42.0, 55.0, 53.0, 49.0, 56.0, 48.0, 60.0, 52.0, 47.0, 36.0, 42.0, 39.0, 33.0, 35.0, 24.0, 18.0, 12.0, 11.0, 17.0, 10.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1683349609375, -0.16349029541015625, -0.1586456298828125, -0.15380096435546875, -0.148956298828125, -0.14411163330078125, -0.1392669677734375, -0.13442230224609375, -0.12957763671875, -0.12473297119140625, -0.1198883056640625, -0.11504364013671875, -0.110198974609375, -0.10535430908203125, -0.1005096435546875, -0.09566497802734375, -0.0908203125, -0.08597564697265625, -0.0811309814453125, -0.07628631591796875, -0.071441650390625, -0.06659698486328125, -0.0617523193359375, -0.05690765380859375, -0.05206298828125, -0.04721832275390625, -0.0423736572265625, -0.03752899169921875, -0.032684326171875, -0.02783966064453125, -0.0229949951171875, -0.01815032958984375, -0.0133056640625, -0.00846099853515625, -0.0036163330078125, 0.00122833251953125, 0.006072998046875, 0.01091766357421875, 0.0157623291015625, 0.02060699462890625, 0.02545166015625, 0.03029632568359375, 0.0351409912109375, 0.03998565673828125, 0.044830322265625, 0.04967498779296875, 0.0545196533203125, 0.05936431884765625, 0.064208984375, 0.06905364990234375, 0.0738983154296875, 0.07874298095703125, 0.083587646484375, 0.08843231201171875, 0.0932769775390625, 0.09812164306640625, 0.10296630859375, 0.10781097412109375, 0.1126556396484375, 0.11750030517578125, 0.122344970703125, 0.12718963623046875, 0.1320343017578125, 0.13687896728515625, 0.1417236328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 7.0, 10.0, 11.0, 18.0, 36.0, 41.0, 71.0, 104.0, 169.0, 273.0, 484.0, 875.0, 1864.0, 6057.0, 48739.0, 826252.0, 146642.0, 11645.0, 2698.0, 1136.0, 578.0, 333.0, 187.0, 114.0, 74.0, 43.0, 33.0, 18.0, 16.0, 8.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.85302734375, -0.8291244506835938, -0.8052215576171875, -0.7813186645507812, -0.757415771484375, -0.7335128784179688, -0.7096099853515625, -0.6857070922851562, -0.66180419921875, -0.6379013061523438, -0.6139984130859375, -0.5900955200195312, -0.566192626953125, -0.5422897338867188, -0.5183868408203125, -0.49448394775390625, -0.4705810546875, -0.44667816162109375, -0.4227752685546875, -0.39887237548828125, -0.374969482421875, -0.35106658935546875, -0.3271636962890625, -0.30326080322265625, -0.27935791015625, -0.25545501708984375, -0.2315521240234375, -0.20764923095703125, -0.183746337890625, -0.15984344482421875, -0.1359405517578125, -0.11203765869140625, -0.088134765625, -0.06423187255859375, -0.0403289794921875, -0.01642608642578125, 0.007476806640625, 0.03137969970703125, 0.0552825927734375, 0.07918548583984375, 0.10308837890625, 0.12699127197265625, 0.1508941650390625, 0.17479705810546875, 0.198699951171875, 0.22260284423828125, 0.2465057373046875, 0.27040863037109375, 0.2943115234375, 0.31821441650390625, 0.3421173095703125, 0.36602020263671875, 0.389923095703125, 0.41382598876953125, 0.4377288818359375, 0.46163177490234375, 0.48553466796875, 0.5094375610351562, 0.5333404541015625, 0.5572433471679688, 0.581146240234375, 0.6050491333007812, 0.6289520263671875, 0.6528549194335938, 0.6767578125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 6.0, 5.0, 15.0, 18.0, 13.0, 26.0, 17.0, 19.0, 28.0, 33.0, 44.0, 46.0, 42.0, 57.0, 40.0, 50.0, 54.0, 64.0, 38.0, 54.0, 42.0, 47.0, 39.0, 33.0, 30.0, 24.0, 23.0, 20.0, 17.0, 10.0, 10.0, 11.0, 5.0, 2.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55712890625, -0.5389938354492188, -0.5208587646484375, -0.5027236938476562, -0.484588623046875, -0.46645355224609375, -0.4483184814453125, -0.43018341064453125, -0.41204833984375, -0.39391326904296875, -0.3757781982421875, -0.35764312744140625, -0.339508056640625, -0.32137298583984375, -0.3032379150390625, -0.28510284423828125, -0.2669677734375, -0.24883270263671875, -0.2306976318359375, -0.21256256103515625, -0.194427490234375, -0.17629241943359375, -0.1581573486328125, -0.14002227783203125, -0.12188720703125, -0.10375213623046875, -0.0856170654296875, -0.06748199462890625, -0.049346923828125, -0.03121185302734375, -0.0130767822265625, 0.00505828857421875, 0.023193359375, 0.04132843017578125, 0.0594635009765625, 0.07759857177734375, 0.095733642578125, 0.11386871337890625, 0.1320037841796875, 0.15013885498046875, 0.16827392578125, 0.18640899658203125, 0.2045440673828125, 0.22267913818359375, 0.240814208984375, 0.25894927978515625, 0.2770843505859375, 0.29521942138671875, 0.3133544921875, 0.33148956298828125, 0.3496246337890625, 0.36775970458984375, 0.385894775390625, 0.40402984619140625, 0.4221649169921875, 0.44029998779296875, 0.45843505859375, 0.47657012939453125, 0.4947052001953125, 0.5128402709960938, 0.530975341796875, 0.5491104125976562, 0.5672454833984375, 0.5853805541992188, 0.603515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 4.0, 7.0, 12.0, 18.0, 22.0, 29.0, 34.0, 69.0, 120.0, 227.0, 393.0, 1030.0, 3479.0, 19264.0, 213378.0, 747682.0, 52577.0, 7204.0, 1698.0, 598.0, 236.0, 158.0, 73.0, 60.0, 44.0, 26.0, 20.0, 13.0, 14.0, 12.0, 9.0, 7.0, 9.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1876220703125, -0.18141555786132812, -0.17520904541015625, -0.16900253295898438, -0.1627960205078125, -0.15658950805664062, -0.15038299560546875, -0.14417648315429688, -0.137969970703125, -0.13176345825195312, -0.12555694580078125, -0.11935043334960938, -0.1131439208984375, -0.10693740844726562, -0.10073089599609375, -0.09452438354492188, -0.08831787109375, -0.08211135864257812, -0.07590484619140625, -0.06969833374023438, -0.0634918212890625, -0.057285308837890625, -0.05107879638671875, -0.044872283935546875, -0.038665771484375, -0.032459259033203125, -0.02625274658203125, -0.020046234130859375, -0.0138397216796875, -0.007633209228515625, -0.00142669677734375, 0.004779815673828125, 0.010986328125, 0.017192840576171875, 0.02339935302734375, 0.029605865478515625, 0.0358123779296875, 0.042018890380859375, 0.04822540283203125, 0.054431915283203125, 0.060638427734375, 0.06684494018554688, 0.07305145263671875, 0.07925796508789062, 0.0854644775390625, 0.09167098999023438, 0.09787750244140625, 0.10408401489257812, 0.11029052734375, 0.11649703979492188, 0.12270355224609375, 0.12891006469726562, 0.1351165771484375, 0.14132308959960938, 0.14752960205078125, 0.15373611450195312, 0.159942626953125, 0.16614913940429688, 0.17235565185546875, 0.17856216430664062, 0.1847686767578125, 0.19097518920898438, 0.19718170166015625, 0.20338821411132812, 0.2095947265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 8.0, 3.0, 8.0, 6.0, 8.0, 8.0, 12.0, 18.0, 22.0, 30.0, 68.0, 102.0, 203.0, 186.0, 105.0, 64.0, 37.0, 21.0, 12.0, 9.0, 12.0, 15.0, 7.0, 8.0, 6.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001316070556640625, -0.00012722983956336975, -0.000122852623462677, -0.00011847540736198425, -0.0001140981912612915, -0.00010972097516059875, -0.000105343759059906, -0.00010096654295921326, -9.658932685852051e-05, -9.221211075782776e-05, -8.783489465713501e-05, -8.345767855644226e-05, -7.908046245574951e-05, -7.470324635505676e-05, -7.032603025436401e-05, -6.594881415367126e-05, -6.157159805297852e-05, -5.7194381952285767e-05, -5.281716585159302e-05, -4.843994975090027e-05, -4.406273365020752e-05, -3.968551754951477e-05, -3.530830144882202e-05, -3.093108534812927e-05, -2.6553869247436523e-05, -2.2176653146743774e-05, -1.7799437046051025e-05, -1.3422220945358276e-05, -9.045004844665527e-06, -4.667788743972778e-06, -2.905726432800293e-07, 4.08664345741272e-06, 8.463859558105469e-06, 1.2841075658798218e-05, 1.7218291759490967e-05, 2.1595507860183716e-05, 2.5972723960876465e-05, 3.0349940061569214e-05, 3.472715616226196e-05, 3.910437226295471e-05, 4.348158836364746e-05, 4.785880446434021e-05, 5.223602056503296e-05, 5.661323666572571e-05, 6.099045276641846e-05, 6.53676688671112e-05, 6.974488496780396e-05, 7.41221010684967e-05, 7.849931716918945e-05, 8.28765332698822e-05, 8.725374937057495e-05, 9.16309654712677e-05, 9.600818157196045e-05, 0.0001003853976726532, 0.00010476261377334595, 0.0001091398298740387, 0.00011351704597473145, 0.0001178942620754242, 0.00012227147817611694, 0.0001266486942768097, 0.00013102591037750244, 0.0001354031264781952, 0.00013978034257888794, 0.0001441575586795807, 0.00014853477478027344]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 14.0, 22.0, 34.0, 29.0, 81.0, 119.0, 192.0, 404.0, 892.0, 2258.0, 8089.0, 64546.0, 777801.0, 172257.0, 15695.0, 3582.0, 1280.0, 567.0, 263.0, 142.0, 90.0, 53.0, 40.0, 26.0, 28.0, 17.0, 11.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1412353515625, -0.1355133056640625, -0.129791259765625, -0.1240692138671875, -0.11834716796875, -0.1126251220703125, -0.106903076171875, -0.1011810302734375, -0.095458984375, -0.0897369384765625, -0.084014892578125, -0.0782928466796875, -0.07257080078125, -0.0668487548828125, -0.061126708984375, -0.0554046630859375, -0.0496826171875, -0.0439605712890625, -0.038238525390625, -0.0325164794921875, -0.02679443359375, -0.0210723876953125, -0.015350341796875, -0.0096282958984375, -0.00390625, 0.0018157958984375, 0.007537841796875, 0.0132598876953125, 0.01898193359375, 0.0247039794921875, 0.030426025390625, 0.0361480712890625, 0.0418701171875, 0.0475921630859375, 0.053314208984375, 0.0590362548828125, 0.06475830078125, 0.0704803466796875, 0.076202392578125, 0.0819244384765625, 0.087646484375, 0.0933685302734375, 0.099090576171875, 0.1048126220703125, 0.11053466796875, 0.1162567138671875, 0.121978759765625, 0.1277008056640625, 0.1334228515625, 0.1391448974609375, 0.144866943359375, 0.1505889892578125, 0.15631103515625, 0.1620330810546875, 0.167755126953125, 0.1734771728515625, 0.17919921875, 0.1849212646484375, 0.190643310546875, 0.1963653564453125, 0.20208740234375, 0.2078094482421875, 0.213531494140625, 0.2192535400390625, 0.2249755859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 6.0, 10.0, 29.0, 19.0, 20.0, 24.0, 17.0, 31.0, 51.0, 59.0, 61.0, 61.0, 64.0, 63.0, 70.0, 61.0, 55.0, 39.0, 44.0, 36.0, 32.0, 30.0, 19.0, 14.0, 10.0, 16.0, 12.0, 9.0, 3.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.08135986328125, -0.07824420928955078, -0.07512855529785156, -0.07201290130615234, -0.06889724731445312, -0.0657815933227539, -0.06266593933105469, -0.05955028533935547, -0.05643463134765625, -0.05331897735595703, -0.05020332336425781, -0.047087669372558594, -0.043972015380859375, -0.040856361389160156, -0.03774070739746094, -0.03462505340576172, -0.0315093994140625, -0.02839374542236328, -0.025278091430664062, -0.022162437438964844, -0.019046783447265625, -0.015931129455566406, -0.012815475463867188, -0.009699821472167969, -0.00658416748046875, -0.0034685134887695312, -0.0003528594970703125, 0.0027627944946289062, 0.005878448486328125, 0.008994102478027344, 0.012109756469726562, 0.015225410461425781, 0.018341064453125, 0.02145671844482422, 0.024572372436523438, 0.027688026428222656, 0.030803680419921875, 0.033919334411621094, 0.03703498840332031, 0.04015064239501953, 0.04326629638671875, 0.04638195037841797, 0.04949760437011719, 0.052613258361816406, 0.055728912353515625, 0.058844566345214844, 0.06196022033691406, 0.06507587432861328, 0.0681915283203125, 0.07130718231201172, 0.07442283630371094, 0.07753849029541016, 0.08065414428710938, 0.0837697982788086, 0.08688545227050781, 0.09000110626220703, 0.09311676025390625, 0.09623241424560547, 0.09934806823730469, 0.1024637222290039, 0.10557937622070312, 0.10869503021240234, 0.11181068420410156, 0.11492633819580078, 0.1180419921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 2.0, 5.0, 9.0, 16.0, 72.0, 182.0, 428.0, 171.0, 64.0, 30.0, 7.0, 5.0, 6.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.9220685958862305, -5.745709419250488, -5.569350242614746, -5.392991065979004, -5.21663236618042, -5.040273189544678, -4.8639140129089355, -4.687554836273193, -4.511195659637451, -4.334836483001709, -4.158477306365967, -3.9821183681488037, -3.8057591915130615, -3.6294002532958984, -3.4530410766601562, -3.276681900024414, -3.100322961807251, -2.923963785171509, -2.7476048469543457, -2.5712456703186035, -2.3948864936828613, -2.218527317047119, -2.042168378829956, -1.8658092021942139, -1.6894501447677612, -1.5130910873413086, -1.3367319107055664, -1.1603728532791138, -0.9840137362480164, -0.807654619216919, -0.6312955617904663, -0.4549363851547241, -0.2785773277282715, -0.10221822559833527, 0.07414087653160095, 0.250499963760376, 0.4268590807914734, 0.6032181978225708, 0.7795772552490234, 0.9559364318847656, 1.1322954893112183, 1.308654546737671, 1.485013723373413, 1.6613727807998657, 1.8377318382263184, 2.0140910148620605, 2.1904501914978027, 2.366809368133545, 2.543168306350708, 2.71952748298645, 2.8958864212036133, 3.0722455978393555, 3.2486047744750977, 3.42496395111084, 3.601322889328003, 3.777682065963745, 3.954041004180908, 4.13040018081665, 4.306759357452393, 4.483118057250977, 4.659477233886719, 4.835836410522461, 5.012195587158203, 5.188554763793945, 5.3649139404296875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 11.0, 10.0, 11.0, 18.0, 25.0, 24.0, 30.0, 24.0, 41.0, 44.0, 49.0, 59.0, 80.0, 90.0, 82.0, 63.0, 50.0, 39.0, 26.0, 28.0, 38.0, 23.0, 24.0, 18.0, 17.0, 7.0, 9.0, 13.0, 11.0, 6.0, 3.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.6947264671325684, -2.616408586502075, -2.538090467453003, -2.4597725868225098, -2.3814547061920166, -2.3031368255615234, -2.224818706512451, -2.146500825881958, -2.068182945251465, -1.9898649454116821, -1.911547064781189, -1.8332290649414062, -1.754911184310913, -1.6765931844711304, -1.5982751846313477, -1.5199573040008545, -1.4416391849517822, -1.3633211851119995, -1.2850033044815063, -1.2066853046417236, -1.1283674240112305, -1.0500494241714478, -0.971731424331665, -0.8934134840965271, -0.8150955438613892, -0.7367776036262512, -0.6584596633911133, -0.5801416635513306, -0.5018237233161926, -0.4235057830810547, -0.34518781304359436, -0.26686984300613403, -0.1885519027709961, -0.11023394763469696, -0.03191599249839783, 0.046401962637901306, 0.12471991777420044, 0.20303785800933838, 0.2813558280467987, 0.35967379808425903, 0.437991738319397, 0.5163096785545349, 0.5946276187896729, 0.6729456186294556, 0.7512635588645935, 0.8295814990997314, 0.9078994989395142, 0.9862174391746521, 1.06453537940979, 1.1428533792495728, 1.221171259880066, 1.2994892597198486, 1.3778071403503418, 1.4561251401901245, 1.5344431400299072, 1.6127610206604004, 1.691079020500183, 1.7693970203399658, 1.847714900970459, 1.9260329008102417, 2.0043509006500244, 2.0826687812805176, 2.1609866619110107, 2.239304780960083, 2.317622661590576]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 9.0, 10.0, 12.0, 30.0, 28.0, 38.0, 55.0, 71.0, 130.0, 216.0, 439.0, 996.0, 2741.0, 10367.0, 59246.0, 1146357.0, 2800718.0, 146594.0, 18974.0, 4448.0, 1476.0, 579.0, 289.0, 163.0, 85.0, 57.0, 44.0, 30.0, 29.0, 20.0, 18.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27490234375, -0.2666168212890625, -0.258331298828125, -0.2500457763671875, -0.24176025390625, -0.2334747314453125, -0.225189208984375, -0.2169036865234375, -0.2086181640625, -0.2003326416015625, -0.192047119140625, -0.1837615966796875, -0.17547607421875, -0.1671905517578125, -0.158905029296875, -0.1506195068359375, -0.142333984375, -0.1340484619140625, -0.125762939453125, -0.1174774169921875, -0.10919189453125, -0.1009063720703125, -0.092620849609375, -0.0843353271484375, -0.0760498046875, -0.0677642822265625, -0.059478759765625, -0.0511932373046875, -0.04290771484375, -0.0346221923828125, -0.026336669921875, -0.0180511474609375, -0.009765625, -0.0014801025390625, 0.006805419921875, 0.0150909423828125, 0.02337646484375, 0.0316619873046875, 0.039947509765625, 0.0482330322265625, 0.0565185546875, 0.0648040771484375, 0.073089599609375, 0.0813751220703125, 0.08966064453125, 0.0979461669921875, 0.106231689453125, 0.1145172119140625, 0.122802734375, 0.1310882568359375, 0.139373779296875, 0.1476593017578125, 0.15594482421875, 0.1642303466796875, 0.172515869140625, 0.1808013916015625, 0.1890869140625, 0.1973724365234375, 0.205657958984375, 0.2139434814453125, 0.22222900390625, 0.2305145263671875, 0.238800048828125, 0.2470855712890625, 0.25537109375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 12.0, 15.0, 22.0, 24.0, 27.0, 20.0, 29.0, 35.0, 48.0, 37.0, 46.0, 46.0, 62.0, 66.0, 60.0, 72.0, 43.0, 46.0, 55.0, 35.0, 31.0, 33.0, 36.0, 20.0, 13.0, 19.0, 11.0, 11.0, 4.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1688232421875, -0.1640949249267578, -0.15936660766601562, -0.15463829040527344, -0.14990997314453125, -0.14518165588378906, -0.14045333862304688, -0.1357250213623047, -0.1309967041015625, -0.1262683868408203, -0.12154006958007812, -0.11681175231933594, -0.11208343505859375, -0.10735511779785156, -0.10262680053710938, -0.09789848327636719, -0.093170166015625, -0.08844184875488281, -0.08371353149414062, -0.07898521423339844, -0.07425689697265625, -0.06952857971191406, -0.06480026245117188, -0.06007194519042969, -0.0553436279296875, -0.05061531066894531, -0.045886993408203125, -0.04115867614746094, -0.03643035888671875, -0.03170204162597656, -0.026973724365234375, -0.022245407104492188, -0.01751708984375, -0.012788772583007812, -0.008060455322265625, -0.0033321380615234375, 0.00139617919921875, 0.0061244964599609375, 0.010852813720703125, 0.015581130981445312, 0.0203094482421875, 0.025037765502929688, 0.029766082763671875, 0.03449440002441406, 0.03922271728515625, 0.04395103454589844, 0.048679351806640625, 0.05340766906738281, 0.058135986328125, 0.06286430358886719, 0.06759262084960938, 0.07232093811035156, 0.07704925537109375, 0.08177757263183594, 0.08650588989257812, 0.09123420715332031, 0.0959625244140625, 0.10069084167480469, 0.10541915893554688, 0.11014747619628906, 0.11487579345703125, 0.11960411071777344, 0.12433242797851562, 0.1290607452392578, 0.1337890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 9.0, 24.0, 33.0, 72.0, 106.0, 261.0, 493.0, 1130.0, 3840.0, 17952.0, 169671.0, 3770026.0, 208067.0, 17245.0, 3372.0, 1066.0, 444.0, 201.0, 117.0, 54.0, 22.0, 17.0, 15.0, 12.0, 2.0, 2.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4736328125, -0.4610137939453125, -0.448394775390625, -0.4357757568359375, -0.42315673828125, -0.4105377197265625, -0.397918701171875, -0.3852996826171875, -0.3726806640625, -0.3600616455078125, -0.347442626953125, -0.3348236083984375, -0.32220458984375, -0.3095855712890625, -0.296966552734375, -0.2843475341796875, -0.271728515625, -0.2591094970703125, -0.246490478515625, -0.2338714599609375, -0.22125244140625, -0.2086334228515625, -0.196014404296875, -0.1833953857421875, -0.1707763671875, -0.1581573486328125, -0.145538330078125, -0.1329193115234375, -0.12030029296875, -0.1076812744140625, -0.095062255859375, -0.0824432373046875, -0.06982421875, -0.0572052001953125, -0.044586181640625, -0.0319671630859375, -0.01934814453125, -0.0067291259765625, 0.005889892578125, 0.0185089111328125, 0.0311279296875, 0.0437469482421875, 0.056365966796875, 0.0689849853515625, 0.08160400390625, 0.0942230224609375, 0.106842041015625, 0.1194610595703125, 0.132080078125, 0.1446990966796875, 0.157318115234375, 0.1699371337890625, 0.18255615234375, 0.1951751708984375, 0.207794189453125, 0.2204132080078125, 0.2330322265625, 0.2456512451171875, 0.258270263671875, 0.2708892822265625, 0.28350830078125, 0.2961273193359375, 0.308746337890625, 0.3213653564453125, 0.333984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 8.0, 3.0, 9.0, 9.0, 14.0, 17.0, 14.0, 21.0, 40.0, 42.0, 72.0, 102.0, 212.0, 391.0, 725.0, 945.0, 639.0, 357.0, 177.0, 95.0, 58.0, 44.0, 23.0, 16.0, 15.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2744140625, -0.26436614990234375, -0.2543182373046875, -0.24427032470703125, -0.234222412109375, -0.22417449951171875, -0.2141265869140625, -0.20407867431640625, -0.19403076171875, -0.18398284912109375, -0.1739349365234375, -0.16388702392578125, -0.153839111328125, -0.14379119873046875, -0.1337432861328125, -0.12369537353515625, -0.1136474609375, -0.10359954833984375, -0.0935516357421875, -0.08350372314453125, -0.073455810546875, -0.06340789794921875, -0.0533599853515625, -0.04331207275390625, -0.03326416015625, -0.02321624755859375, -0.0131683349609375, -0.00312042236328125, 0.006927490234375, 0.01697540283203125, 0.0270233154296875, 0.03707122802734375, 0.047119140625, 0.05716705322265625, 0.0672149658203125, 0.07726287841796875, 0.087310791015625, 0.09735870361328125, 0.1074066162109375, 0.11745452880859375, 0.12750244140625, 0.13755035400390625, 0.1475982666015625, 0.15764617919921875, 0.167694091796875, 0.17774200439453125, 0.1877899169921875, 0.19783782958984375, 0.2078857421875, 0.21793365478515625, 0.2279815673828125, 0.23802947998046875, 0.248077392578125, 0.25812530517578125, 0.2681732177734375, 0.27822113037109375, 0.28826904296875, 0.29831695556640625, 0.3083648681640625, 0.31841278076171875, 0.328460693359375, 0.33850860595703125, 0.3485565185546875, 0.35860443115234375, 0.36865234375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 11.0, 23.0, 98.0, 441.0, 338.0, 62.0, 16.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.616742134094238, -6.40238094329834, -6.188019752502441, -5.973658561706543, -5.7592973709106445, -5.544936180114746, -5.3305745124816895, -5.116213321685791, -4.901852130889893, -4.687490940093994, -4.473129749298096, -4.258768558502197, -4.044406890869141, -3.8300459384918213, -3.6156845092773438, -3.4013233184814453, -3.186962127685547, -2.9726009368896484, -2.75823974609375, -2.5438783168792725, -2.329517126083374, -2.1151559352874756, -1.9007946252822876, -1.6864333152770996, -1.4720721244812012, -1.2577109336853027, -1.0433496236801147, -0.8289883732795715, -0.6146271228790283, -0.4002659320831299, -0.1859046220779419, 0.028456687927246094, 0.24281740188598633, 0.45717865228652954, 0.6715399026870728, 0.885901153087616, 1.1002624034881592, 1.3146235942840576, 1.5289849042892456, 1.7433462142944336, 1.957707405090332, 2.1720685958862305, 2.386429786682129, 2.6007912158966064, 2.815152406692505, 3.0295135974884033, 3.243875026702881, 3.4582362174987793, 3.6725974082946777, 3.886958599090576, 4.101319789886475, 4.315680980682373, 4.53004264831543, 4.744403839111328, 4.958765029907227, 5.173126220703125, 5.387487411499023, 5.601848602294922, 5.81620979309082, 6.030570983886719, 6.244932174682617, 6.459293365478516, 6.673655033111572, 6.888016223907471, 7.102377414703369]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 9.0, 10.0, 1.0, 9.0, 9.0, 2.0, 21.0, 13.0, 16.0, 23.0, 26.0, 21.0, 31.0, 30.0, 36.0, 39.0, 49.0, 41.0, 38.0, 45.0, 43.0, 36.0, 44.0, 31.0, 35.0, 51.0, 49.0, 26.0, 28.0, 31.0, 25.0, 15.0, 18.0, 13.0, 15.0, 12.0, 12.0, 9.0, 8.0, 11.0, 6.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1541190147399902, -1.1190747022628784, -1.0840303897857666, -1.0489860773086548, -1.013941764831543, -0.9788974523544312, -0.9438531994819641, -0.9088088870048523, -0.8737645745277405, -0.8387202620506287, -0.8036759495735168, -0.768631637096405, -0.733587384223938, -0.6985430717468262, -0.6634987592697144, -0.6284544467926025, -0.5934101343154907, -0.5583658218383789, -0.5233215093612671, -0.48827722668647766, -0.45323291420936584, -0.41818860173225403, -0.3831443190574646, -0.3481000065803528, -0.31305569410324097, -0.27801138162612915, -0.24296708405017853, -0.2079227864742279, -0.1728784739971161, -0.13783416152000427, -0.10278986394405365, -0.06774556636810303, -0.03270125389099121, 0.0023430511355400085, 0.03738735616207123, 0.07243166118860245, 0.10747596621513367, 0.14252027869224548, 0.1775645762681961, 0.21260887384414673, 0.24765318632125854, 0.28269749879837036, 0.3177418112754822, 0.3527860939502716, 0.3878304064273834, 0.42287471890449524, 0.45791900157928467, 0.4929633140563965, 0.5280076265335083, 0.5630519390106201, 0.5980962514877319, 0.6331405639648438, 0.6681848764419556, 0.7032291889190674, 0.7382734417915344, 0.7733177542686462, 0.8083620667457581, 0.8434063792228699, 0.8784506916999817, 0.9134950041770935, 0.9485392570495605, 0.9835835695266724, 1.0186278820037842, 1.053672194480896, 1.0887165069580078]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 3.0, 10.0, 7.0, 6.0, 16.0, 23.0, 51.0, 65.0, 115.0, 204.0, 424.0, 908.0, 2233.0, 6753.0, 24027.0, 104060.0, 428032.0, 368776.0, 83476.0, 19928.0, 5753.0, 1995.0, 836.0, 381.0, 199.0, 117.0, 48.0, 26.0, 26.0, 12.0, 11.0, 5.0, 7.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.337646484375, -0.32798004150390625, -0.3183135986328125, -0.30864715576171875, -0.298980712890625, -0.28931427001953125, -0.2796478271484375, -0.26998138427734375, -0.26031494140625, -0.25064849853515625, -0.2409820556640625, -0.23131561279296875, -0.221649169921875, -0.21198272705078125, -0.2023162841796875, -0.19264984130859375, -0.1829833984375, -0.17331695556640625, -0.1636505126953125, -0.15398406982421875, -0.144317626953125, -0.13465118408203125, -0.1249847412109375, -0.11531829833984375, -0.10565185546875, -0.09598541259765625, -0.0863189697265625, -0.07665252685546875, -0.066986083984375, -0.05731964111328125, -0.0476531982421875, -0.03798675537109375, -0.0283203125, -0.01865386962890625, -0.0089874267578125, 0.00067901611328125, 0.010345458984375, 0.02001190185546875, 0.0296783447265625, 0.03934478759765625, 0.04901123046875, 0.05867767333984375, 0.0683441162109375, 0.07801055908203125, 0.087677001953125, 0.09734344482421875, 0.1070098876953125, 0.11667633056640625, 0.1263427734375, 0.13600921630859375, 0.1456756591796875, 0.15534210205078125, 0.165008544921875, 0.17467498779296875, 0.1843414306640625, 0.19400787353515625, 0.20367431640625, 0.21334075927734375, 0.2230072021484375, 0.23267364501953125, 0.242340087890625, 0.25200653076171875, 0.2616729736328125, 0.27133941650390625, 0.281005859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 9.0, 9.0, 10.0, 14.0, 15.0, 22.0, 14.0, 29.0, 26.0, 41.0, 25.0, 49.0, 36.0, 60.0, 61.0, 61.0, 49.0, 44.0, 66.0, 40.0, 42.0, 48.0, 42.0, 41.0, 28.0, 20.0, 17.0, 20.0, 21.0, 10.0, 12.0, 9.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1904296875, -0.1857290267944336, -0.1810283660888672, -0.17632770538330078, -0.17162704467773438, -0.16692638397216797, -0.16222572326660156, -0.15752506256103516, -0.15282440185546875, -0.14812374114990234, -0.14342308044433594, -0.13872241973876953, -0.13402175903320312, -0.12932109832763672, -0.12462043762207031, -0.1199197769165039, -0.1152191162109375, -0.1105184555053711, -0.10581779479980469, -0.10111713409423828, -0.09641647338867188, -0.09171581268310547, -0.08701515197753906, -0.08231449127197266, -0.07761383056640625, -0.07291316986083984, -0.06821250915527344, -0.06351184844970703, -0.058811187744140625, -0.05411052703857422, -0.04940986633300781, -0.044709205627441406, -0.040008544921875, -0.035307884216308594, -0.030607223510742188, -0.02590656280517578, -0.021205902099609375, -0.01650524139404297, -0.011804580688476562, -0.007103919982910156, -0.00240325927734375, 0.0022974014282226562, 0.0069980621337890625, 0.011698722839355469, 0.016399383544921875, 0.02110004425048828, 0.025800704956054688, 0.030501365661621094, 0.0352020263671875, 0.039902687072753906, 0.04460334777832031, 0.04930400848388672, 0.054004669189453125, 0.05870532989501953, 0.06340599060058594, 0.06810665130615234, 0.07280731201171875, 0.07750797271728516, 0.08220863342285156, 0.08690929412841797, 0.09160995483398438, 0.09631061553955078, 0.10101127624511719, 0.1057119369506836, 0.11041259765625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 4.0, 6.0, 14.0, 7.0, 14.0, 22.0, 24.0, 25.0, 34.0, 58.0, 85.0, 110.0, 200.0, 284.0, 559.0, 1289.0, 3721.0, 12993.0, 66104.0, 588302.0, 313165.0, 46228.0, 10032.0, 2947.0, 1066.0, 463.0, 275.0, 147.0, 97.0, 66.0, 55.0, 28.0, 39.0, 25.0, 7.0, 12.0, 11.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.37890625, -0.36772918701171875, -0.3565521240234375, -0.34537506103515625, -0.334197998046875, -0.32302093505859375, -0.3118438720703125, -0.30066680908203125, -0.28948974609375, -0.27831268310546875, -0.2671356201171875, -0.25595855712890625, -0.244781494140625, -0.23360443115234375, -0.2224273681640625, -0.21125030517578125, -0.2000732421875, -0.18889617919921875, -0.1777191162109375, -0.16654205322265625, -0.155364990234375, -0.14418792724609375, -0.1330108642578125, -0.12183380126953125, -0.11065673828125, -0.09947967529296875, -0.0883026123046875, -0.07712554931640625, -0.065948486328125, -0.05477142333984375, -0.0435943603515625, -0.03241729736328125, -0.021240234375, -0.01006317138671875, 0.0011138916015625, 0.01229095458984375, 0.023468017578125, 0.03464508056640625, 0.0458221435546875, 0.05699920654296875, 0.06817626953125, 0.07935333251953125, 0.0905303955078125, 0.10170745849609375, 0.112884521484375, 0.12406158447265625, 0.1352386474609375, 0.14641571044921875, 0.1575927734375, 0.16876983642578125, 0.1799468994140625, 0.19112396240234375, 0.202301025390625, 0.21347808837890625, 0.2246551513671875, 0.23583221435546875, 0.24700927734375, 0.25818634033203125, 0.2693634033203125, 0.28054046630859375, 0.291717529296875, 0.30289459228515625, 0.3140716552734375, 0.32524871826171875, 0.33642578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 7.0, 2.0, 6.0, 5.0, 3.0, 6.0, 7.0, 9.0, 5.0, 8.0, 21.0, 18.0, 26.0, 28.0, 36.0, 42.0, 43.0, 41.0, 50.0, 54.0, 40.0, 46.0, 44.0, 47.0, 45.0, 45.0, 47.0, 49.0, 39.0, 37.0, 12.0, 27.0, 22.0, 14.0, 19.0, 15.0, 8.0, 8.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.465576171875, -0.4518852233886719, -0.43819427490234375, -0.4245033264160156, -0.4108123779296875, -0.3971214294433594, -0.38343048095703125, -0.3697395324707031, -0.356048583984375, -0.3423576354980469, -0.32866668701171875, -0.3149757385253906, -0.3012847900390625, -0.2875938415527344, -0.27390289306640625, -0.2602119445800781, -0.24652099609375, -0.23283004760742188, -0.21913909912109375, -0.20544815063476562, -0.1917572021484375, -0.17806625366210938, -0.16437530517578125, -0.15068435668945312, -0.136993408203125, -0.12330245971679688, -0.10961151123046875, -0.09592056274414062, -0.0822296142578125, -0.06853866577148438, -0.05484771728515625, -0.041156768798828125, -0.0274658203125, -0.013774871826171875, -8.392333984375e-05, 0.013607025146484375, 0.0272979736328125, 0.040988922119140625, 0.05467987060546875, 0.06837081909179688, 0.082061767578125, 0.09575271606445312, 0.10944366455078125, 0.12313461303710938, 0.1368255615234375, 0.15051651000976562, 0.16420745849609375, 0.17789840698242188, 0.19158935546875, 0.20528030395507812, 0.21897125244140625, 0.23266220092773438, 0.2463531494140625, 0.2600440979003906, 0.27373504638671875, 0.2874259948730469, 0.301116943359375, 0.3148078918457031, 0.32849884033203125, 0.3421897888183594, 0.3558807373046875, 0.3695716857910156, 0.38326263427734375, 0.3969535827636719, 0.41064453125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 8.0, 11.0, 8.0, 28.0, 26.0, 37.0, 85.0, 138.0, 282.0, 600.0, 1595.0, 5291.0, 23143.0, 139911.0, 705436.0, 140653.0, 23092.0, 5360.0, 1624.0, 619.0, 252.0, 118.0, 85.0, 48.0, 31.0, 20.0, 9.0, 12.0, 9.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09246826171875, -0.08922386169433594, -0.08597946166992188, -0.08273506164550781, -0.07949066162109375, -0.07624626159667969, -0.07300186157226562, -0.06975746154785156, -0.0665130615234375, -0.06326866149902344, -0.060024261474609375, -0.05677986145019531, -0.05353546142578125, -0.05029106140136719, -0.047046661376953125, -0.04380226135253906, -0.040557861328125, -0.03731346130371094, -0.034069061279296875, -0.030824661254882812, -0.02758026123046875, -0.024335861206054688, -0.021091461181640625, -0.017847061157226562, -0.0146026611328125, -0.011358261108398438, -0.008113861083984375, -0.0048694610595703125, -0.00162506103515625, 0.0016193389892578125, 0.004863739013671875, 0.008108139038085938, 0.0113525390625, 0.014596939086914062, 0.017841339111328125, 0.021085739135742188, 0.02433013916015625, 0.027574539184570312, 0.030818939208984375, 0.03406333923339844, 0.0373077392578125, 0.04055213928222656, 0.043796539306640625, 0.04704093933105469, 0.05028533935546875, 0.05352973937988281, 0.056774139404296875, 0.06001853942871094, 0.063262939453125, 0.06650733947753906, 0.06975173950195312, 0.07299613952636719, 0.07624053955078125, 0.07948493957519531, 0.08272933959960938, 0.08597373962402344, 0.0892181396484375, 0.09246253967285156, 0.09570693969726562, 0.09895133972167969, 0.10219573974609375, 0.10544013977050781, 0.10868453979492188, 0.11192893981933594, 0.11517333984375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 5.0, 5.0, 5.0, 13.0, 13.0, 25.0, 42.0, 61.0, 109.0, 148.0, 149.0, 142.0, 103.0, 58.0, 46.0, 26.0, 13.0, 15.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.736682891845703e-05, -7.523968815803528e-05, -7.311254739761353e-05, -7.098540663719177e-05, -6.885826587677002e-05, -6.673112511634827e-05, -6.460398435592651e-05, -6.247684359550476e-05, -6.034970283508301e-05, -5.8222562074661255e-05, -5.60954213142395e-05, -5.396828055381775e-05, -5.1841139793395996e-05, -4.971399903297424e-05, -4.758685827255249e-05, -4.545971751213074e-05, -4.3332576751708984e-05, -4.120543599128723e-05, -3.907829523086548e-05, -3.6951154470443726e-05, -3.482401371002197e-05, -3.269687294960022e-05, -3.056973218917847e-05, -2.8442591428756714e-05, -2.631545066833496e-05, -2.4188309907913208e-05, -2.2061169147491455e-05, -1.9934028387069702e-05, -1.780688762664795e-05, -1.5679746866226196e-05, -1.3552606105804443e-05, -1.142546534538269e-05, -9.298324584960938e-06, -7.1711838245391846e-06, -5.044043064117432e-06, -2.9169023036956787e-06, -7.897615432739258e-07, 1.3373792171478271e-06, 3.46451997756958e-06, 5.591660737991333e-06, 7.718801498413086e-06, 9.845942258834839e-06, 1.1973083019256592e-05, 1.4100223779678345e-05, 1.6227364540100098e-05, 1.835450530052185e-05, 2.0481646060943604e-05, 2.2608786821365356e-05, 2.473592758178711e-05, 2.6863068342208862e-05, 2.8990209102630615e-05, 3.111734986305237e-05, 3.324449062347412e-05, 3.5371631383895874e-05, 3.749877214431763e-05, 3.962591290473938e-05, 4.175305366516113e-05, 4.3880194425582886e-05, 4.600733518600464e-05, 4.813447594642639e-05, 5.0261616706848145e-05, 5.23887574672699e-05, 5.451589822769165e-05, 5.66430389881134e-05, 5.8770179748535156e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 9.0, 9.0, 11.0, 19.0, 20.0, 32.0, 49.0, 90.0, 147.0, 291.0, 640.0, 1543.0, 4308.0, 16021.0, 87644.0, 659951.0, 230696.0, 34706.0, 7974.0, 2483.0, 968.0, 404.0, 183.0, 136.0, 54.0, 54.0, 26.0, 23.0, 16.0, 7.0, 7.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1204833984375, -0.11701583862304688, -0.11354827880859375, -0.11008071899414062, -0.1066131591796875, -0.10314559936523438, -0.09967803955078125, -0.09621047973632812, -0.092742919921875, -0.08927536010742188, -0.08580780029296875, -0.08234024047851562, -0.0788726806640625, -0.07540512084960938, -0.07193756103515625, -0.06847000122070312, -0.06500244140625, -0.061534881591796875, -0.05806732177734375, -0.054599761962890625, -0.0511322021484375, -0.047664642333984375, -0.04419708251953125, -0.040729522705078125, -0.037261962890625, -0.033794403076171875, -0.03032684326171875, -0.026859283447265625, -0.0233917236328125, -0.019924163818359375, -0.01645660400390625, -0.012989044189453125, -0.009521484375, -0.006053924560546875, -0.00258636474609375, 0.000881195068359375, 0.0043487548828125, 0.007816314697265625, 0.01128387451171875, 0.014751434326171875, 0.018218994140625, 0.021686553955078125, 0.02515411376953125, 0.028621673583984375, 0.0320892333984375, 0.035556793212890625, 0.03902435302734375, 0.042491912841796875, 0.04595947265625, 0.049427032470703125, 0.05289459228515625, 0.056362152099609375, 0.0598297119140625, 0.06329727172851562, 0.06676483154296875, 0.07023239135742188, 0.073699951171875, 0.07716751098632812, 0.08063507080078125, 0.08410263061523438, 0.0875701904296875, 0.09103775024414062, 0.09450531005859375, 0.09797286987304688, 0.1014404296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 5.0, 5.0, 7.0, 6.0, 11.0, 14.0, 22.0, 17.0, 13.0, 37.0, 34.0, 57.0, 44.0, 43.0, 71.0, 83.0, 74.0, 64.0, 56.0, 59.0, 54.0, 48.0, 35.0, 27.0, 24.0, 15.0, 10.0, 11.0, 7.0, 7.0, 5.0, 5.0, 5.0, 4.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0831298828125, -0.08060836791992188, -0.07808685302734375, -0.07556533813476562, -0.0730438232421875, -0.07052230834960938, -0.06800079345703125, -0.06547927856445312, -0.062957763671875, -0.060436248779296875, -0.05791473388671875, -0.055393218994140625, -0.0528717041015625, -0.050350189208984375, -0.04782867431640625, -0.045307159423828125, -0.04278564453125, -0.040264129638671875, -0.03774261474609375, -0.035221099853515625, -0.0326995849609375, -0.030178070068359375, -0.02765655517578125, -0.025135040283203125, -0.022613525390625, -0.020092010498046875, -0.01757049560546875, -0.015048980712890625, -0.0125274658203125, -0.010005950927734375, -0.00748443603515625, -0.004962921142578125, -0.00244140625, 8.0108642578125e-05, 0.00260162353515625, 0.005123138427734375, 0.0076446533203125, 0.010166168212890625, 0.01268768310546875, 0.015209197998046875, 0.017730712890625, 0.020252227783203125, 0.02277374267578125, 0.025295257568359375, 0.0278167724609375, 0.030338287353515625, 0.03285980224609375, 0.035381317138671875, 0.03790283203125, 0.040424346923828125, 0.04294586181640625, 0.045467376708984375, 0.0479888916015625, 0.050510406494140625, 0.05303192138671875, 0.055553436279296875, 0.058074951171875, 0.060596466064453125, 0.06311798095703125, 0.06563949584960938, 0.0681610107421875, 0.07068252563476562, 0.07320404052734375, 0.07572555541992188, 0.0782470703125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 13.0, 15.0, 38.0, 70.0, 138.0, 257.0, 229.0, 111.0, 65.0, 19.0, 11.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2343032360076904, -2.1451523303985596, -2.0560014247894287, -1.9668503999710083, -1.877699375152588, -1.788548469543457, -1.6993975639343262, -1.6102465391159058, -1.5210955142974854, -1.4319446086883545, -1.342793583869934, -1.2536426782608032, -1.1644916534423828, -1.075340747833252, -0.9861897826194763, -0.8970388174057007, -0.8078879117965698, -0.7187369465827942, -0.6295859813690186, -0.5404350757598877, -0.4512840807437897, -0.36213311553001404, -0.2729821801185608, -0.18383121490478516, -0.09468024969100952, -0.005529291927814484, 0.08362166583538055, 0.172772616147995, 0.26192358136177063, 0.35107454657554626, 0.4402254819869995, 0.5293764472007751, 0.6185274124145508, 0.7076783776283264, 0.796829342842102, 0.8859802484512329, 0.9751312732696533, 1.0642821788787842, 1.153433084487915, 1.2425841093063354, 1.3317351341247559, 1.4208860397338867, 1.5100370645523071, 1.599187970161438, 1.6883389949798584, 1.7774899005889893, 1.8666408061981201, 1.9557918310165405, 2.044942855834961, 2.134093761444092, 2.2232446670532227, 2.3123958110809326, 2.4015467166900635, 2.4906976222991943, 2.579848527908325, 2.668999671936035, 2.758150339126587, 2.8473012447357178, 2.9364521503448486, 3.0256032943725586, 3.1147541999816895, 3.2039051055908203, 3.293056011199951, 3.382206916809082, 3.471358060836792]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 7.0, 5.0, 4.0, 14.0, 5.0, 17.0, 10.0, 18.0, 16.0, 23.0, 24.0, 24.0, 26.0, 46.0, 28.0, 33.0, 69.0, 92.0, 90.0, 86.0, 60.0, 34.0, 35.0, 32.0, 29.0, 32.0, 23.0, 23.0, 13.0, 14.0, 16.0, 11.0, 6.0, 13.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16617488861084, -2.104649782180786, -2.0431246757507324, -1.9815996885299683, -1.9200745820999146, -1.8585494756698608, -1.7970243692398071, -1.735499382019043, -1.6739742755889893, -1.6124491691589355, -1.5509240627288818, -1.4893990755081177, -1.427873969078064, -1.3663488626480103, -1.3048237562179565, -1.2432987689971924, -1.1817736625671387, -1.120248556137085, -1.0587234497070312, -0.9971984028816223, -0.9356733560562134, -0.8741482496261597, -0.812623143196106, -0.751098096370697, -0.6895729303359985, -0.6280478239059448, -0.5665227770805359, -0.5049976706504822, -0.44347262382507324, -0.38194751739501953, -0.3204224407672882, -0.2588973641395569, -0.19737231731414795, -0.13584724068641663, -0.0743221566081047, -0.012797072529792786, 0.04872800409793854, 0.11025309562683105, 0.17177817225456238, 0.2333032488822937, 0.294828325510025, 0.35635340213775635, 0.41787847876548767, 0.479403555393219, 0.5409286618232727, 0.6024537086486816, 0.6639788150787354, 0.7255039215087891, 0.787028968334198, 0.8485540747642517, 0.9100791215896606, 0.9716042280197144, 1.033129334449768, 1.0946543216705322, 1.156179428100586, 1.2177045345306396, 1.2792296409606934, 1.340754747390747, 1.4022798538208008, 1.463804841041565, 1.5253299474716187, 1.5868550539016724, 1.648380160331726, 1.7099051475524902, 1.771430253982544]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 11.0, 11.0, 20.0, 21.0, 33.0, 37.0, 53.0, 86.0, 131.0, 189.0, 348.0, 619.0, 1124.0, 2253.0, 4946.0, 12618.0, 42724.0, 225258.0, 1439587.0, 2021849.0, 348848.0, 64338.0, 17175.0, 6314.0, 2708.0, 1295.0, 643.0, 402.0, 223.0, 128.0, 84.0, 68.0, 41.0, 31.0, 23.0, 5.0, 13.0, 6.0, 6.0, 3.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.129150390625, -0.1245574951171875, -0.119964599609375, -0.1153717041015625, -0.11077880859375, -0.1061859130859375, -0.101593017578125, -0.0970001220703125, -0.0924072265625, -0.0878143310546875, -0.083221435546875, -0.0786285400390625, -0.07403564453125, -0.0694427490234375, -0.064849853515625, -0.0602569580078125, -0.0556640625, -0.0510711669921875, -0.046478271484375, -0.0418853759765625, -0.03729248046875, -0.0326995849609375, -0.028106689453125, -0.0235137939453125, -0.0189208984375, -0.0143280029296875, -0.009735107421875, -0.0051422119140625, -0.00054931640625, 0.0040435791015625, 0.008636474609375, 0.0132293701171875, 0.017822265625, 0.0224151611328125, 0.027008056640625, 0.0316009521484375, 0.03619384765625, 0.0407867431640625, 0.045379638671875, 0.0499725341796875, 0.0545654296875, 0.0591583251953125, 0.063751220703125, 0.0683441162109375, 0.07293701171875, 0.0775299072265625, 0.082122802734375, 0.0867156982421875, 0.09130859375, 0.0959014892578125, 0.100494384765625, 0.1050872802734375, 0.10968017578125, 0.1142730712890625, 0.118865966796875, 0.1234588623046875, 0.1280517578125, 0.1326446533203125, 0.137237548828125, 0.1418304443359375, 0.14642333984375, 0.1510162353515625, 0.155609130859375, 0.1602020263671875, 0.164794921875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 10.0, 11.0, 6.0, 12.0, 12.0, 14.0, 19.0, 28.0, 22.0, 25.0, 32.0, 39.0, 37.0, 38.0, 37.0, 60.0, 48.0, 30.0, 49.0, 38.0, 49.0, 40.0, 35.0, 32.0, 39.0, 25.0, 23.0, 35.0, 27.0, 23.0, 17.0, 19.0, 17.0, 11.0, 3.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12451171875, -0.120849609375, -0.1171875, -0.113525390625, -0.10986328125, -0.106201171875, -0.1025390625, -0.098876953125, -0.09521484375, -0.091552734375, -0.087890625, -0.084228515625, -0.08056640625, -0.076904296875, -0.0732421875, -0.069580078125, -0.06591796875, -0.062255859375, -0.05859375, -0.054931640625, -0.05126953125, -0.047607421875, -0.0439453125, -0.040283203125, -0.03662109375, -0.032958984375, -0.029296875, -0.025634765625, -0.02197265625, -0.018310546875, -0.0146484375, -0.010986328125, -0.00732421875, -0.003662109375, 0.0, 0.003662109375, 0.00732421875, 0.010986328125, 0.0146484375, 0.018310546875, 0.02197265625, 0.025634765625, 0.029296875, 0.032958984375, 0.03662109375, 0.040283203125, 0.0439453125, 0.047607421875, 0.05126953125, 0.054931640625, 0.05859375, 0.062255859375, 0.06591796875, 0.069580078125, 0.0732421875, 0.076904296875, 0.08056640625, 0.084228515625, 0.087890625, 0.091552734375, 0.09521484375, 0.098876953125, 0.1025390625, 0.106201171875, 0.10986328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 8.0, 5.0, 7.0, 10.0, 18.0, 17.0, 26.0, 47.0, 78.0, 168.0, 358.0, 1028.0, 3580.0, 17961.0, 214562.0, 3689323.0, 242875.0, 18579.0, 3728.0, 1083.0, 412.0, 181.0, 98.0, 47.0, 23.0, 9.0, 11.0, 11.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.350341796875, -0.3398895263671875, -0.329437255859375, -0.3189849853515625, -0.30853271484375, -0.2980804443359375, -0.287628173828125, -0.2771759033203125, -0.2667236328125, -0.2562713623046875, -0.245819091796875, -0.2353668212890625, -0.22491455078125, -0.2144622802734375, -0.204010009765625, -0.1935577392578125, -0.18310546875, -0.1726531982421875, -0.162200927734375, -0.1517486572265625, -0.14129638671875, -0.1308441162109375, -0.120391845703125, -0.1099395751953125, -0.0994873046875, -0.0890350341796875, -0.078582763671875, -0.0681304931640625, -0.05767822265625, -0.0472259521484375, -0.036773681640625, -0.0263214111328125, -0.015869140625, -0.0054168701171875, 0.005035400390625, 0.0154876708984375, 0.02593994140625, 0.0363922119140625, 0.046844482421875, 0.0572967529296875, 0.0677490234375, 0.0782012939453125, 0.088653564453125, 0.0991058349609375, 0.10955810546875, 0.1200103759765625, 0.130462646484375, 0.1409149169921875, 0.1513671875, 0.1618194580078125, 0.172271728515625, 0.1827239990234375, 0.19317626953125, 0.2036285400390625, 0.214080810546875, 0.2245330810546875, 0.2349853515625, 0.2454376220703125, 0.255889892578125, 0.2663421630859375, 0.27679443359375, 0.2872467041015625, 0.297698974609375, 0.3081512451171875, 0.318603515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 6.0, 6.0, 6.0, 7.0, 5.0, 22.0, 20.0, 38.0, 26.0, 37.0, 47.0, 74.0, 106.0, 151.0, 234.0, 331.0, 448.0, 544.0, 568.0, 428.0, 291.0, 201.0, 124.0, 94.0, 63.0, 60.0, 36.0, 19.0, 18.0, 5.0, 13.0, 8.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.189697265625, -0.18352890014648438, -0.17736053466796875, -0.17119216918945312, -0.1650238037109375, -0.15885543823242188, -0.15268707275390625, -0.14651870727539062, -0.140350341796875, -0.13418197631835938, -0.12801361083984375, -0.12184524536132812, -0.1156768798828125, -0.10950851440429688, -0.10334014892578125, -0.09717178344726562, -0.09100341796875, -0.08483505249023438, -0.07866668701171875, -0.07249832153320312, -0.0663299560546875, -0.060161590576171875, -0.05399322509765625, -0.047824859619140625, -0.041656494140625, -0.035488128662109375, -0.02931976318359375, -0.023151397705078125, -0.0169830322265625, -0.010814666748046875, -0.00464630126953125, 0.001522064208984375, 0.0076904296875, 0.013858795166015625, 0.02002716064453125, 0.026195526123046875, 0.0323638916015625, 0.038532257080078125, 0.04470062255859375, 0.050868988037109375, 0.057037353515625, 0.06320571899414062, 0.06937408447265625, 0.07554244995117188, 0.0817108154296875, 0.08787918090820312, 0.09404754638671875, 0.10021591186523438, 0.10638427734375, 0.11255264282226562, 0.11872100830078125, 0.12488937377929688, 0.1310577392578125, 0.13722610473632812, 0.14339447021484375, 0.14956283569335938, 0.155731201171875, 0.16189956665039062, 0.16806793212890625, 0.17423629760742188, 0.1804046630859375, 0.18657302856445312, 0.19274139404296875, 0.19890975952148438, 0.205078125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 13.0, 26.0, 34.0, 65.0, 113.0, 131.0, 178.0, 137.0, 117.0, 70.0, 41.0, 21.0, 7.0, 8.0, 12.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6722023487091064, -1.613752007484436, -1.555301547050476, -1.4968512058258057, -1.4384008646011353, -1.3799504041671753, -1.3215000629425049, -1.263049602508545, -1.2045992612838745, -1.146148920059204, -1.0876984596252441, -1.0292481184005737, -0.9707977175712585, -0.9123473167419434, -0.853896975517273, -0.7954465746879578, -0.7369962334632874, -0.6785458326339722, -0.6200954914093018, -0.5616450905799866, -0.5031946897506714, -0.4447443187236786, -0.3862939476966858, -0.3278435468673706, -0.2693931758403778, -0.21094278991222382, -0.15249240398406982, -0.09404203295707703, -0.035591647028923035, 0.022858738899230957, 0.08130910992622375, 0.13975951075553894, 0.19820988178253174, 0.25666025280952454, 0.3151106536388397, 0.3735610246658325, 0.4320114254951477, 0.4904617965221405, 0.5489121675491333, 0.6073625683784485, 0.6658129692077637, 0.7242633700370789, 0.7827137112617493, 0.8411641120910645, 0.8996145129203796, 0.9580649137496948, 1.0165152549743652, 1.0749657154083252, 1.133415937423706, 1.1918662786483765, 1.2503167390823364, 1.3087670803070068, 1.3672174215316772, 1.4256678819656372, 1.4841182231903076, 1.5425686836242676, 1.601019024848938, 1.6594693660736084, 1.7179198265075684, 1.7763701677322388, 1.8348205089569092, 1.8932709693908691, 1.9517213106155396, 2.01017165184021, 2.06862211227417]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 3.0, 9.0, 10.0, 12.0, 12.0, 11.0, 16.0, 12.0, 17.0, 16.0, 26.0, 29.0, 23.0, 46.0, 41.0, 36.0, 47.0, 58.0, 48.0, 60.0, 50.0, 54.0, 38.0, 33.0, 32.0, 40.0, 35.0, 29.0, 31.0, 16.0, 22.0, 17.0, 7.0, 13.0, 11.0, 6.0, 6.0, 5.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0436985492706299, -1.0101770162582397, -0.9766553640365601, -0.9431338310241699, -0.909612238407135, -0.8760906457901001, -0.8425690531730652, -0.8090474605560303, -0.7755259275436401, -0.7420043349266052, -0.7084827423095703, -0.6749612092971802, -0.6414396166801453, -0.6079180240631104, -0.5743964314460754, -0.5408748388290405, -0.5073532462120056, -0.4738316535949707, -0.4403100907802582, -0.40678849816322327, -0.37326693534851074, -0.33974534273147583, -0.3062237501144409, -0.272702157497406, -0.23918059468269348, -0.20565901696681976, -0.17213743925094604, -0.13861584663391113, -0.10509426891803741, -0.0715726912021637, -0.038051098585128784, -0.004529520869255066, 0.028992056846618652, 0.06251363456249237, 0.09603521972894669, 0.129556804895401, 0.16307838261127472, 0.19659996032714844, 0.23012155294418335, 0.26364314556121826, 0.2971647083759308, 0.3306863009929657, 0.3642078638076782, 0.39772945642471313, 0.43125104904174805, 0.46477261185646057, 0.4982942044734955, 0.531815767288208, 0.5653373599052429, 0.5988589525222778, 0.6323805451393127, 0.6659021377563477, 0.6994236707687378, 0.7329452633857727, 0.7664668560028076, 0.7999884486198425, 0.8335100412368774, 0.8670316338539124, 0.9005532264709473, 0.9340747594833374, 0.9675963521003723, 1.0011179447174072, 1.034639596939087, 1.068161129951477, 1.1016826629638672]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 11.0, 12.0, 17.0, 22.0, 22.0, 44.0, 73.0, 107.0, 183.0, 345.0, 609.0, 1179.0, 2452.0, 5945.0, 15640.0, 44396.0, 145847.0, 420430.0, 282306.0, 84289.0, 27171.0, 9707.0, 4043.0, 1757.0, 813.0, 429.0, 257.0, 137.0, 100.0, 63.0, 52.0, 30.0, 19.0, 14.0, 12.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.2393798828125, -0.23287010192871094, -0.22636032104492188, -0.2198505401611328, -0.21334075927734375, -0.2068309783935547, -0.20032119750976562, -0.19381141662597656, -0.1873016357421875, -0.18079185485839844, -0.17428207397460938, -0.1677722930908203, -0.16126251220703125, -0.1547527313232422, -0.14824295043945312, -0.14173316955566406, -0.135223388671875, -0.12871360778808594, -0.12220382690429688, -0.11569404602050781, -0.10918426513671875, -0.10267448425292969, -0.09616470336914062, -0.08965492248535156, -0.0831451416015625, -0.07663536071777344, -0.07012557983398438, -0.06361579895019531, -0.05710601806640625, -0.05059623718261719, -0.044086456298828125, -0.03757667541503906, -0.03106689453125, -0.024557113647460938, -0.018047332763671875, -0.011537551879882812, -0.00502777099609375, 0.0014820098876953125, 0.007991790771484375, 0.014501571655273438, 0.0210113525390625, 0.027521133422851562, 0.034030914306640625, 0.04054069519042969, 0.04705047607421875, 0.05356025695800781, 0.060070037841796875, 0.06657981872558594, 0.073089599609375, 0.07959938049316406, 0.08610916137695312, 0.09261894226074219, 0.09912872314453125, 0.10563850402832031, 0.11214828491210938, 0.11865806579589844, 0.1251678466796875, 0.13167762756347656, 0.13818740844726562, 0.1446971893310547, 0.15120697021484375, 0.1577167510986328, 0.16422653198242188, 0.17073631286621094, 0.17724609375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 4.0, 5.0, 10.0, 13.0, 11.0, 13.0, 14.0, 11.0, 25.0, 29.0, 21.0, 19.0, 32.0, 33.0, 45.0, 42.0, 49.0, 42.0, 41.0, 37.0, 41.0, 39.0, 45.0, 40.0, 47.0, 48.0, 50.0, 21.0, 21.0, 24.0, 29.0, 14.0, 14.0, 18.0, 10.0, 7.0, 9.0, 4.0, 4.0, 7.0, 1.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.125244140625, -0.12151622772216797, -0.11778831481933594, -0.1140604019165039, -0.11033248901367188, -0.10660457611083984, -0.10287666320800781, -0.09914875030517578, -0.09542083740234375, -0.09169292449951172, -0.08796501159667969, -0.08423709869384766, -0.08050918579101562, -0.0767812728881836, -0.07305335998535156, -0.06932544708251953, -0.0655975341796875, -0.06186962127685547, -0.05814170837402344, -0.054413795471191406, -0.050685882568359375, -0.046957969665527344, -0.04323005676269531, -0.03950214385986328, -0.03577423095703125, -0.03204631805419922, -0.028318405151367188, -0.024590492248535156, -0.020862579345703125, -0.017134666442871094, -0.013406753540039062, -0.009678840637207031, -0.005950927734375, -0.0022230148315429688, 0.0015048980712890625, 0.005232810974121094, 0.008960723876953125, 0.012688636779785156, 0.016416549682617188, 0.02014446258544922, 0.02387237548828125, 0.02760028839111328, 0.03132820129394531, 0.035056114196777344, 0.038784027099609375, 0.042511940002441406, 0.04623985290527344, 0.04996776580810547, 0.0536956787109375, 0.05742359161376953, 0.06115150451660156, 0.0648794174194336, 0.06860733032226562, 0.07233524322509766, 0.07606315612792969, 0.07979106903076172, 0.08351898193359375, 0.08724689483642578, 0.09097480773925781, 0.09470272064208984, 0.09843063354492188, 0.1021585464477539, 0.10588645935058594, 0.10961437225341797, 0.11334228515625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 8.0, 6.0, 2.0, 11.0, 9.0, 14.0, 21.0, 28.0, 51.0, 71.0, 91.0, 156.0, 209.0, 334.0, 418.0, 731.0, 1436.0, 3839.0, 15412.0, 103059.0, 762844.0, 133142.0, 18366.0, 4397.0, 1568.0, 782.0, 473.0, 331.0, 232.0, 157.0, 100.0, 73.0, 55.0, 41.0, 33.0, 11.0, 16.0, 13.0, 7.0, 8.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.40673828125, -0.3959083557128906, -0.38507843017578125, -0.3742485046386719, -0.3634185791015625, -0.3525886535644531, -0.34175872802734375, -0.3309288024902344, -0.320098876953125, -0.3092689514160156, -0.29843902587890625, -0.2876091003417969, -0.2767791748046875, -0.2659492492675781, -0.25511932373046875, -0.24428939819335938, -0.23345947265625, -0.22262954711914062, -0.21179962158203125, -0.20096969604492188, -0.1901397705078125, -0.17930984497070312, -0.16847991943359375, -0.15764999389648438, -0.146820068359375, -0.13599014282226562, -0.12516021728515625, -0.11433029174804688, -0.1035003662109375, -0.09267044067382812, -0.08184051513671875, -0.07101058959960938, -0.0601806640625, -0.049350738525390625, -0.03852081298828125, -0.027690887451171875, -0.0168609619140625, -0.006031036376953125, 0.00479888916015625, 0.015628814697265625, 0.026458740234375, 0.037288665771484375, 0.04811859130859375, 0.058948516845703125, 0.0697784423828125, 0.08060836791992188, 0.09143829345703125, 0.10226821899414062, 0.11309814453125, 0.12392807006835938, 0.13475799560546875, 0.14558792114257812, 0.1564178466796875, 0.16724777221679688, 0.17807769775390625, 0.18890762329101562, 0.199737548828125, 0.21056747436523438, 0.22139739990234375, 0.23222732543945312, 0.2430572509765625, 0.2538871765136719, 0.26471710205078125, 0.2755470275878906, 0.286376953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 11.0, 16.0, 12.0, 16.0, 20.0, 31.0, 23.0, 27.0, 34.0, 44.0, 54.0, 61.0, 49.0, 41.0, 65.0, 56.0, 60.0, 56.0, 49.0, 40.0, 59.0, 28.0, 26.0, 22.0, 25.0, 13.0, 9.0, 11.0, 9.0, 10.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498291015625, -0.4828834533691406, -0.46747589111328125, -0.4520683288574219, -0.4366607666015625, -0.4212532043457031, -0.40584564208984375, -0.3904380798339844, -0.375030517578125, -0.3596229553222656, -0.34421539306640625, -0.3288078308105469, -0.3134002685546875, -0.2979927062988281, -0.28258514404296875, -0.2671775817871094, -0.25177001953125, -0.23636245727539062, -0.22095489501953125, -0.20554733276367188, -0.1901397705078125, -0.17473220825195312, -0.15932464599609375, -0.14391708374023438, -0.128509521484375, -0.11310195922851562, -0.09769439697265625, -0.08228683471679688, -0.0668792724609375, -0.051471710205078125, -0.03606414794921875, -0.020656585693359375, -0.0052490234375, 0.010158538818359375, 0.02556610107421875, 0.040973663330078125, 0.0563812255859375, 0.07178878784179688, 0.08719635009765625, 0.10260391235351562, 0.118011474609375, 0.13341903686523438, 0.14882659912109375, 0.16423416137695312, 0.1796417236328125, 0.19504928588867188, 0.21045684814453125, 0.22586441040039062, 0.24127197265625, 0.2566795349121094, 0.27208709716796875, 0.2874946594238281, 0.3029022216796875, 0.3183097839355469, 0.33371734619140625, 0.3491249084472656, 0.364532470703125, 0.3799400329589844, 0.39534759521484375, 0.4107551574707031, 0.4261627197265625, 0.4415702819824219, 0.45697784423828125, 0.4723854064941406, 0.48779296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 7.0, 6.0, 9.0, 23.0, 28.0, 41.0, 73.0, 89.0, 181.0, 303.0, 653.0, 1506.0, 4021.0, 13034.0, 55631.0, 615235.0, 296773.0, 44180.0, 10828.0, 3359.0, 1238.0, 582.0, 293.0, 156.0, 107.0, 61.0, 45.0, 21.0, 14.0, 18.0, 13.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.083251953125, -0.08047008514404297, -0.07768821716308594, -0.0749063491821289, -0.07212448120117188, -0.06934261322021484, -0.06656074523925781, -0.06377887725830078, -0.06099700927734375, -0.05821514129638672, -0.05543327331542969, -0.052651405334472656, -0.049869537353515625, -0.047087669372558594, -0.04430580139160156, -0.04152393341064453, -0.0387420654296875, -0.03596019744873047, -0.03317832946777344, -0.030396461486816406, -0.027614593505859375, -0.024832725524902344, -0.022050857543945312, -0.01926898956298828, -0.01648712158203125, -0.013705253601074219, -0.010923385620117188, -0.008141517639160156, -0.005359649658203125, -0.0025777816772460938, 0.0002040863037109375, 0.0029859542846679688, 0.005767822265625, 0.008549690246582031, 0.011331558227539062, 0.014113426208496094, 0.016895294189453125, 0.019677162170410156, 0.022459030151367188, 0.02524089813232422, 0.02802276611328125, 0.03080463409423828, 0.03358650207519531, 0.036368370056152344, 0.039150238037109375, 0.041932106018066406, 0.04471397399902344, 0.04749584197998047, 0.0502777099609375, 0.05305957794189453, 0.05584144592285156, 0.058623313903808594, 0.061405181884765625, 0.06418704986572266, 0.06696891784667969, 0.06975078582763672, 0.07253265380859375, 0.07531452178955078, 0.07809638977050781, 0.08087825775146484, 0.08366012573242188, 0.0864419937133789, 0.08922386169433594, 0.09200572967529297, 0.09478759765625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 13.0, 9.0, 15.0, 20.0, 25.0, 34.0, 29.0, 49.0, 51.0, 84.0, 99.0, 98.0, 108.0, 81.0, 75.0, 46.0, 32.0, 29.0, 25.0, 16.0, 12.0, 10.0, 12.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1604042053222656e-05, -4.014279693365097e-05, -3.8681551814079285e-05, -3.72203066945076e-05, -3.575906157493591e-05, -3.429781645536423e-05, -3.283657133579254e-05, -3.1375326216220856e-05, -2.991408109664917e-05, -2.8452835977077484e-05, -2.69915908575058e-05, -2.5530345737934113e-05, -2.4069100618362427e-05, -2.260785549879074e-05, -2.1146610379219055e-05, -1.968536525964737e-05, -1.8224120140075684e-05, -1.6762875020503998e-05, -1.5301629900932312e-05, -1.3840384781360626e-05, -1.237913966178894e-05, -1.0917894542217255e-05, -9.456649422645569e-06, -7.995404303073883e-06, -6.534159183502197e-06, -5.0729140639305115e-06, -3.6116689443588257e-06, -2.15042382478714e-06, -6.891787052154541e-07, 7.720664143562317e-07, 2.2333115339279175e-06, 3.6945566534996033e-06, 5.155801773071289e-06, 6.617046892642975e-06, 8.07829201221466e-06, 9.539537131786346e-06, 1.1000782251358032e-05, 1.2462027370929718e-05, 1.3923272490501404e-05, 1.538451761007309e-05, 1.6845762729644775e-05, 1.830700784921646e-05, 1.9768252968788147e-05, 2.1229498088359833e-05, 2.269074320793152e-05, 2.4151988327503204e-05, 2.561323344707489e-05, 2.7074478566646576e-05, 2.8535723686218262e-05, 2.9996968805789948e-05, 3.145821392536163e-05, 3.291945904493332e-05, 3.4380704164505005e-05, 3.584194928407669e-05, 3.7303194403648376e-05, 3.876443952322006e-05, 4.022568464279175e-05, 4.1686929762363434e-05, 4.314817488193512e-05, 4.4609420001506805e-05, 4.607066512107849e-05, 4.753191024065018e-05, 4.899315536022186e-05, 5.045440047979355e-05, 5.1915645599365234e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 7.0, 6.0, 6.0, 8.0, 7.0, 14.0, 16.0, 23.0, 41.0, 38.0, 54.0, 94.0, 123.0, 201.0, 274.0, 503.0, 891.0, 1739.0, 3771.0, 9417.0, 27591.0, 103137.0, 644310.0, 188116.0, 44067.0, 13693.0, 5264.0, 2327.0, 1118.0, 646.0, 348.0, 217.0, 147.0, 95.0, 75.0, 48.0, 34.0, 24.0, 15.0, 19.0, 8.0, 8.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0], "bins": [-0.0816650390625, -0.07943916320800781, -0.07721328735351562, -0.07498741149902344, -0.07276153564453125, -0.07053565979003906, -0.06830978393554688, -0.06608390808105469, -0.0638580322265625, -0.06163215637207031, -0.059406280517578125, -0.05718040466308594, -0.05495452880859375, -0.05272865295410156, -0.050502777099609375, -0.04827690124511719, -0.046051025390625, -0.04382514953613281, -0.041599273681640625, -0.03937339782714844, -0.03714752197265625, -0.03492164611816406, -0.032695770263671875, -0.030469894409179688, -0.0282440185546875, -0.026018142700195312, -0.023792266845703125, -0.021566390991210938, -0.01934051513671875, -0.017114639282226562, -0.014888763427734375, -0.012662887573242188, -0.01043701171875, -0.008211135864257812, -0.005985260009765625, -0.0037593841552734375, -0.00153350830078125, 0.0006923675537109375, 0.002918243408203125, 0.0051441192626953125, 0.0073699951171875, 0.009595870971679688, 0.011821746826171875, 0.014047622680664062, 0.01627349853515625, 0.018499374389648438, 0.020725250244140625, 0.022951126098632812, 0.025177001953125, 0.027402877807617188, 0.029628753662109375, 0.03185462951660156, 0.03408050537109375, 0.03630638122558594, 0.038532257080078125, 0.04075813293457031, 0.0429840087890625, 0.04520988464355469, 0.047435760498046875, 0.04966163635253906, 0.05188751220703125, 0.05411338806152344, 0.056339263916015625, 0.05856513977050781, 0.060791015625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 8.0, 8.0, 11.0, 9.0, 16.0, 7.0, 17.0, 23.0, 16.0, 35.0, 49.0, 50.0, 68.0, 72.0, 91.0, 78.0, 68.0, 73.0, 60.0, 35.0, 35.0, 29.0, 27.0, 21.0, 13.0, 10.0, 9.0, 9.0, 8.0, 7.0, 4.0, 7.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07476806640625, -0.07243919372558594, -0.07011032104492188, -0.06778144836425781, -0.06545257568359375, -0.06312370300292969, -0.060794830322265625, -0.05846595764160156, -0.0561370849609375, -0.05380821228027344, -0.051479339599609375, -0.04915046691894531, -0.04682159423828125, -0.04449272155761719, -0.042163848876953125, -0.03983497619628906, -0.037506103515625, -0.03517723083496094, -0.032848358154296875, -0.030519485473632812, -0.02819061279296875, -0.025861740112304688, -0.023532867431640625, -0.021203994750976562, -0.0188751220703125, -0.016546249389648438, -0.014217376708984375, -0.011888504028320312, -0.00955963134765625, -0.0072307586669921875, -0.004901885986328125, -0.0025730133056640625, -0.000244140625, 0.0020847320556640625, 0.004413604736328125, 0.0067424774169921875, 0.00907135009765625, 0.011400222778320312, 0.013729095458984375, 0.016057968139648438, 0.0183868408203125, 0.020715713500976562, 0.023044586181640625, 0.025373458862304688, 0.02770233154296875, 0.030031204223632812, 0.032360076904296875, 0.03468894958496094, 0.037017822265625, 0.03934669494628906, 0.041675567626953125, 0.04400444030761719, 0.04633331298828125, 0.04866218566894531, 0.050991058349609375, 0.05331993103027344, 0.0556488037109375, 0.05797767639160156, 0.060306549072265625, 0.06263542175292969, 0.06496429443359375, 0.06729316711425781, 0.06962203979492188, 0.07195091247558594, 0.07427978515625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 16.0, 28.0, 56.0, 131.0, 197.0, 319.0, 122.0, 49.0, 27.0, 10.0, 11.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7548468112945557, -3.6754565238952637, -3.596066474914551, -3.516676187515259, -3.437285900115967, -3.357895851135254, -3.278505563735962, -3.19911527633667, -3.119725227355957, -3.040334939956665, -2.960944890975952, -2.88155460357666, -2.802164316177368, -2.722774028778076, -2.6433839797973633, -2.5639936923980713, -2.4846034049987793, -2.4052131175994873, -2.3258230686187744, -2.2464327812194824, -2.1670424938201904, -2.0876522064208984, -2.0082621574401855, -1.9288718700408936, -1.8494817018508911, -1.7700915336608887, -1.6907012462615967, -1.6113110780715942, -1.5319209098815918, -1.4525306224822998, -1.3731404542922974, -1.293750286102295, -1.2143598794937134, -1.134969711303711, -1.055579423904419, -0.9761892557144165, -0.8967990279197693, -0.8174088001251221, -0.7380186319351196, -0.6586284041404724, -0.5792381763458252, -0.499847948551178, -0.42045775055885315, -0.3410675525665283, -0.2616773247718811, -0.1822870969772339, -0.10289689898490906, -0.02350670099258423, 0.05588352680206299, 0.135273739695549, 0.21466395258903503, 0.29405415058135986, 0.3734443783760071, 0.4528346061706543, 0.5322247743606567, 0.611615002155304, 0.6910052299499512, 0.7703954577445984, 0.8497856855392456, 0.929175853729248, 1.00856614112854, 1.0879563093185425, 1.167346477508545, 1.246736764907837, 1.3261269330978394]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 8.0, 3.0, 4.0, 6.0, 10.0, 10.0, 15.0, 14.0, 13.0, 22.0, 23.0, 22.0, 25.0, 27.0, 26.0, 33.0, 32.0, 39.0, 48.0, 69.0, 82.0, 73.0, 68.0, 35.0, 32.0, 33.0, 25.0, 23.0, 28.0, 24.0, 20.0, 18.0, 15.0, 11.0, 15.0, 16.0, 6.0, 10.0, 3.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4711780548095703, -1.426309585571289, -1.3814411163330078, -1.3365726470947266, -1.2917041778564453, -1.2468358278274536, -1.2019673585891724, -1.1570988893508911, -1.1122304201126099, -1.0673619508743286, -1.0224934816360474, -0.9776250720024109, -0.9327566027641296, -0.8878881335258484, -0.8430197238922119, -0.7981512546539307, -0.7532827854156494, -0.7084143161773682, -0.6635458469390869, -0.6186774373054504, -0.5738089680671692, -0.5289404988288879, -0.4840720593929291, -0.4392036199569702, -0.39433515071868896, -0.3494666814804077, -0.30459824204444885, -0.25972980260849, -0.21486133337020874, -0.16999287903308868, -0.12512442469596863, -0.08025598526000977, -0.035387635231018066, 0.00948081910610199, 0.054349273443222046, 0.0992177277803421, 0.14408618211746216, 0.18895463645458221, 0.23382309079170227, 0.27869153022766113, 0.3235599994659424, 0.36842846870422363, 0.4132969081401825, 0.45816534757614136, 0.5030338168144226, 0.5479022860527039, 0.5927706956863403, 0.6376391649246216, 0.6825076341629028, 0.7273761034011841, 0.7722445726394653, 0.8171129822731018, 0.8619814515113831, 0.9068499207496643, 0.9517183303833008, 0.996586799621582, 1.0414552688598633, 1.0863237380981445, 1.1311922073364258, 1.176060676574707, 1.2209291458129883, 1.26579749584198, 1.3106659650802612, 1.3555344343185425, 1.4004029035568237]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 11.0, 11.0, 20.0, 27.0, 29.0, 71.0, 91.0, 166.0, 319.0, 587.0, 1317.0, 2996.0, 7863.0, 26676.0, 130377.0, 875849.0, 2441007.0, 585033.0, 89862.0, 20577.0, 6609.0, 2564.0, 1075.0, 511.0, 270.0, 152.0, 73.0, 57.0, 25.0, 29.0, 7.0, 2.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.1599445343017578, -0.15485000610351562, -0.14975547790527344, -0.14466094970703125, -0.13956642150878906, -0.13447189331054688, -0.1293773651123047, -0.1242828369140625, -0.11918830871582031, -0.11409378051757812, -0.10899925231933594, -0.10390472412109375, -0.09881019592285156, -0.09371566772460938, -0.08862113952636719, -0.083526611328125, -0.07843208312988281, -0.07333755493164062, -0.06824302673339844, -0.06314849853515625, -0.05805397033691406, -0.052959442138671875, -0.04786491394042969, -0.0427703857421875, -0.03767585754394531, -0.032581329345703125, -0.027486801147460938, -0.02239227294921875, -0.017297744750976562, -0.012203216552734375, -0.0071086883544921875, -0.00201416015625, 0.0030803680419921875, 0.008174896240234375, 0.013269424438476562, 0.01836395263671875, 0.023458480834960938, 0.028553009033203125, 0.03364753723144531, 0.0387420654296875, 0.04383659362792969, 0.048931121826171875, 0.05402565002441406, 0.05912017822265625, 0.06421470642089844, 0.06930923461914062, 0.07440376281738281, 0.079498291015625, 0.08459281921386719, 0.08968734741210938, 0.09478187561035156, 0.09987640380859375, 0.10497093200683594, 0.11006546020507812, 0.11515998840332031, 0.1202545166015625, 0.1253490447998047, 0.13044357299804688, 0.13553810119628906, 0.14063262939453125, 0.14572715759277344, 0.15082168579101562, 0.1559162139892578, 0.1610107421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 3.0, 6.0, 6.0, 4.0, 13.0, 19.0, 15.0, 19.0, 26.0, 33.0, 34.0, 31.0, 35.0, 52.0, 46.0, 42.0, 45.0, 40.0, 52.0, 48.0, 57.0, 49.0, 42.0, 38.0, 41.0, 40.0, 22.0, 14.0, 30.0, 25.0, 13.0, 15.0, 7.0, 16.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12139892578125, -0.11739826202392578, -0.11339759826660156, -0.10939693450927734, -0.10539627075195312, -0.1013956069946289, -0.09739494323730469, -0.09339427947998047, -0.08939361572265625, -0.08539295196533203, -0.08139228820800781, -0.0773916244506836, -0.07339096069335938, -0.06939029693603516, -0.06538963317871094, -0.06138896942138672, -0.0573883056640625, -0.05338764190673828, -0.04938697814941406, -0.045386314392089844, -0.041385650634765625, -0.037384986877441406, -0.03338432312011719, -0.02938365936279297, -0.02538299560546875, -0.02138233184814453, -0.017381668090820312, -0.013381004333496094, -0.009380340576171875, -0.005379676818847656, -0.0013790130615234375, 0.0026216506958007812, 0.006622314453125, 0.010622978210449219, 0.014623641967773438, 0.018624305725097656, 0.022624969482421875, 0.026625633239746094, 0.030626296997070312, 0.03462696075439453, 0.03862762451171875, 0.04262828826904297, 0.04662895202636719, 0.050629615783691406, 0.054630279541015625, 0.058630943298339844, 0.06263160705566406, 0.06663227081298828, 0.0706329345703125, 0.07463359832763672, 0.07863426208496094, 0.08263492584228516, 0.08663558959960938, 0.0906362533569336, 0.09463691711425781, 0.09863758087158203, 0.10263824462890625, 0.10663890838623047, 0.11063957214355469, 0.1146402359008789, 0.11864089965820312, 0.12264156341552734, 0.12664222717285156, 0.13064289093017578, 0.1346435546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 3.0, 9.0, 8.0, 11.0, 22.0, 16.0, 45.0, 72.0, 139.0, 263.0, 618.0, 2049.0, 10423.0, 169762.0, 3811780.0, 185194.0, 10683.0, 1900.0, 660.0, 271.0, 147.0, 68.0, 45.0, 41.0, 17.0, 11.0, 7.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3447265625, -0.33304595947265625, -0.3213653564453125, -0.30968475341796875, -0.298004150390625, -0.28632354736328125, -0.2746429443359375, -0.26296234130859375, -0.25128173828125, -0.23960113525390625, -0.2279205322265625, -0.21623992919921875, -0.204559326171875, -0.19287872314453125, -0.1811981201171875, -0.16951751708984375, -0.1578369140625, -0.14615631103515625, -0.1344757080078125, -0.12279510498046875, -0.111114501953125, -0.09943389892578125, -0.0877532958984375, -0.07607269287109375, -0.06439208984375, -0.05271148681640625, -0.0410308837890625, -0.02935028076171875, -0.017669677734375, -0.00598907470703125, 0.0056915283203125, 0.01737213134765625, 0.029052734375, 0.04073333740234375, 0.0524139404296875, 0.06409454345703125, 0.075775146484375, 0.08745574951171875, 0.0991363525390625, 0.11081695556640625, 0.12249755859375, 0.13417816162109375, 0.1458587646484375, 0.15753936767578125, 0.169219970703125, 0.18090057373046875, 0.1925811767578125, 0.20426177978515625, 0.2159423828125, 0.22762298583984375, 0.2393035888671875, 0.25098419189453125, 0.262664794921875, 0.27434539794921875, 0.2860260009765625, 0.29770660400390625, 0.30938720703125, 0.32106781005859375, 0.3327484130859375, 0.34442901611328125, 0.356109619140625, 0.36779022216796875, 0.3794708251953125, 0.39115142822265625, 0.40283203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 12.0, 8.0, 12.0, 23.0, 18.0, 25.0, 41.0, 53.0, 77.0, 107.0, 167.0, 219.0, 346.0, 428.0, 559.0, 547.0, 447.0, 293.0, 187.0, 151.0, 106.0, 68.0, 50.0, 28.0, 29.0, 16.0, 13.0, 5.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177978515625, -0.17136573791503906, -0.16475296020507812, -0.1581401824951172, -0.15152740478515625, -0.1449146270751953, -0.13830184936523438, -0.13168907165527344, -0.1250762939453125, -0.11846351623535156, -0.11185073852539062, -0.10523796081542969, -0.09862518310546875, -0.09201240539550781, -0.08539962768554688, -0.07878684997558594, -0.072174072265625, -0.06556129455566406, -0.058948516845703125, -0.05233573913574219, -0.04572296142578125, -0.03911018371582031, -0.032497406005859375, -0.025884628295898438, -0.0192718505859375, -0.012659072875976562, -0.006046295166015625, 0.0005664825439453125, 0.00717926025390625, 0.013792037963867188, 0.020404815673828125, 0.027017593383789062, 0.03363037109375, 0.04024314880371094, 0.046855926513671875, 0.05346870422363281, 0.06008148193359375, 0.06669425964355469, 0.07330703735351562, 0.07991981506347656, 0.0865325927734375, 0.09314537048339844, 0.09975814819335938, 0.10637092590332031, 0.11298370361328125, 0.11959648132324219, 0.12620925903320312, 0.13282203674316406, 0.139434814453125, 0.14604759216308594, 0.15266036987304688, 0.1592731475830078, 0.16588592529296875, 0.1724987030029297, 0.17911148071289062, 0.18572425842285156, 0.1923370361328125, 0.19894981384277344, 0.20556259155273438, 0.2121753692626953, 0.21878814697265625, 0.2254009246826172, 0.23201370239257812, 0.23862648010253906, 0.2452392578125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 10.0, 32.0, 88.0, 236.0, 311.0, 203.0, 67.0, 29.0, 9.0, 10.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.481540679931641, -6.35811710357666, -6.234694004058838, -6.111270427703857, -5.987846851348877, -5.864423751831055, -5.741000175476074, -5.617576599121094, -5.494153022766113, -5.370729446411133, -5.2473063468933105, -5.12388277053833, -5.00045919418335, -4.877036094665527, -4.753612518310547, -4.630188941955566, -4.506765842437744, -4.383342266082764, -4.259919166564941, -4.136495590209961, -4.0130720138549805, -3.889648675918579, -3.7662253379821777, -3.6428017616271973, -3.519378185272217, -3.3959548473358154, -3.272531270980835, -3.1491079330444336, -3.025684356689453, -2.9022610187530518, -2.7788376808166504, -2.65541410446167, -2.5319910049438477, -2.4085676670074463, -2.285144090652466, -2.1617207527160645, -2.038297176361084, -1.9148738384246826, -1.7914503812789917, -1.6680269241333008, -1.5446033477783203, -1.4211798906326294, -1.2977564334869385, -1.174333095550537, -1.0509096384048462, -0.9274861812591553, -0.8040627241134644, -0.6806393265724182, -0.5572159290313721, -0.43379250168800354, -0.310369074344635, -0.1869456171989441, -0.06352218985557556, 0.05990123748779297, 0.1833246946334839, 0.30674809217453003, 0.43017154932022095, 0.5535950064659119, 0.677018404006958, 0.8004418611526489, 0.9238653182983398, 1.0472886562347412, 1.1707122325897217, 1.294135570526123, 1.417559027671814]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 2.0, 2.0, 6.0, 6.0, 4.0, 7.0, 19.0, 13.0, 16.0, 25.0, 21.0, 23.0, 33.0, 36.0, 31.0, 32.0, 40.0, 54.0, 46.0, 38.0, 42.0, 43.0, 46.0, 59.0, 37.0, 35.0, 33.0, 20.0, 34.0, 19.0, 23.0, 26.0, 18.0, 20.0, 18.0, 12.0, 9.0, 8.0, 8.0, 7.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0951546430587769, -1.0612988471984863, -1.0274431705474854, -0.9935874342918396, -0.9597316980361938, -0.9258759021759033, -0.8920201659202576, -0.8581644296646118, -0.8243086934089661, -0.7904529571533203, -0.7565972208976746, -0.7227414846420288, -0.6888856887817383, -0.6550300121307373, -0.6211742162704468, -0.587318480014801, -0.5534627437591553, -0.5196070075035095, -0.48575127124786377, -0.45189550518989563, -0.4180397689342499, -0.3841840326786041, -0.350328266620636, -0.31647253036499023, -0.2826167941093445, -0.24876105785369873, -0.21490530669689178, -0.18104955554008484, -0.1471938192844391, -0.11333808302879333, -0.07948233187198639, -0.04562658071517944, -0.011770963668823242, 0.022084780037403107, 0.055940523743629456, 0.0897962674498558, 0.12365201115608215, 0.1575077474117279, 0.19136349856853485, 0.2252192497253418, 0.25907498598098755, 0.2929307222366333, 0.32678645849227905, 0.3606422245502472, 0.39449796080589294, 0.4283536970615387, 0.46220946311950684, 0.4960651993751526, 0.5299209356307983, 0.5637766718864441, 0.5976324081420898, 0.6314881443977356, 0.6653438806533813, 0.6991996765136719, 0.7330554127693176, 0.7669111490249634, 0.8007668852806091, 0.8346226215362549, 0.8684783577919006, 0.9023340940475464, 0.9361898899078369, 0.9700455665588379, 1.0039013624191284, 1.037757158279419, 1.07161283493042]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 11.0, 17.0, 17.0, 23.0, 36.0, 60.0, 79.0, 128.0, 204.0, 310.0, 550.0, 920.0, 1756.0, 3378.0, 7144.0, 16516.0, 43323.0, 139122.0, 432123.0, 275467.0, 78529.0, 27158.0, 11053.0, 4987.0, 2499.0, 1293.0, 713.0, 405.0, 243.0, 170.0, 103.0, 69.0, 57.0, 22.0, 16.0, 14.0, 8.0, 12.0, 4.0, 4.0, 3.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19873046875, -0.19182205200195312, -0.18491363525390625, -0.17800521850585938, -0.1710968017578125, -0.16418838500976562, -0.15727996826171875, -0.15037155151367188, -0.143463134765625, -0.13655471801757812, -0.12964630126953125, -0.12273788452148438, -0.1158294677734375, -0.10892105102539062, -0.10201263427734375, -0.09510421752929688, -0.08819580078125, -0.08128738403320312, -0.07437896728515625, -0.06747055053710938, -0.0605621337890625, -0.053653717041015625, -0.04674530029296875, -0.039836883544921875, -0.032928466796875, -0.026020050048828125, -0.01911163330078125, -0.012203216552734375, -0.0052947998046875, 0.001613616943359375, 0.00852203369140625, 0.015430450439453125, 0.0223388671875, 0.029247283935546875, 0.03615570068359375, 0.043064117431640625, 0.0499725341796875, 0.056880950927734375, 0.06378936767578125, 0.07069778442382812, 0.077606201171875, 0.08451461791992188, 0.09142303466796875, 0.09833145141601562, 0.1052398681640625, 0.11214828491210938, 0.11905670166015625, 0.12596511840820312, 0.13287353515625, 0.13978195190429688, 0.14669036865234375, 0.15359878540039062, 0.1605072021484375, 0.16741561889648438, 0.17432403564453125, 0.18123245239257812, 0.188140869140625, 0.19504928588867188, 0.20195770263671875, 0.20886611938476562, 0.2157745361328125, 0.22268295288085938, 0.22959136962890625, 0.23649978637695312, 0.243408203125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 15.0, 12.0, 14.0, 19.0, 16.0, 27.0, 36.0, 41.0, 29.0, 53.0, 60.0, 58.0, 36.0, 40.0, 44.0, 46.0, 45.0, 50.0, 40.0, 48.0, 32.0, 51.0, 26.0, 28.0, 16.0, 19.0, 24.0, 14.0, 8.0, 10.0, 8.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12186050415039062, -0.11774444580078125, -0.11362838745117188, -0.1095123291015625, -0.10539627075195312, -0.10128021240234375, -0.09716415405273438, -0.093048095703125, -0.08893203735351562, -0.08481597900390625, -0.08069992065429688, -0.0765838623046875, -0.07246780395507812, -0.06835174560546875, -0.06423568725585938, -0.06011962890625, -0.056003570556640625, -0.05188751220703125, -0.047771453857421875, -0.0436553955078125, -0.039539337158203125, -0.03542327880859375, -0.031307220458984375, -0.027191162109375, -0.023075103759765625, -0.01895904541015625, -0.014842987060546875, -0.0107269287109375, -0.006610870361328125, -0.00249481201171875, 0.001621246337890625, 0.0057373046875, 0.009853363037109375, 0.01396942138671875, 0.018085479736328125, 0.0222015380859375, 0.026317596435546875, 0.03043365478515625, 0.034549713134765625, 0.038665771484375, 0.042781829833984375, 0.04689788818359375, 0.051013946533203125, 0.0551300048828125, 0.059246063232421875, 0.06336212158203125, 0.06747817993164062, 0.07159423828125, 0.07571029663085938, 0.07982635498046875, 0.08394241333007812, 0.0880584716796875, 0.09217453002929688, 0.09629058837890625, 0.10040664672851562, 0.104522705078125, 0.10863876342773438, 0.11275482177734375, 0.11687088012695312, 0.1209869384765625, 0.12510299682617188, 0.12921905517578125, 0.13333511352539062, 0.137451171875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 7.0, 8.0, 24.0, 18.0, 25.0, 30.0, 59.0, 85.0, 137.0, 188.0, 294.0, 446.0, 764.0, 1492.0, 3979.0, 23973.0, 824432.0, 176067.0, 10998.0, 2606.0, 1220.0, 575.0, 374.0, 255.0, 154.0, 116.0, 73.0, 49.0, 27.0, 24.0, 14.0, 8.0, 7.0, 9.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58544921875, -0.568634033203125, -0.55181884765625, -0.535003662109375, -0.5181884765625, -0.501373291015625, -0.48455810546875, -0.467742919921875, -0.450927734375, -0.434112548828125, -0.41729736328125, -0.400482177734375, -0.3836669921875, -0.366851806640625, -0.35003662109375, -0.333221435546875, -0.31640625, -0.299591064453125, -0.28277587890625, -0.265960693359375, -0.2491455078125, -0.232330322265625, -0.21551513671875, -0.198699951171875, -0.181884765625, -0.165069580078125, -0.14825439453125, -0.131439208984375, -0.1146240234375, -0.097808837890625, -0.08099365234375, -0.064178466796875, -0.04736328125, -0.030548095703125, -0.01373291015625, 0.003082275390625, 0.0198974609375, 0.036712646484375, 0.05352783203125, 0.070343017578125, 0.087158203125, 0.103973388671875, 0.12078857421875, 0.137603759765625, 0.1544189453125, 0.171234130859375, 0.18804931640625, 0.204864501953125, 0.2216796875, 0.238494873046875, 0.25531005859375, 0.272125244140625, 0.2889404296875, 0.305755615234375, 0.32257080078125, 0.339385986328125, 0.356201171875, 0.373016357421875, 0.38983154296875, 0.406646728515625, 0.4234619140625, 0.440277099609375, 0.45709228515625, 0.473907470703125, 0.49072265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 1.0, 8.0, 11.0, 11.0, 24.0, 16.0, 24.0, 28.0, 42.0, 44.0, 69.0, 65.0, 84.0, 78.0, 80.0, 78.0, 64.0, 64.0, 40.0, 31.0, 32.0, 22.0, 31.0, 18.0, 6.0, 13.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6904296875, -0.6700286865234375, -0.649627685546875, -0.6292266845703125, -0.60882568359375, -0.5884246826171875, -0.568023681640625, -0.5476226806640625, -0.5272216796875, -0.5068206787109375, -0.486419677734375, -0.4660186767578125, -0.44561767578125, -0.4252166748046875, -0.404815673828125, -0.3844146728515625, -0.364013671875, -0.3436126708984375, -0.323211669921875, -0.3028106689453125, -0.28240966796875, -0.2620086669921875, -0.241607666015625, -0.2212066650390625, -0.2008056640625, -0.1804046630859375, -0.160003662109375, -0.1396026611328125, -0.11920166015625, -0.0988006591796875, -0.078399658203125, -0.0579986572265625, -0.03759765625, -0.0171966552734375, 0.003204345703125, 0.0236053466796875, 0.04400634765625, 0.0644073486328125, 0.084808349609375, 0.1052093505859375, 0.1256103515625, 0.1460113525390625, 0.166412353515625, 0.1868133544921875, 0.20721435546875, 0.2276153564453125, 0.248016357421875, 0.2684173583984375, 0.288818359375, 0.3092193603515625, 0.329620361328125, 0.3500213623046875, 0.37042236328125, 0.3908233642578125, 0.411224365234375, 0.4316253662109375, 0.4520263671875, 0.4724273681640625, 0.492828369140625, 0.5132293701171875, 0.53363037109375, 0.5540313720703125, 0.574432373046875, 0.5948333740234375, 0.615234375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 6.0, 7.0, 12.0, 12.0, 21.0, 9.0, 28.0, 32.0, 48.0, 49.0, 80.0, 104.0, 155.0, 272.0, 542.0, 1153.0, 2923.0, 8969.0, 47872.0, 833103.0, 129196.0, 16082.0, 4518.0, 1633.0, 686.0, 359.0, 208.0, 126.0, 103.0, 49.0, 48.0, 30.0, 21.0, 23.0, 9.0, 5.0, 8.0, 9.0, 5.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.12200927734375, -0.11849308013916016, -0.11497688293457031, -0.11146068572998047, -0.10794448852539062, -0.10442829132080078, -0.10091209411621094, -0.0973958969116211, -0.09387969970703125, -0.0903635025024414, -0.08684730529785156, -0.08333110809326172, -0.07981491088867188, -0.07629871368408203, -0.07278251647949219, -0.06926631927490234, -0.0657501220703125, -0.062233924865722656, -0.05871772766113281, -0.05520153045654297, -0.051685333251953125, -0.04816913604736328, -0.04465293884277344, -0.041136741638183594, -0.03762054443359375, -0.034104347229003906, -0.030588150024414062, -0.02707195281982422, -0.023555755615234375, -0.02003955841064453, -0.016523361206054688, -0.013007164001464844, -0.009490966796875, -0.005974769592285156, -0.0024585723876953125, 0.0010576248168945312, 0.004573822021484375, 0.008090019226074219, 0.011606216430664062, 0.015122413635253906, 0.01863861083984375, 0.022154808044433594, 0.025671005249023438, 0.02918720245361328, 0.032703399658203125, 0.03621959686279297, 0.03973579406738281, 0.043251991271972656, 0.0467681884765625, 0.050284385681152344, 0.05380058288574219, 0.05731678009033203, 0.060832977294921875, 0.06434917449951172, 0.06786537170410156, 0.0713815689086914, 0.07489776611328125, 0.0784139633178711, 0.08193016052246094, 0.08544635772705078, 0.08896255493164062, 0.09247875213623047, 0.09599494934082031, 0.09951114654541016, 0.10302734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 11.0, 5.0, 9.0, 17.0, 9.0, 22.0, 30.0, 32.0, 39.0, 71.0, 76.0, 94.0, 101.0, 100.0, 82.0, 61.0, 55.0, 36.0, 22.0, 28.0, 15.0, 13.0, 14.0, 2.0, 7.0, 10.0, 4.0, 0.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.3272972106933594e-05, -4.1985884308815e-05, -4.069879651069641e-05, -3.941170871257782e-05, -3.812462091445923e-05, -3.683753311634064e-05, -3.5550445318222046e-05, -3.4263357520103455e-05, -3.297626972198486e-05, -3.168918192386627e-05, -3.040209412574768e-05, -2.911500632762909e-05, -2.7827918529510498e-05, -2.6540830731391907e-05, -2.5253742933273315e-05, -2.3966655135154724e-05, -2.2679567337036133e-05, -2.139247953891754e-05, -2.010539174079895e-05, -1.881830394268036e-05, -1.7531216144561768e-05, -1.6244128346443176e-05, -1.4957040548324585e-05, -1.3669952750205994e-05, -1.2382864952087402e-05, -1.1095777153968811e-05, -9.80868935585022e-06, -8.521601557731628e-06, -7.234513759613037e-06, -5.947425961494446e-06, -4.6603381633758545e-06, -3.373250365257263e-06, -2.086162567138672e-06, -7.990747690200806e-07, 4.880130290985107e-07, 1.775100827217102e-06, 3.0621886253356934e-06, 4.349276423454285e-06, 5.636364221572876e-06, 6.923452019691467e-06, 8.210539817810059e-06, 9.49762761592865e-06, 1.0784715414047241e-05, 1.2071803212165833e-05, 1.3358891010284424e-05, 1.4645978808403015e-05, 1.5933066606521606e-05, 1.7220154404640198e-05, 1.850724220275879e-05, 1.979433000087738e-05, 2.108141779899597e-05, 2.2368505597114563e-05, 2.3655593395233154e-05, 2.4942681193351746e-05, 2.6229768991470337e-05, 2.7516856789588928e-05, 2.880394458770752e-05, 3.009103238582611e-05, 3.13781201839447e-05, 3.2665207982063293e-05, 3.3952295780181885e-05, 3.5239383578300476e-05, 3.652647137641907e-05, 3.781355917453766e-05, 3.910064697265625e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 6.0, 9.0, 6.0, 16.0, 18.0, 28.0, 26.0, 41.0, 97.0, 135.0, 182.0, 281.0, 487.0, 849.0, 1697.0, 3846.0, 10209.0, 40918.0, 599272.0, 335547.0, 38014.0, 9588.0, 3607.0, 1572.0, 782.0, 451.0, 276.0, 190.0, 116.0, 71.0, 52.0, 32.0, 33.0, 26.0, 21.0, 8.0, 7.0, 7.0, 8.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07366943359375, -0.07103633880615234, -0.06840324401855469, -0.06577014923095703, -0.06313705444335938, -0.06050395965576172, -0.05787086486816406, -0.055237770080566406, -0.05260467529296875, -0.049971580505371094, -0.04733848571777344, -0.04470539093017578, -0.042072296142578125, -0.03943920135498047, -0.03680610656738281, -0.034173011779785156, -0.0315399169921875, -0.028906822204589844, -0.026273727416992188, -0.02364063262939453, -0.021007537841796875, -0.01837444305419922, -0.015741348266601562, -0.013108253479003906, -0.01047515869140625, -0.007842063903808594, -0.0052089691162109375, -0.0025758743286132812, 5.7220458984375e-05, 0.0026903152465820312, 0.0053234100341796875, 0.007956504821777344, 0.010589599609375, 0.013222694396972656, 0.015855789184570312, 0.01848888397216797, 0.021121978759765625, 0.02375507354736328, 0.026388168334960938, 0.029021263122558594, 0.03165435791015625, 0.034287452697753906, 0.03692054748535156, 0.03955364227294922, 0.042186737060546875, 0.04481983184814453, 0.04745292663574219, 0.050086021423339844, 0.0527191162109375, 0.055352210998535156, 0.05798530578613281, 0.06061840057373047, 0.06325149536132812, 0.06588459014892578, 0.06851768493652344, 0.0711507797241211, 0.07378387451171875, 0.0764169692993164, 0.07905006408691406, 0.08168315887451172, 0.08431625366210938, 0.08694934844970703, 0.08958244323730469, 0.09221553802490234, 0.0948486328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 9.0, 2.0, 6.0, 10.0, 16.0, 19.0, 20.0, 27.0, 31.0, 34.0, 54.0, 58.0, 71.0, 91.0, 84.0, 82.0, 89.0, 59.0, 42.0, 39.0, 40.0, 17.0, 22.0, 15.0, 11.0, 9.0, 6.0, 5.0, 3.0, 6.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06292724609375, -0.060718536376953125, -0.05850982666015625, -0.056301116943359375, -0.0540924072265625, -0.051883697509765625, -0.04967498779296875, -0.047466278076171875, -0.045257568359375, -0.043048858642578125, -0.04084014892578125, -0.038631439208984375, -0.0364227294921875, -0.034214019775390625, -0.03200531005859375, -0.029796600341796875, -0.027587890625, -0.025379180908203125, -0.02317047119140625, -0.020961761474609375, -0.0187530517578125, -0.016544342041015625, -0.01433563232421875, -0.012126922607421875, -0.009918212890625, -0.007709503173828125, -0.00550079345703125, -0.003292083740234375, -0.0010833740234375, 0.001125335693359375, 0.00333404541015625, 0.005542755126953125, 0.00775146484375, 0.009960174560546875, 0.01216888427734375, 0.014377593994140625, 0.0165863037109375, 0.018795013427734375, 0.02100372314453125, 0.023212432861328125, 0.025421142578125, 0.027629852294921875, 0.02983856201171875, 0.032047271728515625, 0.0342559814453125, 0.036464691162109375, 0.03867340087890625, 0.040882110595703125, 0.0430908203125, 0.045299530029296875, 0.04750823974609375, 0.049716949462890625, 0.0519256591796875, 0.054134368896484375, 0.05634307861328125, 0.058551788330078125, 0.060760498046875, 0.06296920776367188, 0.06517791748046875, 0.06738662719726562, 0.0695953369140625, 0.07180404663085938, 0.07401275634765625, 0.07622146606445312, 0.07843017578125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 49.0, 264.0, 525.0, 100.0, 29.0, 20.0, 0.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.548857688903809, -8.359682083129883, -8.170506477355957, -7.981330871582031, -7.7921552658081055, -7.60297966003418, -7.413804054260254, -7.224628448486328, -7.035452842712402, -6.846277236938477, -6.657101631164551, -6.467926025390625, -6.278750419616699, -6.089574813842773, -5.900399208068848, -5.711223602294922, -5.522047996520996, -5.33287239074707, -5.1436967849731445, -4.954521179199219, -4.765345573425293, -4.576169967651367, -4.386994361877441, -4.197818756103516, -4.00864315032959, -3.819467544555664, -3.6302919387817383, -3.4411163330078125, -3.2519407272338867, -3.062765121459961, -2.873589515686035, -2.6844139099121094, -2.4952383041381836, -2.306062698364258, -2.116887092590332, -1.9277114868164062, -1.7385358810424805, -1.5493602752685547, -1.360184669494629, -1.1710090637207031, -0.9818334579467773, -0.7926578521728516, -0.6034822463989258, -0.414306640625, -0.22513103485107422, -0.03595542907714844, 0.15322017669677734, 0.3423957824707031, 0.5315713882446289, 0.7207469940185547, 0.9099225997924805, 1.0990982055664062, 1.288273811340332, 1.4774494171142578, 1.6666250228881836, 1.8558006286621094, 2.044976234436035, 2.234151840209961, 2.4233274459838867, 2.6125030517578125, 2.8016786575317383, 2.990854263305664, 3.18002986907959, 3.3692054748535156, 3.5583810806274414]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 3.0, 7.0, 11.0, 11.0, 13.0, 13.0, 17.0, 21.0, 22.0, 25.0, 22.0, 21.0, 27.0, 28.0, 45.0, 74.0, 118.0, 119.0, 53.0, 43.0, 41.0, 24.0, 28.0, 20.0, 25.0, 23.0, 21.0, 22.0, 15.0, 17.0, 8.0, 9.0, 3.0, 5.0, 9.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.342806339263916, -1.2965245246887207, -1.2502427101135254, -1.20396089553833, -1.1576792001724243, -1.111397385597229, -1.0651155710220337, -1.0188337564468384, -0.9725520014762878, -0.9262701869010925, -0.879988431930542, -0.8337066173553467, -0.7874248027801514, -0.7411430478096008, -0.6948612332344055, -0.648579478263855, -0.6022976636886597, -0.5560158491134644, -0.5097340941429138, -0.4634522795677185, -0.4171704947948456, -0.37088871002197266, -0.32460689544677734, -0.2783251106739044, -0.2320433259010315, -0.18576154112815857, -0.13947974145412445, -0.09319794178009033, -0.04691615700721741, -0.0006343722343444824, 0.04564744234085083, 0.09192922711372375, 0.13821089267730713, 0.18449267745018005, 0.23077447712421417, 0.2770562767982483, 0.3233380615711212, 0.36961984634399414, 0.41590166091918945, 0.4621834456920624, 0.5084652304649353, 0.5547470450401306, 0.6010288000106812, 0.6473106145858765, 0.6935924291610718, 0.7398741841316223, 0.7861559987068176, 0.8324377536773682, 0.8787195682525635, 0.9250013828277588, 0.9712831377983093, 1.0175650119781494, 1.0638467073440552, 1.1101285219192505, 1.1564103364944458, 1.2026921510696411, 1.2489738464355469, 1.2952556610107422, 1.3415374755859375, 1.3878192901611328, 1.4341009855270386, 1.4803828001022339, 1.5266646146774292, 1.5729464292526245, 1.6192282438278198]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 15.0, 19.0, 24.0, 33.0, 52.0, 86.0, 124.0, 183.0, 291.0, 438.0, 775.0, 1299.0, 2466.0, 4859.0, 11601.0, 35284.0, 149821.0, 702001.0, 1878421.0, 1071894.0, 248727.0, 55813.0, 16975.0, 6417.0, 2901.0, 1490.0, 889.0, 508.0, 323.0, 186.0, 118.0, 81.0, 41.0, 32.0, 26.0, 17.0, 11.0, 7.0, 2.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.18017578125, -0.17465972900390625, -0.1691436767578125, -0.16362762451171875, -0.158111572265625, -0.15259552001953125, -0.1470794677734375, -0.14156341552734375, -0.13604736328125, -0.13053131103515625, -0.1250152587890625, -0.11949920654296875, -0.113983154296875, -0.10846710205078125, -0.1029510498046875, -0.09743499755859375, -0.0919189453125, -0.08640289306640625, -0.0808868408203125, -0.07537078857421875, -0.069854736328125, -0.06433868408203125, -0.0588226318359375, -0.05330657958984375, -0.04779052734375, -0.04227447509765625, -0.0367584228515625, -0.03124237060546875, -0.025726318359375, -0.02021026611328125, -0.0146942138671875, -0.00917816162109375, -0.003662109375, 0.00185394287109375, 0.0073699951171875, 0.01288604736328125, 0.018402099609375, 0.02391815185546875, 0.0294342041015625, 0.03495025634765625, 0.04046630859375, 0.04598236083984375, 0.0514984130859375, 0.05701446533203125, 0.062530517578125, 0.06804656982421875, 0.0735626220703125, 0.07907867431640625, 0.0845947265625, 0.09011077880859375, 0.0956268310546875, 0.10114288330078125, 0.106658935546875, 0.11217498779296875, 0.1176910400390625, 0.12320709228515625, 0.12872314453125, 0.13423919677734375, 0.1397552490234375, 0.14527130126953125, 0.150787353515625, 0.15630340576171875, 0.1618194580078125, 0.16733551025390625, 0.1728515625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 4.0, 4.0, 13.0, 10.0, 20.0, 18.0, 28.0, 23.0, 42.0, 46.0, 44.0, 49.0, 61.0, 47.0, 54.0, 41.0, 56.0, 45.0, 43.0, 46.0, 40.0, 38.0, 39.0, 25.0, 30.0, 24.0, 19.0, 22.0, 19.0, 5.0, 5.0, 9.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11883544921875, -0.11483097076416016, -0.11082649230957031, -0.10682201385498047, -0.10281753540039062, -0.09881305694580078, -0.09480857849121094, -0.0908041000366211, -0.08679962158203125, -0.0827951431274414, -0.07879066467285156, -0.07478618621826172, -0.07078170776367188, -0.06677722930908203, -0.06277275085449219, -0.058768272399902344, -0.0547637939453125, -0.050759315490722656, -0.04675483703613281, -0.04275035858154297, -0.038745880126953125, -0.03474140167236328, -0.030736923217773438, -0.026732444763183594, -0.02272796630859375, -0.018723487854003906, -0.014719009399414062, -0.010714530944824219, -0.006710052490234375, -0.0027055740356445312, 0.0012989044189453125, 0.005303382873535156, 0.009307861328125, 0.013312339782714844, 0.017316818237304688, 0.02132129669189453, 0.025325775146484375, 0.02933025360107422, 0.03333473205566406, 0.037339210510253906, 0.04134368896484375, 0.045348167419433594, 0.04935264587402344, 0.05335712432861328, 0.057361602783203125, 0.06136608123779297, 0.06537055969238281, 0.06937503814697266, 0.0733795166015625, 0.07738399505615234, 0.08138847351074219, 0.08539295196533203, 0.08939743041992188, 0.09340190887451172, 0.09740638732910156, 0.1014108657836914, 0.10541534423828125, 0.1094198226928711, 0.11342430114746094, 0.11742877960205078, 0.12143325805664062, 0.12543773651123047, 0.1294422149658203, 0.13344669342041016, 0.137451171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 4.0, 4.0, 11.0, 8.0, 26.0, 21.0, 46.0, 63.0, 114.0, 211.0, 436.0, 1145.0, 4553.0, 107607.0, 4049028.0, 26086.0, 3048.0, 950.0, 410.0, 190.0, 110.0, 71.0, 39.0, 20.0, 19.0, 16.0, 12.0, 6.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.1097259521484375, -1.080780029296875, -1.0518341064453125, -1.02288818359375, -0.9939422607421875, -0.964996337890625, -0.9360504150390625, -0.9071044921875, -0.8781585693359375, -0.849212646484375, -0.8202667236328125, -0.79132080078125, -0.7623748779296875, -0.733428955078125, -0.7044830322265625, -0.675537109375, -0.6465911865234375, -0.617645263671875, -0.5886993408203125, -0.55975341796875, -0.5308074951171875, -0.501861572265625, -0.4729156494140625, -0.4439697265625, -0.4150238037109375, -0.386077880859375, -0.3571319580078125, -0.32818603515625, -0.2992401123046875, -0.270294189453125, -0.2413482666015625, -0.21240234375, -0.1834564208984375, -0.154510498046875, -0.1255645751953125, -0.09661865234375, -0.0676727294921875, -0.038726806640625, -0.0097808837890625, 0.0191650390625, 0.0481109619140625, 0.077056884765625, 0.1060028076171875, 0.13494873046875, 0.1638946533203125, 0.192840576171875, 0.2217864990234375, 0.250732421875, 0.2796783447265625, 0.308624267578125, 0.3375701904296875, 0.36651611328125, 0.3954620361328125, 0.424407958984375, 0.4533538818359375, 0.4822998046875, 0.5112457275390625, 0.540191650390625, 0.5691375732421875, 0.59808349609375, 0.6270294189453125, 0.655975341796875, 0.6849212646484375, 0.7138671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 6.0, 7.0, 15.0, 19.0, 27.0, 49.0, 73.0, 123.0, 179.0, 288.0, 414.0, 628.0, 700.0, 515.0, 365.0, 218.0, 142.0, 86.0, 66.0, 38.0, 28.0, 20.0, 17.0, 11.0, 7.0, 6.0, 5.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.33349609375, -0.3190460205078125, -0.304595947265625, -0.2901458740234375, -0.27569580078125, -0.2612457275390625, -0.246795654296875, -0.2323455810546875, -0.2178955078125, -0.2034454345703125, -0.188995361328125, -0.1745452880859375, -0.16009521484375, -0.1456451416015625, -0.131195068359375, -0.1167449951171875, -0.102294921875, -0.0878448486328125, -0.073394775390625, -0.0589447021484375, -0.04449462890625, -0.0300445556640625, -0.015594482421875, -0.0011444091796875, 0.0133056640625, 0.0277557373046875, 0.042205810546875, 0.0566558837890625, 0.07110595703125, 0.0855560302734375, 0.100006103515625, 0.1144561767578125, 0.12890625, 0.1433563232421875, 0.157806396484375, 0.1722564697265625, 0.18670654296875, 0.2011566162109375, 0.215606689453125, 0.2300567626953125, 0.2445068359375, 0.2589569091796875, 0.273406982421875, 0.2878570556640625, 0.30230712890625, 0.3167572021484375, 0.331207275390625, 0.3456573486328125, 0.360107421875, 0.3745574951171875, 0.389007568359375, 0.4034576416015625, 0.41790771484375, 0.4323577880859375, 0.446807861328125, 0.4612579345703125, 0.4757080078125, 0.4901580810546875, 0.504608154296875, 0.5190582275390625, 0.53350830078125, 0.5479583740234375, 0.562408447265625, 0.5768585205078125, 0.59130859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 6.0, 5.0, 15.0, 30.0, 108.0, 324.0, 259.0, 140.0, 57.0, 20.0, 19.0, 11.0, 2.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.773124694824219, -4.505444526672363, -4.23776388168335, -3.970083475112915, -3.7024030685424805, -3.434722661972046, -3.1670422554016113, -2.8993618488311768, -2.631681442260742, -2.3640010356903076, -2.096320629119873, -1.8286402225494385, -1.560959815979004, -1.2932794094085693, -1.0255990028381348, -0.7579185962677002, -0.4902381896972656, -0.22255778312683105, 0.045122623443603516, 0.3128030300140381, 0.5804834365844727, 0.8481638431549072, 1.1158442497253418, 1.3835246562957764, 1.651205062866211, 1.9188854694366455, 2.18656587600708, 2.4542462825775146, 2.721926689147949, 2.989607095718384, 3.2572875022888184, 3.524967908859253, 3.792649269104004, 4.060329437255859, 4.328010082244873, 4.595690727233887, 4.863370895385742, 5.131051063537598, 5.398731708526611, 5.666412353515625, 5.9340925216674805, 6.201772689819336, 6.46945333480835, 6.737133979797363, 7.004814147949219, 7.272494316101074, 7.540174961090088, 7.807855606079102, 8.075535774230957, 8.343215942382812, 8.610897064208984, 8.87857723236084, 9.146257400512695, 9.41393756866455, 9.681617736816406, 9.949298858642578, 10.216979026794434, 10.484659194946289, 10.752340316772461, 11.020020484924316, 11.287700653076172, 11.555380821228027, 11.823060989379883, 12.090742111206055, 12.35842227935791]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 1.0, 1.0, 5.0, 5.0, 7.0, 6.0, 8.0, 11.0, 12.0, 21.0, 18.0, 28.0, 34.0, 33.0, 46.0, 49.0, 62.0, 69.0, 58.0, 62.0, 70.0, 65.0, 64.0, 52.0, 41.0, 30.0, 35.0, 30.0, 28.0, 15.0, 16.0, 9.0, 2.0, 5.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7750701904296875, -2.673734188079834, -2.5723981857299805, -2.471062183380127, -2.3697259426116943, -2.268389940261841, -2.1670539379119873, -2.065717935562134, -1.9643819332122803, -1.8630459308624268, -1.7617098093032837, -1.6603738069534302, -1.5590378046035767, -1.4577016830444336, -1.35636568069458, -1.2550296783447266, -1.1536935567855835, -1.05235755443573, -0.9510214924812317, -0.8496854305267334, -0.7483494281768799, -0.6470133662223816, -0.5456773042678833, -0.4443413019180298, -0.3430052399635315, -0.2416692078113556, -0.1403331607580185, -0.038997113704681396, 0.06233891844749451, 0.1636749505996704, 0.2650110125541687, 0.3663470149040222, 0.4676830768585205, 0.5690191388130188, 0.6703551411628723, 0.7716912031173706, 0.8730272054672241, 0.9743632674217224, 1.0756993293762207, 1.1770353317260742, 1.2783713340759277, 1.3797073364257812, 1.4810434579849243, 1.5823794603347778, 1.6837154626846313, 1.7850515842437744, 1.886387586593628, 1.9877235889434814, 2.089059829711914, 2.1903958320617676, 2.291731834411621, 2.3930678367614746, 2.4944040775299072, 2.5957400798797607, 2.6970760822296143, 2.7984120845794678, 2.8997480869293213, 3.001084089279175, 3.1024200916290283, 3.203756332397461, 3.3050923347473145, 3.406428337097168, 3.5077643394470215, 3.609100341796875, 3.7104363441467285]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 12.0, 17.0, 14.0, 21.0, 59.0, 85.0, 183.0, 344.0, 829.0, 2028.0, 5830.0, 21717.0, 159863.0, 768380.0, 69683.0, 13030.0, 3858.0, 1389.0, 601.0, 264.0, 146.0, 74.0, 52.0, 27.0, 17.0, 9.0, 7.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2147216796875, -0.20510292053222656, -0.19548416137695312, -0.1858654022216797, -0.17624664306640625, -0.1666278839111328, -0.15700912475585938, -0.14739036560058594, -0.1377716064453125, -0.12815284729003906, -0.11853408813476562, -0.10891532897949219, -0.09929656982421875, -0.08967781066894531, -0.08005905151367188, -0.07044029235839844, -0.060821533203125, -0.05120277404785156, -0.041584014892578125, -0.03196525573730469, -0.02234649658203125, -0.012727737426757812, -0.003108978271484375, 0.0065097808837890625, 0.0161285400390625, 0.025747299194335938, 0.035366058349609375, 0.04498481750488281, 0.05460357666015625, 0.06422233581542969, 0.07384109497070312, 0.08345985412597656, 0.09307861328125, 0.10269737243652344, 0.11231613159179688, 0.12193489074707031, 0.13155364990234375, 0.1411724090576172, 0.15079116821289062, 0.16040992736816406, 0.1700286865234375, 0.17964744567871094, 0.18926620483398438, 0.1988849639892578, 0.20850372314453125, 0.2181224822998047, 0.22774124145507812, 0.23736000061035156, 0.246978759765625, 0.25659751892089844, 0.2662162780761719, 0.2758350372314453, 0.28545379638671875, 0.2950725555419922, 0.3046913146972656, 0.31431007385253906, 0.3239288330078125, 0.33354759216308594, 0.3431663513183594, 0.3527851104736328, 0.36240386962890625, 0.3720226287841797, 0.3816413879394531, 0.39126014709472656, 0.40087890625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 5.0, 11.0, 11.0, 15.0, 19.0, 29.0, 25.0, 48.0, 40.0, 41.0, 49.0, 55.0, 68.0, 48.0, 50.0, 76.0, 62.0, 66.0, 52.0, 52.0, 38.0, 34.0, 29.0, 17.0, 15.0, 7.0, 15.0, 4.0, 6.0, 7.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1302490234375, -0.1244049072265625, -0.118560791015625, -0.1127166748046875, -0.10687255859375, -0.1010284423828125, -0.095184326171875, -0.0893402099609375, -0.08349609375, -0.0776519775390625, -0.071807861328125, -0.0659637451171875, -0.06011962890625, -0.0542755126953125, -0.048431396484375, -0.0425872802734375, -0.0367431640625, -0.0308990478515625, -0.025054931640625, -0.0192108154296875, -0.01336669921875, -0.0075225830078125, -0.001678466796875, 0.0041656494140625, 0.010009765625, 0.0158538818359375, 0.021697998046875, 0.0275421142578125, 0.03338623046875, 0.0392303466796875, 0.045074462890625, 0.0509185791015625, 0.0567626953125, 0.0626068115234375, 0.068450927734375, 0.0742950439453125, 0.08013916015625, 0.0859832763671875, 0.091827392578125, 0.0976715087890625, 0.103515625, 0.1093597412109375, 0.115203857421875, 0.1210479736328125, 0.12689208984375, 0.1327362060546875, 0.138580322265625, 0.1444244384765625, 0.1502685546875, 0.1561126708984375, 0.161956787109375, 0.1678009033203125, 0.17364501953125, 0.1794891357421875, 0.185333251953125, 0.1911773681640625, 0.197021484375, 0.2028656005859375, 0.208709716796875, 0.2145538330078125, 0.22039794921875, 0.2262420654296875, 0.232086181640625, 0.2379302978515625, 0.2437744140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 5.0, 8.0, 3.0, 9.0, 11.0, 17.0, 27.0, 39.0, 55.0, 68.0, 108.0, 157.0, 259.0, 462.0, 965.0, 2669.0, 12098.0, 173777.0, 833615.0, 18211.0, 3465.0, 1174.0, 503.0, 268.0, 180.0, 133.0, 60.0, 43.0, 37.0, 24.0, 25.0, 23.0, 17.0, 8.0, 3.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.36181640625, -0.3512077331542969, -0.34059906005859375, -0.3299903869628906, -0.3193817138671875, -0.3087730407714844, -0.29816436767578125, -0.2875556945800781, -0.276947021484375, -0.2663383483886719, -0.25572967529296875, -0.24512100219726562, -0.2345123291015625, -0.22390365600585938, -0.21329498291015625, -0.20268630981445312, -0.19207763671875, -0.18146896362304688, -0.17086029052734375, -0.16025161743164062, -0.1496429443359375, -0.13903427124023438, -0.12842559814453125, -0.11781692504882812, -0.107208251953125, -0.09659957885742188, -0.08599090576171875, -0.07538223266601562, -0.0647735595703125, -0.054164886474609375, -0.04355621337890625, -0.032947540283203125, -0.0223388671875, -0.011730194091796875, -0.00112152099609375, 0.009487152099609375, 0.0200958251953125, 0.030704498291015625, 0.04131317138671875, 0.051921844482421875, 0.062530517578125, 0.07313919067382812, 0.08374786376953125, 0.09435653686523438, 0.1049652099609375, 0.11557388305664062, 0.12618255615234375, 0.13679122924804688, 0.14739990234375, 0.15800857543945312, 0.16861724853515625, 0.17922592163085938, 0.1898345947265625, 0.20044326782226562, 0.21105194091796875, 0.22166061401367188, 0.232269287109375, 0.24287796020507812, 0.25348663330078125, 0.2640953063964844, 0.2747039794921875, 0.2853126525878906, 0.29592132568359375, 0.3065299987792969, 0.317138671875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 4.0, 6.0, 11.0, 15.0, 9.0, 12.0, 13.0, 20.0, 26.0, 29.0, 36.0, 39.0, 55.0, 76.0, 73.0, 89.0, 78.0, 63.0, 69.0, 47.0, 41.0, 38.0, 21.0, 16.0, 17.0, 14.0, 20.0, 9.0, 5.0, 7.0, 3.0, 3.0, 4.0, 3.0, 6.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55810546875, -0.538116455078125, -0.51812744140625, -0.498138427734375, -0.4781494140625, -0.458160400390625, -0.43817138671875, -0.418182373046875, -0.398193359375, -0.378204345703125, -0.35821533203125, -0.338226318359375, -0.3182373046875, -0.298248291015625, -0.27825927734375, -0.258270263671875, -0.23828125, -0.218292236328125, -0.19830322265625, -0.178314208984375, -0.1583251953125, -0.138336181640625, -0.11834716796875, -0.098358154296875, -0.078369140625, -0.058380126953125, -0.03839111328125, -0.018402099609375, 0.0015869140625, 0.021575927734375, 0.04156494140625, 0.061553955078125, 0.08154296875, 0.101531982421875, 0.12152099609375, 0.141510009765625, 0.1614990234375, 0.181488037109375, 0.20147705078125, 0.221466064453125, 0.241455078125, 0.261444091796875, 0.28143310546875, 0.301422119140625, 0.3214111328125, 0.341400146484375, 0.36138916015625, 0.381378173828125, 0.4013671875, 0.421356201171875, 0.44134521484375, 0.461334228515625, 0.4813232421875, 0.501312255859375, 0.52130126953125, 0.541290283203125, 0.561279296875, 0.581268310546875, 0.60125732421875, 0.621246337890625, 0.6412353515625, 0.661224365234375, 0.68121337890625, 0.701202392578125, 0.72119140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 12.0, 11.0, 10.0, 14.0, 13.0, 14.0, 27.0, 40.0, 36.0, 70.0, 132.0, 231.0, 408.0, 703.0, 1606.0, 4228.0, 15111.0, 87098.0, 866774.0, 54849.0, 11036.0, 3252.0, 1348.0, 637.0, 330.0, 180.0, 98.0, 62.0, 42.0, 36.0, 29.0, 18.0, 20.0, 11.0, 12.0, 4.0, 3.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.038848876953125, -0.03757047653198242, -0.036292076110839844, -0.035013675689697266, -0.03373527526855469, -0.03245687484741211, -0.03117847442626953, -0.029900074005126953, -0.028621673583984375, -0.027343273162841797, -0.02606487274169922, -0.02478647232055664, -0.023508071899414062, -0.022229671478271484, -0.020951271057128906, -0.019672870635986328, -0.01839447021484375, -0.017116069793701172, -0.015837669372558594, -0.014559268951416016, -0.013280868530273438, -0.01200246810913086, -0.010724067687988281, -0.009445667266845703, -0.008167266845703125, -0.006888866424560547, -0.005610466003417969, -0.004332065582275391, -0.0030536651611328125, -0.0017752647399902344, -0.0004968643188476562, 0.0007815361022949219, 0.0020599365234375, 0.003338336944580078, 0.004616737365722656, 0.005895137786865234, 0.0071735382080078125, 0.00845193862915039, 0.009730339050292969, 0.011008739471435547, 0.012287139892578125, 0.013565540313720703, 0.014843940734863281, 0.01612234115600586, 0.017400741577148438, 0.018679141998291016, 0.019957542419433594, 0.021235942840576172, 0.02251434326171875, 0.023792743682861328, 0.025071144104003906, 0.026349544525146484, 0.027627944946289062, 0.02890634536743164, 0.03018474578857422, 0.0314631462097168, 0.032741546630859375, 0.03401994705200195, 0.03529834747314453, 0.03657674789428711, 0.03785514831542969, 0.039133548736572266, 0.040411949157714844, 0.04169034957885742, 0.04296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 8.0, 5.0, 1.0, 7.0, 5.0, 8.0, 8.0, 22.0, 14.0, 20.0, 24.0, 28.0, 51.0, 70.0, 69.0, 72.0, 88.0, 83.0, 70.0, 62.0, 43.0, 41.0, 37.0, 32.0, 11.0, 18.0, 7.0, 8.0, 10.0, 5.0, 8.0, 12.0, 5.0, 7.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9458274841308594e-05, -3.8215890526771545e-05, -3.69735062122345e-05, -3.573112189769745e-05, -3.44887375831604e-05, -3.324635326862335e-05, -3.2003968954086304e-05, -3.0761584639549255e-05, -2.9519200325012207e-05, -2.827681601047516e-05, -2.703443169593811e-05, -2.5792047381401062e-05, -2.4549663066864014e-05, -2.3307278752326965e-05, -2.2064894437789917e-05, -2.082251012325287e-05, -1.958012580871582e-05, -1.8337741494178772e-05, -1.7095357179641724e-05, -1.5852972865104675e-05, -1.4610588550567627e-05, -1.3368204236030579e-05, -1.212581992149353e-05, -1.0883435606956482e-05, -9.641051292419434e-06, -8.398666977882385e-06, -7.156282663345337e-06, -5.9138983488082886e-06, -4.67151403427124e-06, -3.429129719734192e-06, -2.1867454051971436e-06, -9.443610906600952e-07, 2.980232238769531e-07, 1.5404075384140015e-06, 2.78279185295105e-06, 4.025176167488098e-06, 5.2675604820251465e-06, 6.509944796562195e-06, 7.752329111099243e-06, 8.994713425636292e-06, 1.023709774017334e-05, 1.1479482054710388e-05, 1.2721866369247437e-05, 1.3964250683784485e-05, 1.5206634998321533e-05, 1.644901931285858e-05, 1.769140362739563e-05, 1.8933787941932678e-05, 2.0176172256469727e-05, 2.1418556571006775e-05, 2.2660940885543823e-05, 2.390332520008087e-05, 2.514570951461792e-05, 2.6388093829154968e-05, 2.7630478143692017e-05, 2.8872862458229065e-05, 3.0115246772766113e-05, 3.135763108730316e-05, 3.260001540184021e-05, 3.384239971637726e-05, 3.508478403091431e-05, 3.6327168345451355e-05, 3.75695526599884e-05, 3.881193697452545e-05, 4.00543212890625e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 12.0, 17.0, 22.0, 27.0, 43.0, 54.0, 60.0, 109.0, 168.0, 256.0, 425.0, 648.0, 1158.0, 2017.0, 4204.0, 9048.0, 22837.0, 77846.0, 759835.0, 117598.0, 30240.0, 11151.0, 4877.0, 2416.0, 1319.0, 762.0, 469.0, 283.0, 216.0, 111.0, 82.0, 59.0, 50.0, 35.0, 24.0, 20.0, 10.0, 10.0, 4.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0222015380859375, -0.021425962448120117, -0.020650386810302734, -0.01987481117248535, -0.01909923553466797, -0.018323659896850586, -0.017548084259033203, -0.01677250862121582, -0.015996932983398438, -0.015221357345581055, -0.014445781707763672, -0.013670206069946289, -0.012894630432128906, -0.012119054794311523, -0.01134347915649414, -0.010567903518676758, -0.009792327880859375, -0.009016752243041992, -0.00824117660522461, -0.0074656009674072266, -0.006690025329589844, -0.005914449691772461, -0.005138874053955078, -0.004363298416137695, -0.0035877227783203125, -0.0028121471405029297, -0.002036571502685547, -0.001260995864868164, -0.00048542022705078125, 0.00029015541076660156, 0.0010657310485839844, 0.0018413066864013672, 0.00261688232421875, 0.003392457962036133, 0.004168033599853516, 0.0049436092376708984, 0.005719184875488281, 0.006494760513305664, 0.007270336151123047, 0.00804591178894043, 0.008821487426757812, 0.009597063064575195, 0.010372638702392578, 0.011148214340209961, 0.011923789978027344, 0.012699365615844727, 0.01347494125366211, 0.014250516891479492, 0.015026092529296875, 0.015801668167114258, 0.01657724380493164, 0.017352819442749023, 0.018128395080566406, 0.01890397071838379, 0.019679546356201172, 0.020455121994018555, 0.021230697631835938, 0.02200627326965332, 0.022781848907470703, 0.023557424545288086, 0.02433300018310547, 0.02510857582092285, 0.025884151458740234, 0.026659727096557617, 0.027435302734375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 17.0, 14.0, 28.0, 31.0, 36.0, 60.0, 76.0, 117.0, 131.0, 137.0, 97.0, 72.0, 39.0, 39.0, 35.0, 20.0, 16.0, 9.0, 9.0, 3.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05499267578125, -0.05294990539550781, -0.050907135009765625, -0.04886436462402344, -0.04682159423828125, -0.04477882385253906, -0.042736053466796875, -0.04069328308105469, -0.0386505126953125, -0.03660774230957031, -0.034564971923828125, -0.03252220153808594, -0.03047943115234375, -0.028436660766601562, -0.026393890380859375, -0.024351119995117188, -0.022308349609375, -0.020265579223632812, -0.018222808837890625, -0.016180038452148438, -0.01413726806640625, -0.012094497680664062, -0.010051727294921875, -0.008008956909179688, -0.0059661865234375, -0.0039234161376953125, -0.001880645751953125, 0.0001621246337890625, 0.00220489501953125, 0.0042476654052734375, 0.006290435791015625, 0.008333206176757812, 0.0103759765625, 0.012418746948242188, 0.014461517333984375, 0.016504287719726562, 0.01854705810546875, 0.020589828491210938, 0.022632598876953125, 0.024675369262695312, 0.0267181396484375, 0.028760910034179688, 0.030803680419921875, 0.03284645080566406, 0.03488922119140625, 0.03693199157714844, 0.038974761962890625, 0.04101753234863281, 0.043060302734375, 0.04510307312011719, 0.047145843505859375, 0.04918861389160156, 0.05123138427734375, 0.05327415466308594, 0.055316925048828125, 0.05735969543457031, 0.0594024658203125, 0.06144523620605469, 0.06348800659179688, 0.06553077697753906, 0.06757354736328125, 0.06961631774902344, 0.07165908813476562, 0.07370185852050781, 0.07574462890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 9.0, 34.0, 296.0, 556.0, 78.0, 26.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4982683658599854, -1.312168836593628, -1.1260693073272705, -0.9399698376655579, -0.7538703083992004, -0.567770779132843, -0.38167130947113037, -0.19557178020477295, -0.009472250938415527, 0.1766272634267807, 0.36272677779197693, 0.548826277256012, 0.7349258065223694, 0.9210253357887268, 1.1071248054504395, 1.2932243347167969, 1.4793238639831543, 1.6654233932495117, 1.8515229225158691, 2.0376224517822266, 2.223721981048584, 2.4098215103149414, 2.595921039581299, 2.7820205688476562, 2.9681200981140137, 3.154219627380371, 3.3403191566467285, 3.526418685913086, 3.7125182151794434, 3.898617744445801, 4.084717273712158, 4.270816802978516, 4.456916332244873, 4.6430158615112305, 4.829115390777588, 5.015214920043945, 5.201314449310303, 5.38741397857666, 5.573513507843018, 5.759613037109375, 5.945712566375732, 6.13181209564209, 6.317911624908447, 6.504011154174805, 6.690110683441162, 6.8762102127075195, 7.062309741973877, 7.248409271240234, 7.434508323669434, 7.620607852935791, 7.806707382202148, 7.992806911468506, 8.178906440734863, 8.365005493164062, 8.551105499267578, 8.737204551696777, 8.923304557800293, 9.109403610229492, 9.295503616333008, 9.481602668762207, 9.667702674865723, 9.853801727294922, 10.039901733398438, 10.226000785827637, 10.412100791931152]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 5.0, 5.0, 2.0, 8.0, 3.0, 13.0, 15.0, 11.0, 13.0, 16.0, 23.0, 27.0, 27.0, 23.0, 29.0, 45.0, 148.0, 257.0, 95.0, 33.0, 22.0, 20.0, 25.0, 30.0, 15.0, 22.0, 7.0, 15.0, 6.0, 14.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6865689754486084, -1.632778286933899, -1.5789874792099, -1.5251967906951904, -1.4714059829711914, -1.417615294456482, -1.3638246059417725, -1.3100337982177734, -1.2562429904937744, -1.202452301979065, -1.148661494255066, -1.0948708057403564, -1.0410799980163574, -0.987289309501648, -0.9334985613822937, -0.8797078132629395, -0.82591712474823, -0.7721263766288757, -0.7183356285095215, -0.664544939994812, -0.610754132270813, -0.5569634437561035, -0.5031726956367493, -0.449381947517395, -0.39559119939804077, -0.3418004512786865, -0.2880097031593323, -0.23421898484230042, -0.18042823672294617, -0.12663748860359192, -0.07284677028656006, -0.01905602216720581, 0.03473472595214844, 0.08852546662092209, 0.14231620728969574, 0.1961069405078888, 0.24989768862724304, 0.3036884367465973, 0.35747915506362915, 0.4112699031829834, 0.46506065130233765, 0.5188513994216919, 0.5726421475410461, 0.6264328956604004, 0.6802235841751099, 0.7340143918991089, 0.7878050804138184, 0.8415958285331726, 0.8953865766525269, 0.9491773247718811, 1.0029680728912354, 1.0567587614059448, 1.1105495691299438, 1.1643402576446533, 1.2181310653686523, 1.2719217538833618, 1.3257124423980713, 1.3795031309127808, 1.4332939386367798, 1.4870846271514893, 1.5408754348754883, 1.5946661233901978, 1.6484568119049072, 1.7022476196289062, 1.7560384273529053]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 9.0, 4.0, 6.0, 4.0, 6.0, 7.0, 10.0, 9.0, 9.0, 15.0, 22.0, 18.0, 24.0, 22.0, 30.0, 28.0, 44.0, 101.0, 253.0, 72.0, 41.0, 21.0, 28.0, 20.0, 30.0, 25.0, 15.0, 18.0, 16.0, 18.0, 14.0, 13.0, 11.0, 7.0, 6.0, 3.0, 5.0, 7.0, 2.0, 6.0, 1.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1368408203125, -0.13297557830810547, -0.12911033630371094, -0.1252450942993164, -0.12137985229492188, -0.11751461029052734, -0.11364936828613281, -0.10978412628173828, -0.10591888427734375, -0.10205364227294922, -0.09818840026855469, -0.09432315826416016, -0.09045791625976562, -0.0865926742553711, -0.08272743225097656, -0.07886219024658203, -0.0749969482421875, -0.07113170623779297, -0.06726646423339844, -0.0634012222290039, -0.059535980224609375, -0.055670738220214844, -0.05180549621582031, -0.04794025421142578, -0.04407501220703125, -0.04020977020263672, -0.03634452819824219, -0.032479286193847656, -0.028614044189453125, -0.024748802185058594, -0.020883560180664062, -0.01701831817626953, -0.013153076171875, -0.009287834167480469, -0.0054225921630859375, -0.0015573501586914062, 0.002307891845703125, 0.006173133850097656, 0.010038375854492188, 0.013903617858886719, 0.01776885986328125, 0.02163410186767578, 0.025499343872070312, 0.029364585876464844, 0.033229827880859375, 0.037095069885253906, 0.04096031188964844, 0.04482555389404297, 0.0486907958984375, 0.05255603790283203, 0.05642127990722656, 0.060286521911621094, 0.06415176391601562, 0.06801700592041016, 0.07188224792480469, 0.07574748992919922, 0.07961273193359375, 0.08347797393798828, 0.08734321594238281, 0.09120845794677734, 0.09507369995117188, 0.0989389419555664, 0.10280418395996094, 0.10666942596435547, 0.11053466796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 0.0, 6.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 5.0, 13.0, 12.0, 33.0, 49.0, 65.0, 154.0, 380.0, 1792.0, 20463.0, 8358076.0, 5985.0, 988.0, 239.0, 105.0, 76.0, 47.0, 26.0, 9.0, 4.0, 9.0, 12.0, 5.0, 4.0, 1.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0], "bins": [-2.059337854385376, -1.9890497922897339, -1.9187617301940918, -1.8484737873077393, -1.7781857252120972, -1.707897663116455, -1.6376097202301025, -1.5673216581344604, -1.4970335960388184, -1.4267455339431763, -1.3564574718475342, -1.2861695289611816, -1.2158814668655396, -1.1455934047698975, -1.075305461883545, -1.0050173997879028, -0.9347293376922607, -0.8644412755966187, -0.7941532731056213, -0.723865270614624, -0.6535772085189819, -0.5832891464233398, -0.5130011439323425, -0.4427131116390228, -0.3724250793457031, -0.3021370470523834, -0.23184901475906372, -0.16156098246574402, -0.09127295017242432, -0.020984917879104614, 0.04930311441421509, 0.11959114670753479, 0.1898794174194336, 0.2601674497127533, 0.330455482006073, 0.4007435142993927, 0.4710315465927124, 0.5413196086883545, 0.6116076111793518, 0.6818956136703491, 0.7521836757659912, 0.8224717378616333, 0.8927597403526306, 0.9630477428436279, 1.03333580493927, 1.103623867034912, 1.1739118099212646, 1.2441998720169067, 1.3144879341125488, 1.384775996208191, 1.455064058303833, 1.5253520011901855, 1.5956400632858276, 1.6659281253814697, 1.7362160682678223, 1.8065041303634644, 1.8767921924591064, 1.9470802545547485, 2.0173683166503906, 2.087656259536743, 2.1579442024230957, 2.2282323837280273, 2.29852032661438, 2.3688085079193115, 2.439096450805664]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 6.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 7.0, 3.0, 5.0, 5.0, 5.0, 3.0, 5.0, 5.0, 5.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.0644290447235107, -2.008401393890381, -1.9523738622665405, -1.8963463306427002, -1.8403187990188599, -1.7842912673950195, -1.7282636165618896, -1.6722360849380493, -1.616208553314209, -1.5601810216903687, -1.5041533708572388, -1.4481258392333984, -1.392098307609558, -1.3360707759857178, -1.280043125152588, -1.2240155935287476, -1.1679880619049072, -1.111960530281067, -1.055932879447937, -0.9999053478240967, -0.9438778162002563, -0.8878502249717712, -0.8318226337432861, -0.7757951021194458, -0.7197674512863159, -0.6637398600578308, -0.6077123284339905, -0.5516847372055054, -0.49565720558166504, -0.43962961435317993, -0.3836020529270172, -0.3275744915008545, -0.27154695987701416, -0.21551939845085144, -0.15949183702468872, -0.10346426069736481, -0.04743669927120209, 0.008590877056121826, 0.06461843848228455, 0.12064599990844727, 0.17667356133460999, 0.2327011227607727, 0.2887286841869354, 0.34475624561309814, 0.40078383684158325, 0.45681139826774597, 0.5128389596939087, 0.568866491317749, 0.6248940825462341, 0.6809216737747192, 0.7369492053985596, 0.7929767966270447, 0.849004328250885, 0.9050319194793701, 0.9610594511032104, 1.0170869827270508, 1.0731146335601807, 1.129142165184021, 1.1851698160171509, 1.2411973476409912, 1.2972248792648315, 1.3532524108886719, 1.4092800617218018, 1.465307593345642, 1.5213351249694824]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 12.0, 11.0, 26.0, 28.0, 33.0, 58.0, 97.0, 147.0, 221.0, 345.0, 698.0, 1632.0, 4239.0, 12970.0, 44768.0, 160013.0, 207398.0, 64162.0, 17939.0, 5584.0, 1984.0, 756.0, 369.0, 236.0, 148.0, 112.0, 65.0, 53.0, 48.0, 26.0, 18.0, 12.0, 12.0, 10.0, 7.0, 8.0, 0.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.01171875, -0.9730224609375, -0.934326171875, -0.8956298828125, -0.85693359375, -0.8182373046875, -0.779541015625, -0.7408447265625, -0.7021484375, -0.6634521484375, -0.624755859375, -0.5860595703125, -0.54736328125, -0.5086669921875, -0.469970703125, -0.4312744140625, -0.392578125, -0.3538818359375, -0.315185546875, -0.2764892578125, -0.23779296875, -0.1990966796875, -0.160400390625, -0.1217041015625, -0.0830078125, -0.0443115234375, -0.005615234375, 0.0330810546875, 0.07177734375, 0.1104736328125, 0.149169921875, 0.1878662109375, 0.2265625, 0.2652587890625, 0.303955078125, 0.3426513671875, 0.38134765625, 0.4200439453125, 0.458740234375, 0.4974365234375, 0.5361328125, 0.5748291015625, 0.613525390625, 0.6522216796875, 0.69091796875, 0.7296142578125, 0.768310546875, 0.8070068359375, 0.845703125, 0.8843994140625, 0.923095703125, 0.9617919921875, 1.00048828125, 1.0391845703125, 1.077880859375, 1.1165771484375, 1.1552734375, 1.1939697265625, 1.232666015625, 1.2713623046875, 1.31005859375, 1.3487548828125, 1.387451171875, 1.4261474609375, 1.46484375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 4.0, 2.0, 9.0, 14.0, 19.0, 16.0, 20.0, 30.0, 44.0, 44.0, 68.0, 72.0, 96.0, 91.0, 80.0, 75.0, 67.0, 41.0, 39.0, 45.0, 27.0, 25.0, 18.0, 10.0, 9.0, 8.0, 8.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1551513671875, -0.14869117736816406, -0.14223098754882812, -0.1357707977294922, -0.12931060791015625, -0.12285041809082031, -0.11639022827148438, -0.10993003845214844, -0.1034698486328125, -0.09700965881347656, -0.09054946899414062, -0.08408927917480469, -0.07762908935546875, -0.07116889953613281, -0.06470870971679688, -0.05824851989746094, -0.051788330078125, -0.04532814025878906, -0.038867950439453125, -0.03240776062011719, -0.02594757080078125, -0.019487380981445312, -0.013027191162109375, -0.0065670013427734375, -0.0001068115234375, 0.0063533782958984375, 0.012813568115234375, 0.019273757934570312, 0.02573394775390625, 0.03219413757324219, 0.038654327392578125, 0.04511451721191406, 0.05157470703125, 0.05803489685058594, 0.06449508666992188, 0.07095527648925781, 0.07741546630859375, 0.08387565612792969, 0.09033584594726562, 0.09679603576660156, 0.1032562255859375, 0.10971641540527344, 0.11617660522460938, 0.12263679504394531, 0.12909698486328125, 0.1355571746826172, 0.14201736450195312, 0.14847755432128906, 0.154937744140625, 0.16139793395996094, 0.16785812377929688, 0.1743183135986328, 0.18077850341796875, 0.1872386932373047, 0.19369888305664062, 0.20015907287597656, 0.2066192626953125, 0.21307945251464844, 0.21953964233398438, 0.2259998321533203, 0.23246002197265625, 0.2389202117919922, 0.24538040161132812, 0.25184059143066406, 0.25830078125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [5.0, 3.0, 9.0, 23.0, 46.0, 117.0, 106.0, 104.0, 32.0, 12.0, 10.0, 7.0, 6.0, 6.0, 2.0, 4.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3772463798522949, -0.31599223613739014, -0.25473809242248535, -0.19348397850990295, -0.13222983479499817, -0.07097569108009338, -0.009721577167510986, 0.0515325665473938, 0.11278671026229858, 0.17404085397720337, 0.23529498279094696, 0.29654911160469055, 0.35780325531959534, 0.4190573990345001, 0.4803115129470825, 0.5415656566619873, 0.6028198003768921, 0.6640739440917969, 0.7253280878067017, 0.7865822315216064, 0.8478363752365112, 0.909090518951416, 0.970344603061676, 1.0315988063812256, 1.0928528308868408, 1.1541069746017456, 1.2153611183166504, 1.2766152620315552, 1.33786940574646, 1.3991235494613647, 1.4603776931762695, 1.5216317176818848, 1.582885980606079, 1.6441401243209839, 1.7053942680358887, 1.7666484117507935, 1.8279025554656982, 1.889156699180603, 1.9504108428955078, 2.011664867401123, 2.0729191303253174, 2.1341731548309326, 2.195427417755127, 2.256681442260742, 2.3179357051849365, 2.3791897296905518, 2.440443992614746, 2.5016980171203613, 2.5629520416259766, 2.624206066131592, 2.685460329055786, 2.7467143535614014, 2.8079686164855957, 2.869222640991211, 2.9304769039154053, 2.9917309284210205, 3.052985191345215, 3.11423921585083, 3.1754934787750244, 3.2367475032806396, 3.298001766204834, 3.359255790710449, 3.4205100536346436, 3.481764078140259, 3.543018341064453]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 3.0, 6.0, 10.0, 14.0, 23.0, 22.0, 26.0, 24.0, 33.0, 41.0, 62.0, 42.0, 35.0, 32.0, 20.0, 18.0, 15.0, 11.0, 3.0, 6.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5427846312522888, -0.5188493132591248, -0.49491405487060547, -0.4709787368774414, -0.44704344868659973, -0.42310816049575806, -0.399172842502594, -0.3752375543117523, -0.35130226612091064, -0.32736697793006897, -0.3034316897392273, -0.27949637174606323, -0.25556108355522156, -0.23162579536437988, -0.20769049227237701, -0.18375518918037415, -0.15981990098953247, -0.1358846127986908, -0.11194930970668793, -0.08801401406526566, -0.06407871842384338, -0.04014342278242111, -0.01620812714099884, 0.007727175951004028, 0.0316624641418457, 0.055597759783267975, 0.07953305542469025, 0.10346835106611252, 0.1274036467075348, 0.15133893489837646, 0.17527423799037933, 0.1992095410823822, 0.22314482927322388, 0.24708011746406555, 0.2710154056549072, 0.2949507236480713, 0.31888601183891296, 0.34282130002975464, 0.3667566180229187, 0.3906919062137604, 0.41462719440460205, 0.4385624825954437, 0.4624977707862854, 0.48643308877944946, 0.5103683471679688, 0.5343036651611328, 0.5582389831542969, 0.5821743011474609, 0.6061095595359802, 0.6300448775291443, 0.6539801359176636, 0.6779154539108276, 0.7018507719039917, 0.725786030292511, 0.749721348285675, 0.7736566066741943, 0.7975919246673584, 0.8215272426605225, 0.8454625010490417, 0.8693978190422058, 0.8933330774307251, 0.9172683954238892, 0.9412037134170532, 0.9651390314102173, 0.9890742897987366]}, "eval/loss": 6.638564109802246, "eval/wer": 1.1671528067146855, "eval/runtime": 872.015, "eval/samples_per_second": 3.03, "eval/steps_per_second": 0.38} \ No newline at end of file