diff --git "a/wandb/run-20220302_215121-t49ehimo/files/wandb-summary.json" "b/wandb/run-20220302_215121-t49ehimo/files/wandb-summary.json" --- "a/wandb/run-20220302_215121-t49ehimo/files/wandb-summary.json" +++ "b/wandb/run-20220302_215121-t49ehimo/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.5204, "train/learning_rate": 5.780346820809249e-08, "train/epoch": 5.0, "train/global_step": 4460, "_runtime": 30356, "_timestamp": 1646288237, "_step": 4463, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 26.0, 74.0, 15.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 29845.0, 341.0, 77.0, 31.0, 17.0, 12.0, 11.0, 2.0, 8.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.0625, -95.99365234375, -93.9248046875, -91.85595703125, -89.787109375, -87.71826171875, -85.6494140625, -83.58056640625, -81.51171875, -79.44287109375, -77.3740234375, -75.30517578125, -73.236328125, -71.16748046875, -69.0986328125, -67.02978515625, -64.9609375, -62.89208984375, -60.8232421875, -58.75439453125, -56.685546875, -54.61669921875, -52.5478515625, -50.47900390625, -48.41015625, -46.34130859375, -44.2724609375, -42.20361328125, -40.134765625, -38.06591796875, -35.9970703125, -33.92822265625, -31.859375, -29.79052734375, -27.7216796875, -25.65283203125, -23.583984375, -21.51513671875, -19.4462890625, -17.37744140625, -15.30859375, -13.23974609375, -11.1708984375, -9.10205078125, -7.033203125, -4.96435546875, -2.8955078125, -0.82666015625, 1.2421875, 3.31103515625, 5.3798828125, 7.44873046875, 9.517578125, 11.58642578125, 13.6552734375, 15.72412109375, 17.79296875, 19.86181640625, 21.9306640625, 23.99951171875, 26.068359375, 28.13720703125, 30.2060546875, 32.27490234375, 34.34375]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 6.0, 8.0, 7.0, 7.0, 15.0, 13.0, 22.0, 20.0, 29.0, 26.0, 25.0, 42.0, 35.0, 45.0, 45.0, 55.0, 51.0, 55.0, 69.0, 56.0, 61.0, 48.0, 56.0, 31.0, 43.0, 33.0, 24.0, 14.0, 22.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-47.140663146972656, -46.067935943603516, -44.995208740234375, -43.922481536865234, -42.849754333496094, -41.77703094482422, -40.70430374145508, -39.63157653808594, -38.5588493347168, -37.486122131347656, -36.413394927978516, -35.340667724609375, -34.2679443359375, -33.19521713256836, -32.12248992919922, -31.049762725830078, -29.977035522460938, -28.904308319091797, -27.831581115722656, -26.75885581970215, -25.686128616333008, -24.613401412963867, -23.54067611694336, -22.46794891357422, -21.395221710205078, -20.322494506835938, -19.249767303466797, -18.17704200744629, -17.10431480407715, -16.031587600708008, -14.958861351013184, -13.88613510131836, -12.813411712646484, -11.740684509277344, -10.66795825958252, -9.595232009887695, -8.522504806518555, -7.449778079986572, -6.37705135345459, -5.304324626922607, -4.231597900390625, -3.1588711738586426, -2.08614444732666, -1.0134177207946777, 0.05930900573730469, 1.132035732269287, 2.2047624588012695, 3.277489185333252, 4.350215911865234, 5.422942638397217, 6.495669364929199, 7.568396091461182, 8.641122817993164, 9.713850021362305, 10.786576271057129, 11.859302520751953, 12.932029724121094, 14.004756927490234, 15.077483177185059, 16.150209426879883, 17.222936630249023, 18.295663833618164, 19.368389129638672, 20.441116333007812, 21.513843536376953]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 5.0, 11.0, 12.0, 13.0, 12.0, 17.0, 21.0, 21.0, 27.0, 23.0, 38.0, 30.0, 35.0, 38.0, 39.0, 41.0, 41.0, 29.0, 34.0, 43.0, 44.0, 41.0, 35.0, 34.0, 47.0, 36.0, 23.0, 32.0, 25.0, 25.0, 20.0, 23.0, 11.0, 10.0, 13.0, 8.0, 7.0, 5.0, 4.0, 5.0, 3.0, 7.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-27.810733795166016, -26.96071434020996, -26.110692977905273, -25.26067352294922, -24.41065216064453, -23.560632705688477, -22.710613250732422, -21.860591888427734, -21.010570526123047, -20.160551071166992, -19.310529708862305, -18.46051025390625, -17.610488891601562, -16.760469436645508, -15.910449028015137, -15.060428619384766, -14.210409164428711, -13.36038875579834, -12.510368347167969, -11.660348892211914, -10.810327529907227, -9.960308074951172, -9.1102876663208, -8.26026725769043, -7.410246849060059, -6.5602264404296875, -5.710206031799316, -4.8601861000061035, -4.010165691375732, -3.1601452827453613, -2.3101253509521484, -1.4601049423217773, -0.6100864410400391, 0.23993384838104248, 1.089954137802124, 1.939974308013916, 2.789994716644287, 3.640015125274658, 4.490035057067871, 5.340055465698242, 6.190075874328613, 7.040096282958984, 7.8901166915893555, 8.740137100219727, 9.590156555175781, 10.440177917480469, 11.290197372436523, 12.140217781066895, 12.990238189697266, 13.840258598327637, 14.690279006958008, 15.540298461914062, 16.39031982421875, 17.240339279174805, 18.09035873413086, 18.940380096435547, 19.790401458740234, 20.64042091369629, 21.490442276000977, 22.34046173095703, 23.19048309326172, 24.040502548217773, 24.890522003173828, 25.740543365478516, 26.59056282043457]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 10.0, 13.0, 23.0, 36.0, 47.0, 61.0, 97.0, 185.0, 279.0, 417.0, 699.0, 1105.0, 1899.0, 2858.0, 4604.0, 7230.0, 11395.0, 17506.0, 26139.0, 38377.0, 54357.0, 75168.0, 104453.0, 168303.0, 175372.0, 107937.0, 77328.0, 56011.0, 39384.0, 27044.0, 18022.0, 11798.0, 7626.0, 4813.0, 2994.0, 1853.0, 1114.0, 759.0, 447.0, 284.0, 176.0, 107.0, 66.0, 64.0, 33.0, 20.0, 17.0, 7.0, 10.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.8125, -66.595703125, -64.37890625, -62.162109375, -59.9453125, -57.728515625, -55.51171875, -53.294921875, -51.078125, -48.861328125, -46.64453125, -44.427734375, -42.2109375, -39.994140625, -37.77734375, -35.560546875, -33.34375, -31.126953125, -28.91015625, -26.693359375, -24.4765625, -22.259765625, -20.04296875, -17.826171875, -15.609375, -13.392578125, -11.17578125, -8.958984375, -6.7421875, -4.525390625, -2.30859375, -0.091796875, 2.125, 4.341796875, 6.55859375, 8.775390625, 10.9921875, 13.208984375, 15.42578125, 17.642578125, 19.859375, 22.076171875, 24.29296875, 26.509765625, 28.7265625, 30.943359375, 33.16015625, 35.376953125, 37.59375, 39.810546875, 42.02734375, 44.244140625, 46.4609375, 48.677734375, 50.89453125, 53.111328125, 55.328125, 57.544921875, 59.76171875, 61.978515625, 64.1953125, 66.412109375, 68.62890625, 70.845703125, 73.0625]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 11.0, 12.0, 7.0, 7.0, 10.0, 13.0, 15.0, 22.0, 11.0, 23.0, 38.0, 33.0, 28.0, 39.0, 45.0, 42.0, 69.0, 83.0, 72.0, 59.0, 56.0, 35.0, 44.0, 35.0, 24.0, 26.0, 24.0, 16.0, 14.0, 16.0, 18.0, 9.0, 9.0, 8.0, 7.0, 1.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.453125, -27.559326171875, -26.66552734375, -25.771728515625, -24.8779296875, -23.984130859375, -23.09033203125, -22.196533203125, -21.302734375, -20.408935546875, -19.51513671875, -18.621337890625, -17.7275390625, -16.833740234375, -15.93994140625, -15.046142578125, -14.15234375, -13.258544921875, -12.36474609375, -11.470947265625, -10.5771484375, -9.683349609375, -8.78955078125, -7.895751953125, -7.001953125, -6.108154296875, -5.21435546875, -4.320556640625, -3.4267578125, -2.532958984375, -1.63916015625, -0.745361328125, 0.1484375, 1.042236328125, 1.93603515625, 2.829833984375, 3.7236328125, 4.617431640625, 5.51123046875, 6.405029296875, 7.298828125, 8.192626953125, 9.08642578125, 9.980224609375, 10.8740234375, 11.767822265625, 12.66162109375, 13.555419921875, 14.44921875, 15.343017578125, 16.23681640625, 17.130615234375, 18.0244140625, 18.918212890625, 19.81201171875, 20.705810546875, 21.599609375, 22.493408203125, 23.38720703125, 24.281005859375, 25.1748046875, 26.068603515625, 26.96240234375, 27.856201171875, 28.75]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 6.0, 6.0, 8.0, 14.0, 12.0, 9.0, 20.0, 19.0, 32.0, 24.0, 34.0, 32.0, 31.0, 24.0, 35.0, 43.0, 49.0, 37.0, 50.0, 41.0, 41.0, 47.0, 49.0, 35.0, 40.0, 28.0, 34.0, 27.0, 25.0, 14.0, 23.0, 13.0, 19.0, 15.0, 14.0, 5.0, 8.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.58609676361084, -15.049652099609375, -14.51320743560791, -13.976762771606445, -13.440317153930664, -12.9038724899292, -12.367427825927734, -11.83098316192627, -11.294538497924805, -10.75809383392334, -10.221649169921875, -9.685203552246094, -9.148758888244629, -8.612314224243164, -8.0758695602417, -7.539424896240234, -7.002979278564453, -6.466534614562988, -5.930089473724365, -5.3936448097229, -4.857199668884277, -4.3207550048828125, -3.7843103408813477, -3.2478654384613037, -2.7114205360412598, -2.174975633621216, -1.6385308504104614, -1.102086067199707, -0.5656411647796631, -0.02919626235961914, 0.5072484016418457, 1.0436933040618896, 1.58013916015625, 2.116584062576294, 2.653028964996338, 3.1894736289978027, 3.7259185314178467, 4.262363433837891, 4.7988080978393555, 5.33525276184082, 5.871697902679443, 6.408142566680908, 6.944587707519531, 7.481032371520996, 8.017477035522461, 8.553922653198242, 9.09036636352539, 9.626811981201172, 10.163256645202637, 10.699701309204102, 11.236145973205566, 11.772590637207031, 12.309036254882812, 12.845480918884277, 13.381925582885742, 13.918370246887207, 14.454814910888672, 14.991259574890137, 15.527704238891602, 16.064149856567383, 16.60059356689453, 17.137039184570312, 17.673484802246094, 18.209928512573242, 18.746374130249023]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 8.0, 8.0, 3.0, 6.0, 9.0, 8.0, 12.0, 13.0, 25.0, 22.0, 25.0, 25.0, 22.0, 26.0, 22.0, 29.0, 43.0, 30.0, 43.0, 51.0, 44.0, 44.0, 49.0, 37.0, 34.0, 37.0, 35.0, 35.0, 26.0, 26.0, 29.0, 26.0, 27.0, 18.0, 22.0, 17.0, 13.0, 10.0, 9.0, 4.0, 6.0, 4.0, 1.0, 7.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-16.44671630859375, -15.948348045349121, -15.449978828430176, -14.951610565185547, -14.453241348266602, -13.954873085021973, -13.456504821777344, -12.958135604858398, -12.45976734161377, -11.96139907836914, -11.463029861450195, -10.964661598205566, -10.466293334960938, -9.967924118041992, -9.469555854797363, -8.971187591552734, -8.472818374633789, -7.974449634552002, -7.476080894470215, -6.977712631225586, -6.479343891143799, -5.980975151062012, -5.482606887817383, -4.984238147735596, -4.485869407653809, -3.9875006675720215, -3.4891321659088135, -2.9907636642456055, -2.4923949241638184, -1.9940261840820312, -1.4956576824188232, -0.9972891807556152, -0.4989204406738281, -0.0005518198013305664, 0.497816801071167, 0.9961854219436646, 1.494554042816162, 1.9929227828979492, 2.4912912845611572, 2.9896597862243652, 3.4880285263061523, 3.9863972663879395, 4.484766006469727, 4.9831342697143555, 5.481503009796143, 5.97987174987793, 6.478240013122559, 6.976608753204346, 7.474977493286133, 7.97334623336792, 8.471714973449707, 8.970083236694336, 9.468452453613281, 9.96682071685791, 10.465188980102539, 10.963558197021484, 11.461926460266113, 11.960294723510742, 12.458663940429688, 12.957032203674316, 13.455400466918945, 13.95376968383789, 14.45213794708252, 14.950506210327148, 15.448875427246094]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 2.0, 4.0, 8.0, 15.0, 12.0, 19.0, 25.0, 35.0, 66.0, 105.0, 185.0, 341.0, 567.0, 1158.0, 2227.0, 4543.0, 9617.0, 21755.0, 51677.0, 135006.0, 399320.0, 1160400.0, 1479153.0, 598464.0, 200068.0, 74061.0, 30175.0, 13092.0, 5989.0, 2871.0, 1504.0, 776.0, 412.0, 254.0, 138.0, 69.0, 60.0, 30.0, 31.0, 16.0, 8.0, 7.0, 5.0, 3.0, 3.0, 5.0, 2.0, 3.0], "bins": [-40.8125, -39.74365234375, -38.6748046875, -37.60595703125, -36.537109375, -35.46826171875, -34.3994140625, -33.33056640625, -32.26171875, -31.19287109375, -30.1240234375, -29.05517578125, -27.986328125, -26.91748046875, -25.8486328125, -24.77978515625, -23.7109375, -22.64208984375, -21.5732421875, -20.50439453125, -19.435546875, -18.36669921875, -17.2978515625, -16.22900390625, -15.16015625, -14.09130859375, -13.0224609375, -11.95361328125, -10.884765625, -9.81591796875, -8.7470703125, -7.67822265625, -6.609375, -5.54052734375, -4.4716796875, -3.40283203125, -2.333984375, -1.26513671875, -0.1962890625, 0.87255859375, 1.94140625, 3.01025390625, 4.0791015625, 5.14794921875, 6.216796875, 7.28564453125, 8.3544921875, 9.42333984375, 10.4921875, 11.56103515625, 12.6298828125, 13.69873046875, 14.767578125, 15.83642578125, 16.9052734375, 17.97412109375, 19.04296875, 20.11181640625, 21.1806640625, 22.24951171875, 23.318359375, 24.38720703125, 25.4560546875, 26.52490234375, 27.59375]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 1.0, 1.0, 5.0, 2.0, 4.0, 10.0, 7.0, 8.0, 5.0, 13.0, 18.0, 12.0, 17.0, 21.0, 24.0, 25.0, 23.0, 42.0, 36.0, 34.0, 31.0, 36.0, 39.0, 36.0, 48.0, 48.0, 52.0, 41.0, 30.0, 33.0, 33.0, 37.0, 29.0, 27.0, 26.0, 19.0, 28.0, 18.0, 15.0, 16.0, 13.0, 7.0, 6.0, 6.0, 7.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.265625, -13.8173828125, -13.369140625, -12.9208984375, -12.47265625, -12.0244140625, -11.576171875, -11.1279296875, -10.6796875, -10.2314453125, -9.783203125, -9.3349609375, -8.88671875, -8.4384765625, -7.990234375, -7.5419921875, -7.09375, -6.6455078125, -6.197265625, -5.7490234375, -5.30078125, -4.8525390625, -4.404296875, -3.9560546875, -3.5078125, -3.0595703125, -2.611328125, -2.1630859375, -1.71484375, -1.2666015625, -0.818359375, -0.3701171875, 0.078125, 0.5263671875, 0.974609375, 1.4228515625, 1.87109375, 2.3193359375, 2.767578125, 3.2158203125, 3.6640625, 4.1123046875, 4.560546875, 5.0087890625, 5.45703125, 5.9052734375, 6.353515625, 6.8017578125, 7.25, 7.6982421875, 8.146484375, 8.5947265625, 9.04296875, 9.4912109375, 9.939453125, 10.3876953125, 10.8359375, 11.2841796875, 11.732421875, 12.1806640625, 12.62890625, 13.0771484375, 13.525390625, 13.9736328125, 14.421875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 11.0, 10.0, 17.0, 27.0, 44.0, 47.0, 99.0, 148.0, 296.0, 467.0, 828.0, 1470.0, 2754.0, 5287.0, 10157.0, 21992.0, 48979.0, 115171.0, 281655.0, 692035.0, 1380355.0, 951061.0, 396105.0, 160315.0, 67318.0, 29282.0, 13749.0, 6752.0, 3433.0, 1849.0, 1026.0, 603.0, 370.0, 225.0, 141.0, 70.0, 53.0, 27.0, 19.0, 16.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-33.78125, -32.807373046875, -31.83349609375, -30.859619140625, -29.8857421875, -28.911865234375, -27.93798828125, -26.964111328125, -25.990234375, -25.016357421875, -24.04248046875, -23.068603515625, -22.0947265625, -21.120849609375, -20.14697265625, -19.173095703125, -18.19921875, -17.225341796875, -16.25146484375, -15.277587890625, -14.3037109375, -13.329833984375, -12.35595703125, -11.382080078125, -10.408203125, -9.434326171875, -8.46044921875, -7.486572265625, -6.5126953125, -5.538818359375, -4.56494140625, -3.591064453125, -2.6171875, -1.643310546875, -0.66943359375, 0.304443359375, 1.2783203125, 2.252197265625, 3.22607421875, 4.199951171875, 5.173828125, 6.147705078125, 7.12158203125, 8.095458984375, 9.0693359375, 10.043212890625, 11.01708984375, 11.990966796875, 12.96484375, 13.938720703125, 14.91259765625, 15.886474609375, 16.8603515625, 17.834228515625, 18.80810546875, 19.781982421875, 20.755859375, 21.729736328125, 22.70361328125, 23.677490234375, 24.6513671875, 25.625244140625, 26.59912109375, 27.572998046875, 28.546875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 13.0, 9.0, 16.0, 16.0, 16.0, 23.0, 30.0, 39.0, 45.0, 57.0, 67.0, 99.0, 115.0, 117.0, 171.0, 222.0, 257.0, 311.0, 319.0, 365.0, 344.0, 266.0, 255.0, 198.0, 158.0, 120.0, 108.0, 86.0, 55.0, 38.0, 32.0, 18.0, 23.0, 22.0, 13.0, 11.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.661865234375, -7.39404296875, -7.126220703125, -6.8583984375, -6.590576171875, -6.32275390625, -6.054931640625, -5.787109375, -5.519287109375, -5.25146484375, -4.983642578125, -4.7158203125, -4.447998046875, -4.18017578125, -3.912353515625, -3.64453125, -3.376708984375, -3.10888671875, -2.841064453125, -2.5732421875, -2.305419921875, -2.03759765625, -1.769775390625, -1.501953125, -1.234130859375, -0.96630859375, -0.698486328125, -0.4306640625, -0.162841796875, 0.10498046875, 0.372802734375, 0.640625, 0.908447265625, 1.17626953125, 1.444091796875, 1.7119140625, 1.979736328125, 2.24755859375, 2.515380859375, 2.783203125, 3.051025390625, 3.31884765625, 3.586669921875, 3.8544921875, 4.122314453125, 4.39013671875, 4.657958984375, 4.92578125, 5.193603515625, 5.46142578125, 5.729248046875, 5.9970703125, 6.264892578125, 6.53271484375, 6.800537109375, 7.068359375, 7.336181640625, 7.60400390625, 7.871826171875, 8.1396484375, 8.407470703125, 8.67529296875, 8.943115234375, 9.2109375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 7.0, 11.0, 8.0, 17.0, 19.0, 28.0, 32.0, 28.0, 44.0, 42.0, 55.0, 58.0, 55.0, 67.0, 49.0, 68.0, 50.0, 57.0, 50.0, 46.0, 36.0, 22.0, 27.0, 22.0, 20.0, 16.0, 10.0, 6.0, 7.0, 3.0, 4.0, 4.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.66727066040039, -15.98918342590332, -15.31109619140625, -14.63300895690918, -13.95492172241211, -13.276834487915039, -12.598746299743652, -11.920659065246582, -11.242571830749512, -10.564484596252441, -9.886397361755371, -9.208309173583984, -8.530221939086914, -7.852135181427002, -7.174047470092773, -6.495960235595703, -5.817873001098633, -5.1397857666015625, -4.461698532104492, -3.7836108207702637, -3.1055235862731934, -2.427436351776123, -1.7493486404418945, -1.0712614059448242, -0.3931741714477539, 0.28491318225860596, 0.9630005359649658, 1.6410880088806152, 2.3191752433776855, 2.997262477874756, 3.6753501892089844, 4.353437423706055, 5.031524658203125, 5.709611892700195, 6.387699127197266, 7.065786838531494, 7.7438740730285645, 8.421960830688477, 9.100049018859863, 9.778136253356934, 10.456223487854004, 11.134310722351074, 11.812397956848145, 12.490486145019531, 13.168573379516602, 13.846660614013672, 14.524747848510742, 15.202835083007812, 15.880922317504883, 16.559009552001953, 17.237096786499023, 17.915184020996094, 18.593271255493164, 19.271358489990234, 19.949447631835938, 20.627532958984375, 21.305622100830078, 21.98370933532715, 22.66179656982422, 23.33988380432129, 24.01797103881836, 24.69605827331543, 25.3741455078125, 26.052234649658203, 26.73031997680664]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 4.0, 12.0, 6.0, 5.0, 12.0, 12.0, 12.0, 14.0, 23.0, 23.0, 16.0, 23.0, 34.0, 29.0, 29.0, 49.0, 50.0, 45.0, 46.0, 47.0, 46.0, 48.0, 46.0, 32.0, 28.0, 44.0, 32.0, 22.0, 31.0, 29.0, 26.0, 21.0, 18.0, 12.0, 9.0, 14.0, 9.0, 13.0, 5.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.349449157714844, -18.798690795898438, -18.247934341430664, -17.697175979614258, -17.14641761779785, -16.595661163330078, -16.044902801513672, -15.494144439697266, -14.943387031555176, -14.392629623413086, -13.84187126159668, -13.29111385345459, -12.7403564453125, -12.189598083496094, -11.638840675354004, -11.088083267211914, -10.537324905395508, -9.986567497253418, -9.435809135437012, -8.885051727294922, -8.334293365478516, -7.783535957336426, -7.232778549194336, -6.682020664215088, -6.13126277923584, -5.580504894256592, -5.029747009277344, -4.478989601135254, -3.928231716156006, -3.377473831176758, -2.826716184616089, -2.27595853805542, -1.7251996994018555, -1.174441933631897, -0.6236841678619385, -0.07292640209197998, 0.4778313636779785, 1.0285892486572266, 1.5793468952178955, 2.1301045417785645, 2.6808624267578125, 3.2316203117370605, 3.7823779582977295, 4.333135604858398, 4.8838934898376465, 5.4346513748168945, 5.985408782958984, 6.536166667938232, 7.0869245529174805, 7.6376824378967285, 8.188440322875977, 8.739197731018066, 9.289955139160156, 9.840713500976562, 10.391470909118652, 10.942228317260742, 11.492986679077148, 12.043744087219238, 12.594502449035645, 13.145259857177734, 13.69601821899414, 14.24677562713623, 14.79753303527832, 15.348291397094727, 15.899048805236816]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 7.0, 4.0, 21.0, 38.0, 42.0, 69.0, 80.0, 137.0, 239.0, 354.0, 553.0, 858.0, 1337.0, 2108.0, 3239.0, 5077.0, 7771.0, 11889.0, 17783.0, 26921.0, 39920.0, 57111.0, 81108.0, 108010.0, 132106.0, 137480.0, 118694.0, 91148.0, 65582.0, 46169.0, 31322.0, 21487.0, 13786.0, 9236.0, 5939.0, 3802.0, 2545.0, 1621.0, 1050.0, 683.0, 438.0, 274.0, 154.0, 130.0, 85.0, 45.0, 38.0, 23.0, 16.0, 6.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-32.125, -31.127197265625, -30.12939453125, -29.131591796875, -28.1337890625, -27.135986328125, -26.13818359375, -25.140380859375, -24.142578125, -23.144775390625, -22.14697265625, -21.149169921875, -20.1513671875, -19.153564453125, -18.15576171875, -17.157958984375, -16.16015625, -15.162353515625, -14.16455078125, -13.166748046875, -12.1689453125, -11.171142578125, -10.17333984375, -9.175537109375, -8.177734375, -7.179931640625, -6.18212890625, -5.184326171875, -4.1865234375, -3.188720703125, -2.19091796875, -1.193115234375, -0.1953125, 0.802490234375, 1.80029296875, 2.798095703125, 3.7958984375, 4.793701171875, 5.79150390625, 6.789306640625, 7.787109375, 8.784912109375, 9.78271484375, 10.780517578125, 11.7783203125, 12.776123046875, 13.77392578125, 14.771728515625, 15.76953125, 16.767333984375, 17.76513671875, 18.762939453125, 19.7607421875, 20.758544921875, 21.75634765625, 22.754150390625, 23.751953125, 24.749755859375, 25.74755859375, 26.745361328125, 27.7431640625, 28.740966796875, 29.73876953125, 30.736572265625, 31.734375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 3.0, 6.0, 6.0, 4.0, 5.0, 10.0, 11.0, 13.0, 12.0, 11.0, 17.0, 20.0, 25.0, 29.0, 30.0, 33.0, 36.0, 40.0, 31.0, 51.0, 46.0, 56.0, 55.0, 56.0, 46.0, 41.0, 34.0, 39.0, 39.0, 27.0, 28.0, 27.0, 22.0, 18.0, 16.0, 12.0, 14.0, 6.0, 6.0, 7.0, 7.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.734375, -15.22509765625, -14.7158203125, -14.20654296875, -13.697265625, -13.18798828125, -12.6787109375, -12.16943359375, -11.66015625, -11.15087890625, -10.6416015625, -10.13232421875, -9.623046875, -9.11376953125, -8.6044921875, -8.09521484375, -7.5859375, -7.07666015625, -6.5673828125, -6.05810546875, -5.548828125, -5.03955078125, -4.5302734375, -4.02099609375, -3.51171875, -3.00244140625, -2.4931640625, -1.98388671875, -1.474609375, -0.96533203125, -0.4560546875, 0.05322265625, 0.5625, 1.07177734375, 1.5810546875, 2.09033203125, 2.599609375, 3.10888671875, 3.6181640625, 4.12744140625, 4.63671875, 5.14599609375, 5.6552734375, 6.16455078125, 6.673828125, 7.18310546875, 7.6923828125, 8.20166015625, 8.7109375, 9.22021484375, 9.7294921875, 10.23876953125, 10.748046875, 11.25732421875, 11.7666015625, 12.27587890625, 12.78515625, 13.29443359375, 13.8037109375, 14.31298828125, 14.822265625, 15.33154296875, 15.8408203125, 16.35009765625, 16.859375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 9.0, 28.0, 18.0, 34.0, 42.0, 73.0, 101.0, 130.0, 216.0, 276.0, 367.0, 514.0, 767.0, 1084.0, 1612.0, 2541.0, 4186.0, 7090.0, 12501.0, 25783.0, 65036.0, 218725.0, 438930.0, 166569.0, 52165.0, 21560.0, 11055.0, 6215.0, 3735.0, 2350.0, 1521.0, 961.0, 742.0, 476.0, 351.0, 211.0, 158.0, 115.0, 70.0, 73.0, 51.0, 37.0, 25.0, 22.0, 8.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.78125, -57.876953125, -55.97265625, -54.068359375, -52.1640625, -50.259765625, -48.35546875, -46.451171875, -44.546875, -42.642578125, -40.73828125, -38.833984375, -36.9296875, -35.025390625, -33.12109375, -31.216796875, -29.3125, -27.408203125, -25.50390625, -23.599609375, -21.6953125, -19.791015625, -17.88671875, -15.982421875, -14.078125, -12.173828125, -10.26953125, -8.365234375, -6.4609375, -4.556640625, -2.65234375, -0.748046875, 1.15625, 3.060546875, 4.96484375, 6.869140625, 8.7734375, 10.677734375, 12.58203125, 14.486328125, 16.390625, 18.294921875, 20.19921875, 22.103515625, 24.0078125, 25.912109375, 27.81640625, 29.720703125, 31.625, 33.529296875, 35.43359375, 37.337890625, 39.2421875, 41.146484375, 43.05078125, 44.955078125, 46.859375, 48.763671875, 50.66796875, 52.572265625, 54.4765625, 56.380859375, 58.28515625, 60.189453125, 62.09375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 6.0, 4.0, 12.0, 15.0, 15.0, 20.0, 24.0, 31.0, 25.0, 23.0, 31.0, 36.0, 39.0, 32.0, 39.0, 42.0, 50.0, 47.0, 41.0, 45.0, 52.0, 46.0, 35.0, 31.0, 39.0, 25.0, 22.0, 18.0, 12.0, 22.0, 24.0, 17.0, 7.0, 10.0, 10.0, 4.0, 7.0, 3.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5, -13.008056640625, -12.51611328125, -12.024169921875, -11.5322265625, -11.040283203125, -10.54833984375, -10.056396484375, -9.564453125, -9.072509765625, -8.58056640625, -8.088623046875, -7.5966796875, -7.104736328125, -6.61279296875, -6.120849609375, -5.62890625, -5.136962890625, -4.64501953125, -4.153076171875, -3.6611328125, -3.169189453125, -2.67724609375, -2.185302734375, -1.693359375, -1.201416015625, -0.70947265625, -0.217529296875, 0.2744140625, 0.766357421875, 1.25830078125, 1.750244140625, 2.2421875, 2.734130859375, 3.22607421875, 3.718017578125, 4.2099609375, 4.701904296875, 5.19384765625, 5.685791015625, 6.177734375, 6.669677734375, 7.16162109375, 7.653564453125, 8.1455078125, 8.637451171875, 9.12939453125, 9.621337890625, 10.11328125, 10.605224609375, 11.09716796875, 11.589111328125, 12.0810546875, 12.572998046875, 13.06494140625, 13.556884765625, 14.048828125, 14.540771484375, 15.03271484375, 15.524658203125, 16.0166015625, 16.508544921875, 17.00048828125, 17.492431640625, 17.984375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 5.0, 10.0, 6.0, 3.0, 12.0, 11.0, 19.0, 27.0, 21.0, 38.0, 72.0, 91.0, 150.0, 235.0, 371.0, 723.0, 1342.0, 2520.0, 5643.0, 16741.0, 76278.0, 756506.0, 148052.0, 25013.0, 7684.0, 3211.0, 1598.0, 840.0, 499.0, 299.0, 166.0, 101.0, 66.0, 51.0, 39.0, 26.0, 20.0, 16.0, 14.0, 9.0, 9.0, 3.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-259.0, -250.55078125, -242.1015625, -233.65234375, -225.203125, -216.75390625, -208.3046875, -199.85546875, -191.40625, -182.95703125, -174.5078125, -166.05859375, -157.609375, -149.16015625, -140.7109375, -132.26171875, -123.8125, -115.36328125, -106.9140625, -98.46484375, -90.015625, -81.56640625, -73.1171875, -64.66796875, -56.21875, -47.76953125, -39.3203125, -30.87109375, -22.421875, -13.97265625, -5.5234375, 2.92578125, 11.375, 19.82421875, 28.2734375, 36.72265625, 45.171875, 53.62109375, 62.0703125, 70.51953125, 78.96875, 87.41796875, 95.8671875, 104.31640625, 112.765625, 121.21484375, 129.6640625, 138.11328125, 146.5625, 155.01171875, 163.4609375, 171.91015625, 180.359375, 188.80859375, 197.2578125, 205.70703125, 214.15625, 222.60546875, 231.0546875, 239.50390625, 247.953125, 256.40234375, 264.8515625, 273.30078125, 281.75]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 6.0, 9.0, 12.0, 13.0, 24.0, 21.0, 29.0, 35.0, 44.0, 68.0, 104.0, 200.0, 110.0, 72.0, 61.0, 39.0, 39.0, 26.0, 17.0, 13.0, 13.0, 4.0, 11.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023284912109375, -0.022525787353515625, -0.02176666259765625, -0.021007537841796875, -0.0202484130859375, -0.019489288330078125, -0.01873016357421875, -0.017971038818359375, -0.0172119140625, -0.016452789306640625, -0.01569366455078125, -0.014934539794921875, -0.0141754150390625, -0.013416290283203125, -0.01265716552734375, -0.011898040771484375, -0.011138916015625, -0.010379791259765625, -0.00962066650390625, -0.008861541748046875, -0.0081024169921875, -0.007343292236328125, -0.00658416748046875, -0.005825042724609375, -0.00506591796875, -0.004306793212890625, -0.00354766845703125, -0.002788543701171875, -0.0020294189453125, -0.001270294189453125, -0.00051116943359375, 0.000247955322265625, 0.001007080078125, 0.001766204833984375, 0.00252532958984375, 0.003284454345703125, 0.0040435791015625, 0.004802703857421875, 0.00556182861328125, 0.006320953369140625, 0.007080078125, 0.007839202880859375, 0.00859832763671875, 0.009357452392578125, 0.0101165771484375, 0.010875701904296875, 0.01163482666015625, 0.012393951416015625, 0.013153076171875, 0.013912200927734375, 0.01467132568359375, 0.015430450439453125, 0.0161895751953125, 0.016948699951171875, 0.01770782470703125, 0.018466949462890625, 0.01922607421875, 0.019985198974609375, 0.02074432373046875, 0.021503448486328125, 0.0222625732421875, 0.023021697998046875, 0.02378082275390625, 0.024539947509765625, 0.025299072265625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 5.0, 5.0, 13.0, 11.0, 10.0, 24.0, 35.0, 45.0, 55.0, 73.0, 104.0, 147.0, 216.0, 342.0, 466.0, 710.0, 1041.0, 1525.0, 2415.0, 4081.0, 7097.0, 13551.0, 29046.0, 79767.0, 360085.0, 397983.0, 85587.0, 30762.0, 14198.0, 7448.0, 4193.0, 2527.0, 1682.0, 1044.0, 671.0, 484.0, 294.0, 219.0, 147.0, 120.0, 97.0, 70.0, 45.0, 29.0, 24.0, 21.0, 14.0, 10.0, 6.0, 8.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-62.0, -60.123046875, -58.24609375, -56.369140625, -54.4921875, -52.615234375, -50.73828125, -48.861328125, -46.984375, -45.107421875, -43.23046875, -41.353515625, -39.4765625, -37.599609375, -35.72265625, -33.845703125, -31.96875, -30.091796875, -28.21484375, -26.337890625, -24.4609375, -22.583984375, -20.70703125, -18.830078125, -16.953125, -15.076171875, -13.19921875, -11.322265625, -9.4453125, -7.568359375, -5.69140625, -3.814453125, -1.9375, -0.060546875, 1.81640625, 3.693359375, 5.5703125, 7.447265625, 9.32421875, 11.201171875, 13.078125, 14.955078125, 16.83203125, 18.708984375, 20.5859375, 22.462890625, 24.33984375, 26.216796875, 28.09375, 29.970703125, 31.84765625, 33.724609375, 35.6015625, 37.478515625, 39.35546875, 41.232421875, 43.109375, 44.986328125, 46.86328125, 48.740234375, 50.6171875, 52.494140625, 54.37109375, 56.248046875, 58.125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 0.0, 6.0, 5.0, 8.0, 10.0, 10.0, 12.0, 15.0, 14.0, 14.0, 28.0, 44.0, 34.0, 49.0, 40.0, 67.0, 92.0, 106.0, 82.0, 60.0, 49.0, 36.0, 42.0, 24.0, 29.0, 21.0, 23.0, 10.0, 8.0, 8.0, 8.0, 6.0, 10.0, 9.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.0859375, -13.6749267578125, -13.263916015625, -12.8529052734375, -12.44189453125, -12.0308837890625, -11.619873046875, -11.2088623046875, -10.7978515625, -10.3868408203125, -9.975830078125, -9.5648193359375, -9.15380859375, -8.7427978515625, -8.331787109375, -7.9207763671875, -7.509765625, -7.0987548828125, -6.687744140625, -6.2767333984375, -5.86572265625, -5.4547119140625, -5.043701171875, -4.6326904296875, -4.2216796875, -3.8106689453125, -3.399658203125, -2.9886474609375, -2.57763671875, -2.1666259765625, -1.755615234375, -1.3446044921875, -0.93359375, -0.5225830078125, -0.111572265625, 0.2994384765625, 0.71044921875, 1.1214599609375, 1.532470703125, 1.9434814453125, 2.3544921875, 2.7655029296875, 3.176513671875, 3.5875244140625, 3.99853515625, 4.4095458984375, 4.820556640625, 5.2315673828125, 5.642578125, 6.0535888671875, 6.464599609375, 6.8756103515625, 7.28662109375, 7.6976318359375, 8.108642578125, 8.5196533203125, 8.9306640625, 9.3416748046875, 9.752685546875, 10.1636962890625, 10.57470703125, 10.9857177734375, 11.396728515625, 11.8077392578125, 12.21875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 7.0, 1.0, 8.0, 7.0, 5.0, 11.0, 15.0, 16.0, 22.0, 24.0, 39.0, 39.0, 52.0, 91.0, 90.0, 104.0, 97.0, 82.0, 58.0, 45.0, 39.0, 34.0, 29.0, 18.0, 12.0, 10.0, 7.0, 6.0, 9.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-35.681339263916016, -34.799903869628906, -33.9184684753418, -33.03703308105469, -32.15559387207031, -31.274158477783203, -30.392723083496094, -29.511287689208984, -28.629850387573242, -27.748414993286133, -26.86697769165039, -25.98554229736328, -25.104106903076172, -24.22266960144043, -23.34123420715332, -22.459796905517578, -21.57836151123047, -20.69692611694336, -19.815488815307617, -18.934053421020508, -18.0526180267334, -17.171180725097656, -16.289745330810547, -15.408308982849121, -14.526874542236328, -13.645438194274902, -12.764002799987793, -11.882566452026367, -11.001130104064941, -10.119693756103516, -9.238258361816406, -8.35682201385498, -7.475385665893555, -6.593949794769287, -5.712513446807861, -4.831077575683594, -3.949641466140747, -3.0682053565979004, -2.186769485473633, -1.305333137512207, -0.42389726638793945, 0.45753878355026245, 1.3389748334884644, 2.2204108238220215, 3.101846933364868, 3.983283042907715, 4.864718914031982, 5.746155261993408, 6.627591133117676, 7.509027004241943, 8.390462875366211, 9.271899223327637, 10.153335571289062, 11.034770965576172, 11.916207313537598, 12.797643661499023, 13.679079055786133, 14.560515403747559, 15.441950798034668, 16.323387145996094, 17.204822540283203, 18.086259841918945, 18.967695236206055, 19.849132537841797, 20.730567932128906]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 10.0, 8.0, 14.0, 19.0, 17.0, 17.0, 25.0, 19.0, 27.0, 21.0, 36.0, 30.0, 42.0, 29.0, 40.0, 33.0, 49.0, 46.0, 44.0, 47.0, 41.0, 38.0, 36.0, 42.0, 36.0, 24.0, 27.0, 24.0, 28.0, 17.0, 12.0, 20.0, 14.0, 15.0, 7.0, 11.0, 9.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.817935943603516, -22.118282318115234, -21.418628692626953, -20.718975067138672, -20.01932144165039, -19.31966781616211, -18.620014190673828, -17.920360565185547, -17.220706939697266, -16.521053314208984, -15.821399688720703, -15.121746063232422, -14.42209243774414, -13.72243881225586, -13.022786140441895, -12.323132514953613, -11.623479843139648, -10.923826217651367, -10.224172592163086, -9.524518966674805, -8.824865341186523, -8.125211715698242, -7.425559043884277, -6.725905418395996, -6.026251792907715, -5.326598167419434, -4.626944541931152, -3.9272913932800293, -3.227637767791748, -2.527984142303467, -1.8283309936523438, -1.1286773681640625, -0.42902374267578125, 0.27062976360321045, 0.9702832698822021, 1.6699366569519043, 2.3695902824401855, 3.069243907928467, 3.76889705657959, 4.468550682067871, 5.168204307556152, 5.867857933044434, 6.567511558532715, 7.267164707183838, 7.966818332672119, 8.666471481323242, 9.366125106811523, 10.065778732299805, 10.765432357788086, 11.465085983276367, 12.164739608764648, 12.86439323425293, 13.564046859741211, 14.263700485229492, 14.963353157043457, 15.663006782531738, 16.362659454345703, 17.062313079833984, 17.761966705322266, 18.461620330810547, 19.161273956298828, 19.86092758178711, 20.56058120727539, 21.260234832763672, 21.959888458251953]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 8.0, 6.0, 24.0, 22.0, 41.0, 48.0, 77.0, 85.0, 136.0, 204.0, 327.0, 490.0, 734.0, 1181.0, 1897.0, 3230.0, 5625.0, 10420.0, 21276.0, 46800.0, 118080.0, 301143.0, 314073.0, 125312.0, 49490.0, 22250.0, 10891.0, 5865.0, 3302.0, 1929.0, 1217.0, 812.0, 503.0, 337.0, 239.0, 132.0, 96.0, 70.0, 45.0, 30.0, 30.0, 10.0, 16.0, 7.0, 10.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-48.125, -46.62255859375, -45.1201171875, -43.61767578125, -42.115234375, -40.61279296875, -39.1103515625, -37.60791015625, -36.10546875, -34.60302734375, -33.1005859375, -31.59814453125, -30.095703125, -28.59326171875, -27.0908203125, -25.58837890625, -24.0859375, -22.58349609375, -21.0810546875, -19.57861328125, -18.076171875, -16.57373046875, -15.0712890625, -13.56884765625, -12.06640625, -10.56396484375, -9.0615234375, -7.55908203125, -6.056640625, -4.55419921875, -3.0517578125, -1.54931640625, -0.046875, 1.45556640625, 2.9580078125, 4.46044921875, 5.962890625, 7.46533203125, 8.9677734375, 10.47021484375, 11.97265625, 13.47509765625, 14.9775390625, 16.47998046875, 17.982421875, 19.48486328125, 20.9873046875, 22.48974609375, 23.9921875, 25.49462890625, 26.9970703125, 28.49951171875, 30.001953125, 31.50439453125, 33.0068359375, 34.50927734375, 36.01171875, 37.51416015625, 39.0166015625, 40.51904296875, 42.021484375, 43.52392578125, 45.0263671875, 46.52880859375, 48.03125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 10.0, 10.0, 9.0, 15.0, 14.0, 20.0, 18.0, 16.0, 22.0, 26.0, 29.0, 40.0, 32.0, 25.0, 52.0, 38.0, 42.0, 49.0, 51.0, 39.0, 54.0, 45.0, 29.0, 31.0, 34.0, 35.0, 31.0, 23.0, 21.0, 21.0, 18.0, 11.0, 19.0, 13.0, 11.0, 8.0, 10.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.984375, -13.5386962890625, -13.093017578125, -12.6473388671875, -12.20166015625, -11.7559814453125, -11.310302734375, -10.8646240234375, -10.4189453125, -9.9732666015625, -9.527587890625, -9.0819091796875, -8.63623046875, -8.1905517578125, -7.744873046875, -7.2991943359375, -6.853515625, -6.4078369140625, -5.962158203125, -5.5164794921875, -5.07080078125, -4.6251220703125, -4.179443359375, -3.7337646484375, -3.2880859375, -2.8424072265625, -2.396728515625, -1.9510498046875, -1.50537109375, -1.0596923828125, -0.614013671875, -0.1683349609375, 0.27734375, 0.7230224609375, 1.168701171875, 1.6143798828125, 2.06005859375, 2.5057373046875, 2.951416015625, 3.3970947265625, 3.8427734375, 4.2884521484375, 4.734130859375, 5.1798095703125, 5.62548828125, 6.0711669921875, 6.516845703125, 6.9625244140625, 7.408203125, 7.8538818359375, 8.299560546875, 8.7452392578125, 9.19091796875, 9.6365966796875, 10.082275390625, 10.5279541015625, 10.9736328125, 11.4193115234375, 11.864990234375, 12.3106689453125, 12.75634765625, 13.2020263671875, 13.647705078125, 14.0933837890625, 14.5390625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 8.0, 10.0, 5.0, 17.0, 17.0, 24.0, 32.0, 55.0, 60.0, 84.0, 102.0, 157.0, 228.0, 330.0, 498.0, 764.0, 1100.0, 2068.0, 3248.0, 6058.0, 12427.0, 28918.0, 85821.0, 403852.0, 368334.0, 80326.0, 27772.0, 11890.0, 5785.0, 3170.0, 1892.0, 1171.0, 703.0, 509.0, 357.0, 203.0, 143.0, 118.0, 72.0, 63.0, 53.0, 35.0, 17.0, 13.0, 10.0, 14.0, 5.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-76.6875, -74.12890625, -71.5703125, -69.01171875, -66.453125, -63.89453125, -61.3359375, -58.77734375, -56.21875, -53.66015625, -51.1015625, -48.54296875, -45.984375, -43.42578125, -40.8671875, -38.30859375, -35.75, -33.19140625, -30.6328125, -28.07421875, -25.515625, -22.95703125, -20.3984375, -17.83984375, -15.28125, -12.72265625, -10.1640625, -7.60546875, -5.046875, -2.48828125, 0.0703125, 2.62890625, 5.1875, 7.74609375, 10.3046875, 12.86328125, 15.421875, 17.98046875, 20.5390625, 23.09765625, 25.65625, 28.21484375, 30.7734375, 33.33203125, 35.890625, 38.44921875, 41.0078125, 43.56640625, 46.125, 48.68359375, 51.2421875, 53.80078125, 56.359375, 58.91796875, 61.4765625, 64.03515625, 66.59375, 69.15234375, 71.7109375, 74.26953125, 76.828125, 79.38671875, 81.9453125, 84.50390625, 87.0625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 2.0, 8.0, 3.0, 7.0, 8.0, 9.0, 8.0, 11.0, 10.0, 18.0, 22.0, 29.0, 32.0, 39.0, 57.0, 49.0, 66.0, 75.0, 74.0, 64.0, 62.0, 59.0, 62.0, 41.0, 44.0, 29.0, 18.0, 13.0, 14.0, 9.0, 7.0, 12.0, 9.0, 6.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.171875, -20.576171875, -19.98046875, -19.384765625, -18.7890625, -18.193359375, -17.59765625, -17.001953125, -16.40625, -15.810546875, -15.21484375, -14.619140625, -14.0234375, -13.427734375, -12.83203125, -12.236328125, -11.640625, -11.044921875, -10.44921875, -9.853515625, -9.2578125, -8.662109375, -8.06640625, -7.470703125, -6.875, -6.279296875, -5.68359375, -5.087890625, -4.4921875, -3.896484375, -3.30078125, -2.705078125, -2.109375, -1.513671875, -0.91796875, -0.322265625, 0.2734375, 0.869140625, 1.46484375, 2.060546875, 2.65625, 3.251953125, 3.84765625, 4.443359375, 5.0390625, 5.634765625, 6.23046875, 6.826171875, 7.421875, 8.017578125, 8.61328125, 9.208984375, 9.8046875, 10.400390625, 10.99609375, 11.591796875, 12.1875, 12.783203125, 13.37890625, 13.974609375, 14.5703125, 15.166015625, 15.76171875, 16.357421875, 16.953125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 3.0, 6.0, 4.0, 8.0, 3.0, 3.0, 17.0, 17.0, 15.0, 27.0, 38.0, 67.0, 87.0, 148.0, 181.0, 295.0, 527.0, 1023.0, 2145.0, 5267.0, 16578.0, 82798.0, 836639.0, 77005.0, 15861.0, 5270.0, 2106.0, 960.0, 540.0, 305.0, 170.0, 124.0, 86.0, 60.0, 40.0, 31.0, 18.0, 21.0, 13.0, 11.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-91.5, -88.59375, -85.6875, -82.78125, -79.875, -76.96875, -74.0625, -71.15625, -68.25, -65.34375, -62.4375, -59.53125, -56.625, -53.71875, -50.8125, -47.90625, -45.0, -42.09375, -39.1875, -36.28125, -33.375, -30.46875, -27.5625, -24.65625, -21.75, -18.84375, -15.9375, -13.03125, -10.125, -7.21875, -4.3125, -1.40625, 1.5, 4.40625, 7.3125, 10.21875, 13.125, 16.03125, 18.9375, 21.84375, 24.75, 27.65625, 30.5625, 33.46875, 36.375, 39.28125, 42.1875, 45.09375, 48.0, 50.90625, 53.8125, 56.71875, 59.625, 62.53125, 65.4375, 68.34375, 71.25, 74.15625, 77.0625, 79.96875, 82.875, 85.78125, 88.6875, 91.59375, 94.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 12.0, 11.0, 22.0, 44.0, 86.0, 301.0, 307.0, 109.0, 47.0, 30.0, 12.0, 5.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00382232666015625, -0.0036489367485046387, -0.0034755468368530273, -0.003302156925201416, -0.0031287670135498047, -0.0029553771018981934, -0.002781987190246582, -0.0026085972785949707, -0.0024352073669433594, -0.002261817455291748, -0.0020884275436401367, -0.0019150376319885254, -0.001741647720336914, -0.0015682578086853027, -0.0013948678970336914, -0.00122147798538208, -0.0010480880737304688, -0.0008746981620788574, -0.0007013082504272461, -0.0005279183387756348, -0.00035452842712402344, -0.0001811385154724121, -7.748603820800781e-06, 0.00016564130783081055, 0.0003390312194824219, 0.0005124211311340332, 0.0006858110427856445, 0.0008592009544372559, 0.0010325908660888672, 0.0012059807777404785, 0.0013793706893920898, 0.0015527606010437012, 0.0017261505126953125, 0.0018995404243469238, 0.002072930335998535, 0.0022463202476501465, 0.002419710159301758, 0.002593100070953369, 0.0027664899826049805, 0.002939879894256592, 0.003113269805908203, 0.0032866597175598145, 0.0034600496292114258, 0.003633439540863037, 0.0038068294525146484, 0.00398021936416626, 0.004153609275817871, 0.004326999187469482, 0.004500389099121094, 0.004673779010772705, 0.004847168922424316, 0.005020558834075928, 0.005193948745727539, 0.00536733865737915, 0.005540728569030762, 0.005714118480682373, 0.005887508392333984, 0.006060898303985596, 0.006234288215637207, 0.006407678127288818, 0.00658106803894043, 0.006754457950592041, 0.006927847862243652, 0.007101237773895264, 0.007274627685546875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 9.0, 9.0, 15.0, 22.0, 14.0, 26.0, 33.0, 48.0, 68.0, 79.0, 109.0, 141.0, 202.0, 285.0, 351.0, 554.0, 762.0, 1205.0, 2069.0, 4180.0, 10280.0, 42085.0, 820140.0, 132864.0, 18954.0, 6311.0, 2891.0, 1588.0, 961.0, 630.0, 466.0, 317.0, 219.0, 177.0, 118.0, 84.0, 66.0, 44.0, 43.0, 38.0, 24.0, 11.0, 12.0, 8.0, 16.0, 12.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-98.1875, -94.994140625, -91.80078125, -88.607421875, -85.4140625, -82.220703125, -79.02734375, -75.833984375, -72.640625, -69.447265625, -66.25390625, -63.060546875, -59.8671875, -56.673828125, -53.48046875, -50.287109375, -47.09375, -43.900390625, -40.70703125, -37.513671875, -34.3203125, -31.126953125, -27.93359375, -24.740234375, -21.546875, -18.353515625, -15.16015625, -11.966796875, -8.7734375, -5.580078125, -2.38671875, 0.806640625, 4.0, 7.193359375, 10.38671875, 13.580078125, 16.7734375, 19.966796875, 23.16015625, 26.353515625, 29.546875, 32.740234375, 35.93359375, 39.126953125, 42.3203125, 45.513671875, 48.70703125, 51.900390625, 55.09375, 58.287109375, 61.48046875, 64.673828125, 67.8671875, 71.060546875, 74.25390625, 77.447265625, 80.640625, 83.833984375, 87.02734375, 90.220703125, 93.4140625, 96.607421875, 99.80078125, 102.994140625, 106.1875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 13.0, 15.0, 17.0, 42.0, 70.0, 114.0, 352.0, 141.0, 64.0, 40.0, 35.0, 27.0, 8.0, 6.0, 8.0, 3.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.078125, -23.40234375, -22.7265625, -22.05078125, -21.375, -20.69921875, -20.0234375, -19.34765625, -18.671875, -17.99609375, -17.3203125, -16.64453125, -15.96875, -15.29296875, -14.6171875, -13.94140625, -13.265625, -12.58984375, -11.9140625, -11.23828125, -10.5625, -9.88671875, -9.2109375, -8.53515625, -7.859375, -7.18359375, -6.5078125, -5.83203125, -5.15625, -4.48046875, -3.8046875, -3.12890625, -2.453125, -1.77734375, -1.1015625, -0.42578125, 0.25, 0.92578125, 1.6015625, 2.27734375, 2.953125, 3.62890625, 4.3046875, 4.98046875, 5.65625, 6.33203125, 7.0078125, 7.68359375, 8.359375, 9.03515625, 9.7109375, 10.38671875, 11.0625, 11.73828125, 12.4140625, 13.08984375, 13.765625, 14.44140625, 15.1171875, 15.79296875, 16.46875, 17.14453125, 17.8203125, 18.49609375, 19.171875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 6.0, 7.0, 22.0, 15.0, 16.0, 26.0, 55.0, 84.0, 124.0, 185.0, 154.0, 92.0, 53.0, 37.0, 23.0, 24.0, 19.0, 13.0, 9.0, 10.0, 5.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.8348388671875, -61.2921142578125, -59.7493896484375, -58.2066650390625, -56.6639404296875, -55.1212158203125, -53.5784912109375, -52.0357666015625, -50.4930419921875, -48.9503173828125, -47.4075927734375, -45.8648681640625, -44.3221435546875, -42.7794189453125, -41.2366943359375, -39.6939697265625, -38.151248931884766, -36.608524322509766, -35.065799713134766, -33.523075103759766, -31.980350494384766, -30.437625885009766, -28.8949031829834, -27.3521785736084, -25.8094539642334, -24.2667293548584, -22.7240047454834, -21.18128204345703, -19.63855743408203, -18.09583282470703, -16.55310821533203, -15.010383605957031, -13.467655181884766, -11.924930572509766, -10.382205963134766, -8.839482307434082, -7.296757698059082, -5.754033088684082, -4.211309432983398, -2.6685848236083984, -1.1258602142333984, 0.41686415672302246, 1.9595885276794434, 3.502312660217285, 5.045037269592285, 6.587761878967285, 8.130485534667969, 9.673210144042969, 11.215934753417969, 12.758659362792969, 14.301383972167969, 15.844107627868652, 17.38683319091797, 18.92955780029297, 20.472280502319336, 22.015005111694336, 23.557729721069336, 25.100454330444336, 26.643178939819336, 28.185901641845703, 29.728626251220703, 31.271350860595703, 32.8140754699707, 34.3568000793457, 35.8995246887207]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 10.0, 5.0, 6.0, 10.0, 14.0, 17.0, 14.0, 19.0, 23.0, 31.0, 31.0, 43.0, 35.0, 44.0, 38.0, 41.0, 42.0, 51.0, 42.0, 40.0, 35.0, 46.0, 23.0, 40.0, 43.0, 37.0, 25.0, 32.0, 27.0, 18.0, 19.0, 11.0, 11.0, 12.0, 8.0, 6.0, 7.0, 8.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.94864273071289, -29.023019790649414, -28.097396850585938, -27.17177391052246, -26.246150970458984, -25.320528030395508, -24.39490509033203, -23.469282150268555, -22.543659210205078, -21.6180362701416, -20.692413330078125, -19.76679039001465, -18.841167449951172, -17.915544509887695, -16.98992156982422, -16.064298629760742, -15.138675689697266, -14.213052749633789, -13.287429809570312, -12.361806869506836, -11.43618392944336, -10.510560989379883, -9.584938049316406, -8.65931510925293, -7.733692169189453, -6.808069229125977, -5.8824462890625, -4.956823348999023, -4.031200408935547, -3.1055774688720703, -2.1799545288085938, -1.2543315887451172, -0.32871055603027344, 0.5969123840332031, 1.5225353240966797, 2.4481582641601562, 3.373781204223633, 4.299404144287109, 5.225027084350586, 6.1506500244140625, 7.076272964477539, 8.001895904541016, 8.927518844604492, 9.853141784667969, 10.778764724731445, 11.704387664794922, 12.630010604858398, 13.555633544921875, 14.481256484985352, 15.406879425048828, 16.332502365112305, 17.25812530517578, 18.183748245239258, 19.109371185302734, 20.03499412536621, 20.960617065429688, 21.886240005493164, 22.81186294555664, 23.737485885620117, 24.663108825683594, 25.58873176574707, 26.514354705810547, 27.439977645874023, 28.3656005859375, 29.291223526000977]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 7.0, 15.0, 17.0, 35.0, 34.0, 41.0, 81.0, 100.0, 128.0, 190.0, 280.0, 407.0, 597.0, 888.0, 1301.0, 2073.0, 3336.0, 5607.0, 9410.0, 17388.0, 34843.0, 97454.0, 993415.0, 2673438.0, 246290.0, 53482.0, 23930.0, 12440.0, 6866.0, 3856.0, 2288.0, 1419.0, 850.0, 589.0, 351.0, 281.0, 166.0, 102.0, 89.0, 59.0, 39.0, 27.0, 17.0, 20.0, 11.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.03125, -49.3974609375, -47.763671875, -46.1298828125, -44.49609375, -42.8623046875, -41.228515625, -39.5947265625, -37.9609375, -36.3271484375, -34.693359375, -33.0595703125, -31.42578125, -29.7919921875, -28.158203125, -26.5244140625, -24.890625, -23.2568359375, -21.623046875, -19.9892578125, -18.35546875, -16.7216796875, -15.087890625, -13.4541015625, -11.8203125, -10.1865234375, -8.552734375, -6.9189453125, -5.28515625, -3.6513671875, -2.017578125, -0.3837890625, 1.25, 2.8837890625, 4.517578125, 6.1513671875, 7.78515625, 9.4189453125, 11.052734375, 12.6865234375, 14.3203125, 15.9541015625, 17.587890625, 19.2216796875, 20.85546875, 22.4892578125, 24.123046875, 25.7568359375, 27.390625, 29.0244140625, 30.658203125, 32.2919921875, 33.92578125, 35.5595703125, 37.193359375, 38.8271484375, 40.4609375, 42.0947265625, 43.728515625, 45.3623046875, 46.99609375, 48.6298828125, 50.263671875, 51.8974609375, 53.53125]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 6.0, 8.0, 4.0, 8.0, 6.0, 6.0, 12.0, 10.0, 13.0, 13.0, 17.0, 23.0, 22.0, 30.0, 33.0, 27.0, 33.0, 40.0, 48.0, 36.0, 37.0, 49.0, 33.0, 43.0, 50.0, 41.0, 30.0, 41.0, 25.0, 46.0, 27.0, 34.0, 32.0, 21.0, 19.0, 17.0, 9.0, 12.0, 9.0, 8.0, 3.0, 5.0, 4.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.0859375, -14.620361328125, -14.15478515625, -13.689208984375, -13.2236328125, -12.758056640625, -12.29248046875, -11.826904296875, -11.361328125, -10.895751953125, -10.43017578125, -9.964599609375, -9.4990234375, -9.033447265625, -8.56787109375, -8.102294921875, -7.63671875, -7.171142578125, -6.70556640625, -6.239990234375, -5.7744140625, -5.308837890625, -4.84326171875, -4.377685546875, -3.912109375, -3.446533203125, -2.98095703125, -2.515380859375, -2.0498046875, -1.584228515625, -1.11865234375, -0.653076171875, -0.1875, 0.278076171875, 0.74365234375, 1.209228515625, 1.6748046875, 2.140380859375, 2.60595703125, 3.071533203125, 3.537109375, 4.002685546875, 4.46826171875, 4.933837890625, 5.3994140625, 5.864990234375, 6.33056640625, 6.796142578125, 7.26171875, 7.727294921875, 8.19287109375, 8.658447265625, 9.1240234375, 9.589599609375, 10.05517578125, 10.520751953125, 10.986328125, 11.451904296875, 11.91748046875, 12.383056640625, 12.8486328125, 13.314208984375, 13.77978515625, 14.245361328125, 14.7109375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 8.0, 3.0, 10.0, 7.0, 17.0, 14.0, 23.0, 30.0, 50.0, 71.0, 75.0, 113.0, 124.0, 155.0, 252.0, 319.0, 460.0, 637.0, 914.0, 1501.0, 2581.0, 4747.0, 9958.0, 25004.0, 113280.0, 3603013.0, 360517.0, 41511.0, 13941.0, 6234.0, 3121.0, 1808.0, 1069.0, 722.0, 510.0, 395.0, 259.0, 182.0, 133.0, 128.0, 94.0, 69.0, 67.0, 56.0, 23.0, 16.0, 10.0, 9.0, 9.0, 9.0, 6.0, 6.0, 5.0, 7.0, 1.0, 2.0, 2.0], "bins": [-141.5, -137.173828125, -132.84765625, -128.521484375, -124.1953125, -119.869140625, -115.54296875, -111.216796875, -106.890625, -102.564453125, -98.23828125, -93.912109375, -89.5859375, -85.259765625, -80.93359375, -76.607421875, -72.28125, -67.955078125, -63.62890625, -59.302734375, -54.9765625, -50.650390625, -46.32421875, -41.998046875, -37.671875, -33.345703125, -29.01953125, -24.693359375, -20.3671875, -16.041015625, -11.71484375, -7.388671875, -3.0625, 1.263671875, 5.58984375, 9.916015625, 14.2421875, 18.568359375, 22.89453125, 27.220703125, 31.546875, 35.873046875, 40.19921875, 44.525390625, 48.8515625, 53.177734375, 57.50390625, 61.830078125, 66.15625, 70.482421875, 74.80859375, 79.134765625, 83.4609375, 87.787109375, 92.11328125, 96.439453125, 100.765625, 105.091796875, 109.41796875, 113.744140625, 118.0703125, 122.396484375, 126.72265625, 131.048828125, 135.375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 8.0, 1.0, 7.0, 6.0, 2.0, 5.0, 12.0, 12.0, 14.0, 16.0, 17.0, 14.0, 27.0, 34.0, 43.0, 95.0, 149.0, 552.0, 1239.0, 867.0, 360.0, 180.0, 111.0, 95.0, 49.0, 40.0, 30.0, 13.0, 11.0, 14.0, 7.0, 7.0, 6.0, 6.0, 7.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.203125, -24.40869140625, -23.6142578125, -22.81982421875, -22.025390625, -21.23095703125, -20.4365234375, -19.64208984375, -18.84765625, -18.05322265625, -17.2587890625, -16.46435546875, -15.669921875, -14.87548828125, -14.0810546875, -13.28662109375, -12.4921875, -11.69775390625, -10.9033203125, -10.10888671875, -9.314453125, -8.52001953125, -7.7255859375, -6.93115234375, -6.13671875, -5.34228515625, -4.5478515625, -3.75341796875, -2.958984375, -2.16455078125, -1.3701171875, -0.57568359375, 0.21875, 1.01318359375, 1.8076171875, 2.60205078125, 3.396484375, 4.19091796875, 4.9853515625, 5.77978515625, 6.57421875, 7.36865234375, 8.1630859375, 8.95751953125, 9.751953125, 10.54638671875, 11.3408203125, 12.13525390625, 12.9296875, 13.72412109375, 14.5185546875, 15.31298828125, 16.107421875, 16.90185546875, 17.6962890625, 18.49072265625, 19.28515625, 20.07958984375, 20.8740234375, 21.66845703125, 22.462890625, 23.25732421875, 24.0517578125, 24.84619140625, 25.640625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 1.0, 13.0, 18.0, 9.0, 25.0, 117.0, 441.0, 145.0, 71.0, 53.0, 36.0, 19.0, 13.0, 11.0, 7.0, 1.0, 3.0, 0.0, 2.0], "bins": [-211.0430908203125, -206.93154907226562, -202.82000732421875, -198.70846557617188, -194.59690856933594, -190.48536682128906, -186.3738250732422, -182.2622833251953, -178.15074157714844, -174.03919982910156, -169.9276580810547, -165.81610107421875, -161.70455932617188, -157.593017578125, -153.48147583007812, -149.36993408203125, -145.25839233398438, -141.1468505859375, -137.03530883789062, -132.92376708984375, -128.8122100830078, -124.70066833496094, -120.58912658691406, -116.47758483886719, -112.36602783203125, -108.25448608398438, -104.14293670654297, -100.0313949584961, -95.91985321044922, -91.80830383300781, -87.69676208496094, -83.58522033691406, -79.47367095947266, -75.36212921142578, -71.25057983398438, -67.1390380859375, -63.027496337890625, -58.915950775146484, -54.804405212402344, -50.69286346435547, -46.58131790161133, -42.46977233886719, -38.35823059082031, -34.24668502807617, -30.135141372680664, -26.023597717285156, -21.912052154541016, -17.800508499145508, -13.68896484375, -9.577421188354492, -5.465876579284668, -1.3543319702148438, 2.757211685180664, 6.868755340576172, 10.980300903320312, 15.09184455871582, 19.203388214111328, 23.314931869506836, 27.426475524902344, 31.538021087646484, 35.649566650390625, 39.7611083984375, 43.87265396118164, 47.98419952392578, 52.095741271972656]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 7.0, 5.0, 9.0, 4.0, 8.0, 10.0, 13.0, 10.0, 13.0, 17.0, 13.0, 20.0, 17.0, 24.0, 28.0, 23.0, 25.0, 25.0, 47.0, 42.0, 44.0, 34.0, 55.0, 37.0, 42.0, 43.0, 23.0, 58.0, 37.0, 42.0, 33.0, 25.0, 13.0, 22.0, 16.0, 16.0, 15.0, 13.0, 11.0, 19.0, 7.0, 4.0, 7.0, 4.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-50.06481170654297, -48.45705032348633, -46.84928894042969, -45.24152755737305, -43.633766174316406, -42.02600860595703, -40.418243408203125, -38.81048583984375, -37.20272445678711, -35.59496307373047, -33.98720169067383, -32.37944030761719, -30.77168083190918, -29.16391944885254, -27.5561580657959, -25.94839859008789, -24.340635299682617, -22.732873916625977, -21.125112533569336, -19.517353057861328, -17.909591674804688, -16.301830291748047, -14.694068908691406, -13.086308479309082, -11.478547096252441, -9.8707857131958, -8.263025283813477, -6.655263900756836, -5.0475029945373535, -3.439742088317871, -1.8319807052612305, -0.22422027587890625, 1.3835411071777344, 2.991302013397217, 4.599062919616699, 6.20682430267334, 7.814585208892822, 9.422346115112305, 11.030107498168945, 12.63786792755127, 14.24562931060791, 15.85339069366455, 17.461151123046875, 19.068912506103516, 20.676673889160156, 22.284435272216797, 23.892196655273438, 25.499956130981445, 27.107717514038086, 28.715478897094727, 30.323240280151367, 31.930999755859375, 33.538761138916016, 35.146522521972656, 36.7542839050293, 38.36204528808594, 39.96980667114258, 41.57756805419922, 43.18532943725586, 44.7930908203125, 46.40085220336914, 48.00861358642578, 49.616371154785156, 51.2241325378418, 52.83189392089844]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 9.0, 11.0, 17.0, 29.0, 32.0, 51.0, 76.0, 89.0, 148.0, 212.0, 294.0, 430.0, 656.0, 984.0, 1683.0, 2737.0, 4685.0, 8943.0, 17755.0, 42029.0, 128166.0, 512651.0, 217387.0, 59875.0, 23561.0, 11304.0, 5895.0, 3207.0, 2075.0, 1164.0, 764.0, 536.0, 343.0, 227.0, 162.0, 110.0, 78.0, 47.0, 46.0, 19.0, 21.0, 14.0, 9.0, 14.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-78.3125, -75.759765625, -73.20703125, -70.654296875, -68.1015625, -65.548828125, -62.99609375, -60.443359375, -57.890625, -55.337890625, -52.78515625, -50.232421875, -47.6796875, -45.126953125, -42.57421875, -40.021484375, -37.46875, -34.916015625, -32.36328125, -29.810546875, -27.2578125, -24.705078125, -22.15234375, -19.599609375, -17.046875, -14.494140625, -11.94140625, -9.388671875, -6.8359375, -4.283203125, -1.73046875, 0.822265625, 3.375, 5.927734375, 8.48046875, 11.033203125, 13.5859375, 16.138671875, 18.69140625, 21.244140625, 23.796875, 26.349609375, 28.90234375, 31.455078125, 34.0078125, 36.560546875, 39.11328125, 41.666015625, 44.21875, 46.771484375, 49.32421875, 51.876953125, 54.4296875, 56.982421875, 59.53515625, 62.087890625, 64.640625, 67.193359375, 69.74609375, 72.298828125, 74.8515625, 77.404296875, 79.95703125, 82.509765625, 85.0625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 9.0, 0.0, 6.0, 7.0, 6.0, 5.0, 8.0, 10.0, 6.0, 9.0, 16.0, 14.0, 14.0, 15.0, 23.0, 23.0, 26.0, 30.0, 16.0, 22.0, 35.0, 51.0, 42.0, 38.0, 50.0, 42.0, 38.0, 38.0, 35.0, 44.0, 47.0, 33.0, 31.0, 29.0, 30.0, 17.0, 15.0, 20.0, 11.0, 20.0, 7.0, 15.0, 10.0, 8.0, 7.0, 4.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 8.0, 1.0, 3.0, 1.0], "bins": [-52.3125, -50.75341796875, -49.1943359375, -47.63525390625, -46.076171875, -44.51708984375, -42.9580078125, -41.39892578125, -39.83984375, -38.28076171875, -36.7216796875, -35.16259765625, -33.603515625, -32.04443359375, -30.4853515625, -28.92626953125, -27.3671875, -25.80810546875, -24.2490234375, -22.68994140625, -21.130859375, -19.57177734375, -18.0126953125, -16.45361328125, -14.89453125, -13.33544921875, -11.7763671875, -10.21728515625, -8.658203125, -7.09912109375, -5.5400390625, -3.98095703125, -2.421875, -0.86279296875, 0.6962890625, 2.25537109375, 3.814453125, 5.37353515625, 6.9326171875, 8.49169921875, 10.05078125, 11.60986328125, 13.1689453125, 14.72802734375, 16.287109375, 17.84619140625, 19.4052734375, 20.96435546875, 22.5234375, 24.08251953125, 25.6416015625, 27.20068359375, 28.759765625, 30.31884765625, 31.8779296875, 33.43701171875, 34.99609375, 36.55517578125, 38.1142578125, 39.67333984375, 41.232421875, 42.79150390625, 44.3505859375, 45.90966796875, 47.46875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 23.0, 17.0, 21.0, 25.0, 60.0, 71.0, 127.0, 204.0, 326.0, 541.0, 949.0, 1833.0, 3793.0, 9842.0, 35695.0, 509547.0, 434051.0, 34168.0, 9368.0, 3774.0, 1715.0, 991.0, 528.0, 314.0, 198.0, 108.0, 91.0, 52.0, 40.0, 21.0, 12.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.25, -165.72265625, -160.1953125, -154.66796875, -149.140625, -143.61328125, -138.0859375, -132.55859375, -127.03125, -121.50390625, -115.9765625, -110.44921875, -104.921875, -99.39453125, -93.8671875, -88.33984375, -82.8125, -77.28515625, -71.7578125, -66.23046875, -60.703125, -55.17578125, -49.6484375, -44.12109375, -38.59375, -33.06640625, -27.5390625, -22.01171875, -16.484375, -10.95703125, -5.4296875, 0.09765625, 5.625, 11.15234375, 16.6796875, 22.20703125, 27.734375, 33.26171875, 38.7890625, 44.31640625, 49.84375, 55.37109375, 60.8984375, 66.42578125, 71.953125, 77.48046875, 83.0078125, 88.53515625, 94.0625, 99.58984375, 105.1171875, 110.64453125, 116.171875, 121.69921875, 127.2265625, 132.75390625, 138.28125, 143.80859375, 149.3359375, 154.86328125, 160.390625, 165.91796875, 171.4453125, 176.97265625, 182.5]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 7.0, 10.0, 5.0, 7.0, 12.0, 5.0, 19.0, 17.0, 32.0, 31.0, 61.0, 72.0, 77.0, 93.0, 111.0, 91.0, 64.0, 61.0, 44.0, 27.0, 27.0, 30.0, 12.0, 16.0, 9.0, 8.0, 10.0, 10.0, 5.0, 2.0, 5.0, 4.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.25, -52.3330078125, -50.416015625, -48.4990234375, -46.58203125, -44.6650390625, -42.748046875, -40.8310546875, -38.9140625, -36.9970703125, -35.080078125, -33.1630859375, -31.24609375, -29.3291015625, -27.412109375, -25.4951171875, -23.578125, -21.6611328125, -19.744140625, -17.8271484375, -15.91015625, -13.9931640625, -12.076171875, -10.1591796875, -8.2421875, -6.3251953125, -4.408203125, -2.4912109375, -0.57421875, 1.3427734375, 3.259765625, 5.1767578125, 7.09375, 9.0107421875, 10.927734375, 12.8447265625, 14.76171875, 16.6787109375, 18.595703125, 20.5126953125, 22.4296875, 24.3466796875, 26.263671875, 28.1806640625, 30.09765625, 32.0146484375, 33.931640625, 35.8486328125, 37.765625, 39.6826171875, 41.599609375, 43.5166015625, 45.43359375, 47.3505859375, 49.267578125, 51.1845703125, 53.1015625, 55.0185546875, 56.935546875, 58.8525390625, 60.76953125, 62.6865234375, 64.603515625, 66.5205078125, 68.4375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 4.0, 9.0, 5.0, 15.0, 4.0, 13.0, 13.0, 20.0, 27.0, 19.0, 45.0, 57.0, 110.0, 215.0, 416.0, 1044.0, 3062.0, 17382.0, 979756.0, 39489.0, 4321.0, 1361.0, 520.0, 256.0, 123.0, 83.0, 39.0, 29.0, 22.0, 20.0, 18.0, 10.0, 7.0, 11.0, 10.0, 6.0, 7.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-280.25, -271.390625, -262.53125, -253.671875, -244.8125, -235.953125, -227.09375, -218.234375, -209.375, -200.515625, -191.65625, -182.796875, -173.9375, -165.078125, -156.21875, -147.359375, -138.5, -129.640625, -120.78125, -111.921875, -103.0625, -94.203125, -85.34375, -76.484375, -67.625, -58.765625, -49.90625, -41.046875, -32.1875, -23.328125, -14.46875, -5.609375, 3.25, 12.109375, 20.96875, 29.828125, 38.6875, 47.546875, 56.40625, 65.265625, 74.125, 82.984375, 91.84375, 100.703125, 109.5625, 118.421875, 127.28125, 136.140625, 145.0, 153.859375, 162.71875, 171.578125, 180.4375, 189.296875, 198.15625, 207.015625, 215.875, 224.734375, 233.59375, 242.453125, 251.3125, 260.171875, 269.03125, 277.890625, 286.75]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 4.0, 6.0, 9.0, 8.0, 14.0, 8.0, 10.0, 23.0, 28.0, 67.0, 70.0, 148.0, 209.0, 119.0, 90.0, 55.0, 32.0, 24.0, 15.0, 14.0, 8.0, 9.0, 10.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0020923614501953125, -0.0020365864038467407, -0.001980811357498169, -0.0019250363111495972, -0.0018692612648010254, -0.0018134862184524536, -0.0017577111721038818, -0.00170193612575531, -0.0016461610794067383, -0.0015903860330581665, -0.0015346109867095947, -0.001478835940361023, -0.0014230608940124512, -0.0013672858476638794, -0.0013115108013153076, -0.0012557357549667358, -0.001199960708618164, -0.0011441856622695923, -0.0010884106159210205, -0.0010326355695724487, -0.000976860523223877, -0.0009210854768753052, -0.0008653104305267334, -0.0008095353841781616, -0.0007537603378295898, -0.0006979852914810181, -0.0006422102451324463, -0.0005864351987838745, -0.0005306601524353027, -0.00047488510608673096, -0.0004191100597381592, -0.0003633350133895874, -0.0003075599670410156, -0.00025178492069244385, -0.00019600987434387207, -0.0001402348279953003, -8.445978164672852e-05, -2.8684735298156738e-05, 2.709031105041504e-05, 8.286535739898682e-05, 0.0001386404037475586, 0.00019441545009613037, 0.00025019049644470215, 0.0003059655427932739, 0.0003617405891418457, 0.0004175156354904175, 0.00047329068183898926, 0.000529065728187561, 0.0005848407745361328, 0.0006406158208847046, 0.0006963908672332764, 0.0007521659135818481, 0.0008079409599304199, 0.0008637160062789917, 0.0009194910526275635, 0.0009752660989761353, 0.001031041145324707, 0.0010868161916732788, 0.0011425912380218506, 0.0011983662843704224, 0.0012541413307189941, 0.001309916377067566, 0.0013656914234161377, 0.0014214664697647095, 0.0014772415161132812]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 4.0, 5.0, 6.0, 4.0, 4.0, 7.0, 9.0, 7.0, 6.0, 13.0, 19.0, 26.0, 43.0, 58.0, 94.0, 164.0, 331.0, 817.0, 2449.0, 28474.0, 1004118.0, 9060.0, 1608.0, 549.0, 276.0, 134.0, 77.0, 55.0, 33.0, 21.0, 24.0, 16.0, 8.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-447.0, -432.73046875, -418.4609375, -404.19140625, -389.921875, -375.65234375, -361.3828125, -347.11328125, -332.84375, -318.57421875, -304.3046875, -290.03515625, -275.765625, -261.49609375, -247.2265625, -232.95703125, -218.6875, -204.41796875, -190.1484375, -175.87890625, -161.609375, -147.33984375, -133.0703125, -118.80078125, -104.53125, -90.26171875, -75.9921875, -61.72265625, -47.453125, -33.18359375, -18.9140625, -4.64453125, 9.625, 23.89453125, 38.1640625, 52.43359375, 66.703125, 80.97265625, 95.2421875, 109.51171875, 123.78125, 138.05078125, 152.3203125, 166.58984375, 180.859375, 195.12890625, 209.3984375, 223.66796875, 237.9375, 252.20703125, 266.4765625, 280.74609375, 295.015625, 309.28515625, 323.5546875, 337.82421875, 352.09375, 366.36328125, 380.6328125, 394.90234375, 409.171875, 423.44140625, 437.7109375, 451.98046875, 466.25]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 19.0, 54.0, 208.0, 550.0, 103.0, 26.0, 18.0, 11.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.4375, -83.0849609375, -80.732421875, -78.3798828125, -76.02734375, -73.6748046875, -71.322265625, -68.9697265625, -66.6171875, -64.2646484375, -61.912109375, -59.5595703125, -57.20703125, -54.8544921875, -52.501953125, -50.1494140625, -47.796875, -45.4443359375, -43.091796875, -40.7392578125, -38.38671875, -36.0341796875, -33.681640625, -31.3291015625, -28.9765625, -26.6240234375, -24.271484375, -21.9189453125, -19.56640625, -17.2138671875, -14.861328125, -12.5087890625, -10.15625, -7.8037109375, -5.451171875, -3.0986328125, -0.74609375, 1.6064453125, 3.958984375, 6.3115234375, 8.6640625, 11.0166015625, 13.369140625, 15.7216796875, 18.07421875, 20.4267578125, 22.779296875, 25.1318359375, 27.484375, 29.8369140625, 32.189453125, 34.5419921875, 36.89453125, 39.2470703125, 41.599609375, 43.9521484375, 46.3046875, 48.6572265625, 51.009765625, 53.3623046875, 55.71484375, 58.0673828125, 60.419921875, 62.7724609375, 65.125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 15.0, 13.0, 23.0, 35.0, 152.0, 422.0, 139.0, 60.0, 44.0, 34.0, 15.0, 11.0, 3.0, 4.0, 1.0, 2.0], "bins": [-265.3590393066406, -260.35589599609375, -255.3527374267578, -250.34957885742188, -245.34642028808594, -240.34326171875, -235.34011840820312, -230.3369598388672, -225.33380126953125, -220.3306427001953, -215.32749938964844, -210.3243408203125, -205.32118225097656, -200.31802368164062, -195.31488037109375, -190.3117218017578, -185.30856323242188, -180.30540466308594, -175.30226135253906, -170.29910278320312, -165.2959442138672, -160.29278564453125, -155.28964233398438, -150.28648376464844, -145.28334045410156, -140.28018188476562, -135.27703857421875, -130.2738800048828, -125.27072143554688, -120.26757049560547, -115.26441955566406, -110.26126098632812, -105.25810241699219, -100.25495147705078, -95.25179290771484, -90.24864196777344, -85.2454833984375, -80.2423324584961, -75.23918151855469, -70.23602294921875, -65.23286437988281, -60.22970962524414, -55.22655487060547, -50.22340393066406, -45.220245361328125, -40.21709442138672, -35.21393966674805, -30.210784912109375, -25.20763397216797, -20.204479217529297, -15.201325416564941, -10.198171615600586, -5.195016860961914, -0.1918621063232422, 4.811290740966797, 9.814445495605469, 14.81760025024414, 19.820755004882812, 24.823909759521484, 29.827062606811523, 34.83021545410156, 39.8333740234375, 44.836524963378906, 49.83967971801758, 54.84283447265625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 4.0, 5.0, 3.0, 8.0, 11.0, 6.0, 8.0, 14.0, 11.0, 15.0, 20.0, 14.0, 22.0, 19.0, 22.0, 29.0, 27.0, 24.0, 39.0, 43.0, 43.0, 40.0, 50.0, 46.0, 39.0, 39.0, 41.0, 36.0, 30.0, 33.0, 39.0, 30.0, 31.0, 18.0, 17.0, 20.0, 19.0, 19.0, 8.0, 10.0, 12.0, 4.0, 5.0, 10.0, 6.0, 5.0, 2.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-55.125999450683594, -53.378211975097656, -51.63042449951172, -49.88263702392578, -48.134849548339844, -46.387062072753906, -44.63927459716797, -42.89148712158203, -41.143699645996094, -39.395912170410156, -37.64812469482422, -35.90033721923828, -34.152549743652344, -32.404762268066406, -30.656972885131836, -28.9091854095459, -27.161396026611328, -25.41360855102539, -23.665821075439453, -21.918033599853516, -20.170246124267578, -18.42245864868164, -16.67466926574707, -14.926881790161133, -13.179094314575195, -11.431306838989258, -9.68351936340332, -7.935730934143066, -6.187943458557129, -4.440155982971191, -2.6923675537109375, -0.944580078125, 0.8032035827636719, 2.5509912967681885, 4.298779010772705, 6.046566963195801, 7.794354438781738, 9.542141914367676, 11.28993034362793, 13.037717819213867, 14.785505294799805, 16.533292770385742, 18.28108024597168, 20.02886962890625, 21.776657104492188, 23.524444580078125, 25.272232055664062, 27.02001953125, 28.767807006835938, 30.515594482421875, 32.26338195800781, 34.01116943359375, 35.75895690917969, 37.506744384765625, 39.25453186035156, 41.0023193359375, 42.75010681152344, 44.497894287109375, 46.24568176269531, 47.99346923828125, 49.74125671386719, 51.489044189453125, 53.23683166503906, 54.984619140625, 56.7324104309082]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 11.0, 13.0, 28.0, 23.0, 36.0, 58.0, 79.0, 108.0, 165.0, 201.0, 286.0, 364.0, 557.0, 840.0, 1057.0, 1533.0, 2329.0, 3323.0, 5006.0, 7520.0, 12141.0, 20156.0, 36265.0, 80159.0, 319645.0, 373543.0, 86841.0, 38214.0, 20895.0, 12649.0, 7948.0, 5105.0, 3496.0, 2376.0, 1583.0, 1148.0, 781.0, 606.0, 413.0, 293.0, 215.0, 159.0, 115.0, 79.0, 51.0, 44.0, 30.0, 28.0, 12.0, 10.0, 3.0, 8.0, 2.0, 1.0, 0.0, 2.0], "bins": [-69.4375, -67.3359375, -65.234375, -63.1328125, -61.03125, -58.9296875, -56.828125, -54.7265625, -52.625, -50.5234375, -48.421875, -46.3203125, -44.21875, -42.1171875, -40.015625, -37.9140625, -35.8125, -33.7109375, -31.609375, -29.5078125, -27.40625, -25.3046875, -23.203125, -21.1015625, -19.0, -16.8984375, -14.796875, -12.6953125, -10.59375, -8.4921875, -6.390625, -4.2890625, -2.1875, -0.0859375, 2.015625, 4.1171875, 6.21875, 8.3203125, 10.421875, 12.5234375, 14.625, 16.7265625, 18.828125, 20.9296875, 23.03125, 25.1328125, 27.234375, 29.3359375, 31.4375, 33.5390625, 35.640625, 37.7421875, 39.84375, 41.9453125, 44.046875, 46.1484375, 48.25, 50.3515625, 52.453125, 54.5546875, 56.65625, 58.7578125, 60.859375, 62.9609375, 65.0625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 4.0, 4.0, 11.0, 8.0, 10.0, 21.0, 16.0, 17.0, 9.0, 20.0, 29.0, 27.0, 28.0, 26.0, 31.0, 36.0, 46.0, 54.0, 47.0, 41.0, 49.0, 46.0, 41.0, 41.0, 37.0, 35.0, 31.0, 34.0, 28.0, 28.0, 16.0, 21.0, 13.0, 17.0, 12.0, 12.0, 6.0, 5.0, 5.0, 5.0, 6.0, 8.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.65625, -48.1015625, -46.546875, -44.9921875, -43.4375, -41.8828125, -40.328125, -38.7734375, -37.21875, -35.6640625, -34.109375, -32.5546875, -31.0, -29.4453125, -27.890625, -26.3359375, -24.78125, -23.2265625, -21.671875, -20.1171875, -18.5625, -17.0078125, -15.453125, -13.8984375, -12.34375, -10.7890625, -9.234375, -7.6796875, -6.125, -4.5703125, -3.015625, -1.4609375, 0.09375, 1.6484375, 3.203125, 4.7578125, 6.3125, 7.8671875, 9.421875, 10.9765625, 12.53125, 14.0859375, 15.640625, 17.1953125, 18.75, 20.3046875, 21.859375, 23.4140625, 24.96875, 26.5234375, 28.078125, 29.6328125, 31.1875, 32.7421875, 34.296875, 35.8515625, 37.40625, 38.9609375, 40.515625, 42.0703125, 43.625, 45.1796875, 46.734375, 48.2890625, 49.84375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 3.0, 5.0, 9.0, 14.0, 35.0, 28.0, 31.0, 44.0, 67.0, 74.0, 103.0, 144.0, 169.0, 233.0, 349.0, 391.0, 548.0, 734.0, 1101.0, 1527.0, 2257.0, 3790.0, 6729.0, 14596.0, 50394.0, 775509.0, 140797.0, 25136.0, 9535.0, 4821.0, 2856.0, 1767.0, 1229.0, 849.0, 649.0, 502.0, 322.0, 257.0, 237.0, 153.0, 142.0, 91.0, 84.0, 54.0, 48.0, 34.0, 24.0, 13.0, 21.0, 14.0, 14.0, 6.0, 3.0, 4.0, 5.0, 0.0, 1.0, 3.0], "bins": [-470.0, -455.1953125, -440.390625, -425.5859375, -410.78125, -395.9765625, -381.171875, -366.3671875, -351.5625, -336.7578125, -321.953125, -307.1484375, -292.34375, -277.5390625, -262.734375, -247.9296875, -233.125, -218.3203125, -203.515625, -188.7109375, -173.90625, -159.1015625, -144.296875, -129.4921875, -114.6875, -99.8828125, -85.078125, -70.2734375, -55.46875, -40.6640625, -25.859375, -11.0546875, 3.75, 18.5546875, 33.359375, 48.1640625, 62.96875, 77.7734375, 92.578125, 107.3828125, 122.1875, 136.9921875, 151.796875, 166.6015625, 181.40625, 196.2109375, 211.015625, 225.8203125, 240.625, 255.4296875, 270.234375, 285.0390625, 299.84375, 314.6484375, 329.453125, 344.2578125, 359.0625, 373.8671875, 388.671875, 403.4765625, 418.28125, 433.0859375, 447.890625, 462.6953125, 477.5]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 7.0, 4.0, 1.0, 5.0, 6.0, 13.0, 15.0, 13.0, 12.0, 8.0, 12.0, 16.0, 12.0, 19.0, 23.0, 11.0, 19.0, 25.0, 37.0, 37.0, 62.0, 114.0, 115.0, 69.0, 53.0, 37.0, 18.0, 30.0, 25.0, 24.0, 19.0, 23.0, 18.0, 15.0, 19.0, 9.0, 11.0, 9.0, 8.0, 5.0, 7.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-97.1875, -94.171875, -91.15625, -88.140625, -85.125, -82.109375, -79.09375, -76.078125, -73.0625, -70.046875, -67.03125, -64.015625, -61.0, -57.984375, -54.96875, -51.953125, -48.9375, -45.921875, -42.90625, -39.890625, -36.875, -33.859375, -30.84375, -27.828125, -24.8125, -21.796875, -18.78125, -15.765625, -12.75, -9.734375, -6.71875, -3.703125, -0.6875, 2.328125, 5.34375, 8.359375, 11.375, 14.390625, 17.40625, 20.421875, 23.4375, 26.453125, 29.46875, 32.484375, 35.5, 38.515625, 41.53125, 44.546875, 47.5625, 50.578125, 53.59375, 56.609375, 59.625, 62.640625, 65.65625, 68.671875, 71.6875, 74.703125, 77.71875, 80.734375, 83.75, 86.765625, 89.78125, 92.796875, 95.8125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 11.0, 7.0, 11.0, 10.0, 11.0, 22.0, 18.0, 31.0, 47.0, 48.0, 81.0, 94.0, 134.0, 174.0, 280.0, 387.0, 570.0, 944.0, 1631.0, 3429.0, 11686.0, 956621.0, 59789.0, 6277.0, 2476.0, 1300.0, 745.0, 484.0, 335.0, 226.0, 163.0, 124.0, 83.0, 62.0, 56.0, 31.0, 32.0, 30.0, 14.0, 22.0, 16.0, 8.0, 5.0, 6.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2070.0, -2008.75, -1947.5, -1886.25, -1825.0, -1763.75, -1702.5, -1641.25, -1580.0, -1518.75, -1457.5, -1396.25, -1335.0, -1273.75, -1212.5, -1151.25, -1090.0, -1028.75, -967.5, -906.25, -845.0, -783.75, -722.5, -661.25, -600.0, -538.75, -477.5, -416.25, -355.0, -293.75, -232.5, -171.25, -110.0, -48.75, 12.5, 73.75, 135.0, 196.25, 257.5, 318.75, 380.0, 441.25, 502.5, 563.75, 625.0, 686.25, 747.5, 808.75, 870.0, 931.25, 992.5, 1053.75, 1115.0, 1176.25, 1237.5, 1298.75, 1360.0, 1421.25, 1482.5, 1543.75, 1605.0, 1666.25, 1727.5, 1788.75, 1850.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 7.0, 8.0, 13.0, 44.0, 140.0, 378.0, 276.0, 82.0, 23.0, 9.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03228759765625, -0.030731201171875, -0.0291748046875, -0.027618408203125, -0.02606201171875, -0.024505615234375, -0.02294921875, -0.021392822265625, -0.01983642578125, -0.018280029296875, -0.0167236328125, -0.015167236328125, -0.01361083984375, -0.012054443359375, -0.010498046875, -0.008941650390625, -0.00738525390625, -0.005828857421875, -0.0042724609375, -0.002716064453125, -0.00115966796875, 0.000396728515625, 0.001953125, 0.003509521484375, 0.00506591796875, 0.006622314453125, 0.0081787109375, 0.009735107421875, 0.01129150390625, 0.012847900390625, 0.014404296875, 0.015960693359375, 0.01751708984375, 0.019073486328125, 0.0206298828125, 0.022186279296875, 0.02374267578125, 0.025299072265625, 0.02685546875, 0.028411865234375, 0.02996826171875, 0.031524658203125, 0.0330810546875, 0.034637451171875, 0.03619384765625, 0.037750244140625, 0.039306640625, 0.040863037109375, 0.04241943359375, 0.043975830078125, 0.0455322265625, 0.047088623046875, 0.04864501953125, 0.050201416015625, 0.0517578125, 0.053314208984375, 0.05487060546875, 0.056427001953125, 0.0579833984375, 0.059539794921875, 0.06109619140625, 0.062652587890625, 0.064208984375, 0.065765380859375, 0.06732177734375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 11.0, 6.0, 19.0, 9.0, 28.0, 26.0, 52.0, 48.0, 65.0, 102.0, 116.0, 174.0, 221.0, 352.0, 482.0, 857.0, 1719.0, 4787.0, 35775.0, 985387.0, 12057.0, 2817.0, 1262.0, 722.0, 415.0, 279.0, 186.0, 155.0, 91.0, 77.0, 63.0, 36.0, 24.0, 33.0, 14.0, 19.0, 16.0, 9.0, 9.0, 6.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2246.0, -2174.21875, -2102.4375, -2030.65625, -1958.875, -1887.09375, -1815.3125, -1743.53125, -1671.75, -1599.96875, -1528.1875, -1456.40625, -1384.625, -1312.84375, -1241.0625, -1169.28125, -1097.5, -1025.71875, -953.9375, -882.15625, -810.375, -738.59375, -666.8125, -595.03125, -523.25, -451.46875, -379.6875, -307.90625, -236.125, -164.34375, -92.5625, -20.78125, 51.0, 122.78125, 194.5625, 266.34375, 338.125, 409.90625, 481.6875, 553.46875, 625.25, 697.03125, 768.8125, 840.59375, 912.375, 984.15625, 1055.9375, 1127.71875, 1199.5, 1271.28125, 1343.0625, 1414.84375, 1486.625, 1558.40625, 1630.1875, 1701.96875, 1773.75, 1845.53125, 1917.3125, 1989.09375, 2060.875, 2132.65625, 2204.4375, 2276.21875, 2348.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 8.0, 10.0, 10.0, 11.0, 49.0, 166.0, 321.0, 233.0, 85.0, 37.0, 7.0, 6.0, 9.0, 5.0, 3.0, 3.0, 6.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-299.75, -289.6328125, -279.515625, -269.3984375, -259.28125, -249.1640625, -239.046875, -228.9296875, -218.8125, -208.6953125, -198.578125, -188.4609375, -178.34375, -168.2265625, -158.109375, -147.9921875, -137.875, -127.7578125, -117.640625, -107.5234375, -97.40625, -87.2890625, -77.171875, -67.0546875, -56.9375, -46.8203125, -36.703125, -26.5859375, -16.46875, -6.3515625, 3.765625, 13.8828125, 24.0, 34.1171875, 44.234375, 54.3515625, 64.46875, 74.5859375, 84.703125, 94.8203125, 104.9375, 115.0546875, 125.171875, 135.2890625, 145.40625, 155.5234375, 165.640625, 175.7578125, 185.875, 195.9921875, 206.109375, 216.2265625, 226.34375, 236.4609375, 246.578125, 256.6953125, 266.8125, 276.9296875, 287.046875, 297.1640625, 307.28125, 317.3984375, 327.515625, 337.6328125, 347.75]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 6.0, 5.0, 9.0, 8.0, 8.0, 3.0, 7.0, 10.0, 13.0, 14.0, 20.0, 27.0, 31.0, 38.0, 45.0, 49.0, 100.0, 138.0, 417.0, 31.0, 3.0], "bins": [-487.7496643066406, -479.8569641113281, -471.96429443359375, -464.07159423828125, -456.17889404296875, -448.2862243652344, -440.3935241699219, -432.5008544921875, -424.608154296875, -416.7154541015625, -408.8227844238281, -400.9300842285156, -393.03741455078125, -385.14471435546875, -377.25201416015625, -369.3593444824219, -361.4666442871094, -353.5739440917969, -345.6812744140625, -337.78857421875, -329.8958740234375, -322.0032043457031, -314.1105041503906, -306.21783447265625, -298.32513427734375, -290.43243408203125, -282.5397644042969, -274.6470642089844, -266.75439453125, -258.8616943359375, -250.968994140625, -243.07630920410156, -235.18360900878906, -227.29092407226562, -219.39822387695312, -211.5055389404297, -203.61285400390625, -195.7201690673828, -187.82748413085938, -179.93478393554688, -172.04209899902344, -164.1494140625, -156.2567138671875, -148.36402893066406, -140.47134399414062, -132.5786590576172, -124.68596649169922, -116.79327392578125, -108.90058898925781, -101.00790405273438, -93.1152114868164, -85.22251892089844, -77.329833984375, -69.43714904785156, -61.544456481933594, -53.65176773071289, -45.75907897949219, -37.866390228271484, -29.97370147705078, -22.081012725830078, -14.188323974609375, -6.295635223388672, 1.5970535278320312, 9.489742279052734, 17.382431030273438]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 6.0, 4.0, 4.0, 9.0, 8.0, 11.0, 12.0, 14.0, 16.0, 14.0, 15.0, 26.0, 22.0, 29.0, 30.0, 41.0, 33.0, 53.0, 57.0, 46.0, 52.0, 51.0, 47.0, 51.0, 52.0, 34.0, 40.0, 35.0, 28.0, 21.0, 19.0, 19.0, 21.0, 13.0, 14.0, 12.0, 11.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-113.3019027709961, -109.62720489501953, -105.95250701904297, -102.2778091430664, -98.60311126708984, -94.92840576171875, -91.25370788574219, -87.57901000976562, -83.90431213378906, -80.2296142578125, -76.55491638183594, -72.88021850585938, -69.20552062988281, -65.53082275390625, -61.85612106323242, -58.181419372558594, -54.5067253112793, -50.832027435302734, -47.15732955932617, -43.482627868652344, -39.80792999267578, -36.13323211669922, -32.458534240722656, -28.78383445739746, -25.1091365814209, -21.434438705444336, -17.75973892211914, -14.085041046142578, -10.4103422164917, -6.73564338684082, -3.060945510864258, 0.6137542724609375, 4.2884521484375, 7.963150978088379, 11.637849807739258, 15.31254768371582, 18.987247467041016, 22.661945343017578, 26.33664321899414, 30.011343002319336, 33.68604278564453, 37.360740661621094, 41.035438537597656, 44.71013641357422, 48.38483810424805, 52.05953598022461, 55.73423385620117, 59.408935546875, 63.0836296081543, 66.75833129882812, 70.43302917480469, 74.10772705078125, 77.78242492675781, 81.45712280273438, 85.13182067871094, 88.8065185546875, 92.48121643066406, 96.15591430664062, 99.83061218261719, 103.50531005859375, 107.18000793457031, 110.85470581054688, 114.52940368652344, 118.20410919189453, 121.8788070678711]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 10.0, 11.0, 11.0, 18.0, 31.0, 39.0, 49.0, 78.0, 132.0, 163.0, 216.0, 321.0, 461.0, 656.0, 966.0, 1310.0, 2040.0, 3047.0, 4903.0, 8224.0, 14585.0, 26989.0, 55106.0, 127880.0, 1066675.0, 2565366.0, 172143.0, 67401.0, 32774.0, 16997.0, 9475.0, 5613.0, 3384.0, 2170.0, 1411.0, 986.0, 670.0, 472.0, 347.0, 266.0, 200.0, 138.0, 123.0, 98.0, 69.0, 64.0, 57.0, 34.0, 28.0, 23.0, 20.0, 8.0, 9.0, 10.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-70.75, -68.322265625, -65.89453125, -63.466796875, -61.0390625, -58.611328125, -56.18359375, -53.755859375, -51.328125, -48.900390625, -46.47265625, -44.044921875, -41.6171875, -39.189453125, -36.76171875, -34.333984375, -31.90625, -29.478515625, -27.05078125, -24.623046875, -22.1953125, -19.767578125, -17.33984375, -14.912109375, -12.484375, -10.056640625, -7.62890625, -5.201171875, -2.7734375, -0.345703125, 2.08203125, 4.509765625, 6.9375, 9.365234375, 11.79296875, 14.220703125, 16.6484375, 19.076171875, 21.50390625, 23.931640625, 26.359375, 28.787109375, 31.21484375, 33.642578125, 36.0703125, 38.498046875, 40.92578125, 43.353515625, 45.78125, 48.208984375, 50.63671875, 53.064453125, 55.4921875, 57.919921875, 60.34765625, 62.775390625, 65.203125, 67.630859375, 70.05859375, 72.486328125, 74.9140625, 77.341796875, 79.76953125, 82.197265625, 84.625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 7.0, 6.0, 8.0, 7.0, 12.0, 13.0, 11.0, 19.0, 25.0, 34.0, 25.0, 37.0, 42.0, 41.0, 42.0, 49.0, 57.0, 51.0, 45.0, 60.0, 44.0, 44.0, 41.0, 35.0, 40.0, 23.0, 27.0, 14.0, 19.0, 21.0, 23.0, 13.0, 5.0, 8.0, 7.0, 7.0, 3.0, 6.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-15.3828125, -14.8883056640625, -14.393798828125, -13.8992919921875, -13.40478515625, -12.9102783203125, -12.415771484375, -11.9212646484375, -11.4267578125, -10.9322509765625, -10.437744140625, -9.9432373046875, -9.44873046875, -8.9542236328125, -8.459716796875, -7.9652099609375, -7.470703125, -6.9761962890625, -6.481689453125, -5.9871826171875, -5.49267578125, -4.9981689453125, -4.503662109375, -4.0091552734375, -3.5146484375, -3.0201416015625, -2.525634765625, -2.0311279296875, -1.53662109375, -1.0421142578125, -0.547607421875, -0.0531005859375, 0.44140625, 0.9359130859375, 1.430419921875, 1.9249267578125, 2.41943359375, 2.9139404296875, 3.408447265625, 3.9029541015625, 4.3974609375, 4.8919677734375, 5.386474609375, 5.8809814453125, 6.37548828125, 6.8699951171875, 7.364501953125, 7.8590087890625, 8.353515625, 8.8480224609375, 9.342529296875, 9.8370361328125, 10.33154296875, 10.8260498046875, 11.320556640625, 11.8150634765625, 12.3095703125, 12.8040771484375, 13.298583984375, 13.7930908203125, 14.28759765625, 14.7821044921875, 15.276611328125, 15.7711181640625, 16.265625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 8.0, 13.0, 29.0, 16.0, 47.0, 42.0, 68.0, 117.0, 141.0, 216.0, 292.0, 440.0, 607.0, 1075.0, 1630.0, 2727.0, 4952.0, 10132.0, 24595.0, 78437.0, 520568.0, 3247898.0, 217339.0, 47956.0, 17087.0, 7632.0, 4085.0, 2117.0, 1373.0, 811.0, 549.0, 394.0, 228.0, 185.0, 132.0, 96.0, 68.0, 58.0, 40.0, 26.0, 17.0, 10.0, 5.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-55.125, -53.4189453125, -51.712890625, -50.0068359375, -48.30078125, -46.5947265625, -44.888671875, -43.1826171875, -41.4765625, -39.7705078125, -38.064453125, -36.3583984375, -34.65234375, -32.9462890625, -31.240234375, -29.5341796875, -27.828125, -26.1220703125, -24.416015625, -22.7099609375, -21.00390625, -19.2978515625, -17.591796875, -15.8857421875, -14.1796875, -12.4736328125, -10.767578125, -9.0615234375, -7.35546875, -5.6494140625, -3.943359375, -2.2373046875, -0.53125, 1.1748046875, 2.880859375, 4.5869140625, 6.29296875, 7.9990234375, 9.705078125, 11.4111328125, 13.1171875, 14.8232421875, 16.529296875, 18.2353515625, 19.94140625, 21.6474609375, 23.353515625, 25.0595703125, 26.765625, 28.4716796875, 30.177734375, 31.8837890625, 33.58984375, 35.2958984375, 37.001953125, 38.7080078125, 40.4140625, 42.1201171875, 43.826171875, 45.5322265625, 47.23828125, 48.9443359375, 50.650390625, 52.3564453125, 54.0625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 10.0, 4.0, 9.0, 10.0, 18.0, 7.0, 14.0, 19.0, 14.0, 17.0, 24.0, 36.0, 45.0, 58.0, 62.0, 85.0, 112.0, 184.0, 260.0, 467.0, 714.0, 541.0, 354.0, 232.0, 163.0, 123.0, 113.0, 84.0, 66.0, 41.0, 34.0, 25.0, 33.0, 30.0, 18.0, 16.0, 7.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5703125, -10.29046630859375, -10.0106201171875, -9.73077392578125, -9.450927734375, -9.17108154296875, -8.8912353515625, -8.61138916015625, -8.33154296875, -8.05169677734375, -7.7718505859375, -7.49200439453125, -7.212158203125, -6.93231201171875, -6.6524658203125, -6.37261962890625, -6.0927734375, -5.81292724609375, -5.5330810546875, -5.25323486328125, -4.973388671875, -4.69354248046875, -4.4136962890625, -4.13385009765625, -3.85400390625, -3.57415771484375, -3.2943115234375, -3.01446533203125, -2.734619140625, -2.45477294921875, -2.1749267578125, -1.89508056640625, -1.615234375, -1.33538818359375, -1.0555419921875, -0.77569580078125, -0.495849609375, -0.21600341796875, 0.0638427734375, 0.34368896484375, 0.62353515625, 0.90338134765625, 1.1832275390625, 1.46307373046875, 1.742919921875, 2.02276611328125, 2.3026123046875, 2.58245849609375, 2.8623046875, 3.14215087890625, 3.4219970703125, 3.70184326171875, 3.981689453125, 4.26153564453125, 4.5413818359375, 4.82122802734375, 5.10107421875, 5.38092041015625, 5.6607666015625, 5.94061279296875, 6.220458984375, 6.50030517578125, 6.7801513671875, 7.05999755859375, 7.33984375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 11.0, 10.0, 16.0, 12.0, 31.0, 71.0, 130.0, 338.0, 274.0, 44.0, 24.0, 14.0, 2.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.86091995239258, -32.923831939697266, -30.98674201965332, -29.049652099609375, -27.112564086914062, -25.175474166870117, -23.238384246826172, -21.30129623413086, -19.364206314086914, -17.42711639404297, -15.490028381347656, -13.552938461303711, -11.615849494934082, -9.678760528564453, -7.741670608520508, -5.804581642150879, -3.86749267578125, -1.930403470993042, 0.006685733795166016, 1.9437751770019531, 3.880864143371582, 5.817953109741211, 7.755043029785156, 9.692131996154785, 11.629220962524414, 13.566309928894043, 15.503398895263672, 17.440488815307617, 19.377578735351562, 21.314666748046875, 23.25175666809082, 25.188846588134766, 27.125930786132812, 29.063020706176758, 31.00010871887207, 32.937198638916016, 34.87428665161133, 36.811378479003906, 38.74846649169922, 40.68555450439453, 42.622642517089844, 44.559730529785156, 46.496822357177734, 48.43391036987305, 50.37099838256836, 52.30809020996094, 54.24517822265625, 56.18226623535156, 58.11935806274414, 60.05644607543945, 61.99353790283203, 63.930625915527344, 65.86771392822266, 67.80480194091797, 69.74189758300781, 71.67898559570312, 73.61607360839844, 75.55316162109375, 77.49024963378906, 79.42733764648438, 81.36443328857422, 83.30152130126953, 85.23860931396484, 87.17569732666016, 89.11278533935547]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 5.0, 5.0, 7.0, 11.0, 16.0, 12.0, 25.0, 29.0, 31.0, 36.0, 55.0, 44.0, 47.0, 39.0, 59.0, 54.0, 50.0, 59.0, 56.0, 39.0, 44.0, 46.0, 31.0, 36.0, 25.0, 19.0, 17.0, 22.0, 9.0, 12.0, 5.0, 6.0, 9.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-26.071685791015625, -25.326156616210938, -24.580629348754883, -23.835102081298828, -23.08957290649414, -22.344043731689453, -21.5985164642334, -20.852989196777344, -20.107460021972656, -19.36193084716797, -18.616403579711914, -17.87087631225586, -17.125347137451172, -16.379817962646484, -15.63429069519043, -14.888762474060059, -14.143234252929688, -13.397706031799316, -12.652177810668945, -11.906649589538574, -11.161121368408203, -10.415593147277832, -9.670064926147461, -8.92453670501709, -8.179008483886719, -7.433480262756348, -6.687952041625977, -5.9424238204956055, -5.196895599365234, -4.451367378234863, -3.705839157104492, -2.960310935974121, -2.214784622192383, -1.4692564010620117, -0.7237281799316406, 0.02180004119873047, 0.7673282623291016, 1.5128564834594727, 2.2583847045898438, 3.003912925720215, 3.749441146850586, 4.494969367980957, 5.240497589111328, 5.986025810241699, 6.73155403137207, 7.477082252502441, 8.222610473632812, 8.968138694763184, 9.713666915893555, 10.459195137023926, 11.204723358154297, 11.950251579284668, 12.695779800415039, 13.44130802154541, 14.186836242675781, 14.932364463806152, 15.677892684936523, 16.423419952392578, 17.168949127197266, 17.914478302001953, 18.660005569458008, 19.405532836914062, 20.15106201171875, 20.896591186523438, 21.642118453979492]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 7.0, 6.0, 10.0, 12.0, 16.0, 24.0, 37.0, 37.0, 52.0, 79.0, 102.0, 131.0, 188.0, 288.0, 412.0, 673.0, 1062.0, 1868.0, 3581.0, 7576.0, 19508.0, 67208.0, 356637.0, 462640.0, 85232.0, 23299.0, 8473.0, 3977.0, 2003.0, 1146.0, 709.0, 450.0, 298.0, 201.0, 157.0, 120.0, 83.0, 53.0, 51.0, 41.0, 24.0, 20.0, 18.0, 13.0, 9.0, 5.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-37.4375, -36.23291015625, -35.0283203125, -33.82373046875, -32.619140625, -31.41455078125, -30.2099609375, -29.00537109375, -27.80078125, -26.59619140625, -25.3916015625, -24.18701171875, -22.982421875, -21.77783203125, -20.5732421875, -19.36865234375, -18.1640625, -16.95947265625, -15.7548828125, -14.55029296875, -13.345703125, -12.14111328125, -10.9365234375, -9.73193359375, -8.52734375, -7.32275390625, -6.1181640625, -4.91357421875, -3.708984375, -2.50439453125, -1.2998046875, -0.09521484375, 1.109375, 2.31396484375, 3.5185546875, 4.72314453125, 5.927734375, 7.13232421875, 8.3369140625, 9.54150390625, 10.74609375, 11.95068359375, 13.1552734375, 14.35986328125, 15.564453125, 16.76904296875, 17.9736328125, 19.17822265625, 20.3828125, 21.58740234375, 22.7919921875, 23.99658203125, 25.201171875, 26.40576171875, 27.6103515625, 28.81494140625, 30.01953125, 31.22412109375, 32.4287109375, 33.63330078125, 34.837890625, 36.04248046875, 37.2470703125, 38.45166015625, 39.65625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 0.0, 7.0, 7.0, 11.0, 14.0, 9.0, 15.0, 22.0, 31.0, 27.0, 50.0, 39.0, 36.0, 46.0, 52.0, 43.0, 43.0, 48.0, 50.0, 47.0, 55.0, 51.0, 33.0, 38.0, 21.0, 28.0, 24.0, 17.0, 29.0, 18.0, 13.0, 12.0, 9.0, 5.0, 5.0, 5.0, 7.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.78125, -17.200439453125, -16.61962890625, -16.038818359375, -15.4580078125, -14.877197265625, -14.29638671875, -13.715576171875, -13.134765625, -12.553955078125, -11.97314453125, -11.392333984375, -10.8115234375, -10.230712890625, -9.64990234375, -9.069091796875, -8.48828125, -7.907470703125, -7.32666015625, -6.745849609375, -6.1650390625, -5.584228515625, -5.00341796875, -4.422607421875, -3.841796875, -3.260986328125, -2.68017578125, -2.099365234375, -1.5185546875, -0.937744140625, -0.35693359375, 0.223876953125, 0.8046875, 1.385498046875, 1.96630859375, 2.547119140625, 3.1279296875, 3.708740234375, 4.28955078125, 4.870361328125, 5.451171875, 6.031982421875, 6.61279296875, 7.193603515625, 7.7744140625, 8.355224609375, 8.93603515625, 9.516845703125, 10.09765625, 10.678466796875, 11.25927734375, 11.840087890625, 12.4208984375, 13.001708984375, 13.58251953125, 14.163330078125, 14.744140625, 15.324951171875, 15.90576171875, 16.486572265625, 17.0673828125, 17.648193359375, 18.22900390625, 18.809814453125, 19.390625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 9.0, 14.0, 20.0, 27.0, 41.0, 76.0, 74.0, 104.0, 177.0, 214.0, 281.0, 411.0, 602.0, 796.0, 1211.0, 1723.0, 2640.0, 4296.0, 7580.0, 15995.0, 42290.0, 210479.0, 620713.0, 86153.0, 25387.0, 11006.0, 5715.0, 3429.0, 2214.0, 1473.0, 954.0, 713.0, 495.0, 379.0, 238.0, 199.0, 129.0, 81.0, 65.0, 44.0, 31.0, 23.0, 22.0, 10.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.5625, -46.041015625, -44.51953125, -42.998046875, -41.4765625, -39.955078125, -38.43359375, -36.912109375, -35.390625, -33.869140625, -32.34765625, -30.826171875, -29.3046875, -27.783203125, -26.26171875, -24.740234375, -23.21875, -21.697265625, -20.17578125, -18.654296875, -17.1328125, -15.611328125, -14.08984375, -12.568359375, -11.046875, -9.525390625, -8.00390625, -6.482421875, -4.9609375, -3.439453125, -1.91796875, -0.396484375, 1.125, 2.646484375, 4.16796875, 5.689453125, 7.2109375, 8.732421875, 10.25390625, 11.775390625, 13.296875, 14.818359375, 16.33984375, 17.861328125, 19.3828125, 20.904296875, 22.42578125, 23.947265625, 25.46875, 26.990234375, 28.51171875, 30.033203125, 31.5546875, 33.076171875, 34.59765625, 36.119140625, 37.640625, 39.162109375, 40.68359375, 42.205078125, 43.7265625, 45.248046875, 46.76953125, 48.291015625, 49.8125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 7.0, 7.0, 9.0, 9.0, 4.0, 11.0, 17.0, 23.0, 19.0, 23.0, 27.0, 23.0, 40.0, 36.0, 60.0, 79.0, 91.0, 77.0, 59.0, 60.0, 50.0, 42.0, 33.0, 29.0, 34.0, 21.0, 20.0, 14.0, 7.0, 12.0, 11.0, 11.0, 6.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.75, -25.970703125, -25.19140625, -24.412109375, -23.6328125, -22.853515625, -22.07421875, -21.294921875, -20.515625, -19.736328125, -18.95703125, -18.177734375, -17.3984375, -16.619140625, -15.83984375, -15.060546875, -14.28125, -13.501953125, -12.72265625, -11.943359375, -11.1640625, -10.384765625, -9.60546875, -8.826171875, -8.046875, -7.267578125, -6.48828125, -5.708984375, -4.9296875, -4.150390625, -3.37109375, -2.591796875, -1.8125, -1.033203125, -0.25390625, 0.525390625, 1.3046875, 2.083984375, 2.86328125, 3.642578125, 4.421875, 5.201171875, 5.98046875, 6.759765625, 7.5390625, 8.318359375, 9.09765625, 9.876953125, 10.65625, 11.435546875, 12.21484375, 12.994140625, 13.7734375, 14.552734375, 15.33203125, 16.111328125, 16.890625, 17.669921875, 18.44921875, 19.228515625, 20.0078125, 20.787109375, 21.56640625, 22.345703125, 23.125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 15.0, 14.0, 14.0, 27.0, 30.0, 46.0, 86.0, 108.0, 152.0, 230.0, 327.0, 540.0, 938.0, 1568.0, 2893.0, 5905.0, 15428.0, 82126.0, 833286.0, 76935.0, 15205.0, 5815.0, 2777.0, 1594.0, 899.0, 534.0, 339.0, 216.0, 144.0, 105.0, 69.0, 58.0, 43.0, 18.0, 13.0, 16.0, 14.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-62.96875, -61.1943359375, -59.419921875, -57.6455078125, -55.87109375, -54.0966796875, -52.322265625, -50.5478515625, -48.7734375, -46.9990234375, -45.224609375, -43.4501953125, -41.67578125, -39.9013671875, -38.126953125, -36.3525390625, -34.578125, -32.8037109375, -31.029296875, -29.2548828125, -27.48046875, -25.7060546875, -23.931640625, -22.1572265625, -20.3828125, -18.6083984375, -16.833984375, -15.0595703125, -13.28515625, -11.5107421875, -9.736328125, -7.9619140625, -6.1875, -4.4130859375, -2.638671875, -0.8642578125, 0.91015625, 2.6845703125, 4.458984375, 6.2333984375, 8.0078125, 9.7822265625, 11.556640625, 13.3310546875, 15.10546875, 16.8798828125, 18.654296875, 20.4287109375, 22.203125, 23.9775390625, 25.751953125, 27.5263671875, 29.30078125, 31.0751953125, 32.849609375, 34.6240234375, 36.3984375, 38.1728515625, 39.947265625, 41.7216796875, 43.49609375, 45.2705078125, 47.044921875, 48.8193359375, 50.59375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 5.0, 4.0, 16.0, 9.0, 25.0, 31.0, 36.0, 62.0, 115.0, 207.0, 213.0, 89.0, 48.0, 42.0, 19.0, 24.0, 9.0, 11.0, 8.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0011777877807617188, -0.0011466816067695618, -0.0011155754327774048, -0.0010844692587852478, -0.0010533630847930908, -0.0010222569108009338, -0.0009911507368087769, -0.0009600445628166199, -0.0009289383888244629, -0.0008978322148323059, -0.0008667260408401489, -0.0008356198668479919, -0.000804513692855835, -0.000773407518863678, -0.000742301344871521, -0.000711195170879364, -0.000680088996887207, -0.00064898282289505, -0.0006178766489028931, -0.0005867704749107361, -0.0005556643009185791, -0.0005245581269264221, -0.0004934519529342651, -0.00046234577894210815, -0.00043123960494995117, -0.0004001334309577942, -0.0003690272569656372, -0.0003379210829734802, -0.00030681490898132324, -0.00027570873498916626, -0.0002446025609970093, -0.0002134963870048523, -0.0001823902130126953, -0.00015128403902053833, -0.00012017786502838135, -8.907169103622437e-05, -5.796551704406738e-05, -2.68593430519104e-05, 4.246830940246582e-06, 3.5353004932403564e-05, 6.645917892456055e-05, 9.756535291671753e-05, 0.0001286715269088745, 0.0001597777009010315, 0.00019088387489318848, 0.00022199004888534546, 0.00025309622287750244, 0.0002842023968696594, 0.0003153085708618164, 0.0003464147448539734, 0.00037752091884613037, 0.00040862709283828735, 0.00043973326683044434, 0.0004708394408226013, 0.0005019456148147583, 0.0005330517888069153, 0.0005641579627990723, 0.0005952641367912292, 0.0006263703107833862, 0.0006574764847755432, 0.0006885826587677002, 0.0007196888327598572, 0.0007507950067520142, 0.0007819011807441711, 0.0008130073547363281]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 4.0, 10.0, 11.0, 7.0, 16.0, 17.0, 19.0, 40.0, 48.0, 57.0, 86.0, 121.0, 168.0, 258.0, 402.0, 528.0, 928.0, 1625.0, 2857.0, 6357.0, 18209.0, 104595.0, 828471.0, 59046.0, 13377.0, 5041.0, 2385.0, 1357.0, 864.0, 513.0, 347.0, 247.0, 151.0, 121.0, 78.0, 46.0, 35.0, 38.0, 15.0, 21.0, 15.0, 6.0, 5.0, 4.0, 1.0, 8.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.84375, -52.12744140625, -50.4111328125, -48.69482421875, -46.978515625, -45.26220703125, -43.5458984375, -41.82958984375, -40.11328125, -38.39697265625, -36.6806640625, -34.96435546875, -33.248046875, -31.53173828125, -29.8154296875, -28.09912109375, -26.3828125, -24.66650390625, -22.9501953125, -21.23388671875, -19.517578125, -17.80126953125, -16.0849609375, -14.36865234375, -12.65234375, -10.93603515625, -9.2197265625, -7.50341796875, -5.787109375, -4.07080078125, -2.3544921875, -0.63818359375, 1.078125, 2.79443359375, 4.5107421875, 6.22705078125, 7.943359375, 9.65966796875, 11.3759765625, 13.09228515625, 14.80859375, 16.52490234375, 18.2412109375, 19.95751953125, 21.673828125, 23.39013671875, 25.1064453125, 26.82275390625, 28.5390625, 30.25537109375, 31.9716796875, 33.68798828125, 35.404296875, 37.12060546875, 38.8369140625, 40.55322265625, 42.26953125, 43.98583984375, 45.7021484375, 47.41845703125, 49.134765625, 50.85107421875, 52.5673828125, 54.28369140625, 56.0]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 14.0, 9.0, 17.0, 23.0, 19.0, 22.0, 18.0, 41.0, 47.0, 68.0, 155.0, 211.0, 95.0, 53.0, 34.0, 30.0, 29.0, 20.0, 14.0, 17.0, 15.0, 4.0, 8.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.109375, -23.443359375, -22.77734375, -22.111328125, -21.4453125, -20.779296875, -20.11328125, -19.447265625, -18.78125, -18.115234375, -17.44921875, -16.783203125, -16.1171875, -15.451171875, -14.78515625, -14.119140625, -13.453125, -12.787109375, -12.12109375, -11.455078125, -10.7890625, -10.123046875, -9.45703125, -8.791015625, -8.125, -7.458984375, -6.79296875, -6.126953125, -5.4609375, -4.794921875, -4.12890625, -3.462890625, -2.796875, -2.130859375, -1.46484375, -0.798828125, -0.1328125, 0.533203125, 1.19921875, 1.865234375, 2.53125, 3.197265625, 3.86328125, 4.529296875, 5.1953125, 5.861328125, 6.52734375, 7.193359375, 7.859375, 8.525390625, 9.19140625, 9.857421875, 10.5234375, 11.189453125, 11.85546875, 12.521484375, 13.1875, 13.853515625, 14.51953125, 15.185546875, 15.8515625, 16.517578125, 17.18359375, 17.849609375, 18.515625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 9.0, 8.0, 18.0, 33.0, 72.0, 214.0, 508.0, 77.0, 24.0, 9.0, 8.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.509647369384766, -23.459304809570312, -21.40896224975586, -19.358617782592773, -17.30827522277832, -15.257932662963867, -13.207589149475098, -11.157245635986328, -9.106903076171875, -7.056560039520264, -5.006217002868652, -2.955873966217041, -0.9055309295654297, 1.1448116302490234, 3.195155143737793, 5.2454986572265625, 7.295841217041016, 9.346183776855469, 11.396527290344238, 13.446870803833008, 15.497213363647461, 17.547555923461914, 19.597900390625, 21.648242950439453, 23.698585510253906, 25.74892807006836, 27.799270629882812, 29.8496150970459, 31.89995765686035, 33.95030212402344, 36.00064468383789, 38.050987243652344, 40.10133361816406, 42.151676177978516, 44.20201873779297, 46.25236129760742, 48.302703857421875, 50.353050231933594, 52.40339279174805, 54.4537353515625, 56.50407791137695, 58.554420471191406, 60.60476303100586, 62.65510559082031, 64.70545196533203, 66.75579071044922, 68.80613708496094, 70.85647583007812, 72.90682220458984, 74.95716857910156, 77.00750732421875, 79.05785369873047, 81.10819244384766, 83.15853881835938, 85.20887756347656, 87.25922393798828, 89.3095703125, 91.35991668701172, 93.4102554321289, 95.46060180664062, 97.51094055175781, 99.56128692626953, 101.61162567138672, 103.66197204589844, 105.71231079101562]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 5.0, 6.0, 12.0, 10.0, 26.0, 21.0, 20.0, 36.0, 39.0, 58.0, 58.0, 56.0, 68.0, 72.0, 69.0, 58.0, 68.0, 62.0, 41.0, 40.0, 41.0, 25.0, 17.0, 21.0, 13.0, 8.0, 10.0, 6.0, 6.0, 2.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-29.521896362304688, -28.74603843688965, -27.97018051147461, -27.19432258605957, -26.41846466064453, -25.642606735229492, -24.866748809814453, -24.090892791748047, -23.315032958984375, -22.539175033569336, -21.763317108154297, -20.987459182739258, -20.21160125732422, -19.43574333190918, -18.65988540649414, -17.884029388427734, -17.108171463012695, -16.332313537597656, -15.556455612182617, -14.780597686767578, -14.004739761352539, -13.2288818359375, -12.453024864196777, -11.677166938781738, -10.9013090133667, -10.12545108795166, -9.349593162536621, -8.573736190795898, -7.797877788543701, -7.022019863128662, -6.246162414550781, -5.470304489135742, -4.694446563720703, -3.918588638305664, -3.142730951309204, -2.366873264312744, -1.591015338897705, -0.815157413482666, -0.039299964904785156, 0.7365579605102539, 1.512415885925293, 2.288273811340332, 3.064131498336792, 3.839989185333252, 4.615847110748291, 5.39170503616333, 6.167562484741211, 6.94342041015625, 7.719278335571289, 8.495136260986328, 9.270994186401367, 10.046852111816406, 10.822710037231445, 11.598567962646484, 12.374424934387207, 13.150282859802246, 13.926140785217285, 14.701998710632324, 15.477856636047363, 16.253713607788086, 17.029571533203125, 17.805429458618164, 18.581287384033203, 19.357145309448242, 20.13300323486328]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 10.0, 12.0, 12.0, 25.0, 19.0, 21.0, 54.0, 75.0, 94.0, 165.0, 307.0, 492.0, 940.0, 2062.0, 5258.0, 14508.0, 49145.0, 222098.0, 567363.0, 134302.0, 33546.0, 10583.0, 3889.0, 1637.0, 804.0, 432.0, 216.0, 158.0, 97.0, 56.0, 45.0, 28.0, 19.0, 21.0, 11.0, 12.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.65625, -45.16796875, -43.6796875, -42.19140625, -40.703125, -39.21484375, -37.7265625, -36.23828125, -34.75, -33.26171875, -31.7734375, -30.28515625, -28.796875, -27.30859375, -25.8203125, -24.33203125, -22.84375, -21.35546875, -19.8671875, -18.37890625, -16.890625, -15.40234375, -13.9140625, -12.42578125, -10.9375, -9.44921875, -7.9609375, -6.47265625, -4.984375, -3.49609375, -2.0078125, -0.51953125, 0.96875, 2.45703125, 3.9453125, 5.43359375, 6.921875, 8.41015625, 9.8984375, 11.38671875, 12.875, 14.36328125, 15.8515625, 17.33984375, 18.828125, 20.31640625, 21.8046875, 23.29296875, 24.78125, 26.26953125, 27.7578125, 29.24609375, 30.734375, 32.22265625, 33.7109375, 35.19921875, 36.6875, 38.17578125, 39.6640625, 41.15234375, 42.640625, 44.12890625, 45.6171875, 47.10546875, 48.59375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 16.0, 22.0, 18.0, 35.0, 34.0, 54.0, 70.0, 76.0, 73.0, 100.0, 67.0, 72.0, 74.0, 62.0, 46.0, 28.0, 36.0, 27.0, 7.0, 14.0, 11.0, 8.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.515625, -17.0528564453125, -16.590087890625, -16.1273193359375, -15.66455078125, -15.2017822265625, -14.739013671875, -14.2762451171875, -13.8134765625, -13.3507080078125, -12.887939453125, -12.4251708984375, -11.96240234375, -11.4996337890625, -11.036865234375, -10.5740966796875, -10.111328125, -9.6485595703125, -9.185791015625, -8.7230224609375, -8.26025390625, -7.7974853515625, -7.334716796875, -6.8719482421875, -6.4091796875, -5.9464111328125, -5.483642578125, -5.0208740234375, -4.55810546875, -4.0953369140625, -3.632568359375, -3.1697998046875, -2.70703125, -2.2442626953125, -1.781494140625, -1.3187255859375, -0.85595703125, -0.3931884765625, 0.069580078125, 0.5323486328125, 0.9951171875, 1.4578857421875, 1.920654296875, 2.3834228515625, 2.84619140625, 3.3089599609375, 3.771728515625, 4.2344970703125, 4.697265625, 5.1600341796875, 5.622802734375, 6.0855712890625, 6.54833984375, 7.0111083984375, 7.473876953125, 7.9366455078125, 8.3994140625, 8.8621826171875, 9.324951171875, 9.7877197265625, 10.25048828125, 10.7132568359375, 11.176025390625, 11.6387939453125, 12.1015625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 5.0, 10.0, 20.0, 27.0, 30.0, 43.0, 66.0, 70.0, 105.0, 148.0, 228.0, 289.0, 406.0, 626.0, 854.0, 1271.0, 1913.0, 3042.0, 5189.0, 9080.0, 16776.0, 36337.0, 97883.0, 515457.0, 238181.0, 62466.0, 25995.0, 12946.0, 7071.0, 4190.0, 2529.0, 1667.0, 1125.0, 732.0, 505.0, 330.0, 272.0, 185.0, 147.0, 71.0, 72.0, 50.0, 42.0, 30.0, 21.0, 15.0, 12.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-33.46875, -32.4482421875, -31.427734375, -30.4072265625, -29.38671875, -28.3662109375, -27.345703125, -26.3251953125, -25.3046875, -24.2841796875, -23.263671875, -22.2431640625, -21.22265625, -20.2021484375, -19.181640625, -18.1611328125, -17.140625, -16.1201171875, -15.099609375, -14.0791015625, -13.05859375, -12.0380859375, -11.017578125, -9.9970703125, -8.9765625, -7.9560546875, -6.935546875, -5.9150390625, -4.89453125, -3.8740234375, -2.853515625, -1.8330078125, -0.8125, 0.2080078125, 1.228515625, 2.2490234375, 3.26953125, 4.2900390625, 5.310546875, 6.3310546875, 7.3515625, 8.3720703125, 9.392578125, 10.4130859375, 11.43359375, 12.4541015625, 13.474609375, 14.4951171875, 15.515625, 16.5361328125, 17.556640625, 18.5771484375, 19.59765625, 20.6181640625, 21.638671875, 22.6591796875, 23.6796875, 24.7001953125, 25.720703125, 26.7412109375, 27.76171875, 28.7822265625, 29.802734375, 30.8232421875, 31.84375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 9.0, 4.0, 6.0, 7.0, 5.0, 5.0, 15.0, 9.0, 21.0, 17.0, 18.0, 21.0, 23.0, 22.0, 35.0, 30.0, 36.0, 45.0, 42.0, 50.0, 55.0, 51.0, 36.0, 45.0, 39.0, 46.0, 32.0, 29.0, 31.0, 17.0, 21.0, 25.0, 27.0, 21.0, 12.0, 15.0, 10.0, 12.0, 10.0, 10.0, 9.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.21875, -9.8831787109375, -9.547607421875, -9.2120361328125, -8.87646484375, -8.5408935546875, -8.205322265625, -7.8697509765625, -7.5341796875, -7.1986083984375, -6.863037109375, -6.5274658203125, -6.19189453125, -5.8563232421875, -5.520751953125, -5.1851806640625, -4.849609375, -4.5140380859375, -4.178466796875, -3.8428955078125, -3.50732421875, -3.1717529296875, -2.836181640625, -2.5006103515625, -2.1650390625, -1.8294677734375, -1.493896484375, -1.1583251953125, -0.82275390625, -0.4871826171875, -0.151611328125, 0.1839599609375, 0.51953125, 0.8551025390625, 1.190673828125, 1.5262451171875, 1.86181640625, 2.1973876953125, 2.532958984375, 2.8685302734375, 3.2041015625, 3.5396728515625, 3.875244140625, 4.2108154296875, 4.54638671875, 4.8819580078125, 5.217529296875, 5.5531005859375, 5.888671875, 6.2242431640625, 6.559814453125, 6.8953857421875, 7.23095703125, 7.5665283203125, 7.902099609375, 8.2376708984375, 8.5732421875, 8.9088134765625, 9.244384765625, 9.5799560546875, 9.91552734375, 10.2510986328125, 10.586669921875, 10.9222412109375, 11.2578125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 11.0, 10.0, 20.0, 17.0, 21.0, 29.0, 30.0, 46.0, 62.0, 76.0, 121.0, 198.0, 233.0, 346.0, 588.0, 1133.0, 2506.0, 10685.0, 973460.0, 50257.0, 4739.0, 1639.0, 751.0, 476.0, 330.0, 207.0, 143.0, 100.0, 76.0, 49.0, 43.0, 33.0, 21.0, 13.0, 16.0, 12.0, 11.0, 7.0, 10.0, 3.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-315.5, -306.15625, -296.8125, -287.46875, -278.125, -268.78125, -259.4375, -250.09375, -240.75, -231.40625, -222.0625, -212.71875, -203.375, -194.03125, -184.6875, -175.34375, -166.0, -156.65625, -147.3125, -137.96875, -128.625, -119.28125, -109.9375, -100.59375, -91.25, -81.90625, -72.5625, -63.21875, -53.875, -44.53125, -35.1875, -25.84375, -16.5, -7.15625, 2.1875, 11.53125, 20.875, 30.21875, 39.5625, 48.90625, 58.25, 67.59375, 76.9375, 86.28125, 95.625, 104.96875, 114.3125, 123.65625, 133.0, 142.34375, 151.6875, 161.03125, 170.375, 179.71875, 189.0625, 198.40625, 207.75, 217.09375, 226.4375, 235.78125, 245.125, 254.46875, 263.8125, 273.15625, 282.5]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 12.0, 23.0, 56.0, 238.0, 469.0, 144.0, 38.0, 14.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006443023681640625, -0.006222784519195557, -0.006002545356750488, -0.00578230619430542, -0.0055620670318603516, -0.005341827869415283, -0.005121588706970215, -0.0049013495445251465, -0.004681110382080078, -0.00446087121963501, -0.004240632057189941, -0.004020392894744873, -0.0038001537322998047, -0.0035799145698547363, -0.003359675407409668, -0.0031394362449645996, -0.0029191970825195312, -0.002698957920074463, -0.0024787187576293945, -0.002258479595184326, -0.002038240432739258, -0.0018180012702941895, -0.001597762107849121, -0.0013775229454040527, -0.0011572837829589844, -0.000937044620513916, -0.0007168054580688477, -0.0004965662956237793, -0.00027632713317871094, -5.608797073364258e-05, 0.00016415119171142578, 0.00038439035415649414, 0.0006046295166015625, 0.0008248686790466309, 0.0010451078414916992, 0.0012653470039367676, 0.001485586166381836, 0.0017058253288269043, 0.0019260644912719727, 0.002146303653717041, 0.0023665428161621094, 0.0025867819786071777, 0.002807021141052246, 0.0030272603034973145, 0.003247499465942383, 0.003467738628387451, 0.0036879777908325195, 0.003908216953277588, 0.004128456115722656, 0.004348695278167725, 0.004568934440612793, 0.004789173603057861, 0.00500941276550293, 0.005229651927947998, 0.005449891090393066, 0.005670130252838135, 0.005890369415283203, 0.0061106085777282715, 0.00633084774017334, 0.006551086902618408, 0.0067713260650634766, 0.006991565227508545, 0.007211804389953613, 0.007432043552398682, 0.00765228271484375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 6.0, 14.0, 13.0, 15.0, 22.0, 18.0, 33.0, 37.0, 52.0, 92.0, 128.0, 193.0, 285.0, 432.0, 908.0, 2325.0, 11223.0, 987276.0, 38403.0, 4034.0, 1382.0, 582.0, 340.0, 220.0, 148.0, 107.0, 69.0, 48.0, 31.0, 24.0, 23.0, 17.0, 8.0, 7.0, 8.0, 6.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-329.75, -318.65234375, -307.5546875, -296.45703125, -285.359375, -274.26171875, -263.1640625, -252.06640625, -240.96875, -229.87109375, -218.7734375, -207.67578125, -196.578125, -185.48046875, -174.3828125, -163.28515625, -152.1875, -141.08984375, -129.9921875, -118.89453125, -107.796875, -96.69921875, -85.6015625, -74.50390625, -63.40625, -52.30859375, -41.2109375, -30.11328125, -19.015625, -7.91796875, 3.1796875, 14.27734375, 25.375, 36.47265625, 47.5703125, 58.66796875, 69.765625, 80.86328125, 91.9609375, 103.05859375, 114.15625, 125.25390625, 136.3515625, 147.44921875, 158.546875, 169.64453125, 180.7421875, 191.83984375, 202.9375, 214.03515625, 225.1328125, 236.23046875, 247.328125, 258.42578125, 269.5234375, 280.62109375, 291.71875, 302.81640625, 313.9140625, 325.01171875, 336.109375, 347.20703125, 358.3046875, 369.40234375, 380.5]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 3.0, 14.0, 36.0, 85.0, 186.0, 345.0, 173.0, 80.0, 28.0, 10.0, 8.0, 5.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-53.34375, -51.7939453125, -50.244140625, -48.6943359375, -47.14453125, -45.5947265625, -44.044921875, -42.4951171875, -40.9453125, -39.3955078125, -37.845703125, -36.2958984375, -34.74609375, -33.1962890625, -31.646484375, -30.0966796875, -28.546875, -26.9970703125, -25.447265625, -23.8974609375, -22.34765625, -20.7978515625, -19.248046875, -17.6982421875, -16.1484375, -14.5986328125, -13.048828125, -11.4990234375, -9.94921875, -8.3994140625, -6.849609375, -5.2998046875, -3.75, -2.2001953125, -0.650390625, 0.8994140625, 2.44921875, 3.9990234375, 5.548828125, 7.0986328125, 8.6484375, 10.1982421875, 11.748046875, 13.2978515625, 14.84765625, 16.3974609375, 17.947265625, 19.4970703125, 21.046875, 22.5966796875, 24.146484375, 25.6962890625, 27.24609375, 28.7958984375, 30.345703125, 31.8955078125, 33.4453125, 34.9951171875, 36.544921875, 38.0947265625, 39.64453125, 41.1943359375, 42.744140625, 44.2939453125, 45.84375]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 7.0, 4.0, 2.0, 5.0, 7.0, 9.0, 3.0, 7.0, 7.0, 7.0, 15.0, 22.0, 13.0, 15.0, 32.0, 31.0, 73.0, 106.0, 208.0, 343.0, 51.0, 10.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.80369567871094, -41.900936126708984, -40.9981803894043, -40.095420837402344, -39.192665100097656, -38.2899055480957, -37.38714599609375, -36.48439025878906, -35.58163070678711, -34.678871154785156, -33.77611541748047, -32.873355865478516, -31.970598220825195, -31.067840576171875, -30.165082931518555, -29.262325286865234, -28.359567642211914, -27.456809997558594, -26.554052352905273, -25.651294708251953, -24.74853515625, -23.84577751159668, -22.94301986694336, -22.04026222229004, -21.13750457763672, -20.2347469329834, -19.331989288330078, -18.429229736328125, -17.526472091674805, -16.623714447021484, -15.720956802368164, -14.818199157714844, -13.915441513061523, -13.012683868408203, -12.109925270080566, -11.207167625427246, -10.30440902709961, -9.401651382446289, -8.498893737792969, -7.59613561630249, -6.693377494812012, -5.790619373321533, -4.887861251831055, -3.9851036071777344, -3.082345485687256, -2.1795873641967773, -1.276829719543457, -0.3740715980529785, 0.5286865234375, 1.431444525718689, 2.334202527999878, 3.2369604110717773, 4.139718532562256, 5.042476654052734, 5.945234298706055, 6.847992420196533, 7.750750541687012, 8.653508186340332, 9.556266784667969, 10.459024429321289, 11.36178207397461, 12.264540672302246, 13.167298316955566, 14.070056915283203, 14.972814559936523]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 5.0, 4.0, 7.0, 12.0, 11.0, 10.0, 14.0, 31.0, 22.0, 39.0, 42.0, 55.0, 48.0, 63.0, 81.0, 86.0, 67.0, 74.0, 67.0, 49.0, 47.0, 37.0, 24.0, 21.0, 23.0, 13.0, 10.0, 6.0, 9.0, 4.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.38955307006836, -16.737333297729492, -16.085115432739258, -15.43289566040039, -14.780675888061523, -14.128457069396973, -13.476238250732422, -12.824018478393555, -12.171798706054688, -11.519579887390137, -10.86736011505127, -10.215141296386719, -9.562921524047852, -8.9107027053833, -8.25848388671875, -7.606264114379883, -6.954045295715332, -6.301826000213623, -5.649606704711914, -4.997387886047363, -4.345168113708496, -3.692949056625366, -3.0407299995422363, -2.3885107040405273, -1.7362914085388184, -1.0840721130371094, -0.43185293674468994, 0.2203662395477295, 0.8725855350494385, 1.5248048305511475, 2.1770238876342773, 2.8292431831359863, 3.4814624786376953, 4.133681774139404, 4.785901069641113, 5.438119888305664, 6.090339660644531, 6.742558479309082, 7.394777774810791, 8.0469970703125, 8.699216842651367, 9.351435661315918, 10.003655433654785, 10.655874252319336, 11.308094024658203, 11.960312843322754, 12.612531661987305, 13.264751434326172, 13.916970252990723, 14.569189071655273, 15.22140884399414, 15.873627662658691, 16.525846481323242, 17.17806625366211, 17.830286026000977, 18.482505798339844, 19.134723663330078, 19.786943435668945, 20.43916130065918, 21.091381072998047, 21.743600845336914, 22.39582061767578, 23.048038482666016, 23.700258255004883, 24.35247802734375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 9.0, 12.0, 17.0, 28.0, 41.0, 50.0, 84.0, 115.0, 140.0, 208.0, 285.0, 386.0, 603.0, 872.0, 1307.0, 2076.0, 3076.0, 4962.0, 8097.0, 13095.0, 23229.0, 43873.0, 91683.0, 234814.0, 2168860.0, 1246298.0, 185771.0, 76904.0, 37351.0, 19941.0, 11166.0, 6656.0, 4310.0, 2753.0, 1670.0, 1138.0, 769.0, 500.0, 351.0, 240.0, 173.0, 120.0, 86.0, 49.0, 36.0, 20.0, 15.0, 14.0, 12.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.4375, -10.1102294921875, -9.782958984375, -9.4556884765625, -9.12841796875, -8.8011474609375, -8.473876953125, -8.1466064453125, -7.8193359375, -7.4920654296875, -7.164794921875, -6.8375244140625, -6.51025390625, -6.1829833984375, -5.855712890625, -5.5284423828125, -5.201171875, -4.8739013671875, -4.546630859375, -4.2193603515625, -3.89208984375, -3.5648193359375, -3.237548828125, -2.9102783203125, -2.5830078125, -2.2557373046875, -1.928466796875, -1.6011962890625, -1.27392578125, -0.9466552734375, -0.619384765625, -0.2921142578125, 0.03515625, 0.3624267578125, 0.689697265625, 1.0169677734375, 1.34423828125, 1.6715087890625, 1.998779296875, 2.3260498046875, 2.6533203125, 2.9805908203125, 3.307861328125, 3.6351318359375, 3.96240234375, 4.2896728515625, 4.616943359375, 4.9442138671875, 5.271484375, 5.5987548828125, 5.926025390625, 6.2532958984375, 6.58056640625, 6.9078369140625, 7.235107421875, 7.5623779296875, 7.8896484375, 8.2169189453125, 8.544189453125, 8.8714599609375, 9.19873046875, 9.5260009765625, 9.853271484375, 10.1805419921875, 10.5078125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 6.0, 10.0, 11.0, 11.0, 19.0, 15.0, 26.0, 33.0, 26.0, 41.0, 44.0, 42.0, 47.0, 51.0, 52.0, 62.0, 59.0, 70.0, 53.0, 58.0, 41.0, 43.0, 29.0, 35.0, 24.0, 21.0, 17.0, 9.0, 6.0, 12.0, 8.0, 4.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462890625, -2.379730224609375, -2.29656982421875, -2.213409423828125, -2.1302490234375, -2.047088623046875, -1.96392822265625, -1.880767822265625, -1.797607421875, -1.714447021484375, -1.63128662109375, -1.548126220703125, -1.4649658203125, -1.381805419921875, -1.29864501953125, -1.215484619140625, -1.13232421875, -1.049163818359375, -0.96600341796875, -0.882843017578125, -0.7996826171875, -0.716522216796875, -0.63336181640625, -0.550201416015625, -0.467041015625, -0.383880615234375, -0.30072021484375, -0.217559814453125, -0.1343994140625, -0.051239013671875, 0.03192138671875, 0.115081787109375, 0.1982421875, 0.281402587890625, 0.36456298828125, 0.447723388671875, 0.5308837890625, 0.614044189453125, 0.69720458984375, 0.780364990234375, 0.863525390625, 0.946685791015625, 1.02984619140625, 1.113006591796875, 1.1961669921875, 1.279327392578125, 1.36248779296875, 1.445648193359375, 1.52880859375, 1.611968994140625, 1.69512939453125, 1.778289794921875, 1.8614501953125, 1.944610595703125, 2.02777099609375, 2.110931396484375, 2.194091796875, 2.277252197265625, 2.36041259765625, 2.443572998046875, 2.5267333984375, 2.609893798828125, 2.69305419921875, 2.776214599609375, 2.859375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 12.0, 14.0, 17.0, 26.0, 34.0, 49.0, 83.0, 128.0, 177.0, 260.0, 384.0, 681.0, 1088.0, 1848.0, 3540.0, 7318.0, 16981.0, 49304.0, 216789.0, 2578011.0, 1123768.0, 132321.0, 35140.0, 13109.0, 6093.0, 2930.0, 1605.0, 922.0, 585.0, 336.0, 218.0, 170.0, 88.0, 73.0, 43.0, 39.0, 28.0, 16.0, 14.0, 8.0, 8.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.31640625, -7.07928466796875, -6.8421630859375, -6.60504150390625, -6.367919921875, -6.13079833984375, -5.8936767578125, -5.65655517578125, -5.41943359375, -5.18231201171875, -4.9451904296875, -4.70806884765625, -4.470947265625, -4.23382568359375, -3.9967041015625, -3.75958251953125, -3.5224609375, -3.28533935546875, -3.0482177734375, -2.81109619140625, -2.573974609375, -2.33685302734375, -2.0997314453125, -1.86260986328125, -1.62548828125, -1.38836669921875, -1.1512451171875, -0.91412353515625, -0.677001953125, -0.43988037109375, -0.2027587890625, 0.03436279296875, 0.271484375, 0.50860595703125, 0.7457275390625, 0.98284912109375, 1.219970703125, 1.45709228515625, 1.6942138671875, 1.93133544921875, 2.16845703125, 2.40557861328125, 2.6427001953125, 2.87982177734375, 3.116943359375, 3.35406494140625, 3.5911865234375, 3.82830810546875, 4.0654296875, 4.30255126953125, 4.5396728515625, 4.77679443359375, 5.013916015625, 5.25103759765625, 5.4881591796875, 5.72528076171875, 5.96240234375, 6.19952392578125, 6.4366455078125, 6.67376708984375, 6.910888671875, 7.14801025390625, 7.3851318359375, 7.62225341796875, 7.859375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 5.0, 6.0, 3.0, 6.0, 10.0, 12.0, 8.0, 22.0, 31.0, 28.0, 51.0, 48.0, 56.0, 60.0, 86.0, 84.0, 143.0, 176.0, 247.0, 304.0, 356.0, 402.0, 374.0, 337.0, 238.0, 227.0, 186.0, 125.0, 110.0, 87.0, 68.0, 47.0, 35.0, 30.0, 21.0, 9.0, 13.0, 7.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3291015625, -1.2925567626953125, -1.256011962890625, -1.2194671630859375, -1.18292236328125, -1.1463775634765625, -1.109832763671875, -1.0732879638671875, -1.0367431640625, -1.0001983642578125, -0.963653564453125, -0.9271087646484375, -0.89056396484375, -0.8540191650390625, -0.817474365234375, -0.7809295654296875, -0.744384765625, -0.7078399658203125, -0.671295166015625, -0.6347503662109375, -0.59820556640625, -0.5616607666015625, -0.525115966796875, -0.4885711669921875, -0.4520263671875, -0.4154815673828125, -0.378936767578125, -0.3423919677734375, -0.30584716796875, -0.2693023681640625, -0.232757568359375, -0.1962127685546875, -0.15966796875, -0.1231231689453125, -0.086578369140625, -0.0500335693359375, -0.01348876953125, 0.0230560302734375, 0.059600830078125, 0.0961456298828125, 0.1326904296875, 0.1692352294921875, 0.205780029296875, 0.2423248291015625, 0.27886962890625, 0.3154144287109375, 0.351959228515625, 0.3885040283203125, 0.425048828125, 0.4615936279296875, 0.498138427734375, 0.5346832275390625, 0.57122802734375, 0.6077728271484375, 0.644317626953125, 0.6808624267578125, 0.7174072265625, 0.7539520263671875, 0.790496826171875, 0.8270416259765625, 0.86358642578125, 0.9001312255859375, 0.936676025390625, 0.9732208251953125, 1.009765625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 8.0, 11.0, 16.0, 20.0, 66.0, 192.0, 457.0, 151.0, 40.0, 16.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.987723350524902, -8.636414527893066, -8.28510570526123, -7.933796405792236, -7.582487106323242, -7.231178283691406, -6.87986946105957, -6.528560638427734, -6.17725133895874, -5.825942516326904, -5.47463321685791, -5.123324394226074, -4.772015571594238, -4.420706272125244, -4.069397449493408, -3.718088388442993, -3.366779327392578, -3.015470266342163, -2.664161205291748, -2.312852382659912, -1.961543321609497, -1.610234260559082, -1.258925437927246, -0.907616376876831, -0.556307315826416, -0.20499831438064575, 0.1463106870651245, 0.49761962890625, 0.848928689956665, 1.20023775100708, 1.551546573638916, 1.902855634689331, 2.2541656494140625, 2.6054747104644775, 2.9567837715148926, 3.3080925941467285, 3.6594016551971436, 4.010710716247559, 4.3620195388793945, 4.7133283615112305, 5.064637660980225, 5.4159464836120605, 5.767255783081055, 6.118564605712891, 6.469873428344727, 6.821182727813721, 7.172491550445557, 7.523800849914551, 7.875109672546387, 8.226418495178223, 8.577727317810059, 8.929037094116211, 9.280345916748047, 9.631654739379883, 9.982963562011719, 10.334272384643555, 10.68558120727539, 11.036890029907227, 11.388198852539062, 11.739507675170898, 12.09081745147705, 12.442126274108887, 12.793435096740723, 13.144743919372559, 13.496053695678711]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 9.0, 8.0, 12.0, 8.0, 14.0, 13.0, 22.0, 18.0, 36.0, 37.0, 31.0, 39.0, 40.0, 54.0, 51.0, 55.0, 39.0, 75.0, 55.0, 44.0, 50.0, 39.0, 45.0, 33.0, 23.0, 28.0, 13.0, 16.0, 18.0, 15.0, 12.0, 5.0, 13.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8062503337860107, -2.7200124263763428, -2.6337742805480957, -2.5475363731384277, -2.4612984657287598, -2.375060558319092, -2.2888224124908447, -2.2025845050811768, -2.1163463592529297, -2.0301084518432617, -1.9438704252243042, -1.8576323986053467, -1.7713944911956787, -1.6851564645767212, -1.5989184379577637, -1.5126805305480957, -1.4264426231384277, -1.3402045965194702, -1.2539666891098022, -1.1677286624908447, -1.0814907550811768, -0.9952527284622192, -0.9090147018432617, -0.822776734828949, -0.7365387678146362, -0.6503008008003235, -0.5640628337860107, -0.4778248071670532, -0.3915868401527405, -0.30534887313842773, -0.21911084651947021, -0.13287287950515747, -0.04663515090942383, 0.03960283100605011, 0.12584081292152405, 0.21207880973815918, 0.2983167767524719, 0.38455474376678467, 0.4707927703857422, 0.5570307374000549, 0.6432687044143677, 0.7295066714286804, 0.8157446384429932, 0.9019826650619507, 0.9882206320762634, 1.0744585990905762, 1.1606966257095337, 1.2469346523284912, 1.3331725597381592, 1.4194105863571167, 1.5056484937667847, 1.5918865203857422, 1.6781244277954102, 1.7643624544143677, 1.8506004810333252, 1.9368383884429932, 2.0230765342712402, 2.109314441680908, 2.1955525875091553, 2.2817904949188232, 2.368028402328491, 2.4542665481567383, 2.5405044555664062, 2.626742362976074, 2.712980270385742]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 14.0, 18.0, 21.0, 27.0, 38.0, 62.0, 88.0, 104.0, 156.0, 260.0, 413.0, 675.0, 1051.0, 1678.0, 2942.0, 5701.0, 12958.0, 37895.0, 204951.0, 627763.0, 105593.0, 25570.0, 9709.0, 4504.0, 2468.0, 1414.0, 854.0, 564.0, 323.0, 230.0, 155.0, 93.0, 56.0, 50.0, 33.0, 31.0, 19.0, 13.0, 9.0, 4.0, 9.0, 6.0, 7.0, 1.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-4.87890625, -4.7325439453125, -4.586181640625, -4.4398193359375, -4.29345703125, -4.1470947265625, -4.000732421875, -3.8543701171875, -3.7080078125, -3.5616455078125, -3.415283203125, -3.2689208984375, -3.12255859375, -2.9761962890625, -2.829833984375, -2.6834716796875, -2.537109375, -2.3907470703125, -2.244384765625, -2.0980224609375, -1.95166015625, -1.8052978515625, -1.658935546875, -1.5125732421875, -1.3662109375, -1.2198486328125, -1.073486328125, -0.9271240234375, -0.78076171875, -0.6343994140625, -0.488037109375, -0.3416748046875, -0.1953125, -0.0489501953125, 0.097412109375, 0.2437744140625, 0.39013671875, 0.5364990234375, 0.682861328125, 0.8292236328125, 0.9755859375, 1.1219482421875, 1.268310546875, 1.4146728515625, 1.56103515625, 1.7073974609375, 1.853759765625, 2.0001220703125, 2.146484375, 2.2928466796875, 2.439208984375, 2.5855712890625, 2.73193359375, 2.8782958984375, 3.024658203125, 3.1710205078125, 3.3173828125, 3.4637451171875, 3.610107421875, 3.7564697265625, 3.90283203125, 4.0491943359375, 4.195556640625, 4.3419189453125, 4.48828125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 7.0, 6.0, 7.0, 7.0, 18.0, 11.0, 20.0, 31.0, 24.0, 26.0, 40.0, 28.0, 54.0, 51.0, 40.0, 44.0, 52.0, 56.0, 60.0, 57.0, 45.0, 55.0, 34.0, 33.0, 28.0, 24.0, 22.0, 16.0, 17.0, 12.0, 11.0, 14.0, 12.0, 9.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.330078125, -2.257171630859375, -2.18426513671875, -2.111358642578125, -2.0384521484375, -1.965545654296875, -1.89263916015625, -1.819732666015625, -1.746826171875, -1.673919677734375, -1.60101318359375, -1.528106689453125, -1.4552001953125, -1.382293701171875, -1.30938720703125, -1.236480712890625, -1.16357421875, -1.090667724609375, -1.01776123046875, -0.944854736328125, -0.8719482421875, -0.799041748046875, -0.72613525390625, -0.653228759765625, -0.580322265625, -0.507415771484375, -0.43450927734375, -0.361602783203125, -0.2886962890625, -0.215789794921875, -0.14288330078125, -0.069976806640625, 0.0029296875, 0.075836181640625, 0.14874267578125, 0.221649169921875, 0.2945556640625, 0.367462158203125, 0.44036865234375, 0.513275146484375, 0.586181640625, 0.659088134765625, 0.73199462890625, 0.804901123046875, 0.8778076171875, 0.950714111328125, 1.02362060546875, 1.096527099609375, 1.16943359375, 1.242340087890625, 1.31524658203125, 1.388153076171875, 1.4610595703125, 1.533966064453125, 1.60687255859375, 1.679779052734375, 1.752685546875, 1.825592041015625, 1.89849853515625, 1.971405029296875, 2.0443115234375, 2.117218017578125, 2.19012451171875, 2.263031005859375, 2.3359375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 9.0, 4.0, 5.0, 10.0, 10.0, 21.0, 24.0, 46.0, 76.0, 75.0, 134.0, 206.0, 268.0, 401.0, 648.0, 996.0, 1829.0, 3116.0, 6301.0, 16181.0, 70663.0, 704999.0, 195628.0, 27907.0, 9163.0, 4094.0, 2168.0, 1239.0, 804.0, 513.0, 330.0, 207.0, 128.0, 111.0, 79.0, 44.0, 38.0, 23.0, 21.0, 12.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3671875, -5.1802978515625, -4.993408203125, -4.8065185546875, -4.61962890625, -4.4327392578125, -4.245849609375, -4.0589599609375, -3.8720703125, -3.6851806640625, -3.498291015625, -3.3114013671875, -3.12451171875, -2.9376220703125, -2.750732421875, -2.5638427734375, -2.376953125, -2.1900634765625, -2.003173828125, -1.8162841796875, -1.62939453125, -1.4425048828125, -1.255615234375, -1.0687255859375, -0.8818359375, -0.6949462890625, -0.508056640625, -0.3211669921875, -0.13427734375, 0.0526123046875, 0.239501953125, 0.4263916015625, 0.61328125, 0.8001708984375, 0.987060546875, 1.1739501953125, 1.36083984375, 1.5477294921875, 1.734619140625, 1.9215087890625, 2.1083984375, 2.2952880859375, 2.482177734375, 2.6690673828125, 2.85595703125, 3.0428466796875, 3.229736328125, 3.4166259765625, 3.603515625, 3.7904052734375, 3.977294921875, 4.1641845703125, 4.35107421875, 4.5379638671875, 4.724853515625, 4.9117431640625, 5.0986328125, 5.2855224609375, 5.472412109375, 5.6593017578125, 5.84619140625, 6.0330810546875, 6.219970703125, 6.4068603515625, 6.59375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 6.0, 9.0, 12.0, 7.0, 12.0, 7.0, 30.0, 32.0, 22.0, 41.0, 34.0, 49.0, 41.0, 41.0, 32.0, 46.0, 52.0, 56.0, 53.0, 53.0, 43.0, 51.0, 45.0, 31.0, 26.0, 28.0, 23.0, 15.0, 11.0, 15.0, 13.0, 15.0, 10.0, 4.0, 9.0, 5.0, 2.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.7587890625, -1.708892822265625, -1.65899658203125, -1.609100341796875, -1.5592041015625, -1.509307861328125, -1.45941162109375, -1.409515380859375, -1.359619140625, -1.309722900390625, -1.25982666015625, -1.209930419921875, -1.1600341796875, -1.110137939453125, -1.06024169921875, -1.010345458984375, -0.96044921875, -0.910552978515625, -0.86065673828125, -0.810760498046875, -0.7608642578125, -0.710968017578125, -0.66107177734375, -0.611175537109375, -0.561279296875, -0.511383056640625, -0.46148681640625, -0.411590576171875, -0.3616943359375, -0.311798095703125, -0.26190185546875, -0.212005615234375, -0.162109375, -0.112213134765625, -0.06231689453125, -0.012420654296875, 0.0374755859375, 0.087371826171875, 0.13726806640625, 0.187164306640625, 0.237060546875, 0.286956787109375, 0.33685302734375, 0.386749267578125, 0.4366455078125, 0.486541748046875, 0.53643798828125, 0.586334228515625, 0.63623046875, 0.686126708984375, 0.73602294921875, 0.785919189453125, 0.8358154296875, 0.885711669921875, 0.93560791015625, 0.985504150390625, 1.035400390625, 1.085296630859375, 1.13519287109375, 1.185089111328125, 1.2349853515625, 1.284881591796875, 1.33477783203125, 1.384674072265625, 1.4345703125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 4.0, 8.0, 11.0, 22.0, 15.0, 42.0, 34.0, 63.0, 101.0, 156.0, 223.0, 366.0, 740.0, 1513.0, 3917.0, 12537.0, 83806.0, 864943.0, 62656.0, 10850.0, 3468.0, 1387.0, 690.0, 333.0, 209.0, 145.0, 81.0, 62.0, 36.0, 28.0, 22.0, 14.0, 15.0, 9.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.671875, -2.5841064453125, -2.496337890625, -2.4085693359375, -2.32080078125, -2.2330322265625, -2.145263671875, -2.0574951171875, -1.9697265625, -1.8819580078125, -1.794189453125, -1.7064208984375, -1.61865234375, -1.5308837890625, -1.443115234375, -1.3553466796875, -1.267578125, -1.1798095703125, -1.092041015625, -1.0042724609375, -0.91650390625, -0.8287353515625, -0.740966796875, -0.6531982421875, -0.5654296875, -0.4776611328125, -0.389892578125, -0.3021240234375, -0.21435546875, -0.1265869140625, -0.038818359375, 0.0489501953125, 0.13671875, 0.2244873046875, 0.312255859375, 0.4000244140625, 0.48779296875, 0.5755615234375, 0.663330078125, 0.7510986328125, 0.8388671875, 0.9266357421875, 1.014404296875, 1.1021728515625, 1.18994140625, 1.2777099609375, 1.365478515625, 1.4532470703125, 1.541015625, 1.6287841796875, 1.716552734375, 1.8043212890625, 1.89208984375, 1.9798583984375, 2.067626953125, 2.1553955078125, 2.2431640625, 2.3309326171875, 2.418701171875, 2.5064697265625, 2.59423828125, 2.6820068359375, 2.769775390625, 2.8575439453125, 2.9453125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 2.0, 2.0, 8.0, 10.0, 12.0, 17.0, 64.0, 231.0, 456.0, 94.0, 38.0, 17.0, 9.0, 4.0, 6.0, 3.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013494491577148438, -0.00013033486902713776, -0.00012572482228279114, -0.00012111477553844452, -0.0001165047287940979, -0.00011189468204975128, -0.00010728463530540466, -0.00010267458856105804, -9.806454181671143e-05, -9.345449507236481e-05, -8.884444832801819e-05, -8.423440158367157e-05, -7.962435483932495e-05, -7.501430809497833e-05, -7.040426135063171e-05, -6.57942146062851e-05, -6.118416786193848e-05, -5.657412111759186e-05, -5.196407437324524e-05, -4.735402762889862e-05, -4.2743980884552e-05, -3.813393414020538e-05, -3.3523887395858765e-05, -2.8913840651512146e-05, -2.4303793907165527e-05, -1.969374716281891e-05, -1.508370041847229e-05, -1.0473653674125671e-05, -5.863606929779053e-06, -1.253560185432434e-06, 3.3564865589141846e-06, 7.966533303260803e-06, 1.2576580047607422e-05, 1.718662679195404e-05, 2.179667353630066e-05, 2.6406720280647278e-05, 3.1016767024993896e-05, 3.5626813769340515e-05, 4.0236860513687134e-05, 4.484690725803375e-05, 4.945695400238037e-05, 5.406700074672699e-05, 5.867704749107361e-05, 6.328709423542023e-05, 6.789714097976685e-05, 7.250718772411346e-05, 7.711723446846008e-05, 8.17272812128067e-05, 8.633732795715332e-05, 9.094737470149994e-05, 9.555742144584656e-05, 0.00010016746819019318, 0.0001047775149345398, 0.00010938756167888641, 0.00011399760842323303, 0.00011860765516757965, 0.00012321770191192627, 0.0001278277486562729, 0.0001324377954006195, 0.00013704784214496613, 0.00014165788888931274, 0.00014626793563365936, 0.00015087798237800598, 0.0001554880291223526, 0.00016009807586669922]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 9.0, 7.0, 7.0, 7.0, 14.0, 23.0, 20.0, 39.0, 37.0, 80.0, 130.0, 178.0, 307.0, 540.0, 1098.0, 2580.0, 8799.0, 54963.0, 891288.0, 72697.0, 10012.0, 2985.0, 1220.0, 589.0, 292.0, 199.0, 135.0, 92.0, 47.0, 48.0, 31.0, 19.0, 12.0, 13.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8359375, -1.771636962890625, -1.70733642578125, -1.643035888671875, -1.5787353515625, -1.514434814453125, -1.45013427734375, -1.385833740234375, -1.321533203125, -1.257232666015625, -1.19293212890625, -1.128631591796875, -1.0643310546875, -1.000030517578125, -0.93572998046875, -0.871429443359375, -0.80712890625, -0.742828369140625, -0.67852783203125, -0.614227294921875, -0.5499267578125, -0.485626220703125, -0.42132568359375, -0.357025146484375, -0.292724609375, -0.228424072265625, -0.16412353515625, -0.099822998046875, -0.0355224609375, 0.028778076171875, 0.09307861328125, 0.157379150390625, 0.2216796875, 0.285980224609375, 0.35028076171875, 0.414581298828125, 0.4788818359375, 0.543182373046875, 0.60748291015625, 0.671783447265625, 0.736083984375, 0.800384521484375, 0.86468505859375, 0.928985595703125, 0.9932861328125, 1.057586669921875, 1.12188720703125, 1.186187744140625, 1.25048828125, 1.314788818359375, 1.37908935546875, 1.443389892578125, 1.5076904296875, 1.571990966796875, 1.63629150390625, 1.700592041015625, 1.764892578125, 1.829193115234375, 1.89349365234375, 1.957794189453125, 2.0220947265625, 2.086395263671875, 2.15069580078125, 2.214996337890625, 2.279296875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 12.0, 12.0, 24.0, 67.0, 166.0, 343.0, 212.0, 70.0, 47.0, 19.0, 9.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7060546875, -0.6749114990234375, -0.643768310546875, -0.6126251220703125, -0.58148193359375, -0.5503387451171875, -0.519195556640625, -0.4880523681640625, -0.4569091796875, -0.4257659912109375, -0.394622802734375, -0.3634796142578125, -0.33233642578125, -0.3011932373046875, -0.270050048828125, -0.2389068603515625, -0.207763671875, -0.1766204833984375, -0.145477294921875, -0.1143341064453125, -0.08319091796875, -0.0520477294921875, -0.020904541015625, 0.0102386474609375, 0.0413818359375, 0.0725250244140625, 0.103668212890625, 0.1348114013671875, 0.16595458984375, 0.1970977783203125, 0.228240966796875, 0.2593841552734375, 0.29052734375, 0.3216705322265625, 0.352813720703125, 0.3839569091796875, 0.41510009765625, 0.4462432861328125, 0.477386474609375, 0.5085296630859375, 0.5396728515625, 0.5708160400390625, 0.601959228515625, 0.6331024169921875, 0.66424560546875, 0.6953887939453125, 0.726531982421875, 0.7576751708984375, 0.788818359375, 0.8199615478515625, 0.851104736328125, 0.8822479248046875, 0.91339111328125, 0.9445343017578125, 0.975677490234375, 1.0068206787109375, 1.0379638671875, 1.0691070556640625, 1.100250244140625, 1.1313934326171875, 1.16253662109375, 1.1936798095703125, 1.224822998046875, 1.2559661865234375, 1.287109375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 15.0, 23.0, 24.0, 116.0, 426.0, 264.0, 63.0, 30.0, 11.0, 7.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.598084449768066, -5.284798622131348, -4.971512794494629, -4.658227443695068, -4.34494161605835, -4.031655788421631, -3.718370199203491, -3.4050846099853516, -3.091798782348633, -2.778512954711914, -2.4652273654937744, -2.1519417762756348, -1.838655948638916, -1.5253702402114868, -1.2120845317840576, -0.898798942565918, -0.5855131149291992, -0.27222740650177, 0.04105830192565918, 0.3543440103530884, 0.6676297187805176, 0.9809154272079468, 1.294201135635376, 1.6074867248535156, 1.9207725524902344, 2.234058380126953, 2.5473439693450928, 2.8606295585632324, 3.173915386199951, 3.48720121383667, 3.8004868030548096, 4.113772392272949, 4.427057266235352, 4.74034309387207, 5.053628921508789, 5.36691427230835, 5.680200099945068, 5.993485927581787, 6.306771278381348, 6.620057106018066, 6.933342933654785, 7.246628761291504, 7.559914588928223, 7.873199939727783, 8.186485290527344, 8.499771118164062, 8.813056945800781, 9.1263427734375, 9.439628601074219, 9.752914428710938, 10.066200256347656, 10.379486083984375, 10.692771911621094, 11.006056785583496, 11.319342613220215, 11.632628440856934, 11.945914268493652, 12.259200096130371, 12.57248592376709, 12.885771751403809, 13.199056625366211, 13.51234245300293, 13.825628280639648, 14.138914108276367, 14.452199935913086]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 6.0, 9.0, 10.0, 12.0, 9.0, 11.0, 16.0, 23.0, 28.0, 35.0, 39.0, 33.0, 30.0, 48.0, 41.0, 51.0, 54.0, 60.0, 62.0, 51.0, 45.0, 41.0, 50.0, 34.0, 30.0, 24.0, 28.0, 17.0, 14.0, 15.0, 15.0, 12.0, 8.0, 10.0, 10.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.364989995956421, -2.291995048522949, -2.2190001010894775, -2.146005153656006, -2.073010206222534, -2.0000152587890625, -1.9270203113555908, -1.8540253639221191, -1.7810304164886475, -1.7080354690551758, -1.635040521621704, -1.5620455741882324, -1.4890506267547607, -1.416055679321289, -1.3430607318878174, -1.2700657844543457, -1.197070837020874, -1.1240758895874023, -1.0510809421539307, -0.978085994720459, -0.9050910472869873, -0.8320960998535156, -0.759101152420044, -0.6861062049865723, -0.6131112575531006, -0.5401163101196289, -0.4671213626861572, -0.39412641525268555, -0.32113146781921387, -0.2481365203857422, -0.1751415729522705, -0.10214662551879883, -0.02915191650390625, 0.04384303092956543, 0.11683797836303711, 0.1898329257965088, 0.26282787322998047, 0.33582282066345215, 0.40881776809692383, 0.4818127155303955, 0.5548076629638672, 0.6278026103973389, 0.7007975578308105, 0.7737925052642822, 0.8467874526977539, 0.9197824001312256, 0.9927773475646973, 1.065772294998169, 1.1387672424316406, 1.2117621898651123, 1.284757137298584, 1.3577520847320557, 1.4307470321655273, 1.503741979598999, 1.5767369270324707, 1.6497318744659424, 1.722726821899414, 1.7957217693328857, 1.8687167167663574, 1.941711664199829, 2.014706611633301, 2.0877015590667725, 2.160696506500244, 2.233691453933716, 2.3066864013671875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 2.0, 9.0, 12.0, 8.0, 23.0, 31.0, 44.0, 45.0, 71.0, 107.0, 144.0, 250.0, 397.0, 712.0, 1299.0, 2384.0, 4733.0, 9652.0, 21086.0, 48355.0, 122887.0, 347408.0, 302472.0, 106997.0, 42501.0, 18814.0, 8692.0, 4370.0, 2083.0, 1185.0, 641.0, 381.0, 269.0, 142.0, 105.0, 81.0, 51.0, 31.0, 23.0, 21.0, 8.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.18878173828125, -4.0533447265625, -3.91790771484375, -3.782470703125, -3.64703369140625, -3.5115966796875, -3.37615966796875, -3.24072265625, -3.10528564453125, -2.9698486328125, -2.83441162109375, -2.698974609375, -2.56353759765625, -2.4281005859375, -2.29266357421875, -2.1572265625, -2.02178955078125, -1.8863525390625, -1.75091552734375, -1.615478515625, -1.48004150390625, -1.3446044921875, -1.20916748046875, -1.07373046875, -0.93829345703125, -0.8028564453125, -0.66741943359375, -0.531982421875, -0.39654541015625, -0.2611083984375, -0.12567138671875, 0.009765625, 0.14520263671875, 0.2806396484375, 0.41607666015625, 0.551513671875, 0.68695068359375, 0.8223876953125, 0.95782470703125, 1.09326171875, 1.22869873046875, 1.3641357421875, 1.49957275390625, 1.635009765625, 1.77044677734375, 1.9058837890625, 2.04132080078125, 2.1767578125, 2.31219482421875, 2.4476318359375, 2.58306884765625, 2.718505859375, 2.85394287109375, 2.9893798828125, 3.12481689453125, 3.26025390625, 3.39569091796875, 3.5311279296875, 3.66656494140625, 3.802001953125, 3.93743896484375, 4.0728759765625, 4.20831298828125, 4.34375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 8.0, 6.0, 10.0, 18.0, 15.0, 9.0, 9.0, 24.0, 26.0, 26.0, 40.0, 31.0, 48.0, 43.0, 45.0, 55.0, 58.0, 61.0, 46.0, 54.0, 48.0, 33.0, 43.0, 40.0, 29.0, 29.0, 23.0, 15.0, 15.0, 14.0, 16.0, 8.0, 7.0, 11.0, 5.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.416015625, -1.3734130859375, -1.330810546875, -1.2882080078125, -1.24560546875, -1.2030029296875, -1.160400390625, -1.1177978515625, -1.0751953125, -1.0325927734375, -0.989990234375, -0.9473876953125, -0.90478515625, -0.8621826171875, -0.819580078125, -0.7769775390625, -0.734375, -0.6917724609375, -0.649169921875, -0.6065673828125, -0.56396484375, -0.5213623046875, -0.478759765625, -0.4361572265625, -0.3935546875, -0.3509521484375, -0.308349609375, -0.2657470703125, -0.22314453125, -0.1805419921875, -0.137939453125, -0.0953369140625, -0.052734375, -0.0101318359375, 0.032470703125, 0.0750732421875, 0.11767578125, 0.1602783203125, 0.202880859375, 0.2454833984375, 0.2880859375, 0.3306884765625, 0.373291015625, 0.4158935546875, 0.45849609375, 0.5010986328125, 0.543701171875, 0.5863037109375, 0.62890625, 0.6715087890625, 0.714111328125, 0.7567138671875, 0.79931640625, 0.8419189453125, 0.884521484375, 0.9271240234375, 0.9697265625, 1.0123291015625, 1.054931640625, 1.0975341796875, 1.14013671875, 1.1827392578125, 1.225341796875, 1.2679443359375, 1.310546875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 11.0, 10.0, 20.0, 25.0, 39.0, 47.0, 74.0, 133.0, 210.0, 263.0, 461.0, 672.0, 1084.0, 1929.0, 3360.0, 6395.0, 13184.0, 29153.0, 78095.0, 319410.0, 430293.0, 97096.0, 34878.0, 15049.0, 7371.0, 3813.0, 2164.0, 1193.0, 765.0, 477.0, 286.0, 199.0, 125.0, 83.0, 72.0, 44.0, 21.0, 15.0, 10.0, 11.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.4296875, -4.303466796875, -4.17724609375, -4.051025390625, -3.9248046875, -3.798583984375, -3.67236328125, -3.546142578125, -3.419921875, -3.293701171875, -3.16748046875, -3.041259765625, -2.9150390625, -2.788818359375, -2.66259765625, -2.536376953125, -2.41015625, -2.283935546875, -2.15771484375, -2.031494140625, -1.9052734375, -1.779052734375, -1.65283203125, -1.526611328125, -1.400390625, -1.274169921875, -1.14794921875, -1.021728515625, -0.8955078125, -0.769287109375, -0.64306640625, -0.516845703125, -0.390625, -0.264404296875, -0.13818359375, -0.011962890625, 0.1142578125, 0.240478515625, 0.36669921875, 0.492919921875, 0.619140625, 0.745361328125, 0.87158203125, 0.997802734375, 1.1240234375, 1.250244140625, 1.37646484375, 1.502685546875, 1.62890625, 1.755126953125, 1.88134765625, 2.007568359375, 2.1337890625, 2.260009765625, 2.38623046875, 2.512451171875, 2.638671875, 2.764892578125, 2.89111328125, 3.017333984375, 3.1435546875, 3.269775390625, 3.39599609375, 3.522216796875, 3.6484375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 9.0, 6.0, 7.0, 8.0, 8.0, 15.0, 14.0, 14.0, 25.0, 24.0, 27.0, 28.0, 29.0, 33.0, 38.0, 40.0, 34.0, 42.0, 41.0, 39.0, 45.0, 52.0, 39.0, 49.0, 39.0, 32.0, 36.0, 30.0, 27.0, 24.0, 18.0, 24.0, 13.0, 10.0, 13.0, 14.0, 7.0, 9.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.009765625, -0.9783477783203125, -0.946929931640625, -0.9155120849609375, -0.88409423828125, -0.8526763916015625, -0.821258544921875, -0.7898406982421875, -0.7584228515625, -0.7270050048828125, -0.695587158203125, -0.6641693115234375, -0.63275146484375, -0.6013336181640625, -0.569915771484375, -0.5384979248046875, -0.507080078125, -0.4756622314453125, -0.444244384765625, -0.4128265380859375, -0.38140869140625, -0.3499908447265625, -0.318572998046875, -0.2871551513671875, -0.2557373046875, -0.2243194580078125, -0.192901611328125, -0.1614837646484375, -0.13006591796875, -0.0986480712890625, -0.067230224609375, -0.0358123779296875, -0.00439453125, 0.0270233154296875, 0.058441162109375, 0.0898590087890625, 0.12127685546875, 0.1526947021484375, 0.184112548828125, 0.2155303955078125, 0.2469482421875, 0.2783660888671875, 0.309783935546875, 0.3412017822265625, 0.37261962890625, 0.4040374755859375, 0.435455322265625, 0.4668731689453125, 0.498291015625, 0.5297088623046875, 0.561126708984375, 0.5925445556640625, 0.62396240234375, 0.6553802490234375, 0.686798095703125, 0.7182159423828125, 0.7496337890625, 0.7810516357421875, 0.812469482421875, 0.8438873291015625, 0.87530517578125, 0.9067230224609375, 0.938140869140625, 0.9695587158203125, 1.0009765625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 7.0, 17.0, 17.0, 26.0, 20.0, 18.0, 52.0, 85.0, 116.0, 180.0, 240.0, 433.0, 1040.0, 2792.0, 14009.0, 944225.0, 75271.0, 6628.0, 1632.0, 714.0, 399.0, 208.0, 125.0, 82.0, 75.0, 52.0, 30.0, 22.0, 8.0, 7.0, 5.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.0643310546875, -14.480224609375, -13.8961181640625, -13.31201171875, -12.7279052734375, -12.143798828125, -11.5596923828125, -10.9755859375, -10.3914794921875, -9.807373046875, -9.2232666015625, -8.63916015625, -8.0550537109375, -7.470947265625, -6.8868408203125, -6.302734375, -5.7186279296875, -5.134521484375, -4.5504150390625, -3.96630859375, -3.3822021484375, -2.798095703125, -2.2139892578125, -1.6298828125, -1.0457763671875, -0.461669921875, 0.1224365234375, 0.70654296875, 1.2906494140625, 1.874755859375, 2.4588623046875, 3.04296875, 3.6270751953125, 4.211181640625, 4.7952880859375, 5.37939453125, 5.9635009765625, 6.547607421875, 7.1317138671875, 7.7158203125, 8.2999267578125, 8.884033203125, 9.4681396484375, 10.05224609375, 10.6363525390625, 11.220458984375, 11.8045654296875, 12.388671875, 12.9727783203125, 13.556884765625, 14.1409912109375, 14.72509765625, 15.3092041015625, 15.893310546875, 16.4774169921875, 17.0615234375, 17.6456298828125, 18.229736328125, 18.8138427734375, 19.39794921875, 19.9820556640625, 20.566162109375, 21.1502685546875, 21.734375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 8.0, 10.0, 19.0, 27.0, 29.0, 53.0, 77.0, 122.0, 290.0, 124.0, 66.0, 62.0, 40.0, 20.0, 14.0, 10.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017023086547851562, -0.00016425922513008118, -0.00015828758478164673, -0.00015231594443321228, -0.00014634430408477783, -0.00014037266373634338, -0.00013440102338790894, -0.0001284293830394745, -0.00012245774269104004, -0.00011648610234260559, -0.00011051446199417114, -0.0001045428216457367, -9.857118129730225e-05, -9.25995409488678e-05, -8.662790060043335e-05, -8.06562602519989e-05, -7.468461990356445e-05, -6.871297955513e-05, -6.274133920669556e-05, -5.676969885826111e-05, -5.079805850982666e-05, -4.482641816139221e-05, -3.8854777812957764e-05, -3.2883137464523315e-05, -2.6911497116088867e-05, -2.093985676765442e-05, -1.496821641921997e-05, -8.996576070785522e-06, -3.0249357223510742e-06, 2.946704626083374e-06, 8.918344974517822e-06, 1.488998532295227e-05, 2.086162567138672e-05, 2.6833266019821167e-05, 3.2804906368255615e-05, 3.8776546716690063e-05, 4.474818706512451e-05, 5.071982741355896e-05, 5.669146776199341e-05, 6.266310811042786e-05, 6.86347484588623e-05, 7.460638880729675e-05, 8.05780291557312e-05, 8.654966950416565e-05, 9.25213098526001e-05, 9.849295020103455e-05, 0.000104464590549469, 0.00011043623089790344, 0.00011640787124633789, 0.00012237951159477234, 0.0001283511519432068, 0.00013432279229164124, 0.00014029443264007568, 0.00014626607298851013, 0.00015223771333694458, 0.00015820935368537903, 0.00016418099403381348, 0.00017015263438224792, 0.00017612427473068237, 0.00018209591507911682, 0.00018806755542755127, 0.00019403919577598572, 0.00020001083612442017, 0.00020598247647285461, 0.00021195411682128906]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 12.0, 9.0, 15.0, 17.0, 26.0, 31.0, 42.0, 61.0, 88.0, 120.0, 164.0, 236.0, 367.0, 724.0, 1529.0, 3875.0, 18154.0, 936072.0, 74263.0, 7820.0, 2331.0, 1016.0, 538.0, 316.0, 210.0, 136.0, 79.0, 74.0, 48.0, 31.0, 33.0, 20.0, 14.0, 17.0, 13.0, 6.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.072509765625, -13.62939453125, -13.186279296875, -12.7431640625, -12.300048828125, -11.85693359375, -11.413818359375, -10.970703125, -10.527587890625, -10.08447265625, -9.641357421875, -9.1982421875, -8.755126953125, -8.31201171875, -7.868896484375, -7.42578125, -6.982666015625, -6.53955078125, -6.096435546875, -5.6533203125, -5.210205078125, -4.76708984375, -4.323974609375, -3.880859375, -3.437744140625, -2.99462890625, -2.551513671875, -2.1083984375, -1.665283203125, -1.22216796875, -0.779052734375, -0.3359375, 0.107177734375, 0.55029296875, 0.993408203125, 1.4365234375, 1.879638671875, 2.32275390625, 2.765869140625, 3.208984375, 3.652099609375, 4.09521484375, 4.538330078125, 4.9814453125, 5.424560546875, 5.86767578125, 6.310791015625, 6.75390625, 7.197021484375, 7.64013671875, 8.083251953125, 8.5263671875, 8.969482421875, 9.41259765625, 9.855712890625, 10.298828125, 10.741943359375, 11.18505859375, 11.628173828125, 12.0712890625, 12.514404296875, 12.95751953125, 13.400634765625, 13.84375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 13.0, 18.0, 40.0, 63.0, 120.0, 394.0, 155.0, 78.0, 41.0, 26.0, 16.0, 12.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.8359222412109375, -1.764617919921875, -1.6933135986328125, -1.62200927734375, -1.5507049560546875, -1.479400634765625, -1.4080963134765625, -1.3367919921875, -1.2654876708984375, -1.194183349609375, -1.1228790283203125, -1.05157470703125, -0.9802703857421875, -0.908966064453125, -0.8376617431640625, -0.766357421875, -0.6950531005859375, -0.623748779296875, -0.5524444580078125, -0.48114013671875, -0.4098358154296875, -0.338531494140625, -0.2672271728515625, -0.1959228515625, -0.1246185302734375, -0.053314208984375, 0.0179901123046875, 0.08929443359375, 0.1605987548828125, 0.231903076171875, 0.3032073974609375, 0.37451171875, 0.4458160400390625, 0.517120361328125, 0.5884246826171875, 0.65972900390625, 0.7310333251953125, 0.802337646484375, 0.8736419677734375, 0.9449462890625, 1.0162506103515625, 1.087554931640625, 1.1588592529296875, 1.23016357421875, 1.3014678955078125, 1.372772216796875, 1.4440765380859375, 1.515380859375, 1.5866851806640625, 1.657989501953125, 1.7292938232421875, 1.80059814453125, 1.8719024658203125, 1.943206787109375, 2.0145111083984375, 2.0858154296875, 2.1571197509765625, 2.228424072265625, 2.2997283935546875, 2.37103271484375, 2.4423370361328125, 2.513641357421875, 2.5849456787109375, 2.65625]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 3.0, 3.0, 8.0, 10.0, 17.0, 25.0, 33.0, 67.0, 110.0, 254.0, 306.0, 85.0, 34.0, 15.0, 7.0, 10.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.084416389465332, -4.951287269592285, -4.818158149719238, -4.685028553009033, -4.551899433135986, -4.4187703132629395, -4.285640716552734, -4.1525115966796875, -4.019382476806641, -3.8862533569335938, -3.7531239986419678, -3.619994640350342, -3.486865520477295, -3.353736400604248, -3.220607042312622, -3.087477684020996, -2.954348564147949, -2.8212194442749023, -2.6880900859832764, -2.5549607276916504, -2.4218316078186035, -2.2887024879455566, -2.1555731296539307, -2.0224437713623047, -1.8893146514892578, -1.7561854124069214, -1.623056173324585, -1.4899269342422485, -1.356797695159912, -1.2236684560775757, -1.0905392169952393, -0.9574099779129028, -0.8242802619934082, -0.6911510229110718, -0.5580217838287354, -0.4248925447463989, -0.2917633056640625, -0.15863406658172607, -0.02550482749938965, 0.10762441158294678, 0.2407536506652832, 0.37388288974761963, 0.507012128829956, 0.6401413679122925, 0.7732706069946289, 0.9063998460769653, 1.0395290851593018, 1.1726583242416382, 1.3057875633239746, 1.438916802406311, 1.5720460414886475, 1.7051752805709839, 1.8383045196533203, 1.9714337587356567, 2.104562997817993, 2.237692356109619, 2.370821475982666, 2.503950595855713, 2.637079954147339, 2.770209312438965, 2.9033384323120117, 3.0364675521850586, 3.1695969104766846, 3.3027262687683105, 3.4358553886413574]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 3.0, 4.0, 13.0, 13.0, 15.0, 19.0, 20.0, 23.0, 36.0, 39.0, 43.0, 37.0, 38.0, 39.0, 52.0, 61.0, 53.0, 60.0, 39.0, 43.0, 46.0, 48.0, 33.0, 32.0, 21.0, 24.0, 25.0, 17.0, 13.0, 16.0, 14.0, 9.0, 9.0, 7.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6580816507339478, -1.609861969947815, -1.5616422891616821, -1.5134227275848389, -1.465203046798706, -1.4169833660125732, -1.3687636852264404, -1.3205440044403076, -1.2723243236541748, -1.224104642868042, -1.1758849620819092, -1.1276652812957764, -1.079445719718933, -1.0312260389328003, -0.9830063581466675, -0.9347866773605347, -0.8865671157836914, -0.8383474349975586, -0.7901278138160706, -0.7419081330299377, -0.6936885118484497, -0.6454688310623169, -0.5972491502761841, -0.5490294694900513, -0.5008098483085632, -0.4525901973247528, -0.4043705463409424, -0.35615086555480957, -0.30793121457099915, -0.2597115635871887, -0.2114918828010559, -0.16327223181724548, -0.11505258083343506, -0.06683292239904404, -0.018613263964653015, 0.029606401920318604, 0.07782605290412903, 0.12604570388793945, 0.17426538467407227, 0.2224850356578827, 0.2707046866416931, 0.31892433762550354, 0.36714398860931396, 0.4153636693954468, 0.4635833203792572, 0.5118029713630676, 0.5600226521492004, 0.6082422733306885, 0.6564619541168213, 0.7046816349029541, 0.7529012560844421, 0.801120936870575, 0.849340558052063, 0.8975602388381958, 0.9457799196243286, 0.9939996004104614, 1.0422191619873047, 1.0904388427734375, 1.1386585235595703, 1.1868782043457031, 1.2350977659225464, 1.2833174467086792, 1.331537127494812, 1.3797568082809448, 1.4279764890670776]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 9.0, 13.0, 25.0, 30.0, 54.0, 63.0, 89.0, 122.0, 166.0, 211.0, 314.0, 439.0, 693.0, 1022.0, 1447.0, 2225.0, 3210.0, 4610.0, 7269.0, 11258.0, 18586.0, 32066.0, 57810.0, 117948.0, 320073.0, 1978831.0, 1198185.0, 226102.0, 93254.0, 47908.0, 27166.0, 16045.0, 9762.0, 6184.0, 3957.0, 2593.0, 1634.0, 977.0, 664.0, 413.0, 275.0, 204.0, 133.0, 89.0, 62.0, 37.0, 26.0, 12.0, 9.0, 8.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.580078125, -1.5347442626953125, -1.489410400390625, -1.4440765380859375, -1.39874267578125, -1.3534088134765625, -1.308074951171875, -1.2627410888671875, -1.2174072265625, -1.1720733642578125, -1.126739501953125, -1.0814056396484375, -1.03607177734375, -0.9907379150390625, -0.945404052734375, -0.9000701904296875, -0.854736328125, -0.8094024658203125, -0.764068603515625, -0.7187347412109375, -0.67340087890625, -0.6280670166015625, -0.582733154296875, -0.5373992919921875, -0.4920654296875, -0.4467315673828125, -0.401397705078125, -0.3560638427734375, -0.31072998046875, -0.2653961181640625, -0.220062255859375, -0.1747283935546875, -0.12939453125, -0.0840606689453125, -0.038726806640625, 0.0066070556640625, 0.05194091796875, 0.0972747802734375, 0.142608642578125, 0.1879425048828125, 0.2332763671875, 0.2786102294921875, 0.323944091796875, 0.3692779541015625, 0.41461181640625, 0.4599456787109375, 0.505279541015625, 0.5506134033203125, 0.595947265625, 0.6412811279296875, 0.686614990234375, 0.7319488525390625, 0.77728271484375, 0.8226165771484375, 0.867950439453125, 0.9132843017578125, 0.9586181640625, 1.0039520263671875, 1.049285888671875, 1.0946197509765625, 1.13995361328125, 1.1852874755859375, 1.230621337890625, 1.2759552001953125, 1.3212890625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 6.0, 9.0, 4.0, 5.0, 8.0, 9.0, 11.0, 14.0, 14.0, 19.0, 32.0, 38.0, 27.0, 29.0, 39.0, 42.0, 38.0, 45.0, 50.0, 44.0, 56.0, 49.0, 43.0, 45.0, 44.0, 41.0, 30.0, 36.0, 23.0, 15.0, 20.0, 18.0, 13.0, 16.0, 15.0, 17.0, 6.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.482666015625, -0.46929168701171875, -0.4559173583984375, -0.44254302978515625, -0.429168701171875, -0.41579437255859375, -0.4024200439453125, -0.38904571533203125, -0.37567138671875, -0.36229705810546875, -0.3489227294921875, -0.33554840087890625, -0.322174072265625, -0.30879974365234375, -0.2954254150390625, -0.28205108642578125, -0.2686767578125, -0.25530242919921875, -0.2419281005859375, -0.22855377197265625, -0.215179443359375, -0.20180511474609375, -0.1884307861328125, -0.17505645751953125, -0.16168212890625, -0.14830780029296875, -0.1349334716796875, -0.12155914306640625, -0.108184814453125, -0.09481048583984375, -0.0814361572265625, -0.06806182861328125, -0.0546875, -0.04131317138671875, -0.0279388427734375, -0.01456451416015625, -0.001190185546875, 0.01218414306640625, 0.0255584716796875, 0.03893280029296875, 0.05230712890625, 0.06568145751953125, 0.0790557861328125, 0.09243011474609375, 0.105804443359375, 0.11917877197265625, 0.1325531005859375, 0.14592742919921875, 0.1593017578125, 0.17267608642578125, 0.1860504150390625, 0.19942474365234375, 0.212799072265625, 0.22617340087890625, 0.2395477294921875, 0.25292205810546875, 0.26629638671875, 0.27967071533203125, 0.2930450439453125, 0.30641937255859375, 0.319793701171875, 0.33316802978515625, 0.3465423583984375, 0.35991668701171875, 0.373291015625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 13.0, 12.0, 20.0, 27.0, 45.0, 50.0, 101.0, 142.0, 210.0, 301.0, 464.0, 764.0, 1239.0, 2088.0, 4015.0, 7823.0, 15954.0, 38019.0, 114528.0, 529882.0, 2720487.0, 564383.0, 120221.0, 39331.0, 16455.0, 7779.0, 4155.0, 2248.0, 1329.0, 795.0, 472.0, 327.0, 205.0, 129.0, 92.0, 54.0, 36.0, 25.0, 17.0, 15.0, 9.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2861328125, -1.243988037109375, -1.20184326171875, -1.159698486328125, -1.1175537109375, -1.075408935546875, -1.03326416015625, -0.991119384765625, -0.948974609375, -0.906829833984375, -0.86468505859375, -0.822540283203125, -0.7803955078125, -0.738250732421875, -0.69610595703125, -0.653961181640625, -0.61181640625, -0.569671630859375, -0.52752685546875, -0.485382080078125, -0.4432373046875, -0.401092529296875, -0.35894775390625, -0.316802978515625, -0.274658203125, -0.232513427734375, -0.19036865234375, -0.148223876953125, -0.1060791015625, -0.063934326171875, -0.02178955078125, 0.020355224609375, 0.0625, 0.104644775390625, 0.14678955078125, 0.188934326171875, 0.2310791015625, 0.273223876953125, 0.31536865234375, 0.357513427734375, 0.399658203125, 0.441802978515625, 0.48394775390625, 0.526092529296875, 0.5682373046875, 0.610382080078125, 0.65252685546875, 0.694671630859375, 0.73681640625, 0.778961181640625, 0.82110595703125, 0.863250732421875, 0.9053955078125, 0.947540283203125, 0.98968505859375, 1.031829833984375, 1.073974609375, 1.116119384765625, 1.15826416015625, 1.200408935546875, 1.2425537109375, 1.284698486328125, 1.32684326171875, 1.368988037109375, 1.4111328125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 3.0, 4.0, 7.0, 8.0, 11.0, 18.0, 13.0, 19.0, 19.0, 33.0, 33.0, 34.0, 46.0, 47.0, 62.0, 72.0, 111.0, 143.0, 186.0, 237.0, 281.0, 339.0, 423.0, 393.0, 297.0, 285.0, 193.0, 158.0, 140.0, 102.0, 81.0, 68.0, 48.0, 37.0, 37.0, 18.0, 23.0, 10.0, 10.0, 9.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.275634765625, -0.26827239990234375, -0.2609100341796875, -0.25354766845703125, -0.246185302734375, -0.23882293701171875, -0.2314605712890625, -0.22409820556640625, -0.21673583984375, -0.20937347412109375, -0.2020111083984375, -0.19464874267578125, -0.187286376953125, -0.17992401123046875, -0.1725616455078125, -0.16519927978515625, -0.1578369140625, -0.15047454833984375, -0.1431121826171875, -0.13574981689453125, -0.128387451171875, -0.12102508544921875, -0.1136627197265625, -0.10630035400390625, -0.09893798828125, -0.09157562255859375, -0.0842132568359375, -0.07685089111328125, -0.069488525390625, -0.06212615966796875, -0.0547637939453125, -0.04740142822265625, -0.0400390625, -0.03267669677734375, -0.0253143310546875, -0.01795196533203125, -0.010589599609375, -0.00322723388671875, 0.0041351318359375, 0.01149749755859375, 0.01885986328125, 0.02622222900390625, 0.0335845947265625, 0.04094696044921875, 0.048309326171875, 0.05567169189453125, 0.0630340576171875, 0.07039642333984375, 0.0777587890625, 0.08512115478515625, 0.0924835205078125, 0.09984588623046875, 0.107208251953125, 0.11457061767578125, 0.1219329833984375, 0.12929534912109375, 0.13665771484375, 0.14402008056640625, 0.1513824462890625, 0.15874481201171875, 0.166107177734375, 0.17346954345703125, 0.1808319091796875, 0.18819427490234375, 0.195556640625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 20.0, 21.0, 24.0, 37.0, 73.0, 136.0, 228.0, 233.0, 101.0, 41.0, 17.0, 18.0, 10.0, 6.0, 7.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3627512454986572, -1.3213934898376465, -1.2800357341766357, -1.238677978515625, -1.1973202228546143, -1.1559624671936035, -1.1146047115325928, -1.073246955871582, -1.0318892002105713, -0.9905314445495605, -0.9491736888885498, -0.9078159332275391, -0.8664581775665283, -0.8251004219055176, -0.7837427258491516, -0.7423849701881409, -0.7010272741317749, -0.6596695184707642, -0.6183117628097534, -0.5769540071487427, -0.5355962514877319, -0.4942385256290436, -0.4528807997703552, -0.4115230441093445, -0.37016528844833374, -0.328807532787323, -0.28744977712631226, -0.2460920512676239, -0.20473429560661316, -0.16337653994560242, -0.12201879918575287, -0.08066105842590332, -0.03930318355560303, 0.002054564654827118, 0.04341231286525726, 0.08477006107568741, 0.12612780928611755, 0.1674855649471283, 0.20884330570697784, 0.2502010464668274, 0.29155880212783813, 0.3329165577888489, 0.3742743134498596, 0.415632039308548, 0.4569897949695587, 0.49834755063056946, 0.5397052764892578, 0.5810630321502686, 0.6224207878112793, 0.66377854347229, 0.7051362991333008, 0.7464940547943115, 0.7878518104553223, 0.829209566116333, 0.870567262172699, 0.9119250178337097, 0.9532827734947205, 0.9946405291557312, 1.0359982252120972, 1.077355980873108, 1.1187137365341187, 1.1600714921951294, 1.2014292478561401, 1.2427870035171509, 1.2841447591781616]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 3.0, 6.0, 5.0, 4.0, 8.0, 15.0, 11.0, 16.0, 11.0, 18.0, 17.0, 35.0, 27.0, 32.0, 37.0, 42.0, 45.0, 49.0, 43.0, 34.0, 48.0, 42.0, 48.0, 43.0, 52.0, 38.0, 29.0, 38.0, 26.0, 30.0, 17.0, 19.0, 21.0, 17.0, 15.0, 10.0, 12.0, 5.0, 10.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47232919931411743, -0.45789918303489685, -0.44346919655799866, -0.4290391802787781, -0.4146091639995575, -0.4001791477203369, -0.3857491612434387, -0.37131914496421814, -0.35688912868499756, -0.342459112405777, -0.3280291259288788, -0.3135991096496582, -0.2991690933704376, -0.28473907709121704, -0.27030909061431885, -0.25587907433509827, -0.24144907295703888, -0.2270190715789795, -0.2125890552997589, -0.19815905392169952, -0.18372903764247894, -0.16929903626441956, -0.15486901998519897, -0.1404390186071396, -0.1260090172290802, -0.11157900840044022, -0.09714899957180023, -0.08271899819374084, -0.06828898191452026, -0.053858980536460876, -0.03942897170782089, -0.024998962879180908, -0.010568946599960327, 0.0038610612973570824, 0.018291069194674492, 0.03272107616066933, 0.04715108498930931, 0.061581090092659, 0.07601109892129898, 0.09044110774993896, 0.10487111657857895, 0.11930112540721893, 0.13373112678527832, 0.1481611430644989, 0.1625911444425583, 0.17702114582061768, 0.19145116209983826, 0.20588117837905884, 0.22031117975711823, 0.2347411811351776, 0.2491711974143982, 0.2636012136936188, 0.27803120017051697, 0.29246121644973755, 0.30689123272895813, 0.3213212490081787, 0.3357512354850769, 0.3501812517642975, 0.3646112382411957, 0.37904125452041626, 0.39347127079963684, 0.4079012870788574, 0.4223312735557556, 0.4367612898349762, 0.4511913061141968]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 0.0, 5.0, 6.0, 4.0, 7.0, 13.0, 15.0, 22.0, 29.0, 57.0, 75.0, 106.0, 155.0, 243.0, 362.0, 556.0, 768.0, 1356.0, 1973.0, 3069.0, 5074.0, 8739.0, 17036.0, 42510.0, 155481.0, 538423.0, 182697.0, 47338.0, 18752.0, 9313.0, 5248.0, 3213.0, 2022.0, 1298.0, 834.0, 602.0, 397.0, 258.0, 159.0, 105.0, 86.0, 49.0, 35.0, 21.0, 17.0, 10.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68310546875, -0.6599884033203125, -0.636871337890625, -0.6137542724609375, -0.59063720703125, -0.5675201416015625, -0.544403076171875, -0.5212860107421875, -0.4981689453125, -0.4750518798828125, -0.451934814453125, -0.4288177490234375, -0.40570068359375, -0.3825836181640625, -0.359466552734375, -0.3363494873046875, -0.313232421875, -0.2901153564453125, -0.266998291015625, -0.2438812255859375, -0.22076416015625, -0.1976470947265625, -0.174530029296875, -0.1514129638671875, -0.1282958984375, -0.1051788330078125, -0.082061767578125, -0.0589447021484375, -0.03582763671875, -0.0127105712890625, 0.010406494140625, 0.0335235595703125, 0.056640625, 0.0797576904296875, 0.102874755859375, 0.1259918212890625, 0.14910888671875, 0.1722259521484375, 0.195343017578125, 0.2184600830078125, 0.2415771484375, 0.2646942138671875, 0.287811279296875, 0.3109283447265625, 0.33404541015625, 0.3571624755859375, 0.380279541015625, 0.4033966064453125, 0.426513671875, 0.4496307373046875, 0.472747802734375, 0.4958648681640625, 0.51898193359375, 0.5420989990234375, 0.565216064453125, 0.5883331298828125, 0.6114501953125, 0.6345672607421875, 0.657684326171875, 0.6808013916015625, 0.70391845703125, 0.7270355224609375, 0.750152587890625, 0.7732696533203125, 0.79638671875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 8.0, 8.0, 12.0, 8.0, 13.0, 14.0, 17.0, 19.0, 23.0, 18.0, 39.0, 25.0, 38.0, 41.0, 35.0, 46.0, 42.0, 37.0, 49.0, 43.0, 30.0, 46.0, 36.0, 38.0, 45.0, 42.0, 29.0, 32.0, 20.0, 20.0, 17.0, 18.0, 13.0, 14.0, 9.0, 12.0, 10.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.37705230712890625, -0.3651885986328125, -0.35332489013671875, -0.341461181640625, -0.32959747314453125, -0.3177337646484375, -0.30587005615234375, -0.29400634765625, -0.28214263916015625, -0.2702789306640625, -0.25841522216796875, -0.246551513671875, -0.23468780517578125, -0.2228240966796875, -0.21096038818359375, -0.1990966796875, -0.18723297119140625, -0.1753692626953125, -0.16350555419921875, -0.151641845703125, -0.13977813720703125, -0.1279144287109375, -0.11605072021484375, -0.10418701171875, -0.09232330322265625, -0.0804595947265625, -0.06859588623046875, -0.056732177734375, -0.04486846923828125, -0.0330047607421875, -0.02114105224609375, -0.00927734375, 0.00258636474609375, 0.0144500732421875, 0.02631378173828125, 0.038177490234375, 0.05004119873046875, 0.0619049072265625, 0.07376861572265625, 0.08563232421875, 0.09749603271484375, 0.1093597412109375, 0.12122344970703125, 0.133087158203125, 0.14495086669921875, 0.1568145751953125, 0.16867828369140625, 0.1805419921875, 0.19240570068359375, 0.2042694091796875, 0.21613311767578125, 0.227996826171875, 0.23986053466796875, 0.2517242431640625, 0.26358795166015625, 0.27545166015625, 0.28731536865234375, 0.2991790771484375, 0.31104278564453125, 0.322906494140625, 0.33477020263671875, 0.3466339111328125, 0.35849761962890625, 0.370361328125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 9.0, 8.0, 12.0, 24.0, 34.0, 38.0, 62.0, 157.0, 244.0, 473.0, 1092.0, 2652.0, 8359.0, 48749.0, 894044.0, 76728.0, 10278.0, 3115.0, 1281.0, 538.0, 267.0, 138.0, 87.0, 58.0, 32.0, 17.0, 15.0, 8.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9921875, -1.919952392578125, -1.84771728515625, -1.775482177734375, -1.7032470703125, -1.631011962890625, -1.55877685546875, -1.486541748046875, -1.414306640625, -1.342071533203125, -1.26983642578125, -1.197601318359375, -1.1253662109375, -1.053131103515625, -0.98089599609375, -0.908660888671875, -0.83642578125, -0.764190673828125, -0.69195556640625, -0.619720458984375, -0.5474853515625, -0.475250244140625, -0.40301513671875, -0.330780029296875, -0.258544921875, -0.186309814453125, -0.11407470703125, -0.041839599609375, 0.0303955078125, 0.102630615234375, 0.17486572265625, 0.247100830078125, 0.3193359375, 0.391571044921875, 0.46380615234375, 0.536041259765625, 0.6082763671875, 0.680511474609375, 0.75274658203125, 0.824981689453125, 0.897216796875, 0.969451904296875, 1.04168701171875, 1.113922119140625, 1.1861572265625, 1.258392333984375, 1.33062744140625, 1.402862548828125, 1.47509765625, 1.547332763671875, 1.61956787109375, 1.691802978515625, 1.7640380859375, 1.836273193359375, 1.90850830078125, 1.980743408203125, 2.052978515625, 2.125213623046875, 2.19744873046875, 2.269683837890625, 2.3419189453125, 2.414154052734375, 2.48638916015625, 2.558624267578125, 2.630859375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 6.0, 9.0, 11.0, 11.0, 19.0, 27.0, 26.0, 29.0, 31.0, 37.0, 37.0, 48.0, 42.0, 50.0, 52.0, 49.0, 41.0, 30.0, 48.0, 41.0, 44.0, 41.0, 31.0, 43.0, 33.0, 37.0, 24.0, 17.0, 17.0, 16.0, 12.0, 7.0, 8.0, 6.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.304443359375, -0.29537200927734375, -0.2863006591796875, -0.27722930908203125, -0.268157958984375, -0.25908660888671875, -0.2500152587890625, -0.24094390869140625, -0.23187255859375, -0.22280120849609375, -0.2137298583984375, -0.20465850830078125, -0.195587158203125, -0.18651580810546875, -0.1774444580078125, -0.16837310791015625, -0.1593017578125, -0.15023040771484375, -0.1411590576171875, -0.13208770751953125, -0.123016357421875, -0.11394500732421875, -0.1048736572265625, -0.09580230712890625, -0.08673095703125, -0.07765960693359375, -0.0685882568359375, -0.05951690673828125, -0.050445556640625, -0.04137420654296875, -0.0323028564453125, -0.02323150634765625, -0.01416015625, -0.00508880615234375, 0.0039825439453125, 0.01305389404296875, 0.022125244140625, 0.03119659423828125, 0.0402679443359375, 0.04933929443359375, 0.05841064453125, 0.06748199462890625, 0.0765533447265625, 0.08562469482421875, 0.094696044921875, 0.10376739501953125, 0.1128387451171875, 0.12191009521484375, 0.1309814453125, 0.14005279541015625, 0.1491241455078125, 0.15819549560546875, 0.167266845703125, 0.17633819580078125, 0.1854095458984375, 0.19448089599609375, 0.20355224609375, 0.21262359619140625, 0.2216949462890625, 0.23076629638671875, 0.239837646484375, 0.24890899658203125, 0.2579803466796875, 0.26705169677734375, 0.276123046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 3.0, 5.0, 10.0, 20.0, 22.0, 41.0, 37.0, 51.0, 66.0, 91.0, 126.0, 221.0, 338.0, 512.0, 799.0, 1313.0, 2403.0, 4999.0, 11120.0, 31322.0, 137046.0, 671395.0, 133589.0, 30926.0, 11099.0, 4884.0, 2453.0, 1307.0, 803.0, 482.0, 318.0, 229.0, 160.0, 101.0, 69.0, 43.0, 35.0, 21.0, 27.0, 21.0, 7.0, 10.0, 5.0, 2.0, 4.0, 5.0, 3.0, 4.0], "bins": [-0.28076171875, -0.2732734680175781, -0.26578521728515625, -0.2582969665527344, -0.2508087158203125, -0.24332046508789062, -0.23583221435546875, -0.22834396362304688, -0.220855712890625, -0.21336746215820312, -0.20587921142578125, -0.19839096069335938, -0.1909027099609375, -0.18341445922851562, -0.17592620849609375, -0.16843795776367188, -0.16094970703125, -0.15346145629882812, -0.14597320556640625, -0.13848495483398438, -0.1309967041015625, -0.12350845336914062, -0.11602020263671875, -0.10853195190429688, -0.101043701171875, -0.09355545043945312, -0.08606719970703125, -0.07857894897460938, -0.0710906982421875, -0.06360244750976562, -0.05611419677734375, -0.048625946044921875, -0.0411376953125, -0.033649444580078125, -0.02616119384765625, -0.018672943115234375, -0.0111846923828125, -0.003696441650390625, 0.00379180908203125, 0.011280059814453125, 0.018768310546875, 0.026256561279296875, 0.03374481201171875, 0.041233062744140625, 0.0487213134765625, 0.056209564208984375, 0.06369781494140625, 0.07118606567382812, 0.07867431640625, 0.08616256713867188, 0.09365081787109375, 0.10113906860351562, 0.1086273193359375, 0.11611557006835938, 0.12360382080078125, 0.13109207153320312, 0.138580322265625, 0.14606857299804688, 0.15355682373046875, 0.16104507446289062, 0.1685333251953125, 0.17602157592773438, 0.18350982666015625, 0.19099807739257812, 0.198486328125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 8.0, 14.0, 21.0, 30.0, 44.0, 75.0, 104.0, 196.0, 195.0, 114.0, 48.0, 42.0, 15.0, 17.0, 13.0, 7.0, 9.0, 11.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2292137145996094e-05, -2.1548941731452942e-05, -2.080574631690979e-05, -2.0062550902366638e-05, -1.9319355487823486e-05, -1.8576160073280334e-05, -1.7832964658737183e-05, -1.708976924419403e-05, -1.634657382965088e-05, -1.5603378415107727e-05, -1.4860183000564575e-05, -1.4116987586021423e-05, -1.3373792171478271e-05, -1.263059675693512e-05, -1.1887401342391968e-05, -1.1144205927848816e-05, -1.0401010513305664e-05, -9.657815098762512e-06, -8.91461968421936e-06, -8.171424269676208e-06, -7.428228855133057e-06, -6.685033440589905e-06, -5.941838026046753e-06, -5.198642611503601e-06, -4.455447196960449e-06, -3.7122517824172974e-06, -2.9690563678741455e-06, -2.2258609533309937e-06, -1.4826655387878418e-06, -7.394701242446899e-07, 3.725290298461914e-09, 7.469207048416138e-07, 1.4901161193847656e-06, 2.2333115339279175e-06, 2.9765069484710693e-06, 3.719702363014221e-06, 4.462897777557373e-06, 5.206093192100525e-06, 5.949288606643677e-06, 6.692484021186829e-06, 7.4356794357299805e-06, 8.178874850273132e-06, 8.922070264816284e-06, 9.665265679359436e-06, 1.0408461093902588e-05, 1.115165650844574e-05, 1.1894851922988892e-05, 1.2638047337532043e-05, 1.3381242752075195e-05, 1.4124438166618347e-05, 1.4867633581161499e-05, 1.561082899570465e-05, 1.6354024410247803e-05, 1.7097219824790955e-05, 1.7840415239334106e-05, 1.8583610653877258e-05, 1.932680606842041e-05, 2.0070001482963562e-05, 2.0813196897506714e-05, 2.1556392312049866e-05, 2.2299587726593018e-05, 2.304278314113617e-05, 2.378597855567932e-05, 2.4529173970222473e-05, 2.5272369384765625e-05]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 10.0, 10.0, 7.0, 19.0, 30.0, 47.0, 49.0, 74.0, 116.0, 173.0, 300.0, 439.0, 732.0, 1343.0, 2502.0, 5189.0, 12308.0, 36116.0, 158768.0, 652617.0, 125659.0, 31061.0, 10872.0, 4724.0, 2222.0, 1223.0, 712.0, 422.0, 260.0, 176.0, 112.0, 69.0, 52.0, 38.0, 32.0, 20.0, 8.0, 11.0, 6.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1846923828125, -0.17932891845703125, -0.1739654541015625, -0.16860198974609375, -0.163238525390625, -0.15787506103515625, -0.1525115966796875, -0.14714813232421875, -0.14178466796875, -0.13642120361328125, -0.1310577392578125, -0.12569427490234375, -0.120330810546875, -0.11496734619140625, -0.1096038818359375, -0.10424041748046875, -0.098876953125, -0.09351348876953125, -0.0881500244140625, -0.08278656005859375, -0.077423095703125, -0.07205963134765625, -0.0666961669921875, -0.06133270263671875, -0.05596923828125, -0.05060577392578125, -0.0452423095703125, -0.03987884521484375, -0.034515380859375, -0.02915191650390625, -0.0237884521484375, -0.01842498779296875, -0.0130615234375, -0.00769805908203125, -0.0023345947265625, 0.00302886962890625, 0.008392333984375, 0.01375579833984375, 0.0191192626953125, 0.02448272705078125, 0.02984619140625, 0.03520965576171875, 0.0405731201171875, 0.04593658447265625, 0.051300048828125, 0.05666351318359375, 0.0620269775390625, 0.06739044189453125, 0.07275390625, 0.07811737060546875, 0.0834808349609375, 0.08884429931640625, 0.094207763671875, 0.09957122802734375, 0.1049346923828125, 0.11029815673828125, 0.11566162109375, 0.12102508544921875, 0.1263885498046875, 0.13175201416015625, 0.137115478515625, 0.14247894287109375, 0.1478424072265625, 0.15320587158203125, 0.1585693359375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 6.0, 11.0, 6.0, 15.0, 26.0, 25.0, 24.0, 30.0, 62.0, 47.0, 73.0, 84.0, 94.0, 86.0, 105.0, 61.0, 62.0, 34.0, 34.0, 27.0, 31.0, 15.0, 12.0, 12.0, 5.0, 6.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05218505859375, -0.0507659912109375, -0.049346923828125, -0.0479278564453125, -0.0465087890625, -0.0450897216796875, -0.043670654296875, -0.0422515869140625, -0.04083251953125, -0.0394134521484375, -0.037994384765625, -0.0365753173828125, -0.03515625, -0.0337371826171875, -0.032318115234375, -0.0308990478515625, -0.02947998046875, -0.0280609130859375, -0.026641845703125, -0.0252227783203125, -0.0238037109375, -0.0223846435546875, -0.020965576171875, -0.0195465087890625, -0.01812744140625, -0.0167083740234375, -0.015289306640625, -0.0138702392578125, -0.012451171875, -0.0110321044921875, -0.009613037109375, -0.0081939697265625, -0.00677490234375, -0.0053558349609375, -0.003936767578125, -0.0025177001953125, -0.0010986328125, 0.0003204345703125, 0.001739501953125, 0.0031585693359375, 0.00457763671875, 0.0059967041015625, 0.007415771484375, 0.0088348388671875, 0.01025390625, 0.0116729736328125, 0.013092041015625, 0.0145111083984375, 0.01593017578125, 0.0173492431640625, 0.018768310546875, 0.0201873779296875, 0.0216064453125, 0.0230255126953125, 0.024444580078125, 0.0258636474609375, 0.02728271484375, 0.0287017822265625, 0.030120849609375, 0.0315399169921875, 0.032958984375, 0.0343780517578125, 0.035797119140625, 0.0372161865234375, 0.03863525390625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 6.0, 13.0, 24.0, 19.0, 31.0, 60.0, 113.0, 210.0, 221.0, 124.0, 67.0, 33.0, 17.0, 9.0, 12.0, 5.0, 7.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.934408962726593, -0.9022752046585083, -0.8701415061950684, -0.8380078077316284, -0.8058740496635437, -0.773740291595459, -0.741606593132019, -0.7094728946685791, -0.6773391366004944, -0.6452053785324097, -0.6130716800689697, -0.5809379816055298, -0.5488042235374451, -0.5166704654693604, -0.4845367670059204, -0.4524030387401581, -0.42026931047439575, -0.3881355822086334, -0.3560018539428711, -0.32386812567710876, -0.29173439741134644, -0.2596006691455841, -0.22746694087982178, -0.19533321261405945, -0.16319948434829712, -0.1310657560825348, -0.09893202781677246, -0.06679829955101013, -0.0346645712852478, -0.0025308430194854736, 0.029602885246276855, 0.061736613512039185, 0.09387028217315674, 0.12600401043891907, 0.1581377387046814, 0.19027146697044373, 0.22240519523620605, 0.2545389235019684, 0.2866726517677307, 0.31880638003349304, 0.35094010829925537, 0.3830738365650177, 0.41520756483078003, 0.44734129309654236, 0.4794750213623047, 0.5116087198257446, 0.5437424778938293, 0.5758762359619141, 0.608009934425354, 0.640143632888794, 0.6722773909568787, 0.7044111490249634, 0.7365448474884033, 0.7686785459518433, 0.800812304019928, 0.8329460620880127, 0.8650797605514526, 0.8972134590148926, 0.9293472170829773, 0.961480975151062, 0.993614673614502, 1.025748372077942, 1.0578820705413818, 1.0900158882141113, 1.1221495866775513]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 4.0, 3.0, 10.0, 14.0, 8.0, 15.0, 13.0, 16.0, 18.0, 27.0, 35.0, 32.0, 38.0, 33.0, 43.0, 55.0, 40.0, 49.0, 48.0, 38.0, 41.0, 47.0, 59.0, 29.0, 41.0, 35.0, 29.0, 25.0, 19.0, 17.0, 26.0, 16.0, 12.0, 14.0, 6.0, 6.0, 11.0, 11.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4165615141391754, -0.4038724899291992, -0.3911834955215454, -0.3784944713115692, -0.365805447101593, -0.3531164228916168, -0.3404273986816406, -0.3277384042739868, -0.3150493800640106, -0.3023603558540344, -0.2896713614463806, -0.2769823372364044, -0.2642933130264282, -0.251604288816452, -0.23891527950763702, -0.22622627019882202, -0.21353724598884583, -0.20084822177886963, -0.18815921247005463, -0.17547020316123962, -0.16278117895126343, -0.15009215474128723, -0.13740314543247223, -0.12471412867307663, -0.11202511191368103, -0.09933609515428543, -0.08664707839488983, -0.07395806163549423, -0.06126904487609863, -0.04858002811670303, -0.035891011357307434, -0.023201994597911835, -0.010512977838516235, 0.002176038920879364, 0.014865055680274963, 0.027554072439670563, 0.04024308919906616, 0.05293210595846176, 0.06562112271785736, 0.07831013947725296, 0.09099915623664856, 0.10368817299604416, 0.11637718975543976, 0.12906619906425476, 0.14175522327423096, 0.15444424748420715, 0.16713325679302216, 0.17982226610183716, 0.19251129031181335, 0.20520031452178955, 0.21788932383060455, 0.23057833313941956, 0.24326735734939575, 0.25595638155937195, 0.26864540576934814, 0.28133440017700195, 0.29402342438697815, 0.30671244859695435, 0.31940144300460815, 0.33209046721458435, 0.34477949142456055, 0.35746851563453674, 0.37015753984451294, 0.38284653425216675, 0.39553555846214294]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 9.0, 15.0, 28.0, 30.0, 50.0, 79.0, 109.0, 202.0, 314.0, 486.0, 896.0, 1694.0, 3402.0, 7193.0, 15394.0, 33385.0, 78188.0, 196161.0, 376150.0, 194369.0, 77436.0, 33265.0, 15181.0, 7108.0, 3471.0, 1670.0, 928.0, 500.0, 289.0, 194.0, 117.0, 81.0, 42.0, 40.0, 26.0, 20.0, 5.0, 8.0, 6.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9462890625, -0.9180374145507812, -0.8897857666015625, -0.8615341186523438, -0.833282470703125, -0.8050308227539062, -0.7767791748046875, -0.7485275268554688, -0.72027587890625, -0.6920242309570312, -0.6637725830078125, -0.6355209350585938, -0.607269287109375, -0.5790176391601562, -0.5507659912109375, -0.5225143432617188, -0.4942626953125, -0.46601104736328125, -0.4377593994140625, -0.40950775146484375, -0.381256103515625, -0.35300445556640625, -0.3247528076171875, -0.29650115966796875, -0.26824951171875, -0.23999786376953125, -0.2117462158203125, -0.18349456787109375, -0.155242919921875, -0.12699127197265625, -0.0987396240234375, -0.07048797607421875, -0.042236328125, -0.01398468017578125, 0.0142669677734375, 0.04251861572265625, 0.070770263671875, 0.09902191162109375, 0.1272735595703125, 0.15552520751953125, 0.18377685546875, 0.21202850341796875, 0.2402801513671875, 0.26853179931640625, 0.296783447265625, 0.32503509521484375, 0.3532867431640625, 0.38153839111328125, 0.4097900390625, 0.43804168701171875, 0.4662933349609375, 0.49454498291015625, 0.522796630859375, 0.5510482788085938, 0.5792999267578125, 0.6075515747070312, 0.63580322265625, 0.6640548706054688, 0.6923065185546875, 0.7205581665039062, 0.748809814453125, 0.7770614624023438, 0.8053131103515625, 0.8335647583007812, 0.86181640625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 6.0, 9.0, 6.0, 8.0, 12.0, 17.0, 5.0, 13.0, 15.0, 18.0, 30.0, 26.0, 38.0, 32.0, 31.0, 42.0, 41.0, 40.0, 34.0, 45.0, 40.0, 42.0, 34.0, 37.0, 40.0, 41.0, 35.0, 25.0, 27.0, 28.0, 22.0, 16.0, 13.0, 24.0, 14.0, 20.0, 8.0, 10.0, 5.0, 6.0, 6.0, 9.0, 7.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.2802734375, -0.2721080780029297, -0.2639427185058594, -0.25577735900878906, -0.24761199951171875, -0.23944664001464844, -0.23128128051757812, -0.2231159210205078, -0.2149505615234375, -0.2067852020263672, -0.19861984252929688, -0.19045448303222656, -0.18228912353515625, -0.17412376403808594, -0.16595840454101562, -0.1577930450439453, -0.149627685546875, -0.1414623260498047, -0.13329696655273438, -0.12513160705566406, -0.11696624755859375, -0.10880088806152344, -0.10063552856445312, -0.09247016906738281, -0.0843048095703125, -0.07613945007324219, -0.06797409057617188, -0.05980873107910156, -0.05164337158203125, -0.04347801208496094, -0.035312652587890625, -0.027147293090820312, -0.01898193359375, -0.010816574096679688, -0.002651214599609375, 0.0055141448974609375, 0.01367950439453125, 0.021844863891601562, 0.030010223388671875, 0.03817558288574219, 0.0463409423828125, 0.05450630187988281, 0.06267166137695312, 0.07083702087402344, 0.07900238037109375, 0.08716773986816406, 0.09533309936523438, 0.10349845886230469, 0.111663818359375, 0.11982917785644531, 0.12799453735351562, 0.13615989685058594, 0.14432525634765625, 0.15249061584472656, 0.16065597534179688, 0.1688213348388672, 0.1769866943359375, 0.1851520538330078, 0.19331741333007812, 0.20148277282714844, 0.20964813232421875, 0.21781349182128906, 0.22597885131835938, 0.2341442108154297, 0.2423095703125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 8.0, 4.0, 14.0, 11.0, 23.0, 27.0, 44.0, 67.0, 87.0, 141.0, 199.0, 368.0, 641.0, 1194.0, 2292.0, 4688.0, 10266.0, 24455.0, 68467.0, 254179.0, 482491.0, 128419.0, 40806.0, 15541.0, 7062.0, 3264.0, 1635.0, 889.0, 475.0, 284.0, 177.0, 95.0, 70.0, 53.0, 38.0, 22.0, 24.0, 10.0, 10.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.0087890625, -0.9775161743164062, -0.9462432861328125, -0.9149703979492188, -0.883697509765625, -0.8524246215820312, -0.8211517333984375, -0.7898788452148438, -0.75860595703125, -0.7273330688476562, -0.6960601806640625, -0.6647872924804688, -0.633514404296875, -0.6022415161132812, -0.5709686279296875, -0.5396957397460938, -0.5084228515625, -0.47714996337890625, -0.4458770751953125, -0.41460418701171875, -0.383331298828125, -0.35205841064453125, -0.3207855224609375, -0.28951263427734375, -0.25823974609375, -0.22696685791015625, -0.1956939697265625, -0.16442108154296875, -0.133148193359375, -0.10187530517578125, -0.0706024169921875, -0.03932952880859375, -0.008056640625, 0.02321624755859375, 0.0544891357421875, 0.08576202392578125, 0.117034912109375, 0.14830780029296875, 0.1795806884765625, 0.21085357666015625, 0.24212646484375, 0.27339935302734375, 0.3046722412109375, 0.33594512939453125, 0.367218017578125, 0.39849090576171875, 0.4297637939453125, 0.46103668212890625, 0.4923095703125, 0.5235824584960938, 0.5548553466796875, 0.5861282348632812, 0.617401123046875, 0.6486740112304688, 0.6799468994140625, 0.7112197875976562, 0.74249267578125, 0.7737655639648438, 0.8050384521484375, 0.8363113403320312, 0.867584228515625, 0.8988571166992188, 0.9301300048828125, 0.9614028930664062, 0.99267578125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 7.0, 6.0, 7.0, 9.0, 13.0, 17.0, 21.0, 14.0, 18.0, 24.0, 25.0, 21.0, 20.0, 36.0, 34.0, 34.0, 34.0, 39.0, 31.0, 35.0, 35.0, 37.0, 40.0, 44.0, 41.0, 42.0, 29.0, 26.0, 28.0, 28.0, 25.0, 33.0, 21.0, 18.0, 17.0, 9.0, 9.0, 12.0, 10.0, 7.0, 8.0, 5.0, 5.0, 1.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1759033203125, -0.17000389099121094, -0.16410446166992188, -0.1582050323486328, -0.15230560302734375, -0.1464061737060547, -0.14050674438476562, -0.13460731506347656, -0.1287078857421875, -0.12280845642089844, -0.11690902709960938, -0.11100959777832031, -0.10511016845703125, -0.09921073913574219, -0.09331130981445312, -0.08741188049316406, -0.081512451171875, -0.07561302185058594, -0.06971359252929688, -0.06381416320800781, -0.05791473388671875, -0.05201530456542969, -0.046115875244140625, -0.04021644592285156, -0.0343170166015625, -0.028417587280273438, -0.022518157958984375, -0.016618728637695312, -0.01071929931640625, -0.0048198699951171875, 0.001079559326171875, 0.0069789886474609375, 0.01287841796875, 0.018777847290039062, 0.024677276611328125, 0.030576705932617188, 0.03647613525390625, 0.04237556457519531, 0.048274993896484375, 0.05417442321777344, 0.0600738525390625, 0.06597328186035156, 0.07187271118164062, 0.07777214050292969, 0.08367156982421875, 0.08957099914550781, 0.09547042846679688, 0.10136985778808594, 0.107269287109375, 0.11316871643066406, 0.11906814575195312, 0.12496757507324219, 0.13086700439453125, 0.1367664337158203, 0.14266586303710938, 0.14856529235839844, 0.1544647216796875, 0.16036415100097656, 0.16626358032226562, 0.1721630096435547, 0.17806243896484375, 0.1839618682861328, 0.18986129760742188, 0.19576072692871094, 0.20166015625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 13.0, 10.0, 18.0, 26.0, 42.0, 46.0, 66.0, 102.0, 150.0, 246.0, 390.0, 718.0, 1421.0, 3278.0, 10085.0, 57480.0, 914423.0, 45147.0, 8858.0, 2964.0, 1315.0, 677.0, 387.0, 230.0, 152.0, 108.0, 57.0, 47.0, 28.0, 18.0, 16.0, 16.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.3984375, -2.330780029296875, -2.26312255859375, -2.195465087890625, -2.1278076171875, -2.060150146484375, -1.99249267578125, -1.924835205078125, -1.857177734375, -1.789520263671875, -1.72186279296875, -1.654205322265625, -1.5865478515625, -1.518890380859375, -1.45123291015625, -1.383575439453125, -1.31591796875, -1.248260498046875, -1.18060302734375, -1.112945556640625, -1.0452880859375, -0.977630615234375, -0.90997314453125, -0.842315673828125, -0.774658203125, -0.707000732421875, -0.63934326171875, -0.571685791015625, -0.5040283203125, -0.436370849609375, -0.36871337890625, -0.301055908203125, -0.2333984375, -0.165740966796875, -0.09808349609375, -0.030426025390625, 0.0372314453125, 0.104888916015625, 0.17254638671875, 0.240203857421875, 0.307861328125, 0.375518798828125, 0.44317626953125, 0.510833740234375, 0.5784912109375, 0.646148681640625, 0.71380615234375, 0.781463623046875, 0.84912109375, 0.916778564453125, 0.98443603515625, 1.052093505859375, 1.1197509765625, 1.187408447265625, 1.25506591796875, 1.322723388671875, 1.390380859375, 1.458038330078125, 1.52569580078125, 1.593353271484375, 1.6610107421875, 1.728668212890625, 1.79632568359375, 1.863983154296875, 1.931640625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 8.0, 9.0, 7.0, 25.0, 54.0, 112.0, 278.0, 310.0, 105.0, 49.0, 21.0, 7.0, 11.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.301568984985352e-05, -7.123500108718872e-05, -6.945431232452393e-05, -6.767362356185913e-05, -6.589293479919434e-05, -6.411224603652954e-05, -6.233155727386475e-05, -6.055086851119995e-05, -5.8770179748535156e-05, -5.698949098587036e-05, -5.5208802223205566e-05, -5.342811346054077e-05, -5.1647424697875977e-05, -4.986673593521118e-05, -4.808604717254639e-05, -4.630535840988159e-05, -4.45246696472168e-05, -4.2743980884552e-05, -4.096329212188721e-05, -3.918260335922241e-05, -3.740191459655762e-05, -3.562122583389282e-05, -3.384053707122803e-05, -3.205984830856323e-05, -3.0279159545898438e-05, -2.8498470783233643e-05, -2.6717782020568848e-05, -2.4937093257904053e-05, -2.3156404495239258e-05, -2.1375715732574463e-05, -1.9595026969909668e-05, -1.7814338207244873e-05, -1.6033649444580078e-05, -1.4252960681915283e-05, -1.2472271919250488e-05, -1.0691583156585693e-05, -8.910894393920898e-06, -7.1302056312561035e-06, -5.349516868591309e-06, -3.5688281059265137e-06, -1.7881393432617188e-06, -7.450580596923828e-09, 1.773238182067871e-06, 3.553926944732666e-06, 5.334615707397461e-06, 7.115304470062256e-06, 8.89599323272705e-06, 1.0676681995391846e-05, 1.245737075805664e-05, 1.4238059520721436e-05, 1.601874828338623e-05, 1.7799437046051025e-05, 1.958012580871582e-05, 2.1360814571380615e-05, 2.314150333404541e-05, 2.4922192096710205e-05, 2.6702880859375e-05, 2.8483569622039795e-05, 3.026425838470459e-05, 3.2044947147369385e-05, 3.382563591003418e-05, 3.5606324672698975e-05, 3.738701343536377e-05, 3.9167702198028564e-05, 4.094839096069336e-05]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 9.0, 10.0, 8.0, 15.0, 20.0, 27.0, 28.0, 49.0, 73.0, 85.0, 118.0, 192.0, 236.0, 423.0, 676.0, 1164.0, 2273.0, 5248.0, 16051.0, 92265.0, 864301.0, 46121.0, 10706.0, 3970.0, 1810.0, 971.0, 573.0, 334.0, 219.0, 153.0, 103.0, 76.0, 53.0, 50.0, 28.0, 24.0, 24.0, 17.0, 10.0, 9.0, 6.0, 9.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6669921875, -1.613800048828125, -1.56060791015625, -1.507415771484375, -1.4542236328125, -1.401031494140625, -1.34783935546875, -1.294647216796875, -1.241455078125, -1.188262939453125, -1.13507080078125, -1.081878662109375, -1.0286865234375, -0.975494384765625, -0.92230224609375, -0.869110107421875, -0.81591796875, -0.762725830078125, -0.70953369140625, -0.656341552734375, -0.6031494140625, -0.549957275390625, -0.49676513671875, -0.443572998046875, -0.390380859375, -0.337188720703125, -0.28399658203125, -0.230804443359375, -0.1776123046875, -0.124420166015625, -0.07122802734375, -0.018035888671875, 0.03515625, 0.088348388671875, 0.14154052734375, 0.194732666015625, 0.2479248046875, 0.301116943359375, 0.35430908203125, 0.407501220703125, 0.460693359375, 0.513885498046875, 0.56707763671875, 0.620269775390625, 0.6734619140625, 0.726654052734375, 0.77984619140625, 0.833038330078125, 0.88623046875, 0.939422607421875, 0.99261474609375, 1.045806884765625, 1.0989990234375, 1.152191162109375, 1.20538330078125, 1.258575439453125, 1.311767578125, 1.364959716796875, 1.41815185546875, 1.471343994140625, 1.5245361328125, 1.577728271484375, 1.63092041015625, 1.684112548828125, 1.7373046875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 10.0, 16.0, 23.0, 39.0, 61.0, 90.0, 117.0, 368.0, 82.0, 56.0, 43.0, 33.0, 15.0, 8.0, 8.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36865234375, -0.35753631591796875, -0.3464202880859375, -0.33530426025390625, -0.324188232421875, -0.31307220458984375, -0.3019561767578125, -0.29084014892578125, -0.27972412109375, -0.26860809326171875, -0.2574920654296875, -0.24637603759765625, -0.235260009765625, -0.22414398193359375, -0.2130279541015625, -0.20191192626953125, -0.1907958984375, -0.17967987060546875, -0.1685638427734375, -0.15744781494140625, -0.146331787109375, -0.13521575927734375, -0.1240997314453125, -0.11298370361328125, -0.10186767578125, -0.09075164794921875, -0.0796356201171875, -0.06851959228515625, -0.057403564453125, -0.04628753662109375, -0.0351715087890625, -0.02405548095703125, -0.012939453125, -0.00182342529296875, 0.0092926025390625, 0.02040863037109375, 0.031524658203125, 0.04264068603515625, 0.0537567138671875, 0.06487274169921875, 0.07598876953125, 0.08710479736328125, 0.0982208251953125, 0.10933685302734375, 0.120452880859375, 0.13156890869140625, 0.1426849365234375, 0.15380096435546875, 0.1649169921875, 0.17603302001953125, 0.1871490478515625, 0.19826507568359375, 0.209381103515625, 0.22049713134765625, 0.2316131591796875, 0.24272918701171875, 0.25384521484375, 0.26496124267578125, 0.2760772705078125, 0.28719329833984375, 0.298309326171875, 0.30942535400390625, 0.3205413818359375, 0.33165740966796875, 0.3427734375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 7.0, 8.0, 13.0, 32.0, 44.0, 64.0, 111.0, 222.0, 271.0, 104.0, 44.0, 17.0, 11.0, 13.0, 6.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.845899760723114, -0.8180158138275146, -0.7901318669319153, -0.7622479796409607, -0.7343640327453613, -0.706480085849762, -0.6785961389541626, -0.650712251663208, -0.6228283047676086, -0.5949443578720093, -0.5670604109764099, -0.5391765236854553, -0.511292576789856, -0.4834086298942566, -0.4555246829986572, -0.42764076590538025, -0.3997568190097809, -0.3718728721141815, -0.34398895502090454, -0.3161050081253052, -0.2882210910320282, -0.26033714413642883, -0.23245321214199066, -0.2045692801475525, -0.17668534815311432, -0.14880141615867615, -0.12091748416423798, -0.09303354471921921, -0.06514961272478104, -0.03726567327976227, -0.009381741285324097, 0.018502190709114075, 0.046386122703552246, 0.07427005469799042, 0.10215398669242859, 0.13003793358802795, 0.15792185068130493, 0.1858057975769043, 0.21368972957134247, 0.24157366156578064, 0.2694575786590576, 0.297341525554657, 0.32522544264793396, 0.3531093895435333, 0.3809933066368103, 0.40887725353240967, 0.43676120042800903, 0.464645117521286, 0.4925290644168854, 0.5204129815101624, 0.5482969284057617, 0.5761808753013611, 0.6040648221969604, 0.631948709487915, 0.6598326563835144, 0.6877166032791138, 0.7156005501747131, 0.7434844970703125, 0.7713684439659119, 0.7992523312568665, 0.8271362781524658, 0.8550202250480652, 0.8829041719436646, 0.9107880592346191, 0.9386720061302185]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 2.0, 5.0, 3.0, 3.0, 6.0, 13.0, 12.0, 12.0, 14.0, 19.0, 22.0, 21.0, 31.0, 29.0, 37.0, 32.0, 38.0, 45.0, 50.0, 46.0, 47.0, 57.0, 64.0, 40.0, 37.0, 28.0, 37.0, 34.0, 36.0, 25.0, 24.0, 23.0, 21.0, 17.0, 9.0, 10.0, 15.0, 17.0, 9.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3324841856956482, -0.3221283555030823, -0.31177252531051636, -0.30141669511795044, -0.2910608649253845, -0.2807050347328186, -0.2703492045402527, -0.25999337434768677, -0.24963755905628204, -0.23928172886371613, -0.2289258986711502, -0.2185700684785843, -0.20821425318717957, -0.19785842299461365, -0.18750259280204773, -0.1771467626094818, -0.1667909324169159, -0.15643510222434998, -0.14607927203178406, -0.13572344183921814, -0.12536761164665222, -0.1150117889046669, -0.10465596616268158, -0.09430013597011566, -0.08394430577754974, -0.07358847558498383, -0.06323264539241791, -0.05287682265043259, -0.04252099245786667, -0.03216516226530075, -0.02180933579802513, -0.011453509330749512, -0.0010976791381835938, 0.009258149191737175, 0.019613977521657944, 0.029969805851578712, 0.04032563418149948, 0.0506814643740654, 0.06103729084134102, 0.07139311730861664, 0.08174894750118256, 0.09210477769374847, 0.10246060788631439, 0.11281643062829971, 0.12317226082086563, 0.13352808356285095, 0.14388391375541687, 0.1542397439479828, 0.1645955741405487, 0.17495140433311462, 0.18530723452568054, 0.19566306471824646, 0.20601889491081238, 0.2163747251033783, 0.22673054039478302, 0.23708637058734894, 0.24744220077991486, 0.2577980160713196, 0.2681538462638855, 0.2785096764564514, 0.28886550664901733, 0.29922133684158325, 0.30957716703414917, 0.3199329972267151, 0.330288827419281]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 7.0, 7.0, 10.0, 11.0, 22.0, 23.0, 43.0, 61.0, 87.0, 97.0, 165.0, 200.0, 308.0, 377.0, 577.0, 724.0, 1011.0, 1473.0, 2130.0, 3100.0, 4318.0, 6486.0, 9655.0, 14627.0, 23541.0, 38180.0, 65992.0, 126241.0, 312031.0, 1324007.0, 1576523.0, 360394.0, 136828.0, 71103.0, 40975.0, 25044.0, 15561.0, 10318.0, 6706.0, 4502.0, 3186.0, 2160.0, 1598.0, 1106.0, 793.0, 534.0, 379.0, 273.0, 212.0, 157.0, 128.0, 87.0, 74.0, 52.0, 35.0, 26.0, 16.0, 11.0, 3.0, 2.0], "bins": [-0.35205078125, -0.3417167663574219, -0.33138275146484375, -0.3210487365722656, -0.3107147216796875, -0.3003807067871094, -0.29004669189453125, -0.2797126770019531, -0.269378662109375, -0.2590446472167969, -0.24871063232421875, -0.23837661743164062, -0.2280426025390625, -0.21770858764648438, -0.20737457275390625, -0.19704055786132812, -0.18670654296875, -0.17637252807617188, -0.16603851318359375, -0.15570449829101562, -0.1453704833984375, -0.13503646850585938, -0.12470245361328125, -0.11436843872070312, -0.104034423828125, -0.09370040893554688, -0.08336639404296875, -0.07303237915039062, -0.0626983642578125, -0.052364349365234375, -0.04203033447265625, -0.031696319580078125, -0.0213623046875, -0.011028289794921875, -0.00069427490234375, 0.009639739990234375, 0.0199737548828125, 0.030307769775390625, 0.04064178466796875, 0.050975799560546875, 0.061309814453125, 0.07164382934570312, 0.08197784423828125, 0.09231185913085938, 0.1026458740234375, 0.11297988891601562, 0.12331390380859375, 0.13364791870117188, 0.14398193359375, 0.15431594848632812, 0.16464996337890625, 0.17498397827148438, 0.1853179931640625, 0.19565200805664062, 0.20598602294921875, 0.21632003784179688, 0.226654052734375, 0.23698806762695312, 0.24732208251953125, 0.2576560974121094, 0.2679901123046875, 0.2783241271972656, 0.28865814208984375, 0.2989921569824219, 0.309326171875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 5.0, 12.0, 13.0, 6.0, 17.0, 19.0, 22.0, 25.0, 27.0, 35.0, 43.0, 27.0, 48.0, 40.0, 51.0, 65.0, 41.0, 46.0, 45.0, 42.0, 37.0, 40.0, 34.0, 41.0, 37.0, 26.0, 23.0, 17.0, 24.0, 18.0, 8.0, 13.0, 12.0, 5.0, 6.0, 7.0, 7.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14501953125, -0.14050865173339844, -0.13599777221679688, -0.1314868927001953, -0.12697601318359375, -0.12246513366699219, -0.11795425415039062, -0.11344337463378906, -0.1089324951171875, -0.10442161560058594, -0.09991073608398438, -0.09539985656738281, -0.09088897705078125, -0.08637809753417969, -0.08186721801757812, -0.07735633850097656, -0.072845458984375, -0.06833457946777344, -0.06382369995117188, -0.05931282043457031, -0.05480194091796875, -0.05029106140136719, -0.045780181884765625, -0.04126930236816406, -0.0367584228515625, -0.03224754333496094, -0.027736663818359375, -0.023225784301757812, -0.01871490478515625, -0.014204025268554688, -0.009693145751953125, -0.0051822662353515625, -0.00067138671875, 0.0038394927978515625, 0.008350372314453125, 0.012861251831054688, 0.01737213134765625, 0.021883010864257812, 0.026393890380859375, 0.030904769897460938, 0.0354156494140625, 0.03992652893066406, 0.044437408447265625, 0.04894828796386719, 0.05345916748046875, 0.05797004699707031, 0.062480926513671875, 0.06699180603027344, 0.071502685546875, 0.07601356506347656, 0.08052444458007812, 0.08503532409667969, 0.08954620361328125, 0.09405708312988281, 0.09856796264648438, 0.10307884216308594, 0.1075897216796875, 0.11210060119628906, 0.11661148071289062, 0.12112236022949219, 0.12563323974609375, 0.1301441192626953, 0.13465499877929688, 0.13916587829589844, 0.1436767578125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 11.0, 4.0, 10.0, 14.0, 24.0, 36.0, 52.0, 72.0, 150.0, 226.0, 364.0, 544.0, 924.0, 1522.0, 2680.0, 4795.0, 9276.0, 18576.0, 43364.0, 118259.0, 445689.0, 2439100.0, 819276.0, 179185.0, 59932.0, 24723.0, 11555.0, 5914.0, 3225.0, 1913.0, 1138.0, 649.0, 396.0, 261.0, 162.0, 87.0, 58.0, 28.0, 33.0, 23.0, 12.0, 4.0, 10.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.42724609375, -0.41455841064453125, -0.4018707275390625, -0.38918304443359375, -0.376495361328125, -0.36380767822265625, -0.3511199951171875, -0.33843231201171875, -0.32574462890625, -0.31305694580078125, -0.3003692626953125, -0.28768157958984375, -0.274993896484375, -0.26230621337890625, -0.2496185302734375, -0.23693084716796875, -0.2242431640625, -0.21155548095703125, -0.1988677978515625, -0.18618011474609375, -0.173492431640625, -0.16080474853515625, -0.1481170654296875, -0.13542938232421875, -0.12274169921875, -0.11005401611328125, -0.0973663330078125, -0.08467864990234375, -0.071990966796875, -0.05930328369140625, -0.0466156005859375, -0.03392791748046875, -0.021240234375, -0.00855255126953125, 0.0041351318359375, 0.01682281494140625, 0.029510498046875, 0.04219818115234375, 0.0548858642578125, 0.06757354736328125, 0.08026123046875, 0.09294891357421875, 0.1056365966796875, 0.11832427978515625, 0.131011962890625, 0.14369964599609375, 0.1563873291015625, 0.16907501220703125, 0.1817626953125, 0.19445037841796875, 0.2071380615234375, 0.21982574462890625, 0.232513427734375, 0.24520111083984375, 0.2578887939453125, 0.27057647705078125, 0.28326416015625, 0.29595184326171875, 0.3086395263671875, 0.32132720947265625, 0.334014892578125, 0.34670257568359375, 0.3593902587890625, 0.37207794189453125, 0.384765625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 6.0, 7.0, 14.0, 24.0, 19.0, 36.0, 31.0, 48.0, 64.0, 83.0, 103.0, 124.0, 176.0, 230.0, 272.0, 359.0, 484.0, 427.0, 348.0, 305.0, 224.0, 160.0, 136.0, 108.0, 82.0, 45.0, 39.0, 41.0, 23.0, 15.0, 7.0, 8.0, 6.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097412109375, -0.0945281982421875, -0.091644287109375, -0.0887603759765625, -0.08587646484375, -0.0829925537109375, -0.080108642578125, -0.0772247314453125, -0.0743408203125, -0.0714569091796875, -0.068572998046875, -0.0656890869140625, -0.06280517578125, -0.0599212646484375, -0.057037353515625, -0.0541534423828125, -0.05126953125, -0.0483856201171875, -0.045501708984375, -0.0426177978515625, -0.03973388671875, -0.0368499755859375, -0.033966064453125, -0.0310821533203125, -0.0281982421875, -0.0253143310546875, -0.022430419921875, -0.0195465087890625, -0.01666259765625, -0.0137786865234375, -0.010894775390625, -0.0080108642578125, -0.005126953125, -0.0022430419921875, 0.000640869140625, 0.0035247802734375, 0.00640869140625, 0.0092926025390625, 0.012176513671875, 0.0150604248046875, 0.0179443359375, 0.0208282470703125, 0.023712158203125, 0.0265960693359375, 0.02947998046875, 0.0323638916015625, 0.035247802734375, 0.0381317138671875, 0.041015625, 0.0438995361328125, 0.046783447265625, 0.0496673583984375, 0.05255126953125, 0.0554351806640625, 0.058319091796875, 0.0612030029296875, 0.0640869140625, 0.0669708251953125, 0.069854736328125, 0.0727386474609375, 0.07562255859375, 0.0785064697265625, 0.081390380859375, 0.0842742919921875, 0.087158203125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 4.0, 4.0, 13.0, 15.0, 27.0, 27.0, 45.0, 74.0, 136.0, 199.0, 194.0, 95.0, 56.0, 34.0, 23.0, 7.0, 6.0, 8.0, 6.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22267018258571625, -0.21153748035430908, -0.20040477812290192, -0.18927207589149475, -0.1781393587589264, -0.16700665652751923, -0.15587395429611206, -0.1447412371635437, -0.13360854983329773, -0.12247584760189056, -0.1113431379199028, -0.10021043568849564, -0.08907772600650787, -0.07794502377510071, -0.06681232154369354, -0.05567961186170578, -0.04454690217971802, -0.033414196223020554, -0.02228149212896824, -0.011148788034915924, -1.6082078218460083e-05, 0.011116623878479004, 0.02224932610988617, 0.03338203579187393, 0.0445147380232811, 0.05564744397997856, 0.06678014993667603, 0.07791285216808319, 0.08904555439949036, 0.10017826408147812, 0.11131096631288528, 0.12244367599487305, 0.1335763931274414, 0.14470909535884857, 0.15584179759025574, 0.1669745147228241, 0.17810721695423126, 0.18923991918563843, 0.2003726214170456, 0.21150532364845276, 0.22263804078102112, 0.23377074301242828, 0.24490344524383545, 0.2560361623764038, 0.2671688497066498, 0.27830156683921814, 0.2894342541694641, 0.30056697130203247, 0.31169968843460083, 0.3228324055671692, 0.33396509289741516, 0.3450978100299835, 0.3562304973602295, 0.36736321449279785, 0.3784959316253662, 0.3896286189556122, 0.40076130628585815, 0.4118940234184265, 0.4230267107486725, 0.43415942788124084, 0.4452921152114868, 0.4564248323440552, 0.46755754947662354, 0.4786902368068695, 0.48982295393943787]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 2.0, 9.0, 13.0, 11.0, 15.0, 11.0, 15.0, 23.0, 19.0, 20.0, 41.0, 30.0, 38.0, 44.0, 47.0, 39.0, 49.0, 40.0, 50.0, 53.0, 52.0, 40.0, 40.0, 26.0, 35.0, 35.0, 29.0, 23.0, 24.0, 19.0, 16.0, 14.0, 13.0, 18.0, 11.0, 6.0, 6.0, 6.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.15669216215610504, -0.1520506590604782, -0.14740917086601257, -0.14276766777038574, -0.1381261646747589, -0.13348466157913208, -0.12884317338466644, -0.12420167028903961, -0.11956017464399338, -0.11491867899894714, -0.11027717590332031, -0.10563568025827408, -0.10099418461322784, -0.09635268151760101, -0.09171118587255478, -0.08706969022750854, -0.08242818713188171, -0.07778669148683548, -0.07314518839120865, -0.06850369274616241, -0.06386218965053558, -0.05922069400548935, -0.054579198360443115, -0.04993769899010658, -0.04529619961977005, -0.04065470024943352, -0.036013200879096985, -0.03137170523405075, -0.026730205863714218, -0.022088706493377686, -0.017447208985686302, -0.012805711477994919, -0.008164197206497192, -0.0035226987674832344, 0.0011187996715307236, 0.0057602981105446815, 0.01040179654955864, 0.015043295919895172, 0.019684793427586555, 0.02432629093527794, 0.02896779030561447, 0.033609289675951004, 0.03825078904628754, 0.04289228469133377, 0.0475337840616703, 0.052175283432006836, 0.05681677907705307, 0.0614582784473896, 0.06609977781772614, 0.07074127346277237, 0.0753827765583992, 0.08002427220344543, 0.08466577529907227, 0.0893072709441185, 0.09394876658916473, 0.09859026968479156, 0.1032317653298378, 0.10787326097488403, 0.11251476407051086, 0.1171562597155571, 0.12179775536060333, 0.12643925845623016, 0.131080761551857, 0.13572224974632263, 0.14036375284194946]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 9.0, 11.0, 14.0, 17.0, 23.0, 42.0, 60.0, 84.0, 136.0, 189.0, 293.0, 485.0, 734.0, 1183.0, 1781.0, 3072.0, 5108.0, 9979.0, 22804.0, 74360.0, 485625.0, 345537.0, 57012.0, 19056.0, 8745.0, 4754.0, 2732.0, 1632.0, 1043.0, 704.0, 444.0, 282.0, 205.0, 119.0, 98.0, 58.0, 38.0, 29.0, 28.0, 14.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0], "bins": [-0.42626953125, -0.415313720703125, -0.40435791015625, -0.393402099609375, -0.3824462890625, -0.371490478515625, -0.36053466796875, -0.349578857421875, -0.338623046875, -0.327667236328125, -0.31671142578125, -0.305755615234375, -0.2947998046875, -0.283843994140625, -0.27288818359375, -0.261932373046875, -0.2509765625, -0.240020751953125, -0.22906494140625, -0.218109130859375, -0.2071533203125, -0.196197509765625, -0.18524169921875, -0.174285888671875, -0.163330078125, -0.152374267578125, -0.14141845703125, -0.130462646484375, -0.1195068359375, -0.108551025390625, -0.09759521484375, -0.086639404296875, -0.07568359375, -0.064727783203125, -0.05377197265625, -0.042816162109375, -0.0318603515625, -0.020904541015625, -0.00994873046875, 0.001007080078125, 0.011962890625, 0.022918701171875, 0.03387451171875, 0.044830322265625, 0.0557861328125, 0.066741943359375, 0.07769775390625, 0.088653564453125, 0.099609375, 0.110565185546875, 0.12152099609375, 0.132476806640625, 0.1434326171875, 0.154388427734375, 0.16534423828125, 0.176300048828125, 0.187255859375, 0.198211669921875, 0.20916748046875, 0.220123291015625, 0.2310791015625, 0.242034912109375, 0.25299072265625, 0.263946533203125, 0.27490234375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 3.0, 10.0, 9.0, 9.0, 10.0, 23.0, 21.0, 22.0, 23.0, 27.0, 35.0, 38.0, 36.0, 50.0, 50.0, 43.0, 44.0, 57.0, 48.0, 55.0, 47.0, 46.0, 29.0, 31.0, 35.0, 29.0, 21.0, 22.0, 30.0, 16.0, 7.0, 11.0, 15.0, 9.0, 6.0, 8.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1365966796875, -0.13245201110839844, -0.12830734252929688, -0.12416267395019531, -0.12001800537109375, -0.11587333679199219, -0.11172866821289062, -0.10758399963378906, -0.1034393310546875, -0.09929466247558594, -0.09514999389648438, -0.09100532531738281, -0.08686065673828125, -0.08271598815917969, -0.07857131958007812, -0.07442665100097656, -0.070281982421875, -0.06613731384277344, -0.061992645263671875, -0.05784797668457031, -0.05370330810546875, -0.04955863952636719, -0.045413970947265625, -0.04126930236816406, -0.0371246337890625, -0.03297996520996094, -0.028835296630859375, -0.024690628051757812, -0.02054595947265625, -0.016401290893554688, -0.012256622314453125, -0.008111953735351562, -0.00396728515625, 0.0001773834228515625, 0.004322052001953125, 0.008466720581054688, 0.01261138916015625, 0.016756057739257812, 0.020900726318359375, 0.025045394897460938, 0.0291900634765625, 0.03333473205566406, 0.037479400634765625, 0.04162406921386719, 0.04576873779296875, 0.04991340637207031, 0.054058074951171875, 0.05820274353027344, 0.062347412109375, 0.06649208068847656, 0.07063674926757812, 0.07478141784667969, 0.07892608642578125, 0.08307075500488281, 0.08721542358398438, 0.09136009216308594, 0.0955047607421875, 0.09964942932128906, 0.10379409790039062, 0.10793876647949219, 0.11208343505859375, 0.11622810363769531, 0.12037277221679688, 0.12451744079589844, 0.128662109375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 1.0, 4.0, 8.0, 14.0, 21.0, 22.0, 38.0, 49.0, 80.0, 132.0, 209.0, 318.0, 569.0, 1117.0, 2186.0, 4988.0, 17172.0, 545860.0, 449965.0, 16170.0, 4945.0, 2152.0, 1069.0, 581.0, 298.0, 225.0, 114.0, 80.0, 45.0, 37.0, 32.0, 20.0, 15.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0166015625, -0.989837646484375, -0.96307373046875, -0.936309814453125, -0.9095458984375, -0.882781982421875, -0.85601806640625, -0.829254150390625, -0.802490234375, -0.775726318359375, -0.74896240234375, -0.722198486328125, -0.6954345703125, -0.668670654296875, -0.64190673828125, -0.615142822265625, -0.58837890625, -0.561614990234375, -0.53485107421875, -0.508087158203125, -0.4813232421875, -0.454559326171875, -0.42779541015625, -0.401031494140625, -0.374267578125, -0.347503662109375, -0.32073974609375, -0.293975830078125, -0.2672119140625, -0.240447998046875, -0.21368408203125, -0.186920166015625, -0.16015625, -0.133392333984375, -0.10662841796875, -0.079864501953125, -0.0531005859375, -0.026336669921875, 0.00042724609375, 0.027191162109375, 0.053955078125, 0.080718994140625, 0.10748291015625, 0.134246826171875, 0.1610107421875, 0.187774658203125, 0.21453857421875, 0.241302490234375, 0.26806640625, 0.294830322265625, 0.32159423828125, 0.348358154296875, 0.3751220703125, 0.401885986328125, 0.42864990234375, 0.455413818359375, 0.482177734375, 0.508941650390625, 0.53570556640625, 0.562469482421875, 0.5892333984375, 0.615997314453125, 0.64276123046875, 0.669525146484375, 0.6962890625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 3.0, 8.0, 4.0, 4.0, 10.0, 9.0, 14.0, 19.0, 15.0, 18.0, 29.0, 32.0, 26.0, 35.0, 36.0, 41.0, 40.0, 61.0, 52.0, 54.0, 41.0, 50.0, 48.0, 47.0, 42.0, 42.0, 27.0, 33.0, 23.0, 25.0, 23.0, 19.0, 9.0, 13.0, 9.0, 10.0, 9.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0848388671875, -0.08195018768310547, -0.07906150817871094, -0.0761728286743164, -0.07328414916992188, -0.07039546966552734, -0.06750679016113281, -0.06461811065673828, -0.06172943115234375, -0.05884075164794922, -0.05595207214355469, -0.053063392639160156, -0.050174713134765625, -0.047286033630371094, -0.04439735412597656, -0.04150867462158203, -0.0386199951171875, -0.03573131561279297, -0.03284263610839844, -0.029953956604003906, -0.027065277099609375, -0.024176597595214844, -0.021287918090820312, -0.01839923858642578, -0.01551055908203125, -0.012621879577636719, -0.009733200073242188, -0.006844520568847656, -0.003955841064453125, -0.0010671615600585938, 0.0018215179443359375, 0.004710197448730469, 0.007598876953125, 0.010487556457519531, 0.013376235961914062, 0.016264915466308594, 0.019153594970703125, 0.022042274475097656, 0.024930953979492188, 0.02781963348388672, 0.03070831298828125, 0.03359699249267578, 0.03648567199707031, 0.039374351501464844, 0.042263031005859375, 0.045151710510253906, 0.04804039001464844, 0.05092906951904297, 0.0538177490234375, 0.05670642852783203, 0.05959510803222656, 0.062483787536621094, 0.06537246704101562, 0.06826114654541016, 0.07114982604980469, 0.07403850555419922, 0.07692718505859375, 0.07981586456298828, 0.08270454406738281, 0.08559322357177734, 0.08848190307617188, 0.0913705825805664, 0.09425926208496094, 0.09714794158935547, 0.10003662109375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 9.0, 7.0, 17.0, 24.0, 26.0, 61.0, 82.0, 123.0, 180.0, 253.0, 394.0, 691.0, 1264.0, 2041.0, 3815.0, 7703.0, 17788.0, 50344.0, 208627.0, 576238.0, 118838.0, 33717.0, 13001.0, 5987.0, 3079.0, 1585.0, 992.0, 603.0, 355.0, 244.0, 159.0, 97.0, 64.0, 56.0, 27.0, 23.0, 17.0, 5.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046356201171875, -0.04477548599243164, -0.04319477081298828, -0.04161405563354492, -0.04003334045410156, -0.0384526252746582, -0.036871910095214844, -0.035291194915771484, -0.033710479736328125, -0.032129764556884766, -0.030549049377441406, -0.028968334197998047, -0.027387619018554688, -0.025806903839111328, -0.02422618865966797, -0.02264547348022461, -0.02106475830078125, -0.01948404312133789, -0.01790332794189453, -0.016322612762451172, -0.014741897583007812, -0.013161182403564453, -0.011580467224121094, -0.009999752044677734, -0.008419036865234375, -0.006838321685791016, -0.005257606506347656, -0.003676891326904297, -0.0020961761474609375, -0.0005154609680175781, 0.0010652542114257812, 0.0026459693908691406, 0.0042266845703125, 0.005807399749755859, 0.007388114929199219, 0.008968830108642578, 0.010549545288085938, 0.012130260467529297, 0.013710975646972656, 0.015291690826416016, 0.016872406005859375, 0.018453121185302734, 0.020033836364746094, 0.021614551544189453, 0.023195266723632812, 0.024775981903076172, 0.02635669708251953, 0.02793741226196289, 0.02951812744140625, 0.03109884262084961, 0.03267955780029297, 0.03426027297973633, 0.03584098815917969, 0.03742170333862305, 0.039002418518066406, 0.040583133697509766, 0.042163848876953125, 0.043744564056396484, 0.045325279235839844, 0.0469059944152832, 0.04848670959472656, 0.05006742477416992, 0.05164813995361328, 0.05322885513305664, 0.0548095703125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 1.0, 7.0, 9.0, 14.0, 16.0, 25.0, 25.0, 41.0, 42.0, 61.0, 83.0, 100.0, 102.0, 77.0, 71.0, 108.0, 54.0, 41.0, 28.0, 28.0, 15.0, 15.0, 10.0, 9.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1861324310302734e-05, -1.1548399925231934e-05, -1.1235475540161133e-05, -1.0922551155090332e-05, -1.0609626770019531e-05, -1.029670238494873e-05, -9.98377799987793e-06, -9.670853614807129e-06, -9.357929229736328e-06, -9.045004844665527e-06, -8.732080459594727e-06, -8.419156074523926e-06, -8.106231689453125e-06, -7.793307304382324e-06, -7.4803829193115234e-06, -7.167458534240723e-06, -6.854534149169922e-06, -6.541609764099121e-06, -6.22868537902832e-06, -5.9157609939575195e-06, -5.602836608886719e-06, -5.289912223815918e-06, -4.976987838745117e-06, -4.664063453674316e-06, -4.351139068603516e-06, -4.038214683532715e-06, -3.725290298461914e-06, -3.4123659133911133e-06, -3.0994415283203125e-06, -2.7865171432495117e-06, -2.473592758178711e-06, -2.16066837310791e-06, -1.8477439880371094e-06, -1.5348196029663086e-06, -1.2218952178955078e-06, -9.08970832824707e-07, -5.960464477539062e-07, -2.8312206268310547e-07, 2.9802322387695312e-08, 3.427267074584961e-07, 6.556510925292969e-07, 9.685754776000977e-07, 1.2814998626708984e-06, 1.5944242477416992e-06, 1.9073486328125e-06, 2.2202730178833008e-06, 2.5331974029541016e-06, 2.8461217880249023e-06, 3.159046173095703e-06, 3.471970558166504e-06, 3.7848949432373047e-06, 4.0978193283081055e-06, 4.410743713378906e-06, 4.723668098449707e-06, 5.036592483520508e-06, 5.349516868591309e-06, 5.662441253662109e-06, 5.97536563873291e-06, 6.288290023803711e-06, 6.601214408874512e-06, 6.9141387939453125e-06, 7.227063179016113e-06, 7.539987564086914e-06, 7.852911949157715e-06, 8.165836334228516e-06]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 10.0, 12.0, 19.0, 21.0, 29.0, 35.0, 52.0, 70.0, 122.0, 154.0, 233.0, 332.0, 545.0, 948.0, 1875.0, 4261.0, 11263.0, 42002.0, 325894.0, 574396.0, 61509.0, 14534.0, 5094.0, 2154.0, 1135.0, 608.0, 406.0, 233.0, 187.0, 131.0, 83.0, 58.0, 46.0, 22.0, 16.0, 15.0, 16.0, 10.0, 4.0, 7.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0560302734375, -0.054285526275634766, -0.05254077911376953, -0.0507960319519043, -0.04905128479003906, -0.04730653762817383, -0.045561790466308594, -0.04381704330444336, -0.042072296142578125, -0.04032754898071289, -0.038582801818847656, -0.03683805465698242, -0.03509330749511719, -0.03334856033325195, -0.03160381317138672, -0.029859066009521484, -0.02811431884765625, -0.026369571685791016, -0.02462482452392578, -0.022880077362060547, -0.021135330200195312, -0.019390583038330078, -0.017645835876464844, -0.01590108871459961, -0.014156341552734375, -0.01241159439086914, -0.010666847229003906, -0.008922100067138672, -0.0071773529052734375, -0.005432605743408203, -0.0036878585815429688, -0.0019431114196777344, -0.0001983642578125, 0.0015463829040527344, 0.0032911300659179688, 0.005035877227783203, 0.0067806243896484375, 0.008525371551513672, 0.010270118713378906, 0.01201486587524414, 0.013759613037109375, 0.01550436019897461, 0.017249107360839844, 0.018993854522705078, 0.020738601684570312, 0.022483348846435547, 0.02422809600830078, 0.025972843170166016, 0.02771759033203125, 0.029462337493896484, 0.03120708465576172, 0.03295183181762695, 0.03469657897949219, 0.03644132614135742, 0.038186073303222656, 0.03993082046508789, 0.041675567626953125, 0.04342031478881836, 0.045165061950683594, 0.04690980911254883, 0.04865455627441406, 0.0503993034362793, 0.05214405059814453, 0.053888797760009766, 0.055633544921875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 1.0, 4.0, 9.0, 4.0, 13.0, 24.0, 29.0, 34.0, 47.0, 63.0, 84.0, 103.0, 121.0, 103.0, 82.0, 68.0, 52.0, 45.0, 25.0, 17.0, 12.0, 14.0, 12.0, 9.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01035308837890625, -0.010013818740844727, -0.009674549102783203, -0.00933527946472168, -0.008996009826660156, -0.008656740188598633, -0.00831747055053711, -0.007978200912475586, -0.0076389312744140625, -0.007299661636352539, -0.006960391998291016, -0.006621122360229492, -0.006281852722167969, -0.005942583084106445, -0.005603313446044922, -0.0052640438079833984, -0.004924774169921875, -0.0045855045318603516, -0.004246234893798828, -0.003906965255737305, -0.0035676956176757812, -0.003228425979614258, -0.0028891563415527344, -0.002549886703491211, -0.0022106170654296875, -0.001871347427368164, -0.0015320777893066406, -0.0011928081512451172, -0.0008535385131835938, -0.0005142688751220703, -0.00017499923706054688, 0.00016427040100097656, 0.0005035400390625, 0.0008428096771240234, 0.0011820793151855469, 0.0015213489532470703, 0.0018606185913085938, 0.002199888229370117, 0.0025391578674316406, 0.002878427505493164, 0.0032176971435546875, 0.003556966781616211, 0.0038962364196777344, 0.004235506057739258, 0.004574775695800781, 0.004914045333862305, 0.005253314971923828, 0.0055925846099853516, 0.005931854248046875, 0.0062711238861083984, 0.006610393524169922, 0.006949663162231445, 0.007288932800292969, 0.007628202438354492, 0.007967472076416016, 0.008306741714477539, 0.008646011352539062, 0.008985280990600586, 0.00932455062866211, 0.009663820266723633, 0.010003089904785156, 0.01034235954284668, 0.010681629180908203, 0.011020898818969727, 0.01136016845703125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 5.0, 8.0, 9.0, 16.0, 23.0, 38.0, 65.0, 99.0, 178.0, 217.0, 128.0, 86.0, 36.0, 27.0, 10.0, 14.0, 11.0, 3.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1730543076992035, -0.16308629512786865, -0.15311826765537262, -0.1431502401828766, -0.13318222761154175, -0.12321420758962631, -0.11324618756771088, -0.10327816754579544, -0.09331014752388, -0.08334212750196457, -0.07337410748004913, -0.0634060874581337, -0.05343806743621826, -0.043470047414302826, -0.03350202739238739, -0.023534007370471954, -0.013565987348556519, -0.0035979673266410828, 0.006370052695274353, 0.01633807271718979, 0.026306092739105225, 0.03627411276102066, 0.046242132782936096, 0.05621015280485153, 0.06617817282676697, 0.0761461928486824, 0.08611421287059784, 0.09608223289251328, 0.10605025291442871, 0.11601827293634415, 0.12598629295825958, 0.13595432043075562, 0.14592236280441284, 0.15589037537574768, 0.1658584028482437, 0.17582643032073975, 0.18579444289207458, 0.19576245546340942, 0.20573048293590546, 0.2156985104084015, 0.22566652297973633, 0.23563453555107117, 0.2456025630235672, 0.25557059049606323, 0.26553860306739807, 0.2755066156387329, 0.28547465801239014, 0.295442670583725, 0.3054106831550598, 0.31537869572639465, 0.3253467082977295, 0.3353147506713867, 0.34528276324272156, 0.3552507758140564, 0.3652188181877136, 0.37518683075904846, 0.3851548433303833, 0.39512285590171814, 0.405090868473053, 0.4150589108467102, 0.42502692341804504, 0.4349949359893799, 0.4449629783630371, 0.45493099093437195, 0.4648990035057068]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 3.0, 6.0, 11.0, 10.0, 13.0, 13.0, 10.0, 24.0, 15.0, 23.0, 27.0, 35.0, 36.0, 42.0, 41.0, 40.0, 44.0, 50.0, 38.0, 56.0, 48.0, 47.0, 45.0, 37.0, 30.0, 35.0, 30.0, 27.0, 22.0, 26.0, 16.0, 14.0, 10.0, 18.0, 14.0, 13.0, 8.0, 4.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.13098222017288208, -0.12706336379051208, -0.1231444925069809, -0.1192256286740303, -0.11530676484107971, -0.11138790100812912, -0.10746903717517853, -0.10355018079280853, -0.09963130950927734, -0.09571244567632675, -0.09179358184337616, -0.08787471801042557, -0.08395585417747498, -0.08003699034452438, -0.07611812651157379, -0.0721992701292038, -0.0682804062962532, -0.06436154246330261, -0.06044267863035202, -0.05652381479740143, -0.052604950964450836, -0.048686087131500244, -0.04476722702383995, -0.04084836319088936, -0.036929499357938766, -0.033010635524988174, -0.029091771692037582, -0.02517290972173214, -0.021254045888781548, -0.017335182055830956, -0.013416320085525513, -0.00949745625257492, -0.005578592419624329, -0.0016597290523350239, 0.002259134314954281, 0.006177997216582298, 0.01009686104953289, 0.014015724882483482, 0.017934586852788925, 0.021853450685739517, 0.02577231451869011, 0.0296911783516407, 0.03361004218459129, 0.03752890229225159, 0.04144776612520218, 0.04536662995815277, 0.04928549379110336, 0.053204357624053955, 0.05712322145700455, 0.06104208528995514, 0.06496094912290573, 0.06887981295585632, 0.07279867678880692, 0.07671754062175751, 0.0806363970041275, 0.08455526828765869, 0.08847412467002869, 0.09239298850297928, 0.09631185233592987, 0.10023071616888046, 0.10414958000183105, 0.10806844383478165, 0.11198730766773224, 0.11590616405010223, 0.11982503533363342]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 14.0, 6.0, 18.0, 24.0, 26.0, 50.0, 83.0, 130.0, 223.0, 368.0, 571.0, 960.0, 1541.0, 2632.0, 4196.0, 7303.0, 12561.0, 22610.0, 41752.0, 80500.0, 165379.0, 296533.0, 201864.0, 97094.0, 49723.0, 26827.0, 14816.0, 8307.0, 4919.0, 2937.0, 1779.0, 1089.0, 661.0, 394.0, 222.0, 141.0, 102.0, 74.0, 45.0, 20.0, 19.0, 13.0, 3.0, 10.0, 3.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.2435302734375, -0.23583221435546875, -0.2281341552734375, -0.22043609619140625, -0.212738037109375, -0.20503997802734375, -0.1973419189453125, -0.18964385986328125, -0.18194580078125, -0.17424774169921875, -0.1665496826171875, -0.15885162353515625, -0.151153564453125, -0.14345550537109375, -0.1357574462890625, -0.12805938720703125, -0.120361328125, -0.11266326904296875, -0.1049652099609375, -0.09726715087890625, -0.089569091796875, -0.08187103271484375, -0.0741729736328125, -0.06647491455078125, -0.05877685546875, -0.05107879638671875, -0.0433807373046875, -0.03568267822265625, -0.027984619140625, -0.02028656005859375, -0.0125885009765625, -0.00489044189453125, 0.0028076171875, 0.01050567626953125, 0.0182037353515625, 0.02590179443359375, 0.033599853515625, 0.04129791259765625, 0.0489959716796875, 0.05669403076171875, 0.06439208984375, 0.07209014892578125, 0.0797882080078125, 0.08748626708984375, 0.095184326171875, 0.10288238525390625, 0.1105804443359375, 0.11827850341796875, 0.1259765625, 0.13367462158203125, 0.1413726806640625, 0.14907073974609375, 0.156768798828125, 0.16446685791015625, 0.1721649169921875, 0.17986297607421875, 0.18756103515625, 0.19525909423828125, 0.2029571533203125, 0.21065521240234375, 0.218353271484375, 0.22605133056640625, 0.2337493896484375, 0.24144744873046875, 0.2491455078125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 5.0, 9.0, 7.0, 12.0, 17.0, 14.0, 12.0, 21.0, 25.0, 25.0, 22.0, 22.0, 26.0, 35.0, 45.0, 43.0, 41.0, 44.0, 41.0, 45.0, 43.0, 45.0, 44.0, 35.0, 37.0, 26.0, 33.0, 32.0, 18.0, 26.0, 21.0, 20.0, 16.0, 12.0, 7.0, 12.0, 15.0, 8.0, 7.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.09686279296875, -0.09391307830810547, -0.09096336364746094, -0.0880136489868164, -0.08506393432617188, -0.08211421966552734, -0.07916450500488281, -0.07621479034423828, -0.07326507568359375, -0.07031536102294922, -0.06736564636230469, -0.06441593170166016, -0.061466217041015625, -0.058516502380371094, -0.05556678771972656, -0.05261707305908203, -0.0496673583984375, -0.04671764373779297, -0.04376792907714844, -0.040818214416503906, -0.037868499755859375, -0.034918785095214844, -0.03196907043457031, -0.02901935577392578, -0.02606964111328125, -0.02311992645263672, -0.020170211791992188, -0.017220497131347656, -0.014270782470703125, -0.011321067810058594, -0.008371353149414062, -0.005421638488769531, -0.002471923828125, 0.00047779083251953125, 0.0034275054931640625, 0.006377220153808594, 0.009326934814453125, 0.012276649475097656, 0.015226364135742188, 0.01817607879638672, 0.02112579345703125, 0.02407550811767578, 0.027025222778320312, 0.029974937438964844, 0.032924652099609375, 0.035874366760253906, 0.03882408142089844, 0.04177379608154297, 0.0447235107421875, 0.04767322540283203, 0.05062294006347656, 0.053572654724121094, 0.056522369384765625, 0.059472084045410156, 0.06242179870605469, 0.06537151336669922, 0.06832122802734375, 0.07127094268798828, 0.07422065734863281, 0.07717037200927734, 0.08012008666992188, 0.0830698013305664, 0.08601951599121094, 0.08896923065185547, 0.0919189453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 9.0, 9.0, 12.0, 15.0, 24.0, 29.0, 49.0, 92.0, 143.0, 187.0, 316.0, 522.0, 840.0, 1445.0, 2428.0, 4561.0, 8738.0, 18649.0, 42881.0, 111277.0, 352946.0, 324110.0, 102963.0, 40277.0, 17521.0, 8406.0, 4149.0, 2444.0, 1366.0, 803.0, 504.0, 284.0, 200.0, 129.0, 77.0, 50.0, 36.0, 27.0, 13.0, 10.0, 5.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.297119140625, -0.2881050109863281, -0.27909088134765625, -0.2700767517089844, -0.2610626220703125, -0.2520484924316406, -0.24303436279296875, -0.23402023315429688, -0.225006103515625, -0.21599197387695312, -0.20697784423828125, -0.19796371459960938, -0.1889495849609375, -0.17993545532226562, -0.17092132568359375, -0.16190719604492188, -0.15289306640625, -0.14387893676757812, -0.13486480712890625, -0.12585067749023438, -0.1168365478515625, -0.10782241821289062, -0.09880828857421875, -0.08979415893554688, -0.080780029296875, -0.07176589965820312, -0.06275177001953125, -0.053737640380859375, -0.0447235107421875, -0.035709381103515625, -0.02669525146484375, -0.017681121826171875, -0.0086669921875, 0.000347137451171875, 0.00936126708984375, 0.018375396728515625, 0.0273895263671875, 0.036403656005859375, 0.04541778564453125, 0.054431915283203125, 0.063446044921875, 0.07246017456054688, 0.08147430419921875, 0.09048843383789062, 0.0995025634765625, 0.10851669311523438, 0.11753082275390625, 0.12654495239257812, 0.13555908203125, 0.14457321166992188, 0.15358734130859375, 0.16260147094726562, 0.1716156005859375, 0.18062973022460938, 0.18964385986328125, 0.19865798950195312, 0.207672119140625, 0.21668624877929688, 0.22570037841796875, 0.23471450805664062, 0.2437286376953125, 0.2527427673339844, 0.26175689697265625, 0.2707710266113281, 0.27978515625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 10.0, 9.0, 6.0, 4.0, 17.0, 13.0, 12.0, 20.0, 33.0, 22.0, 22.0, 21.0, 26.0, 35.0, 31.0, 38.0, 42.0, 33.0, 46.0, 52.0, 32.0, 44.0, 36.0, 34.0, 33.0, 48.0, 27.0, 39.0, 30.0, 33.0, 20.0, 24.0, 20.0, 20.0, 19.0, 9.0, 9.0, 7.0, 4.0, 3.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05987548828125, -0.057913780212402344, -0.05595207214355469, -0.05399036407470703, -0.052028656005859375, -0.05006694793701172, -0.04810523986816406, -0.046143531799316406, -0.04418182373046875, -0.042220115661621094, -0.04025840759277344, -0.03829669952392578, -0.036334991455078125, -0.03437328338623047, -0.03241157531738281, -0.030449867248535156, -0.0284881591796875, -0.026526451110839844, -0.024564743041992188, -0.02260303497314453, -0.020641326904296875, -0.01867961883544922, -0.016717910766601562, -0.014756202697753906, -0.01279449462890625, -0.010832786560058594, -0.008871078491210938, -0.006909370422363281, -0.004947662353515625, -0.0029859542846679688, -0.0010242462158203125, 0.0009374618530273438, 0.002899169921875, 0.004860877990722656, 0.0068225860595703125, 0.008784294128417969, 0.010746002197265625, 0.012707710266113281, 0.014669418334960938, 0.016631126403808594, 0.01859283447265625, 0.020554542541503906, 0.022516250610351562, 0.02447795867919922, 0.026439666748046875, 0.02840137481689453, 0.030363082885742188, 0.032324790954589844, 0.0342864990234375, 0.036248207092285156, 0.03820991516113281, 0.04017162322998047, 0.042133331298828125, 0.04409503936767578, 0.04605674743652344, 0.048018455505371094, 0.04998016357421875, 0.051941871643066406, 0.05390357971191406, 0.05586528778076172, 0.057826995849609375, 0.05978870391845703, 0.06175041198730469, 0.06371212005615234, 0.065673828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 9.0, 17.0, 20.0, 33.0, 35.0, 56.0, 75.0, 98.0, 158.0, 239.0, 381.0, 550.0, 842.0, 1358.0, 2416.0, 4253.0, 8059.0, 17861.0, 51322.0, 729134.0, 167121.0, 35246.0, 13820.0, 6548.0, 3475.0, 2014.0, 1188.0, 763.0, 459.0, 328.0, 210.0, 154.0, 97.0, 56.0, 45.0, 31.0, 13.0, 19.0, 12.0, 13.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.259033203125, -0.2511463165283203, -0.24325942993164062, -0.23537254333496094, -0.22748565673828125, -0.21959877014160156, -0.21171188354492188, -0.2038249969482422, -0.1959381103515625, -0.1880512237548828, -0.18016433715820312, -0.17227745056152344, -0.16439056396484375, -0.15650367736816406, -0.14861679077148438, -0.1407299041748047, -0.132843017578125, -0.12495613098144531, -0.11706924438476562, -0.10918235778808594, -0.10129547119140625, -0.09340858459472656, -0.08552169799804688, -0.07763481140136719, -0.0697479248046875, -0.06186103820800781, -0.053974151611328125, -0.04608726501464844, -0.03820037841796875, -0.030313491821289062, -0.022426605224609375, -0.014539718627929688, -0.00665283203125, 0.0012340545654296875, 0.009120941162109375, 0.017007827758789062, 0.02489471435546875, 0.03278160095214844, 0.040668487548828125, 0.04855537414550781, 0.0564422607421875, 0.06432914733886719, 0.07221603393554688, 0.08010292053222656, 0.08798980712890625, 0.09587669372558594, 0.10376358032226562, 0.11165046691894531, 0.119537353515625, 0.1274242401123047, 0.13531112670898438, 0.14319801330566406, 0.15108489990234375, 0.15897178649902344, 0.16685867309570312, 0.1747455596923828, 0.1826324462890625, 0.1905193328857422, 0.19840621948242188, 0.20629310607910156, 0.21417999267578125, 0.22206687927246094, 0.22995376586914062, 0.2378406524658203, 0.2457275390625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 8.0, 9.0, 7.0, 11.0, 7.0, 20.0, 32.0, 44.0, 47.0, 97.0, 138.0, 155.0, 125.0, 76.0, 57.0, 31.0, 24.0, 18.0, 13.0, 11.0, 9.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.748603820800781e-06, -7.5232237577438354e-06, -7.29784369468689e-06, -7.072463631629944e-06, -6.847083568572998e-06, -6.621703505516052e-06, -6.3963234424591064e-06, -6.170943379402161e-06, -5.945563316345215e-06, -5.720183253288269e-06, -5.494803190231323e-06, -5.2694231271743774e-06, -5.044043064117432e-06, -4.818663001060486e-06, -4.59328293800354e-06, -4.367902874946594e-06, -4.1425228118896484e-06, -3.917142748832703e-06, -3.691762685775757e-06, -3.466382622718811e-06, -3.2410025596618652e-06, -3.0156224966049194e-06, -2.7902424335479736e-06, -2.564862370491028e-06, -2.339482307434082e-06, -2.1141022443771362e-06, -1.8887221813201904e-06, -1.6633421182632446e-06, -1.4379620552062988e-06, -1.212581992149353e-06, -9.872019290924072e-07, -7.618218660354614e-07, -5.364418029785156e-07, -3.110617399215698e-07, -8.568167686462402e-08, 1.3969838619232178e-07, 3.650784492492676e-07, 5.904585123062134e-07, 8.158385753631592e-07, 1.041218638420105e-06, 1.2665987014770508e-06, 1.4919787645339966e-06, 1.7173588275909424e-06, 1.942738890647888e-06, 2.168118953704834e-06, 2.3934990167617798e-06, 2.6188790798187256e-06, 2.8442591428756714e-06, 3.069639205932617e-06, 3.295019268989563e-06, 3.520399332046509e-06, 3.7457793951034546e-06, 3.9711594581604e-06, 4.196539521217346e-06, 4.421919584274292e-06, 4.647299647331238e-06, 4.872679710388184e-06, 5.098059773445129e-06, 5.323439836502075e-06, 5.548819899559021e-06, 5.774199962615967e-06, 5.999580025672913e-06, 6.224960088729858e-06, 6.450340151786804e-06, 6.67572021484375e-06]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 7.0, 10.0, 12.0, 17.0, 27.0, 31.0, 48.0, 73.0, 114.0, 161.0, 224.0, 341.0, 547.0, 830.0, 1294.0, 2114.0, 3743.0, 7037.0, 14653.0, 37403.0, 169565.0, 718598.0, 52923.0, 18928.0, 8538.0, 4616.0, 2522.0, 1500.0, 885.0, 563.0, 420.0, 242.0, 195.0, 97.0, 83.0, 60.0, 38.0, 36.0, 16.0, 14.0, 10.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.242919921875, -0.23559188842773438, -0.22826385498046875, -0.22093582153320312, -0.2136077880859375, -0.20627975463867188, -0.19895172119140625, -0.19162368774414062, -0.184295654296875, -0.17696762084960938, -0.16963958740234375, -0.16231155395507812, -0.1549835205078125, -0.14765548706054688, -0.14032745361328125, -0.13299942016601562, -0.12567138671875, -0.11834335327148438, -0.11101531982421875, -0.10368728637695312, -0.0963592529296875, -0.08903121948242188, -0.08170318603515625, -0.07437515258789062, -0.067047119140625, -0.059719085693359375, -0.05239105224609375, -0.045063018798828125, -0.0377349853515625, -0.030406951904296875, -0.02307891845703125, -0.015750885009765625, -0.0084228515625, -0.001094818115234375, 0.00623321533203125, 0.013561248779296875, 0.0208892822265625, 0.028217315673828125, 0.03554534912109375, 0.042873382568359375, 0.050201416015625, 0.057529449462890625, 0.06485748291015625, 0.07218551635742188, 0.0795135498046875, 0.08684158325195312, 0.09416961669921875, 0.10149765014648438, 0.10882568359375, 0.11615371704101562, 0.12348175048828125, 0.13080978393554688, 0.1381378173828125, 0.14546585083007812, 0.15279388427734375, 0.16012191772460938, 0.167449951171875, 0.17477798461914062, 0.18210601806640625, 0.18943405151367188, 0.1967620849609375, 0.20409011840820312, 0.21141815185546875, 0.21874618530273438, 0.22607421875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 2.0, 7.0, 8.0, 12.0, 19.0, 9.0, 22.0, 28.0, 24.0, 33.0, 34.0, 47.0, 86.0, 353.0, 55.0, 34.0, 41.0, 41.0, 25.0, 21.0, 16.0, 17.0, 4.0, 7.0, 9.0, 7.0, 4.0, 4.0, 1.0, 6.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04931640625, -0.04783058166503906, -0.046344757080078125, -0.04485893249511719, -0.04337310791015625, -0.04188728332519531, -0.040401458740234375, -0.03891563415527344, -0.0374298095703125, -0.03594398498535156, -0.034458160400390625, -0.03297233581542969, -0.03148651123046875, -0.030000686645507812, -0.028514862060546875, -0.027029037475585938, -0.025543212890625, -0.024057388305664062, -0.022571563720703125, -0.021085739135742188, -0.01959991455078125, -0.018114089965820312, -0.016628265380859375, -0.015142440795898438, -0.0136566162109375, -0.012170791625976562, -0.010684967041015625, -0.009199142456054688, -0.00771331787109375, -0.0062274932861328125, -0.004741668701171875, -0.0032558441162109375, -0.00177001953125, -0.0002841949462890625, 0.001201629638671875, 0.0026874542236328125, 0.00417327880859375, 0.0056591033935546875, 0.007144927978515625, 0.008630752563476562, 0.0101165771484375, 0.011602401733398438, 0.013088226318359375, 0.014574050903320312, 0.01605987548828125, 0.017545700073242188, 0.019031524658203125, 0.020517349243164062, 0.022003173828125, 0.023488998413085938, 0.024974822998046875, 0.026460647583007812, 0.02794647216796875, 0.029432296752929688, 0.030918121337890625, 0.03240394592285156, 0.0338897705078125, 0.03537559509277344, 0.036861419677734375, 0.03834724426269531, 0.03983306884765625, 0.04131889343261719, 0.042804718017578125, 0.04429054260253906, 0.0457763671875]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 9.0, 10.0, 15.0, 27.0, 39.0, 49.0, 93.0, 129.0, 210.0, 195.0, 89.0, 51.0, 16.0, 15.0, 12.0, 4.0, 14.0, 1.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17663122713565826, -0.16863369941711426, -0.16063618659973145, -0.15263865888118744, -0.14464113116264343, -0.13664360344409943, -0.12864607572555542, -0.12064856290817261, -0.1126510351896286, -0.1046535074710846, -0.09665598720312119, -0.08865846693515778, -0.08066093921661377, -0.07266341149806976, -0.06466589123010635, -0.056668367236852646, -0.04867084324359894, -0.04067331925034523, -0.03267579525709152, -0.024678271263837814, -0.016680747270584106, -0.008683223277330399, -0.0006856992840766907, 0.007311824709177017, 0.015309348702430725, 0.023306872695684433, 0.03130439668893814, 0.03930192068219185, 0.04729944467544556, 0.055296968668699265, 0.06329449266195297, 0.07129201292991638, 0.07928955554962158, 0.08728708326816559, 0.095284603536129, 0.10328212380409241, 0.11127965152263641, 0.11927717924118042, 0.12727469205856323, 0.13527221977710724, 0.14326974749565125, 0.15126727521419525, 0.15926480293273926, 0.16726231575012207, 0.17525984346866608, 0.18325737118721008, 0.1912548840045929, 0.1992524117231369, 0.2072499394416809, 0.21524746716022491, 0.22324499487876892, 0.23124250769615173, 0.23924003541469574, 0.24723756313323975, 0.25523507595062256, 0.26323261857032776, 0.27123013138771057, 0.2792276442050934, 0.2872251868247986, 0.2952226996421814, 0.3032202124595642, 0.3112177550792694, 0.3192152678966522, 0.3272128105163574, 0.33521032333374023]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 9.0, 6.0, 10.0, 8.0, 14.0, 11.0, 14.0, 21.0, 22.0, 31.0, 33.0, 35.0, 41.0, 32.0, 43.0, 50.0, 41.0, 45.0, 53.0, 49.0, 41.0, 40.0, 50.0, 28.0, 37.0, 41.0, 26.0, 22.0, 25.0, 16.0, 24.0, 20.0, 18.0, 9.0, 10.0, 6.0, 8.0, 5.0, 1.0, 2.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11947879195213318, -0.11584986001253128, -0.11222092807292938, -0.10859199613332748, -0.10496306419372559, -0.10133413225412369, -0.09770520031452179, -0.09407627582550049, -0.090447336435318, -0.0868184044957161, -0.0831894725561142, -0.0795605406165123, -0.0759316086769104, -0.0723026767373085, -0.0686737447977066, -0.0650448203086853, -0.061415888369083405, -0.057786956429481506, -0.05415802448987961, -0.05052909255027771, -0.04690016061067581, -0.043271228671073914, -0.039642300456762314, -0.036013368517160416, -0.03238443657755852, -0.02875550463795662, -0.02512657269835472, -0.021497642621397972, -0.017868710681796074, -0.014239778742194176, -0.010610848665237427, -0.0069819167256355286, -0.0033529847860336304, 0.0002759466879069805, 0.0039048781618475914, 0.007533809170126915, 0.011162741109728813, 0.014791673049330711, 0.01842060312628746, 0.02204953506588936, 0.025678467005491257, 0.029307398945093155, 0.03293633088469505, 0.03656525909900665, 0.04019419103860855, 0.04382312297821045, 0.04745205491781235, 0.051080986857414246, 0.054709918797016144, 0.05833885073661804, 0.06196778267621994, 0.06559671461582184, 0.06922564655542374, 0.07285457849502563, 0.07648350298404694, 0.08011244237422943, 0.08374136686325073, 0.08737029880285263, 0.09099923074245453, 0.09462816268205643, 0.09825709462165833, 0.10188602656126022, 0.10551495850086212, 0.10914388298988342, 0.11277282238006592]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 14.0, 12.0, 14.0, 36.0, 43.0, 65.0, 92.0, 130.0, 202.0, 300.0, 436.0, 695.0, 1043.0, 1699.0, 2616.0, 4143.0, 6931.0, 11076.0, 18364.0, 31367.0, 55396.0, 107569.0, 243939.0, 963414.0, 1920040.0, 475295.0, 162214.0, 78347.0, 43018.0, 24729.0, 14786.0, 9139.0, 5754.0, 3760.0, 2500.0, 1644.0, 1110.0, 799.0, 524.0, 342.0, 233.0, 152.0, 97.0, 74.0, 37.0, 36.0, 17.0, 17.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1474609375, -0.1431598663330078, -0.13885879516601562, -0.13455772399902344, -0.13025665283203125, -0.12595558166503906, -0.12165451049804688, -0.11735343933105469, -0.1130523681640625, -0.10875129699707031, -0.10445022583007812, -0.10014915466308594, -0.09584808349609375, -0.09154701232910156, -0.08724594116210938, -0.08294486999511719, -0.078643798828125, -0.07434272766113281, -0.07004165649414062, -0.06574058532714844, -0.06143951416015625, -0.05713844299316406, -0.052837371826171875, -0.04853630065917969, -0.0442352294921875, -0.03993415832519531, -0.035633087158203125, -0.03133201599121094, -0.02703094482421875, -0.022729873657226562, -0.018428802490234375, -0.014127731323242188, -0.00982666015625, -0.0055255889892578125, -0.001224517822265625, 0.0030765533447265625, 0.00737762451171875, 0.011678695678710938, 0.015979766845703125, 0.020280838012695312, 0.0245819091796875, 0.028882980346679688, 0.033184051513671875, 0.03748512268066406, 0.04178619384765625, 0.04608726501464844, 0.050388336181640625, 0.05468940734863281, 0.058990478515625, 0.06329154968261719, 0.06759262084960938, 0.07189369201660156, 0.07619476318359375, 0.08049583435058594, 0.08479690551757812, 0.08909797668457031, 0.0933990478515625, 0.09770011901855469, 0.10200119018554688, 0.10630226135253906, 0.11060333251953125, 0.11490440368652344, 0.11920547485351562, 0.12350654602050781, 0.1278076171875]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 8.0, 7.0, 6.0, 12.0, 11.0, 26.0, 26.0, 22.0, 38.0, 43.0, 35.0, 36.0, 46.0, 50.0, 48.0, 32.0, 43.0, 62.0, 38.0, 37.0, 37.0, 41.0, 39.0, 39.0, 23.0, 24.0, 26.0, 21.0, 20.0, 24.0, 14.0, 21.0, 4.0, 4.0, 8.0, 6.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05633544921875, -0.05450773239135742, -0.052680015563964844, -0.050852298736572266, -0.04902458190917969, -0.04719686508178711, -0.04536914825439453, -0.04354143142700195, -0.041713714599609375, -0.0398859977722168, -0.03805828094482422, -0.03623056411743164, -0.03440284729003906, -0.032575130462646484, -0.030747413635253906, -0.028919696807861328, -0.02709197998046875, -0.025264263153076172, -0.023436546325683594, -0.021608829498291016, -0.019781112670898438, -0.01795339584350586, -0.01612567901611328, -0.014297962188720703, -0.012470245361328125, -0.010642528533935547, -0.008814811706542969, -0.006987094879150391, -0.0051593780517578125, -0.0033316612243652344, -0.0015039443969726562, 0.0003237724304199219, 0.0021514892578125, 0.003979206085205078, 0.005806922912597656, 0.007634639739990234, 0.009462356567382812, 0.01129007339477539, 0.013117790222167969, 0.014945507049560547, 0.016773223876953125, 0.018600940704345703, 0.02042865753173828, 0.02225637435913086, 0.024084091186523438, 0.025911808013916016, 0.027739524841308594, 0.029567241668701172, 0.03139495849609375, 0.03322267532348633, 0.035050392150878906, 0.036878108978271484, 0.03870582580566406, 0.04053354263305664, 0.04236125946044922, 0.0441889762878418, 0.046016693115234375, 0.04784440994262695, 0.04967212677001953, 0.05149984359741211, 0.05332756042480469, 0.055155277252197266, 0.056982994079589844, 0.05881071090698242, 0.060638427734375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 14.0, 18.0, 17.0, 31.0, 59.0, 67.0, 99.0, 139.0, 207.0, 331.0, 504.0, 816.0, 1217.0, 2023.0, 3215.0, 5612.0, 10077.0, 18008.0, 35167.0, 75651.0, 190772.0, 640347.0, 2169339.0, 682941.0, 199842.0, 78750.0, 35966.0, 18515.0, 9838.0, 5578.0, 3400.0, 2015.0, 1276.0, 807.0, 545.0, 350.0, 247.0, 160.0, 99.0, 84.0, 57.0, 19.0, 18.0, 9.0, 10.0, 9.0, 5.0, 7.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.1385498046875, -0.1344165802001953, -0.13028335571289062, -0.12615013122558594, -0.12201690673828125, -0.11788368225097656, -0.11375045776367188, -0.10961723327636719, -0.1054840087890625, -0.10135078430175781, -0.09721755981445312, -0.09308433532714844, -0.08895111083984375, -0.08481788635253906, -0.08068466186523438, -0.07655143737792969, -0.072418212890625, -0.06828498840332031, -0.06415176391601562, -0.06001853942871094, -0.05588531494140625, -0.05175209045410156, -0.047618865966796875, -0.04348564147949219, -0.0393524169921875, -0.03521919250488281, -0.031085968017578125, -0.026952743530273438, -0.02281951904296875, -0.018686294555664062, -0.014553070068359375, -0.010419845581054688, -0.00628662109375, -0.0021533966064453125, 0.001979827880859375, 0.0061130523681640625, 0.01024627685546875, 0.014379501342773438, 0.018512725830078125, 0.022645950317382812, 0.0267791748046875, 0.030912399291992188, 0.035045623779296875, 0.03917884826660156, 0.04331207275390625, 0.04744529724121094, 0.051578521728515625, 0.05571174621582031, 0.059844970703125, 0.06397819519042969, 0.06811141967773438, 0.07224464416503906, 0.07637786865234375, 0.08051109313964844, 0.08464431762695312, 0.08877754211425781, 0.0929107666015625, 0.09704399108886719, 0.10117721557617188, 0.10531044006347656, 0.10944366455078125, 0.11357688903808594, 0.11771011352539062, 0.12184333801269531, 0.1259765625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 4.0, 11.0, 8.0, 12.0, 14.0, 24.0, 30.0, 30.0, 37.0, 58.0, 77.0, 74.0, 99.0, 123.0, 141.0, 190.0, 230.0, 258.0, 366.0, 372.0, 337.0, 293.0, 267.0, 190.0, 194.0, 120.0, 118.0, 98.0, 55.0, 53.0, 43.0, 35.0, 27.0, 24.0, 16.0, 10.0, 7.0, 3.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0316162109375, -0.030617237091064453, -0.029618263244628906, -0.02861928939819336, -0.027620315551757812, -0.026621341705322266, -0.02562236785888672, -0.024623394012451172, -0.023624420166015625, -0.022625446319580078, -0.02162647247314453, -0.020627498626708984, -0.019628524780273438, -0.01862955093383789, -0.017630577087402344, -0.016631603240966797, -0.01563262939453125, -0.014633655548095703, -0.013634681701660156, -0.01263570785522461, -0.011636734008789062, -0.010637760162353516, -0.009638786315917969, -0.008639812469482422, -0.007640838623046875, -0.006641864776611328, -0.005642890930175781, -0.004643917083740234, -0.0036449432373046875, -0.0026459693908691406, -0.0016469955444335938, -0.0006480216979980469, 0.0003509521484375, 0.0013499259948730469, 0.0023488998413085938, 0.0033478736877441406, 0.0043468475341796875, 0.005345821380615234, 0.006344795227050781, 0.007343769073486328, 0.008342742919921875, 0.009341716766357422, 0.010340690612792969, 0.011339664459228516, 0.012338638305664062, 0.01333761215209961, 0.014336585998535156, 0.015335559844970703, 0.01633453369140625, 0.017333507537841797, 0.018332481384277344, 0.01933145523071289, 0.020330429077148438, 0.021329402923583984, 0.02232837677001953, 0.023327350616455078, 0.024326324462890625, 0.025325298309326172, 0.02632427215576172, 0.027323246002197266, 0.028322219848632812, 0.02932119369506836, 0.030320167541503906, 0.03131914138793945, 0.032318115234375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 17.0, 13.0, 17.0, 32.0, 45.0, 68.0, 103.0, 162.0, 169.0, 136.0, 80.0, 48.0, 25.0, 12.0, 13.0, 8.0, 6.0, 6.0, 5.0, 1.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09861345589160919, -0.09456570446491241, -0.09051796048879623, -0.08647021651268005, -0.08242246508598328, -0.0783747136592865, -0.07432696968317032, -0.07027922570705414, -0.06623147428035736, -0.06218372657895088, -0.0581359788775444, -0.054088231176137924, -0.050040483474731445, -0.045992735773324966, -0.04194498807191849, -0.03789724037051201, -0.03384949266910553, -0.02980174496769905, -0.025753997266292572, -0.021706249564886093, -0.017658501863479614, -0.013610754162073135, -0.009563006460666656, -0.005515258759260178, -0.0014675110578536987, 0.00258023664355278, 0.006627984344959259, 0.010675732046365738, 0.014723479747772217, 0.018771227449178696, 0.022818975150585175, 0.026866722851991653, 0.030914485454559326, 0.034962233155965805, 0.039009980857372284, 0.04305772855877876, 0.04710547626018524, 0.05115322396159172, 0.0552009716629982, 0.05924871936440468, 0.06329646706581116, 0.06734421849250793, 0.07139196246862411, 0.0754397064447403, 0.07948745787143707, 0.08353520929813385, 0.08758295327425003, 0.09163069725036621, 0.09567844867706299, 0.09972620010375977, 0.10377394407987595, 0.10782168805599213, 0.1118694394826889, 0.11591719090938568, 0.11996493488550186, 0.12401267886161804, 0.12806043028831482, 0.1321081817150116, 0.13615593314170837, 0.14020366966724396, 0.14425142109394073, 0.1482991725206375, 0.1523469090461731, 0.15639466047286987, 0.16044241189956665]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 12.0, 16.0, 6.0, 23.0, 14.0, 26.0, 29.0, 28.0, 44.0, 46.0, 42.0, 42.0, 57.0, 51.0, 50.0, 52.0, 58.0, 37.0, 34.0, 51.0, 39.0, 41.0, 28.0, 27.0, 26.0, 22.0, 17.0, 17.0, 10.0, 7.0, 9.0, 6.0, 9.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07376483827829361, -0.07160855829715729, -0.06945228576660156, -0.06729600578546524, -0.06513972580432892, -0.0629834532737732, -0.06082717329263687, -0.05867089331150055, -0.056514617055654526, -0.0543583407998085, -0.05220206081867218, -0.05004578456282616, -0.04788950830698013, -0.04573322832584381, -0.04357695206999779, -0.041420675814151764, -0.03926439583301544, -0.03710811957716942, -0.034951839596033096, -0.03279556334018707, -0.0306392852216959, -0.028483007103204727, -0.026326730847358704, -0.02417045272886753, -0.022014174610376358, -0.019857896491885185, -0.017701618373394012, -0.015545342117547989, -0.013389063999056816, -0.011232785880565643, -0.009076508693397045, -0.006920231506228447, -0.004763945937156677, -0.0026076682843267918, -0.0004513906314969063, 0.0017048870213329792, 0.0038611646741628647, 0.0060174427926540375, 0.008173719979822636, 0.010329997166991234, 0.012486275285482407, 0.01464255340397358, 0.016798831522464752, 0.018955107778310776, 0.02111138589680195, 0.02326766401529312, 0.025423940271139145, 0.027580218389630318, 0.02973649650812149, 0.031892772763967514, 0.034049052745103836, 0.03620532900094986, 0.03836160898208618, 0.040517885237932205, 0.04267416149377823, 0.04483044147491455, 0.046986717730760574, 0.0491429939866066, 0.05129927396774292, 0.053455550223588943, 0.05561182647943497, 0.05776810646057129, 0.05992438271641731, 0.062080658972263336, 0.06423693895339966]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 9.0, 12.0, 17.0, 26.0, 28.0, 41.0, 91.0, 99.0, 132.0, 213.0, 289.0, 437.0, 648.0, 977.0, 1581.0, 2402.0, 3912.0, 6948.0, 13210.0, 27688.0, 68403.0, 201170.0, 411462.0, 187838.0, 64630.0, 26261.0, 12596.0, 6765.0, 3968.0, 2221.0, 1498.0, 956.0, 652.0, 396.0, 296.0, 201.0, 156.0, 96.0, 64.0, 50.0, 33.0, 29.0, 19.0, 11.0, 4.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0760498046875, -0.07363319396972656, -0.07121658325195312, -0.06879997253417969, -0.06638336181640625, -0.06396675109863281, -0.061550140380859375, -0.05913352966308594, -0.0567169189453125, -0.05430030822753906, -0.051883697509765625, -0.04946708679199219, -0.04705047607421875, -0.04463386535644531, -0.042217254638671875, -0.03980064392089844, -0.037384033203125, -0.03496742248535156, -0.032550811767578125, -0.030134201049804688, -0.02771759033203125, -0.025300979614257812, -0.022884368896484375, -0.020467758178710938, -0.0180511474609375, -0.015634536743164062, -0.013217926025390625, -0.010801315307617188, -0.00838470458984375, -0.0059680938720703125, -0.003551483154296875, -0.0011348724365234375, 0.00128173828125, 0.0036983489990234375, 0.006114959716796875, 0.008531570434570312, 0.01094818115234375, 0.013364791870117188, 0.015781402587890625, 0.018198013305664062, 0.0206146240234375, 0.023031234741210938, 0.025447845458984375, 0.027864456176757812, 0.03028106689453125, 0.03269767761230469, 0.035114288330078125, 0.03753089904785156, 0.039947509765625, 0.04236412048339844, 0.044780731201171875, 0.04719734191894531, 0.04961395263671875, 0.05203056335449219, 0.054447174072265625, 0.05686378479003906, 0.0592803955078125, 0.06169700622558594, 0.06411361694335938, 0.06653022766113281, 0.06894683837890625, 0.07136344909667969, 0.07378005981445312, 0.07619667053222656, 0.07861328125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 13.0, 10.0, 9.0, 10.0, 17.0, 27.0, 21.0, 25.0, 32.0, 20.0, 45.0, 26.0, 29.0, 46.0, 39.0, 49.0, 51.0, 48.0, 42.0, 51.0, 38.0, 29.0, 41.0, 44.0, 34.0, 30.0, 23.0, 22.0, 22.0, 22.0, 13.0, 5.0, 14.0, 9.0, 5.0, 9.0, 9.0, 6.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0640869140625, -0.062285423278808594, -0.06048393249511719, -0.05868244171142578, -0.056880950927734375, -0.05507946014404297, -0.05327796936035156, -0.051476478576660156, -0.04967498779296875, -0.047873497009277344, -0.04607200622558594, -0.04427051544189453, -0.042469024658203125, -0.04066753387451172, -0.03886604309082031, -0.037064552307128906, -0.0352630615234375, -0.033461570739746094, -0.03166007995605469, -0.02985858917236328, -0.028057098388671875, -0.02625560760498047, -0.024454116821289062, -0.022652626037597656, -0.02085113525390625, -0.019049644470214844, -0.017248153686523438, -0.015446662902832031, -0.013645172119140625, -0.011843681335449219, -0.010042190551757812, -0.008240699768066406, -0.006439208984375, -0.004637718200683594, -0.0028362274169921875, -0.0010347366333007812, 0.000766754150390625, 0.0025682449340820312, 0.0043697357177734375, 0.006171226501464844, 0.00797271728515625, 0.009774208068847656, 0.011575698852539062, 0.013377189636230469, 0.015178680419921875, 0.01698017120361328, 0.018781661987304688, 0.020583152770996094, 0.0223846435546875, 0.024186134338378906, 0.025987625122070312, 0.02778911590576172, 0.029590606689453125, 0.03139209747314453, 0.03319358825683594, 0.034995079040527344, 0.03679656982421875, 0.038598060607910156, 0.04039955139160156, 0.04220104217529297, 0.044002532958984375, 0.04580402374267578, 0.04760551452636719, 0.049407005310058594, 0.05120849609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 9.0, 13.0, 19.0, 24.0, 36.0, 48.0, 126.0, 193.0, 350.0, 648.0, 1406.0, 3153.0, 8142.0, 28161.0, 159129.0, 695851.0, 116334.0, 22665.0, 6887.0, 2764.0, 1246.0, 572.0, 327.0, 173.0, 119.0, 51.0, 25.0, 25.0, 17.0, 13.0, 8.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.112548828125, -0.10812187194824219, -0.10369491577148438, -0.09926795959472656, -0.09484100341796875, -0.09041404724121094, -0.08598709106445312, -0.08156013488769531, -0.0771331787109375, -0.07270622253417969, -0.06827926635742188, -0.06385231018066406, -0.05942535400390625, -0.05499839782714844, -0.050571441650390625, -0.04614448547363281, -0.041717529296875, -0.03729057312011719, -0.032863616943359375, -0.028436660766601562, -0.02400970458984375, -0.019582748413085938, -0.015155792236328125, -0.010728836059570312, -0.0063018798828125, -0.0018749237060546875, 0.002552032470703125, 0.0069789886474609375, 0.01140594482421875, 0.015832901000976562, 0.020259857177734375, 0.024686813354492188, 0.02911376953125, 0.03354072570800781, 0.037967681884765625, 0.04239463806152344, 0.04682159423828125, 0.05124855041503906, 0.055675506591796875, 0.06010246276855469, 0.0645294189453125, 0.06895637512207031, 0.07338333129882812, 0.07781028747558594, 0.08223724365234375, 0.08666419982910156, 0.09109115600585938, 0.09551811218261719, 0.099945068359375, 0.10437202453613281, 0.10879898071289062, 0.11322593688964844, 0.11765289306640625, 0.12207984924316406, 0.12650680541992188, 0.1309337615966797, 0.1353607177734375, 0.1397876739501953, 0.14421463012695312, 0.14864158630371094, 0.15306854248046875, 0.15749549865722656, 0.16192245483398438, 0.1663494110107422, 0.1707763671875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 4.0, 8.0, 9.0, 8.0, 12.0, 16.0, 17.0, 20.0, 25.0, 12.0, 23.0, 40.0, 32.0, 40.0, 35.0, 39.0, 36.0, 53.0, 41.0, 46.0, 49.0, 39.0, 37.0, 39.0, 39.0, 31.0, 37.0, 15.0, 36.0, 29.0, 24.0, 20.0, 15.0, 11.0, 11.0, 8.0, 15.0, 4.0, 2.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033111572265625, -0.03195333480834961, -0.03079509735107422, -0.029636859893798828, -0.028478622436523438, -0.027320384979248047, -0.026162147521972656, -0.025003910064697266, -0.023845672607421875, -0.022687435150146484, -0.021529197692871094, -0.020370960235595703, -0.019212722778320312, -0.018054485321044922, -0.01689624786376953, -0.01573801040649414, -0.01457977294921875, -0.01342153549194336, -0.012263298034667969, -0.011105060577392578, -0.009946823120117188, -0.008788585662841797, -0.007630348205566406, -0.006472110748291016, -0.005313873291015625, -0.004155635833740234, -0.0029973983764648438, -0.0018391609191894531, -0.0006809234619140625, 0.0004773139953613281, 0.0016355514526367188, 0.0027937889099121094, 0.0039520263671875, 0.005110263824462891, 0.006268501281738281, 0.007426738739013672, 0.008584976196289062, 0.009743213653564453, 0.010901451110839844, 0.012059688568115234, 0.013217926025390625, 0.014376163482666016, 0.015534400939941406, 0.016692638397216797, 0.017850875854492188, 0.019009113311767578, 0.02016735076904297, 0.02132558822631836, 0.02248382568359375, 0.02364206314086914, 0.02480030059814453, 0.025958538055419922, 0.027116775512695312, 0.028275012969970703, 0.029433250427246094, 0.030591487884521484, 0.031749725341796875, 0.032907962799072266, 0.034066200256347656, 0.03522443771362305, 0.03638267517089844, 0.03754091262817383, 0.03869915008544922, 0.03985738754272461, 0.041015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 12.0, 16.0, 17.0, 32.0, 53.0, 66.0, 107.0, 150.0, 185.0, 305.0, 428.0, 675.0, 1048.0, 1541.0, 2378.0, 3739.0, 6614.0, 11445.0, 23100.0, 56916.0, 228253.0, 532147.0, 105162.0, 35431.0, 16308.0, 8654.0, 5035.0, 3059.0, 1919.0, 1226.0, 819.0, 532.0, 339.0, 270.0, 179.0, 132.0, 91.0, 58.0, 30.0, 23.0, 18.0, 14.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01934814453125, -0.01870870590209961, -0.01806926727294922, -0.017429828643798828, -0.016790390014648438, -0.016150951385498047, -0.015511512756347656, -0.014872074127197266, -0.014232635498046875, -0.013593196868896484, -0.012953758239746094, -0.012314319610595703, -0.011674880981445312, -0.011035442352294922, -0.010396003723144531, -0.00975656509399414, -0.00911712646484375, -0.00847768783569336, -0.007838249206542969, -0.007198810577392578, -0.0065593719482421875, -0.005919933319091797, -0.005280494689941406, -0.004641056060791016, -0.004001617431640625, -0.0033621788024902344, -0.0027227401733398438, -0.002083301544189453, -0.0014438629150390625, -0.0008044242858886719, -0.00016498565673828125, 0.0004744529724121094, 0.0011138916015625, 0.0017533302307128906, 0.0023927688598632812, 0.003032207489013672, 0.0036716461181640625, 0.004311084747314453, 0.004950523376464844, 0.005589962005615234, 0.006229400634765625, 0.006868839263916016, 0.007508277893066406, 0.008147716522216797, 0.008787155151367188, 0.009426593780517578, 0.010066032409667969, 0.01070547103881836, 0.01134490966796875, 0.01198434829711914, 0.012623786926269531, 0.013263225555419922, 0.013902664184570312, 0.014542102813720703, 0.015181541442871094, 0.015820980072021484, 0.016460418701171875, 0.017099857330322266, 0.017739295959472656, 0.018378734588623047, 0.019018173217773438, 0.019657611846923828, 0.02029705047607422, 0.02093648910522461, 0.021575927734375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 8.0, 2.0, 2.0, 2.0, 9.0, 8.0, 6.0, 11.0, 17.0, 10.0, 19.0, 27.0, 43.0, 99.0, 176.0, 212.0, 135.0, 52.0, 28.0, 23.0, 15.0, 12.0, 12.0, 9.0, 6.0, 10.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0], "bins": [-2.0742416381835938e-05, -2.0137056708335876e-05, -1.9531697034835815e-05, -1.8926337361335754e-05, -1.8320977687835693e-05, -1.7715618014335632e-05, -1.711025834083557e-05, -1.650489866733551e-05, -1.589953899383545e-05, -1.5294179320335388e-05, -1.4688819646835327e-05, -1.4083459973335266e-05, -1.3478100299835205e-05, -1.2872740626335144e-05, -1.2267380952835083e-05, -1.1662021279335022e-05, -1.1056661605834961e-05, -1.04513019323349e-05, -9.845942258834839e-06, -9.240582585334778e-06, -8.635222911834717e-06, -8.029863238334656e-06, -7.424503564834595e-06, -6.819143891334534e-06, -6.213784217834473e-06, -5.608424544334412e-06, -5.003064870834351e-06, -4.3977051973342896e-06, -3.7923455238342285e-06, -3.1869858503341675e-06, -2.5816261768341064e-06, -1.9762665033340454e-06, -1.3709068298339844e-06, -7.655471563339233e-07, -1.601874828338623e-07, 4.4517219066619873e-07, 1.0505318641662598e-06, 1.6558915376663208e-06, 2.261251211166382e-06, 2.866610884666443e-06, 3.471970558166504e-06, 4.077330231666565e-06, 4.682689905166626e-06, 5.288049578666687e-06, 5.893409252166748e-06, 6.498768925666809e-06, 7.10412859916687e-06, 7.709488272666931e-06, 8.314847946166992e-06, 8.920207619667053e-06, 9.525567293167114e-06, 1.0130926966667175e-05, 1.0736286640167236e-05, 1.1341646313667297e-05, 1.1947005987167358e-05, 1.255236566066742e-05, 1.315772533416748e-05, 1.3763085007667542e-05, 1.4368444681167603e-05, 1.4973804354667664e-05, 1.5579164028167725e-05, 1.6184523701667786e-05, 1.6789883375167847e-05, 1.7395243048667908e-05, 1.800060272216797e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 7.0, 9.0, 18.0, 17.0, 27.0, 24.0, 38.0, 56.0, 77.0, 113.0, 173.0, 249.0, 399.0, 651.0, 1088.0, 1965.0, 3753.0, 7522.0, 17010.0, 42900.0, 144181.0, 543333.0, 193294.0, 52994.0, 20022.0, 8930.0, 4243.0, 2139.0, 1249.0, 683.0, 428.0, 269.0, 215.0, 123.0, 104.0, 58.0, 51.0, 33.0, 30.0, 24.0, 10.0, 12.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01415252685546875, -0.013674378395080566, -0.013196229934692383, -0.0127180814743042, -0.012239933013916016, -0.011761784553527832, -0.011283636093139648, -0.010805487632751465, -0.010327339172363281, -0.009849190711975098, -0.009371042251586914, -0.00889289379119873, -0.008414745330810547, -0.007936596870422363, -0.00745844841003418, -0.006980299949645996, -0.0065021514892578125, -0.006024003028869629, -0.005545854568481445, -0.005067706108093262, -0.004589557647705078, -0.0041114091873168945, -0.003633260726928711, -0.0031551122665405273, -0.0026769638061523438, -0.00219881534576416, -0.0017206668853759766, -0.001242518424987793, -0.0007643699645996094, -0.0002862215042114258, 0.0001919269561767578, 0.0006700754165649414, 0.001148223876953125, 0.0016263723373413086, 0.002104520797729492, 0.0025826692581176758, 0.0030608177185058594, 0.003538966178894043, 0.0040171146392822266, 0.00449526309967041, 0.004973411560058594, 0.005451560020446777, 0.005929708480834961, 0.0064078569412231445, 0.006886005401611328, 0.007364153861999512, 0.007842302322387695, 0.008320450782775879, 0.008798599243164062, 0.009276747703552246, 0.00975489616394043, 0.010233044624328613, 0.010711193084716797, 0.01118934154510498, 0.011667490005493164, 0.012145638465881348, 0.012623786926269531, 0.013101935386657715, 0.013580083847045898, 0.014058232307434082, 0.014536380767822266, 0.01501452922821045, 0.015492677688598633, 0.015970826148986816, 0.016448974609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 7.0, 0.0, 6.0, 11.0, 10.0, 9.0, 13.0, 10.0, 20.0, 24.0, 29.0, 28.0, 49.0, 43.0, 69.0, 78.0, 78.0, 67.0, 71.0, 75.0, 50.0, 46.0, 31.0, 37.0, 26.0, 14.0, 22.0, 14.0, 16.0, 8.0, 8.0, 7.0, 9.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.003814697265625, -0.003693819046020508, -0.0035729408264160156, -0.0034520626068115234, -0.0033311843872070312, -0.003210306167602539, -0.003089427947998047, -0.0029685497283935547, -0.0028476715087890625, -0.0027267932891845703, -0.002605915069580078, -0.002485036849975586, -0.0023641586303710938, -0.0022432804107666016, -0.0021224021911621094, -0.002001523971557617, -0.001880645751953125, -0.0017597675323486328, -0.0016388893127441406, -0.0015180110931396484, -0.0013971328735351562, -0.001276254653930664, -0.0011553764343261719, -0.0010344982147216797, -0.0009136199951171875, -0.0007927417755126953, -0.0006718635559082031, -0.0005509853363037109, -0.00043010711669921875, -0.00030922889709472656, -0.00018835067749023438, -6.747245788574219e-05, 5.340576171875e-05, 0.0001742839813232422, 0.0002951622009277344, 0.00041604042053222656, 0.0005369186401367188, 0.0006577968597412109, 0.0007786750793457031, 0.0008995532989501953, 0.0010204315185546875, 0.0011413097381591797, 0.0012621879577636719, 0.001383066177368164, 0.0015039443969726562, 0.0016248226165771484, 0.0017457008361816406, 0.0018665790557861328, 0.001987457275390625, 0.002108335494995117, 0.0022292137145996094, 0.0023500919342041016, 0.0024709701538085938, 0.002591848373413086, 0.002712726593017578, 0.0028336048126220703, 0.0029544830322265625, 0.0030753612518310547, 0.003196239471435547, 0.003317117691040039, 0.0034379959106445312, 0.0035588741302490234, 0.0036797523498535156, 0.003800630569458008, 0.0039215087890625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 3.0, 18.0, 24.0, 23.0, 35.0, 48.0, 82.0, 149.0, 185.0, 157.0, 89.0, 66.0, 35.0, 22.0, 14.0, 9.0, 6.0, 7.0, 4.0, 7.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08575208485126495, -0.0818125531077385, -0.07787302881479263, -0.07393349707126617, -0.06999396532773972, -0.06605443358421326, -0.062114909291267395, -0.058175377547740936, -0.054235849529504776, -0.050296321511268616, -0.04635678976774216, -0.042417261749506, -0.038477733731269836, -0.03453820198774338, -0.030598673969507217, -0.026659144088625908, -0.0227196142077446, -0.01878008432686329, -0.014840555377304554, -0.010901026427745819, -0.00696149654686451, -0.0030219666659832, 0.0009175613522529602, 0.00485709123313427, 0.00879662111401558, 0.012736150994896889, 0.016675680875778198, 0.02061520889401436, 0.024554738774895668, 0.028494268655776978, 0.03243379667401314, 0.0363733246922493, 0.04031285643577576, 0.04425238445401192, 0.048191916197538376, 0.052131444215774536, 0.056070975959300995, 0.060010503977537155, 0.06395003199577332, 0.06788956373929977, 0.07182909548282623, 0.07576862722635269, 0.07970815151929855, 0.08364768326282501, 0.08758721500635147, 0.09152674674987793, 0.09546627104282379, 0.09940580278635025, 0.10334532707929611, 0.10728485882282257, 0.11122438311576843, 0.11516391485929489, 0.11910344660282135, 0.12304297089576721, 0.12698251008987427, 0.13092203438282013, 0.134861558675766, 0.13880108296871185, 0.1427406221628189, 0.14668014645576477, 0.15061967074871063, 0.1545592099428177, 0.15849873423576355, 0.1624382585287094, 0.16637779772281647]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 8.0, 8.0, 15.0, 11.0, 18.0, 15.0, 27.0, 25.0, 34.0, 42.0, 43.0, 42.0, 42.0, 53.0, 54.0, 45.0, 58.0, 47.0, 49.0, 38.0, 50.0, 33.0, 39.0, 29.0, 30.0, 23.0, 24.0, 20.0, 12.0, 13.0, 11.0, 6.0, 8.0, 5.0, 8.0, 8.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06840439885854721, -0.06641142070293427, -0.06441844254732132, -0.062425464391708374, -0.06043248623609543, -0.05843950808048248, -0.05644652992486954, -0.05445355176925659, -0.052460573613643646, -0.0504675954580307, -0.048474617302417755, -0.04648163914680481, -0.044488660991191864, -0.04249568283557892, -0.04050270467996597, -0.03850972652435303, -0.03651674464344978, -0.03452376648783684, -0.03253078833222389, -0.030537810176610947, -0.028544832020998, -0.026551853865385056, -0.02455887384712696, -0.022565895691514015, -0.02057291753590107, -0.018579939380288124, -0.01658696122467518, -0.014593982137739658, -0.012601003982126713, -0.010608025826513767, -0.008615046739578247, -0.0066220685839653015, -0.0046290867030620575, -0.0026361083146184683, -0.0006431299261748791, 0.0013498486950993538, 0.0033428268507122993, 0.005335805006325245, 0.007328784093260765, 0.00932176224887371, 0.011314740404486656, 0.013307718560099602, 0.015300696715712547, 0.017293676733970642, 0.019286654889583588, 0.021279633045196533, 0.02327261120080948, 0.025265589356422424, 0.02725856751203537, 0.029251545667648315, 0.03124452382326126, 0.03323750197887421, 0.03523048013448715, 0.0372234582901001, 0.03921643644571304, 0.04120941460132599, 0.043202392756938934, 0.04519537091255188, 0.047188349068164825, 0.04918132722377777, 0.05117430537939072, 0.05316728353500366, 0.05516026169061661, 0.05715323984622955, 0.0591462217271328]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 5.0, 8.0, 11.0, 21.0, 27.0, 30.0, 59.0, 70.0, 103.0, 155.0, 228.0, 316.0, 415.0, 645.0, 870.0, 1393.0, 1911.0, 2788.0, 4272.0, 6325.0, 9388.0, 14001.0, 21975.0, 34797.0, 55906.0, 93017.0, 158534.0, 221935.0, 163605.0, 96167.0, 57601.0, 35423.0, 22736.0, 14444.0, 9470.0, 6381.0, 4282.0, 2816.0, 1970.0, 1381.0, 930.0, 647.0, 442.0, 296.0, 226.0, 175.0, 107.0, 76.0, 66.0, 39.0, 29.0, 11.0, 12.0, 11.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.0836181640625, -0.08096599578857422, -0.07831382751464844, -0.07566165924072266, -0.07300949096679688, -0.0703573226928711, -0.06770515441894531, -0.06505298614501953, -0.06240081787109375, -0.05974864959716797, -0.05709648132324219, -0.054444313049316406, -0.051792144775390625, -0.049139976501464844, -0.04648780822753906, -0.04383563995361328, -0.0411834716796875, -0.03853130340576172, -0.03587913513183594, -0.033226966857910156, -0.030574798583984375, -0.027922630310058594, -0.025270462036132812, -0.02261829376220703, -0.01996612548828125, -0.01731395721435547, -0.014661788940429688, -0.012009620666503906, -0.009357452392578125, -0.006705284118652344, -0.0040531158447265625, -0.0014009475708007812, 0.001251220703125, 0.0039033889770507812, 0.0065555572509765625, 0.009207725524902344, 0.011859893798828125, 0.014512062072753906, 0.017164230346679688, 0.01981639862060547, 0.02246856689453125, 0.02512073516845703, 0.027772903442382812, 0.030425071716308594, 0.033077239990234375, 0.035729408264160156, 0.03838157653808594, 0.04103374481201172, 0.0436859130859375, 0.04633808135986328, 0.04899024963378906, 0.051642417907714844, 0.054294586181640625, 0.056946754455566406, 0.05959892272949219, 0.06225109100341797, 0.06490325927734375, 0.06755542755126953, 0.07020759582519531, 0.0728597640991211, 0.07551193237304688, 0.07816410064697266, 0.08081626892089844, 0.08346843719482422, 0.08612060546875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 12.0, 9.0, 15.0, 13.0, 13.0, 25.0, 28.0, 38.0, 31.0, 45.0, 47.0, 45.0, 41.0, 52.0, 50.0, 55.0, 61.0, 51.0, 41.0, 40.0, 35.0, 44.0, 24.0, 33.0, 22.0, 23.0, 25.0, 15.0, 12.0, 5.0, 8.0, 10.0, 6.0, 7.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05157470703125, -0.05003643035888672, -0.04849815368652344, -0.046959877014160156, -0.045421600341796875, -0.043883323669433594, -0.04234504699707031, -0.04080677032470703, -0.03926849365234375, -0.03773021697998047, -0.03619194030761719, -0.034653663635253906, -0.033115386962890625, -0.031577110290527344, -0.030038833618164062, -0.02850055694580078, -0.0269622802734375, -0.02542400360107422, -0.023885726928710938, -0.022347450256347656, -0.020809173583984375, -0.019270896911621094, -0.017732620239257812, -0.01619434356689453, -0.01465606689453125, -0.013117790222167969, -0.011579513549804688, -0.010041236877441406, -0.008502960205078125, -0.006964683532714844, -0.0054264068603515625, -0.0038881301879882812, -0.002349853515625, -0.0008115768432617188, 0.0007266998291015625, 0.0022649765014648438, 0.003803253173828125, 0.005341529846191406, 0.0068798065185546875, 0.008418083190917969, 0.00995635986328125, 0.011494636535644531, 0.013032913208007812, 0.014571189880371094, 0.016109466552734375, 0.017647743225097656, 0.019186019897460938, 0.02072429656982422, 0.0222625732421875, 0.02380084991455078, 0.025339126586914062, 0.026877403259277344, 0.028415679931640625, 0.029953956604003906, 0.03149223327636719, 0.03303050994873047, 0.03456878662109375, 0.03610706329345703, 0.03764533996582031, 0.039183616638183594, 0.040721893310546875, 0.042260169982910156, 0.04379844665527344, 0.04533672332763672, 0.046875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 10.0, 10.0, 13.0, 26.0, 41.0, 64.0, 69.0, 108.0, 146.0, 237.0, 339.0, 454.0, 677.0, 950.0, 1356.0, 1968.0, 2932.0, 4289.0, 6811.0, 10448.0, 16964.0, 29049.0, 51176.0, 95896.0, 190554.0, 276080.0, 162244.0, 82198.0, 44737.0, 25369.0, 15267.0, 9479.0, 5971.0, 3957.0, 2672.0, 1864.0, 1206.0, 919.0, 598.0, 450.0, 294.0, 213.0, 143.0, 96.0, 80.0, 51.0, 33.0, 19.0, 13.0, 8.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.08502197265625, -0.0823965072631836, -0.07977104187011719, -0.07714557647705078, -0.07452011108398438, -0.07189464569091797, -0.06926918029785156, -0.06664371490478516, -0.06401824951171875, -0.061392784118652344, -0.05876731872558594, -0.05614185333251953, -0.053516387939453125, -0.05089092254638672, -0.04826545715332031, -0.045639991760253906, -0.0430145263671875, -0.040389060974121094, -0.03776359558105469, -0.03513813018798828, -0.032512664794921875, -0.02988719940185547, -0.027261734008789062, -0.024636268615722656, -0.02201080322265625, -0.019385337829589844, -0.016759872436523438, -0.014134407043457031, -0.011508941650390625, -0.008883476257324219, -0.0062580108642578125, -0.0036325454711914062, -0.001007080078125, 0.0016183853149414062, 0.0042438507080078125, 0.006869316101074219, 0.009494781494140625, 0.012120246887207031, 0.014745712280273438, 0.017371177673339844, 0.01999664306640625, 0.022622108459472656, 0.025247573852539062, 0.02787303924560547, 0.030498504638671875, 0.03312397003173828, 0.03574943542480469, 0.038374900817871094, 0.0410003662109375, 0.043625831604003906, 0.04625129699707031, 0.04887676239013672, 0.051502227783203125, 0.05412769317626953, 0.05675315856933594, 0.059378623962402344, 0.06200408935546875, 0.06462955474853516, 0.06725502014160156, 0.06988048553466797, 0.07250595092773438, 0.07513141632080078, 0.07775688171386719, 0.0803823471069336, 0.0830078125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 10.0, 9.0, 14.0, 15.0, 13.0, 22.0, 21.0, 20.0, 30.0, 30.0, 35.0, 28.0, 30.0, 31.0, 48.0, 35.0, 35.0, 40.0, 40.0, 33.0, 34.0, 38.0, 37.0, 34.0, 31.0, 25.0, 33.0, 24.0, 24.0, 22.0, 20.0, 17.0, 21.0, 11.0, 15.0, 11.0, 8.0, 9.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.021484375, -0.020735502243041992, -0.019986629486083984, -0.019237756729125977, -0.01848888397216797, -0.01774001121520996, -0.016991138458251953, -0.016242265701293945, -0.015493392944335938, -0.01474452018737793, -0.013995647430419922, -0.013246774673461914, -0.012497901916503906, -0.011749029159545898, -0.01100015640258789, -0.010251283645629883, -0.009502410888671875, -0.008753538131713867, -0.00800466537475586, -0.0072557926177978516, -0.006506919860839844, -0.005758047103881836, -0.005009174346923828, -0.00426030158996582, -0.0035114288330078125, -0.0027625560760498047, -0.002013683319091797, -0.001264810562133789, -0.0005159378051757812, 0.00023293495178222656, 0.0009818077087402344, 0.0017306804656982422, 0.00247955322265625, 0.003228425979614258, 0.003977298736572266, 0.0047261714935302734, 0.005475044250488281, 0.006223917007446289, 0.006972789764404297, 0.007721662521362305, 0.008470535278320312, 0.00921940803527832, 0.009968280792236328, 0.010717153549194336, 0.011466026306152344, 0.012214899063110352, 0.01296377182006836, 0.013712644577026367, 0.014461517333984375, 0.015210390090942383, 0.01595926284790039, 0.0167081356048584, 0.017457008361816406, 0.018205881118774414, 0.018954753875732422, 0.01970362663269043, 0.020452499389648438, 0.021201372146606445, 0.021950244903564453, 0.02269911766052246, 0.02344799041748047, 0.024196863174438477, 0.024945735931396484, 0.025694608688354492, 0.0264434814453125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 9.0, 9.0, 10.0, 15.0, 30.0, 42.0, 44.0, 70.0, 111.0, 192.0, 274.0, 445.0, 672.0, 1161.0, 1999.0, 3697.0, 7488.0, 17779.0, 59196.0, 894889.0, 35133.0, 12594.0, 5572.0, 2920.0, 1621.0, 923.0, 577.0, 377.0, 228.0, 162.0, 99.0, 84.0, 42.0, 20.0, 20.0, 17.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.107421875, -0.10429096221923828, -0.10116004943847656, -0.09802913665771484, -0.09489822387695312, -0.0917673110961914, -0.08863639831542969, -0.08550548553466797, -0.08237457275390625, -0.07924365997314453, -0.07611274719238281, -0.0729818344116211, -0.06985092163085938, -0.06672000885009766, -0.06358909606933594, -0.06045818328857422, -0.0573272705078125, -0.05419635772705078, -0.05106544494628906, -0.047934532165527344, -0.044803619384765625, -0.041672706604003906, -0.03854179382324219, -0.03541088104248047, -0.03227996826171875, -0.02914905548095703, -0.026018142700195312, -0.022887229919433594, -0.019756317138671875, -0.016625404357910156, -0.013494491577148438, -0.010363578796386719, -0.007232666015625, -0.004101753234863281, -0.0009708404541015625, 0.0021600723266601562, 0.005290985107421875, 0.008421897888183594, 0.011552810668945312, 0.014683723449707031, 0.01781463623046875, 0.02094554901123047, 0.024076461791992188, 0.027207374572753906, 0.030338287353515625, 0.033469200134277344, 0.03660011291503906, 0.03973102569580078, 0.0428619384765625, 0.04599285125732422, 0.04912376403808594, 0.052254676818847656, 0.055385589599609375, 0.058516502380371094, 0.06164741516113281, 0.06477832794189453, 0.06790924072265625, 0.07104015350341797, 0.07417106628417969, 0.0773019790649414, 0.08043289184570312, 0.08356380462646484, 0.08669471740722656, 0.08982563018798828, 0.09295654296875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 9.0, 11.0, 6.0, 7.0, 19.0, 22.0, 33.0, 21.0, 25.0, 39.0, 40.0, 61.0, 93.0, 65.0, 73.0, 67.0, 60.0, 92.0, 43.0, 35.0, 34.0, 22.0, 26.0, 17.0, 12.0, 13.0, 7.0, 7.0, 7.0, 10.0, 3.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.5299530029296875e-06, -4.3995678424835205e-06, -4.2691826820373535e-06, -4.1387975215911865e-06, -4.0084123611450195e-06, -3.8780272006988525e-06, -3.7476420402526855e-06, -3.6172568798065186e-06, -3.4868717193603516e-06, -3.3564865589141846e-06, -3.2261013984680176e-06, -3.0957162380218506e-06, -2.9653310775756836e-06, -2.8349459171295166e-06, -2.7045607566833496e-06, -2.5741755962371826e-06, -2.4437904357910156e-06, -2.3134052753448486e-06, -2.1830201148986816e-06, -2.0526349544525146e-06, -1.9222497940063477e-06, -1.7918646335601807e-06, -1.6614794731140137e-06, -1.5310943126678467e-06, -1.4007091522216797e-06, -1.2703239917755127e-06, -1.1399388313293457e-06, -1.0095536708831787e-06, -8.791685104370117e-07, -7.487833499908447e-07, -6.183981895446777e-07, -4.880130290985107e-07, -3.5762786865234375e-07, -2.2724270820617676e-07, -9.685754776000977e-08, 3.3527612686157227e-08, 1.6391277313232422e-07, 2.942979335784912e-07, 4.246830940246582e-07, 5.550682544708252e-07, 6.854534149169922e-07, 8.158385753631592e-07, 9.462237358093262e-07, 1.0766088962554932e-06, 1.2069940567016602e-06, 1.3373792171478271e-06, 1.4677643775939941e-06, 1.5981495380401611e-06, 1.7285346984863281e-06, 1.8589198589324951e-06, 1.989305019378662e-06, 2.119690179824829e-06, 2.250075340270996e-06, 2.380460500717163e-06, 2.51084566116333e-06, 2.641230821609497e-06, 2.771615982055664e-06, 2.902001142501831e-06, 3.032386302947998e-06, 3.162771463394165e-06, 3.293156623840332e-06, 3.423541784286499e-06, 3.553926944732666e-06, 3.684312105178833e-06, 3.814697265625e-06]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 14.0, 18.0, 21.0, 24.0, 50.0, 62.0, 78.0, 110.0, 176.0, 236.0, 343.0, 522.0, 734.0, 1086.0, 1713.0, 2709.0, 4652.0, 8694.0, 19425.0, 64658.0, 881145.0, 33017.0, 12611.0, 6432.0, 3672.0, 2162.0, 1311.0, 910.0, 584.0, 400.0, 302.0, 174.0, 145.0, 107.0, 69.0, 49.0, 35.0, 29.0, 17.0, 10.0, 17.0, 11.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080810546875, -0.07822513580322266, -0.07563972473144531, -0.07305431365966797, -0.07046890258789062, -0.06788349151611328, -0.06529808044433594, -0.0627126693725586, -0.06012725830078125, -0.057541847229003906, -0.05495643615722656, -0.05237102508544922, -0.049785614013671875, -0.04720020294189453, -0.04461479187011719, -0.042029380798339844, -0.0394439697265625, -0.036858558654785156, -0.03427314758300781, -0.03168773651123047, -0.029102325439453125, -0.02651691436767578, -0.023931503295898438, -0.021346092224121094, -0.01876068115234375, -0.016175270080566406, -0.013589859008789062, -0.011004447937011719, -0.008419036865234375, -0.005833625793457031, -0.0032482147216796875, -0.0006628036499023438, 0.001922607421875, 0.004508018493652344, 0.0070934295654296875, 0.009678840637207031, 0.012264251708984375, 0.014849662780761719, 0.017435073852539062, 0.020020484924316406, 0.02260589599609375, 0.025191307067871094, 0.027776718139648438, 0.03036212921142578, 0.032947540283203125, 0.03553295135498047, 0.03811836242675781, 0.040703773498535156, 0.0432891845703125, 0.045874595642089844, 0.04846000671386719, 0.05104541778564453, 0.053630828857421875, 0.05621623992919922, 0.05880165100097656, 0.061387062072753906, 0.06397247314453125, 0.0665578842163086, 0.06914329528808594, 0.07172870635986328, 0.07431411743164062, 0.07689952850341797, 0.07948493957519531, 0.08207035064697266, 0.08465576171875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 4.0, 6.0, 10.0, 8.0, 13.0, 14.0, 16.0, 19.0, 24.0, 721.0, 19.0, 29.0, 22.0, 16.0, 8.0, 8.0, 9.0, 3.0, 5.0, 5.0, 3.0, 0.0, 7.0, 3.0, 1.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01934814453125, -0.01872849464416504, -0.018108844757080078, -0.017489194869995117, -0.016869544982910156, -0.016249895095825195, -0.015630245208740234, -0.015010595321655273, -0.014390945434570312, -0.013771295547485352, -0.01315164566040039, -0.01253199577331543, -0.011912345886230469, -0.011292695999145508, -0.010673046112060547, -0.010053396224975586, -0.009433746337890625, -0.008814096450805664, -0.008194446563720703, -0.007574796676635742, -0.006955146789550781, -0.00633549690246582, -0.005715847015380859, -0.0050961971282958984, -0.0044765472412109375, -0.0038568973541259766, -0.0032372474670410156, -0.0026175975799560547, -0.0019979476928710938, -0.0013782978057861328, -0.0007586479187011719, -0.00013899803161621094, 0.00048065185546875, 0.001100301742553711, 0.0017199516296386719, 0.002339601516723633, 0.0029592514038085938, 0.0035789012908935547, 0.004198551177978516, 0.0048182010650634766, 0.0054378509521484375, 0.0060575008392333984, 0.006677150726318359, 0.00729680061340332, 0.007916450500488281, 0.008536100387573242, 0.009155750274658203, 0.009775400161743164, 0.010395050048828125, 0.011014699935913086, 0.011634349822998047, 0.012253999710083008, 0.012873649597167969, 0.01349329948425293, 0.01411294937133789, 0.014732599258422852, 0.015352249145507812, 0.015971899032592773, 0.016591548919677734, 0.017211198806762695, 0.017830848693847656, 0.018450498580932617, 0.019070148468017578, 0.01968979835510254, 0.0203094482421875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 10.0, 12.0, 16.0, 23.0, 46.0, 56.0, 94.0, 141.0, 234.0, 177.0, 76.0, 37.0, 22.0, 14.0, 14.0, 7.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09046808630228043, -0.08663983643054962, -0.08281158655881882, -0.07898333668708801, -0.07515507936477661, -0.0713268369436264, -0.067498579621315, -0.0636703297495842, -0.059842079877853394, -0.05601383000612259, -0.052185580134391785, -0.04835732653737068, -0.04452907666563988, -0.04070082679390907, -0.03687257319688797, -0.033044323325157166, -0.02921607345342636, -0.025387823581695557, -0.021559571847319603, -0.01773132011294365, -0.013903070241212845, -0.01007482036948204, -0.006246568635106087, -0.002418316900730133, 0.0014099329710006714, 0.0052381837740540504, 0.00906643457710743, 0.012894685380160809, 0.016722936183214188, 0.020551186054944992, 0.024379437789320946, 0.0282076895236969, 0.03203593194484711, 0.03586418181657791, 0.039692431688308716, 0.04352068528532982, 0.04734893515706062, 0.05117718502879143, 0.05500543862581253, 0.058833688497543335, 0.06266193836927414, 0.06649018824100494, 0.07031843811273575, 0.07414668798446655, 0.07797494530677795, 0.08180318772792816, 0.08563144505023956, 0.08945969492197037, 0.09328794479370117, 0.09711619466543198, 0.10094444453716278, 0.10477269440889359, 0.10860094428062439, 0.11242920160293579, 0.1162574514746666, 0.1200857013463974, 0.1239139512181282, 0.127742201089859, 0.1315704584121704, 0.13539870083332062, 0.13922695815563202, 0.14305520057678223, 0.14688345789909363, 0.15071171522140503, 0.15453995764255524]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 0.0, 5.0, 9.0, 5.0, 11.0, 16.0, 16.0, 18.0, 24.0, 22.0, 40.0, 36.0, 46.0, 39.0, 49.0, 56.0, 50.0, 60.0, 47.0, 55.0, 52.0, 49.0, 39.0, 38.0, 45.0, 23.0, 28.0, 20.0, 20.0, 15.0, 17.0, 13.0, 10.0, 10.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0564868189394474, -0.05477957800030708, -0.05307233706116676, -0.051365096122026443, -0.049657855182886124, -0.047950614243745804, -0.046243373304605484, -0.044536132365465164, -0.042828891426324844, -0.041121650487184525, -0.039414409548044205, -0.037707168608903885, -0.035999927669763565, -0.034292686730623245, -0.032585445791482925, -0.030878204852342606, -0.029170963913202286, -0.027463722974061966, -0.025756482034921646, -0.024049241095781326, -0.022342000156641006, -0.020634759217500687, -0.018927518278360367, -0.017220277339220047, -0.015513036400079727, -0.013805795460939407, -0.012098554521799088, -0.010391313582658768, -0.008684072643518448, -0.006976831704378128, -0.005269590765237808, -0.0035623498260974884, -0.0018551051616668701, -0.0001478642225265503, 0.0015593767166137695, 0.0032666176557540894, 0.004973858594894409, 0.006681099534034729, 0.008388340473175049, 0.010095581412315369, 0.011802822351455688, 0.013510063290596008, 0.015217304229736328, 0.016924545168876648, 0.018631786108016968, 0.020339027047157288, 0.022046267986297607, 0.023753508925437927, 0.025460749864578247, 0.027167990803718567, 0.028875231742858887, 0.030582472681999207, 0.032289713621139526, 0.033996954560279846, 0.035704195499420166, 0.037411436438560486, 0.039118677377700806, 0.040825918316841125, 0.042533159255981445, 0.044240400195121765, 0.045947641134262085, 0.047654882073402405, 0.049362123012542725, 0.051069363951683044, 0.052776604890823364]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 12.0, 7.0, 8.0, 18.0, 13.0, 34.0, 24.0, 51.0, 57.0, 82.0, 131.0, 188.0, 264.0, 357.0, 555.0, 874.0, 1220.0, 1821.0, 2780.0, 4247.0, 6652.0, 10640.0, 17454.0, 29745.0, 53666.0, 104033.0, 238657.0, 825802.0, 1901176.0, 592968.0, 195740.0, 88783.0, 46040.0, 26008.0, 15915.0, 9870.0, 6474.0, 4186.0, 2773.0, 1851.0, 1136.0, 730.0, 473.0, 294.0, 153.0, 125.0, 76.0, 49.0, 29.0, 18.0, 9.0, 6.0, 2.0, 1.0], "bins": [-0.07354736328125, -0.07163143157958984, -0.06971549987792969, -0.06779956817626953, -0.06588363647460938, -0.06396770477294922, -0.06205177307128906, -0.060135841369628906, -0.05821990966796875, -0.056303977966308594, -0.05438804626464844, -0.05247211456298828, -0.050556182861328125, -0.04864025115966797, -0.04672431945800781, -0.044808387756347656, -0.0428924560546875, -0.040976524353027344, -0.03906059265136719, -0.03714466094970703, -0.035228729248046875, -0.03331279754638672, -0.03139686584472656, -0.029480934143066406, -0.02756500244140625, -0.025649070739746094, -0.023733139038085938, -0.02181720733642578, -0.019901275634765625, -0.01798534393310547, -0.016069412231445312, -0.014153480529785156, -0.012237548828125, -0.010321617126464844, -0.008405685424804688, -0.006489753723144531, -0.004573822021484375, -0.0026578903198242188, -0.0007419586181640625, 0.0011739730834960938, 0.00308990478515625, 0.005005836486816406, 0.0069217681884765625, 0.008837699890136719, 0.010753631591796875, 0.012669563293457031, 0.014585494995117188, 0.016501426696777344, 0.0184173583984375, 0.020333290100097656, 0.022249221801757812, 0.02416515350341797, 0.026081085205078125, 0.02799701690673828, 0.029912948608398438, 0.031828880310058594, 0.03374481201171875, 0.035660743713378906, 0.03757667541503906, 0.03949260711669922, 0.041408538818359375, 0.04332447052001953, 0.04524040222167969, 0.047156333923339844, 0.049072265625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 4.0, 10.0, 7.0, 13.0, 17.0, 14.0, 14.0, 21.0, 30.0, 37.0, 28.0, 40.0, 49.0, 50.0, 50.0, 57.0, 45.0, 53.0, 62.0, 47.0, 54.0, 42.0, 46.0, 34.0, 28.0, 21.0, 25.0, 17.0, 16.0, 15.0, 12.0, 13.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.035736083984375, -0.03474855422973633, -0.033761024475097656, -0.032773494720458984, -0.03178596496582031, -0.03079843521118164, -0.02981090545654297, -0.028823375701904297, -0.027835845947265625, -0.026848316192626953, -0.02586078643798828, -0.02487325668334961, -0.023885726928710938, -0.022898197174072266, -0.021910667419433594, -0.020923137664794922, -0.01993560791015625, -0.018948078155517578, -0.017960548400878906, -0.016973018646240234, -0.015985488891601562, -0.01499795913696289, -0.014010429382324219, -0.013022899627685547, -0.012035369873046875, -0.011047840118408203, -0.010060310363769531, -0.00907278060913086, -0.008085250854492188, -0.007097721099853516, -0.006110191345214844, -0.005122661590576172, -0.0041351318359375, -0.003147602081298828, -0.0021600723266601562, -0.0011725425720214844, -0.0001850128173828125, 0.0008025169372558594, 0.0017900466918945312, 0.002777576446533203, 0.003765106201171875, 0.004752635955810547, 0.005740165710449219, 0.006727695465087891, 0.0077152252197265625, 0.008702754974365234, 0.009690284729003906, 0.010677814483642578, 0.01166534423828125, 0.012652873992919922, 0.013640403747558594, 0.014627933502197266, 0.015615463256835938, 0.01660299301147461, 0.01759052276611328, 0.018578052520751953, 0.019565582275390625, 0.020553112030029297, 0.02154064178466797, 0.02252817153930664, 0.023515701293945312, 0.024503231048583984, 0.025490760803222656, 0.026478290557861328, 0.0274658203125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 8.0, 15.0, 17.0, 13.0, 31.0, 40.0, 57.0, 70.0, 115.0, 139.0, 239.0, 263.0, 421.0, 641.0, 932.0, 1338.0, 2134.0, 3190.0, 5177.0, 8273.0, 14068.0, 24780.0, 46221.0, 93407.0, 209784.0, 579303.0, 1752486.0, 900569.0, 294286.0, 122264.0, 58607.0, 30471.0, 17230.0, 9907.0, 6281.0, 3898.0, 2569.0, 1593.0, 1082.0, 729.0, 511.0, 340.0, 215.0, 175.0, 136.0, 83.0, 45.0, 42.0, 32.0, 15.0, 13.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0], "bins": [-0.0543212890625, -0.052659034729003906, -0.05099678039550781, -0.04933452606201172, -0.047672271728515625, -0.04601001739501953, -0.04434776306152344, -0.042685508728027344, -0.04102325439453125, -0.039361000061035156, -0.03769874572753906, -0.03603649139404297, -0.034374237060546875, -0.03271198272705078, -0.031049728393554688, -0.029387474060058594, -0.0277252197265625, -0.026062965393066406, -0.024400711059570312, -0.02273845672607422, -0.021076202392578125, -0.01941394805908203, -0.017751693725585938, -0.016089439392089844, -0.01442718505859375, -0.012764930725097656, -0.011102676391601562, -0.009440422058105469, -0.007778167724609375, -0.006115913391113281, -0.0044536590576171875, -0.0027914047241210938, -0.001129150390625, 0.0005331039428710938, 0.0021953582763671875, 0.0038576126098632812, 0.005519866943359375, 0.007182121276855469, 0.008844375610351562, 0.010506629943847656, 0.01216888427734375, 0.013831138610839844, 0.015493392944335938, 0.01715564727783203, 0.018817901611328125, 0.02048015594482422, 0.022142410278320312, 0.023804664611816406, 0.0254669189453125, 0.027129173278808594, 0.028791427612304688, 0.03045368194580078, 0.032115936279296875, 0.03377819061279297, 0.03544044494628906, 0.037102699279785156, 0.03876495361328125, 0.040427207946777344, 0.04208946228027344, 0.04375171661376953, 0.045413970947265625, 0.04707622528076172, 0.04873847961425781, 0.050400733947753906, 0.05206298828125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 8.0, 8.0, 9.0, 22.0, 12.0, 29.0, 25.0, 33.0, 44.0, 67.0, 61.0, 98.0, 104.0, 124.0, 128.0, 149.0, 226.0, 271.0, 295.0, 294.0, 337.0, 313.0, 259.0, 210.0, 194.0, 159.0, 113.0, 113.0, 73.0, 69.0, 38.0, 38.0, 36.0, 19.0, 11.0, 17.0, 11.0, 7.0, 10.0, 5.0, 6.0, 4.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.01385498046875, -0.013395071029663086, -0.012935161590576172, -0.012475252151489258, -0.012015342712402344, -0.01155543327331543, -0.011095523834228516, -0.010635614395141602, -0.010175704956054688, -0.009715795516967773, -0.00925588607788086, -0.008795976638793945, -0.008336067199707031, -0.007876157760620117, -0.007416248321533203, -0.006956338882446289, -0.006496429443359375, -0.006036520004272461, -0.005576610565185547, -0.005116701126098633, -0.004656791687011719, -0.004196882247924805, -0.0037369728088378906, -0.0032770633697509766, -0.0028171539306640625, -0.0023572444915771484, -0.0018973350524902344, -0.0014374256134033203, -0.0009775161743164062, -0.0005176067352294922, -5.7697296142578125e-05, 0.00040221214294433594, 0.00086212158203125, 0.001322031021118164, 0.0017819404602050781, 0.002241849899291992, 0.0027017593383789062, 0.0031616687774658203, 0.0036215782165527344, 0.0040814876556396484, 0.0045413970947265625, 0.0050013065338134766, 0.005461215972900391, 0.005921125411987305, 0.006381034851074219, 0.006840944290161133, 0.007300853729248047, 0.007760763168334961, 0.008220672607421875, 0.008680582046508789, 0.009140491485595703, 0.009600400924682617, 0.010060310363769531, 0.010520219802856445, 0.01098012924194336, 0.011440038681030273, 0.011899948120117188, 0.012359857559204102, 0.012819766998291016, 0.01327967643737793, 0.013739585876464844, 0.014199495315551758, 0.014659404754638672, 0.015119314193725586, 0.0155792236328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 7.0, 13.0, 19.0, 39.0, 59.0, 86.0, 121.0, 190.0, 169.0, 110.0, 63.0, 28.0, 25.0, 19.0, 12.0, 8.0, 6.0, 5.0, 2.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06749097257852554, -0.06515972316265106, -0.06282848119735718, -0.0604972317814827, -0.058165982365608215, -0.05583473667502403, -0.05350349098443985, -0.05117224156856537, -0.048840995877981186, -0.046509750187397, -0.04417850077152252, -0.04184725508093834, -0.039516009390354156, -0.037184759974479675, -0.03485351428389549, -0.03252226859331131, -0.03019101917743683, -0.027859771624207497, -0.025528524070978165, -0.023197278380393982, -0.02086603082716465, -0.018534783273935318, -0.016203537583351135, -0.013872290030121803, -0.011541042476892471, -0.00920979492366314, -0.006878548301756382, -0.004547301214188337, -0.0022160541266202927, 0.0001151934266090393, 0.0024464400485157967, 0.004777686670422554, 0.007108934223651886, 0.009440181776881218, 0.011771428398787975, 0.014102675020694733, 0.016433922573924065, 0.018765170127153397, 0.02109641581773758, 0.02342766337096691, 0.025758910924196243, 0.028090158477425575, 0.030421406030654907, 0.03275265172123909, 0.03508389741182327, 0.037415146827697754, 0.03974639251828194, 0.04207763820886612, 0.0444088876247406, 0.04674013331532478, 0.049071382731199265, 0.05140262842178345, 0.05373387783765793, 0.05606512352824211, 0.058396369218826294, 0.060727618634700775, 0.06305886805057526, 0.06539011746644974, 0.06772135943174362, 0.0700526088476181, 0.07238385826349258, 0.07471510767936707, 0.07704634964466095, 0.07937759906053543, 0.08170884102582932]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 9.0, 10.0, 8.0, 13.0, 20.0, 22.0, 24.0, 23.0, 17.0, 22.0, 42.0, 37.0, 41.0, 41.0, 50.0, 40.0, 42.0, 53.0, 60.0, 54.0, 49.0, 38.0, 35.0, 38.0, 29.0, 25.0, 19.0, 25.0, 19.0, 19.0, 17.0, 10.0, 13.0, 8.0, 6.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.03549375757575035, -0.03448797017335892, -0.033482182770967484, -0.03247639536857605, -0.031470607966184616, -0.03046482242643833, -0.029459035024046898, -0.028453247621655464, -0.02744746208190918, -0.026441674679517746, -0.025435887277126312, -0.02443009987473488, -0.023424314334988594, -0.02241852693259716, -0.021412739530205727, -0.020406952127814293, -0.01940116472542286, -0.018395377323031425, -0.017389589920639992, -0.016383804380893707, -0.015378016978502274, -0.01437222957611084, -0.013366442173719406, -0.012360654771327972, -0.011354868300259113, -0.01034908089786768, -0.00934329442679882, -0.008337507024407387, -0.00733172008767724, -0.006325933150947094, -0.00532014574855566, -0.004314358811825514, -0.0033085737377405167, -0.0023027868010103703, -0.0012969996314495802, -0.00029121246188879013, 0.0007145744748413563, 0.0017203614115715027, 0.0027261488139629364, 0.003731935750693083, 0.004737722687423229, 0.005743509624153376, 0.006749296560883522, 0.007755083963274956, 0.00876087136566639, 0.009766657836735249, 0.010772445239126682, 0.011778231710195541, 0.012784019112586975, 0.013789806514978409, 0.014795592986047268, 0.015801381319761276, 0.01680716685950756, 0.017812954261898994, 0.018818741664290428, 0.019824529066681862, 0.020830314606428146, 0.02183610200881958, 0.022841889411211014, 0.023847676813602448, 0.024853462353348732, 0.025859249755740166, 0.0268650371581316, 0.027870824560523033, 0.028876611962914467]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 2.0, 14.0, 12.0, 12.0, 13.0, 27.0, 37.0, 56.0, 77.0, 139.0, 167.0, 276.0, 404.0, 621.0, 980.0, 1618.0, 2678.0, 4647.0, 8804.0, 18962.0, 47298.0, 157159.0, 475914.0, 220664.0, 61139.0, 23054.0, 10179.0, 5376.0, 3162.0, 1823.0, 1154.0, 748.0, 461.0, 307.0, 173.0, 152.0, 82.0, 54.0, 36.0, 26.0, 18.0, 12.0, 11.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.04718017578125, -0.0457768440246582, -0.044373512268066406, -0.04297018051147461, -0.04156684875488281, -0.040163516998291016, -0.03876018524169922, -0.03735685348510742, -0.035953521728515625, -0.03455018997192383, -0.03314685821533203, -0.031743526458740234, -0.030340194702148438, -0.02893686294555664, -0.027533531188964844, -0.026130199432373047, -0.02472686767578125, -0.023323535919189453, -0.021920204162597656, -0.02051687240600586, -0.019113540649414062, -0.017710208892822266, -0.01630687713623047, -0.014903545379638672, -0.013500213623046875, -0.012096881866455078, -0.010693550109863281, -0.009290218353271484, -0.007886886596679688, -0.006483554840087891, -0.005080223083496094, -0.003676891326904297, -0.0022735595703125, -0.0008702278137207031, 0.0005331039428710938, 0.0019364356994628906, 0.0033397674560546875, 0.004743099212646484, 0.006146430969238281, 0.007549762725830078, 0.008953094482421875, 0.010356426239013672, 0.011759757995605469, 0.013163089752197266, 0.014566421508789062, 0.01596975326538086, 0.017373085021972656, 0.018776416778564453, 0.02017974853515625, 0.021583080291748047, 0.022986412048339844, 0.02438974380493164, 0.025793075561523438, 0.027196407318115234, 0.02859973907470703, 0.030003070831298828, 0.031406402587890625, 0.03280973434448242, 0.03421306610107422, 0.035616397857666016, 0.03701972961425781, 0.03842306137084961, 0.039826393127441406, 0.0412297248840332, 0.042633056640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 5.0, 6.0, 7.0, 9.0, 13.0, 14.0, 18.0, 27.0, 27.0, 25.0, 30.0, 32.0, 41.0, 39.0, 42.0, 49.0, 44.0, 42.0, 55.0, 47.0, 56.0, 46.0, 37.0, 43.0, 32.0, 30.0, 23.0, 25.0, 27.0, 23.0, 19.0, 12.0, 10.0, 10.0, 9.0, 9.0, 7.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.034454345703125, -0.03347444534301758, -0.032494544982910156, -0.031514644622802734, -0.030534744262695312, -0.02955484390258789, -0.02857494354248047, -0.027595043182373047, -0.026615142822265625, -0.025635242462158203, -0.02465534210205078, -0.02367544174194336, -0.022695541381835938, -0.021715641021728516, -0.020735740661621094, -0.019755840301513672, -0.01877593994140625, -0.017796039581298828, -0.016816139221191406, -0.015836238861083984, -0.014856338500976562, -0.01387643814086914, -0.012896537780761719, -0.011916637420654297, -0.010936737060546875, -0.009956836700439453, -0.008976936340332031, -0.00799703598022461, -0.0070171356201171875, -0.006037235260009766, -0.005057334899902344, -0.004077434539794922, -0.0030975341796875, -0.002117633819580078, -0.0011377334594726562, -0.00015783309936523438, 0.0008220672607421875, 0.0018019676208496094, 0.0027818679809570312, 0.003761768341064453, 0.004741668701171875, 0.005721569061279297, 0.006701469421386719, 0.007681369781494141, 0.008661270141601562, 0.009641170501708984, 0.010621070861816406, 0.011600971221923828, 0.01258087158203125, 0.013560771942138672, 0.014540672302246094, 0.015520572662353516, 0.016500473022460938, 0.01748037338256836, 0.01846027374267578, 0.019440174102783203, 0.020420074462890625, 0.021399974822998047, 0.02237987518310547, 0.02335977554321289, 0.024339675903320312, 0.025319576263427734, 0.026299476623535156, 0.027279376983642578, 0.02825927734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 15.0, 19.0, 30.0, 35.0, 66.0, 85.0, 150.0, 220.0, 412.0, 633.0, 1070.0, 1862.0, 3538.0, 7158.0, 17434.0, 55626.0, 351097.0, 498897.0, 71771.0, 21067.0, 8380.0, 3978.0, 2072.0, 1131.0, 701.0, 415.0, 232.0, 157.0, 90.0, 63.0, 48.0, 36.0, 11.0, 11.0, 9.0, 8.0, 10.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053955078125, -0.052100181579589844, -0.05024528503417969, -0.04839038848876953, -0.046535491943359375, -0.04468059539794922, -0.04282569885253906, -0.040970802307128906, -0.03911590576171875, -0.037261009216308594, -0.03540611267089844, -0.03355121612548828, -0.031696319580078125, -0.02984142303466797, -0.027986526489257812, -0.026131629943847656, -0.0242767333984375, -0.022421836853027344, -0.020566940307617188, -0.01871204376220703, -0.016857147216796875, -0.015002250671386719, -0.013147354125976562, -0.011292457580566406, -0.00943756103515625, -0.007582664489746094, -0.0057277679443359375, -0.0038728713989257812, -0.002017974853515625, -0.00016307830810546875, 0.0016918182373046875, 0.0035467147827148438, 0.005401611328125, 0.007256507873535156, 0.009111404418945312, 0.010966300964355469, 0.012821197509765625, 0.014676094055175781, 0.016530990600585938, 0.018385887145996094, 0.02024078369140625, 0.022095680236816406, 0.023950576782226562, 0.02580547332763672, 0.027660369873046875, 0.02951526641845703, 0.03137016296386719, 0.033225059509277344, 0.0350799560546875, 0.036934852600097656, 0.03878974914550781, 0.04064464569091797, 0.042499542236328125, 0.04435443878173828, 0.04620933532714844, 0.048064231872558594, 0.04991912841796875, 0.051774024963378906, 0.05362892150878906, 0.05548381805419922, 0.057338714599609375, 0.05919361114501953, 0.06104850769042969, 0.06290340423583984, 0.06475830078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 10.0, 10.0, 8.0, 13.0, 14.0, 14.0, 16.0, 27.0, 20.0, 33.0, 31.0, 34.0, 30.0, 43.0, 53.0, 40.0, 47.0, 36.0, 53.0, 37.0, 38.0, 41.0, 35.0, 39.0, 35.0, 28.0, 24.0, 23.0, 25.0, 28.0, 15.0, 19.0, 21.0, 8.0, 16.0, 6.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0189056396484375, -0.01831841468811035, -0.017731189727783203, -0.017143964767456055, -0.016556739807128906, -0.015969514846801758, -0.01538228988647461, -0.014795064926147461, -0.014207839965820312, -0.013620615005493164, -0.013033390045166016, -0.012446165084838867, -0.011858940124511719, -0.01127171516418457, -0.010684490203857422, -0.010097265243530273, -0.009510040283203125, -0.008922815322875977, -0.008335590362548828, -0.00774836540222168, -0.007161140441894531, -0.006573915481567383, -0.005986690521240234, -0.005399465560913086, -0.0048122406005859375, -0.004225015640258789, -0.0036377906799316406, -0.003050565719604492, -0.0024633407592773438, -0.0018761157989501953, -0.0012888908386230469, -0.0007016658782958984, -0.00011444091796875, 0.00047278404235839844, 0.0010600090026855469, 0.0016472339630126953, 0.0022344589233398438, 0.002821683883666992, 0.0034089088439941406, 0.003996133804321289, 0.0045833587646484375, 0.005170583724975586, 0.005757808685302734, 0.006345033645629883, 0.006932258605957031, 0.00751948356628418, 0.008106708526611328, 0.008693933486938477, 0.009281158447265625, 0.009868383407592773, 0.010455608367919922, 0.01104283332824707, 0.011630058288574219, 0.012217283248901367, 0.012804508209228516, 0.013391733169555664, 0.013978958129882812, 0.014566183090209961, 0.01515340805053711, 0.015740633010864258, 0.016327857971191406, 0.016915082931518555, 0.017502307891845703, 0.01808953285217285, 0.0186767578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 2.0, 6.0, 8.0, 14.0, 29.0, 38.0, 66.0, 72.0, 105.0, 173.0, 252.0, 367.0, 514.0, 735.0, 1166.0, 1741.0, 2806.0, 4668.0, 7730.0, 14227.0, 28135.0, 63410.0, 184648.0, 457193.0, 163371.0, 57794.0, 26020.0, 13312.0, 7404.0, 4527.0, 2702.0, 1779.0, 1088.0, 741.0, 533.0, 346.0, 259.0, 191.0, 97.0, 87.0, 67.0, 39.0, 30.0, 18.0, 6.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007537841796875, -0.007305562496185303, -0.0070732831954956055, -0.006841003894805908, -0.006608724594116211, -0.006376445293426514, -0.006144165992736816, -0.005911886692047119, -0.005679607391357422, -0.005447328090667725, -0.005215048789978027, -0.00498276948928833, -0.004750490188598633, -0.0045182108879089355, -0.004285931587219238, -0.004053652286529541, -0.0038213729858398438, -0.0035890936851501465, -0.0033568143844604492, -0.003124535083770752, -0.0028922557830810547, -0.0026599764823913574, -0.00242769718170166, -0.002195417881011963, -0.0019631385803222656, -0.0017308592796325684, -0.001498579978942871, -0.0012663006782531738, -0.0010340213775634766, -0.0008017420768737793, -0.000569462776184082, -0.00033718347549438477, -0.0001049041748046875, 0.00012737512588500977, 0.00035965442657470703, 0.0005919337272644043, 0.0008242130279541016, 0.0010564923286437988, 0.001288771629333496, 0.0015210509300231934, 0.0017533302307128906, 0.001985609531402588, 0.002217888832092285, 0.0024501681327819824, 0.0026824474334716797, 0.002914726734161377, 0.0031470060348510742, 0.0033792853355407715, 0.0036115646362304688, 0.003843843936920166, 0.004076123237609863, 0.0043084025382995605, 0.004540681838989258, 0.004772961139678955, 0.005005240440368652, 0.00523751974105835, 0.005469799041748047, 0.005702078342437744, 0.005934357643127441, 0.006166636943817139, 0.006398916244506836, 0.006631195545196533, 0.0068634748458862305, 0.007095754146575928, 0.007328033447265625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 2.0, 5.0, 9.0, 12.0, 14.0, 35.0, 56.0, 65.0, 148.0, 174.0, 164.0, 117.0, 60.0, 39.0, 18.0, 12.0, 16.0, 5.0, 4.0, 7.0, 0.0, 6.0, 5.0, 0.0, 4.0, 1.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7821788787841797e-05, -1.724250614643097e-05, -1.666322350502014e-05, -1.6083940863609314e-05, -1.5504658222198486e-05, -1.4925375580787659e-05, -1.4346092939376831e-05, -1.3766810297966003e-05, -1.3187527656555176e-05, -1.2608245015144348e-05, -1.202896237373352e-05, -1.1449679732322693e-05, -1.0870397090911865e-05, -1.0291114449501038e-05, -9.71183180809021e-06, -9.132549166679382e-06, -8.553266525268555e-06, -7.973983883857727e-06, -7.394701242446899e-06, -6.815418601036072e-06, -6.236135959625244e-06, -5.6568533182144165e-06, -5.077570676803589e-06, -4.498288035392761e-06, -3.919005393981934e-06, -3.339722752571106e-06, -2.7604401111602783e-06, -2.1811574697494507e-06, -1.601874828338623e-06, -1.0225921869277954e-06, -4.4330954551696777e-07, 1.3597309589385986e-07, 7.152557373046875e-07, 1.2945383787155151e-06, 1.8738210201263428e-06, 2.4531036615371704e-06, 3.032386302947998e-06, 3.6116689443588257e-06, 4.190951585769653e-06, 4.770234227180481e-06, 5.349516868591309e-06, 5.928799510002136e-06, 6.508082151412964e-06, 7.0873647928237915e-06, 7.666647434234619e-06, 8.245930075645447e-06, 8.825212717056274e-06, 9.404495358467102e-06, 9.98377799987793e-06, 1.0563060641288757e-05, 1.1142343282699585e-05, 1.1721625924110413e-05, 1.230090856552124e-05, 1.2880191206932068e-05, 1.3459473848342896e-05, 1.4038756489753723e-05, 1.461803913116455e-05, 1.5197321772575378e-05, 1.5776604413986206e-05, 1.6355887055397034e-05, 1.693516969680786e-05, 1.751445233821869e-05, 1.8093734979629517e-05, 1.8673017621040344e-05, 1.9252300262451172e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 4.0, 6.0, 9.0, 14.0, 19.0, 20.0, 40.0, 48.0, 74.0, 129.0, 195.0, 319.0, 512.0, 901.0, 1508.0, 2738.0, 5150.0, 10285.0, 22248.0, 53195.0, 150703.0, 454937.0, 218972.0, 70966.0, 28585.0, 12947.0, 6344.0, 3241.0, 1782.0, 1012.0, 660.0, 359.0, 235.0, 137.0, 91.0, 44.0, 44.0, 29.0, 12.0, 12.0, 11.0, 2.0, 2.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007762908935546875, -0.007525146007537842, -0.007287383079528809, -0.007049620151519775, -0.006811857223510742, -0.006574094295501709, -0.006336331367492676, -0.006098568439483643, -0.005860805511474609, -0.005623042583465576, -0.005385279655456543, -0.00514751672744751, -0.0049097537994384766, -0.004671990871429443, -0.00443422794342041, -0.004196465015411377, -0.003958702087402344, -0.0037209391593933105, -0.0034831762313842773, -0.003245413303375244, -0.003007650375366211, -0.0027698874473571777, -0.0025321245193481445, -0.0022943615913391113, -0.002056598663330078, -0.001818835735321045, -0.0015810728073120117, -0.0013433098793029785, -0.0011055469512939453, -0.0008677840232849121, -0.0006300210952758789, -0.0003922581672668457, -0.0001544952392578125, 8.32676887512207e-05, 0.0003210306167602539, 0.0005587935447692871, 0.0007965564727783203, 0.0010343194007873535, 0.0012720823287963867, 0.00150984525680542, 0.0017476081848144531, 0.0019853711128234863, 0.0022231340408325195, 0.0024608969688415527, 0.002698659896850586, 0.002936422824859619, 0.0031741857528686523, 0.0034119486808776855, 0.0036497116088867188, 0.003887474536895752, 0.004125237464904785, 0.004363000392913818, 0.0046007633209228516, 0.004838526248931885, 0.005076289176940918, 0.005314052104949951, 0.005551815032958984, 0.005789577960968018, 0.006027340888977051, 0.006265103816986084, 0.006502866744995117, 0.00674062967300415, 0.006978392601013184, 0.007216155529022217, 0.00745391845703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 5.0, 7.0, 10.0, 10.0, 11.0, 8.0, 12.0, 21.0, 24.0, 39.0, 37.0, 40.0, 55.0, 58.0, 71.0, 63.0, 78.0, 65.0, 70.0, 49.0, 44.0, 51.0, 25.0, 29.0, 24.0, 17.0, 13.0, 10.0, 7.0, 8.0, 7.0, 7.0, 8.0, 3.0, 4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00147247314453125, -0.0014088153839111328, -0.0013451576232910156, -0.0012814998626708984, -0.0012178421020507812, -0.001154184341430664, -0.0010905265808105469, -0.0010268688201904297, -0.0009632110595703125, -0.0008995532989501953, -0.0008358955383300781, -0.0007722377777099609, -0.0007085800170898438, -0.0006449222564697266, -0.0005812644958496094, -0.0005176067352294922, -0.000453948974609375, -0.0003902912139892578, -0.0003266334533691406, -0.00026297569274902344, -0.00019931793212890625, -0.00013566017150878906, -7.200241088867188e-05, -8.344650268554688e-06, 5.53131103515625e-05, 0.00011897087097167969, 0.00018262863159179688, 0.00024628639221191406, 0.00030994415283203125, 0.00037360191345214844, 0.0004372596740722656, 0.0005009174346923828, 0.0005645751953125, 0.0006282329559326172, 0.0006918907165527344, 0.0007555484771728516, 0.0008192062377929688, 0.0008828639984130859, 0.0009465217590332031, 0.0010101795196533203, 0.0010738372802734375, 0.0011374950408935547, 0.0012011528015136719, 0.001264810562133789, 0.0013284683227539062, 0.0013921260833740234, 0.0014557838439941406, 0.0015194416046142578, 0.001583099365234375, 0.0016467571258544922, 0.0017104148864746094, 0.0017740726470947266, 0.0018377304077148438, 0.001901388168334961, 0.001965045928955078, 0.0020287036895751953, 0.0020923614501953125, 0.0021560192108154297, 0.002219676971435547, 0.002283334732055664, 0.0023469924926757812, 0.0024106502532958984, 0.0024743080139160156, 0.002537965774536133, 0.00260162353515625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 6.0, 14.0, 9.0, 25.0, 57.0, 71.0, 94.0, 178.0, 190.0, 129.0, 81.0, 39.0, 29.0, 18.0, 19.0, 8.0, 7.0, 8.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05892157554626465, -0.056685153394937515, -0.05444873124361038, -0.05221230909228325, -0.049975886940956116, -0.04773946851491928, -0.04550304636359215, -0.043266624212265015, -0.04103020206093788, -0.03879377990961075, -0.036557357758283615, -0.03432093560695648, -0.03208451718091965, -0.029848093166947365, -0.02761167287826538, -0.025375250726938248, -0.023138828575611115, -0.02090240642428398, -0.018665984272956848, -0.016429563984274864, -0.014193141832947731, -0.011956719681620598, -0.00972029846161604, -0.007483877241611481, -0.0052474550902843475, -0.0030110334046185017, -0.0007746117189526558, 0.00146180996671319, 0.003698231652379036, 0.005934653803706169, 0.008171075023710728, 0.010407496243715286, 0.012643925845623016, 0.01488034799695015, 0.017116770148277283, 0.019353190436959267, 0.0215896125882864, 0.023826034739613533, 0.026062455028295517, 0.02829887717962265, 0.030535299330949783, 0.032771721482276917, 0.03500814363360405, 0.03724456578493118, 0.03948098421096802, 0.04171741008758545, 0.043953828513622284, 0.04619025066494942, 0.04842667281627655, 0.050663094967603683, 0.05289951711893082, 0.05513593927025795, 0.05737236142158508, 0.05960877984762192, 0.06184520199894905, 0.06408162415027618, 0.06631805002689362, 0.06855446845293045, 0.07079089432954788, 0.07302731275558472, 0.07526373863220215, 0.07750015705823898, 0.07973658293485641, 0.08197300136089325, 0.08420941978693008]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 6.0, 4.0, 12.0, 8.0, 18.0, 11.0, 29.0, 21.0, 22.0, 19.0, 25.0, 34.0, 46.0, 41.0, 44.0, 44.0, 38.0, 53.0, 51.0, 52.0, 56.0, 58.0, 33.0, 36.0, 34.0, 32.0, 21.0, 21.0, 22.0, 20.0, 16.0, 19.0, 9.0, 13.0, 9.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.034080080687999725, -0.0331118069589138, -0.03214352950453758, -0.03117525391280651, -0.03020697832107544, -0.029238702729344368, -0.028270427137613297, -0.027302153408527374, -0.026333875954151154, -0.025365600362420082, -0.02439732477068901, -0.02342904917895794, -0.022460773587226868, -0.021492497995495796, -0.020524222403764725, -0.019555948674678802, -0.01858767308294773, -0.01761939749121666, -0.016651121899485588, -0.015682846307754517, -0.014714570716023445, -0.013746295124292374, -0.012778020463883877, -0.011809744872152805, -0.010841469280421734, -0.009873193688690662, -0.008904918096959591, -0.007936643436551094, -0.006968367379158735, -0.006000091787427664, -0.00503181666135788, -0.004063541069626808, -0.0030952654778957367, -0.0021269898861646652, -0.0011587145272642374, -0.00019043916836380959, 0.0007778364233672619, 0.0017461120150983334, 0.0027143871411681175, 0.003682662732899189, 0.0046509383246302605, 0.005619213916361332, 0.006587489508092403, 0.007555764634162188, 0.008524039760231972, 0.009492315351963043, 0.010460590943694115, 0.011428866535425186, 0.012397142127156258, 0.013365417718887329, 0.0143336933106184, 0.015301968902349472, 0.016270244494080544, 0.017238520085811615, 0.018206793814897537, 0.019175071269273758, 0.02014334499835968, 0.02111162059009075, 0.022079896181821823, 0.023048171773552895, 0.024016447365283966, 0.024984722957015038, 0.02595299854874611, 0.02692127227783203, 0.027889549732208252]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 15.0, 13.0, 24.0, 35.0, 51.0, 56.0, 116.0, 114.0, 216.0, 323.0, 446.0, 607.0, 901.0, 1305.0, 1846.0, 2775.0, 3919.0, 5704.0, 8519.0, 13037.0, 20056.0, 30560.0, 48700.0, 80007.0, 136084.0, 215990.0, 186112.0, 109541.0, 65209.0, 40033.0, 25548.0, 16398.0, 10962.0, 7407.0, 4950.0, 3388.0, 2347.0, 1578.0, 1114.0, 740.0, 526.0, 393.0, 263.0, 206.0, 143.0, 84.0, 53.0, 45.0, 31.0, 23.0, 16.0, 10.0, 6.0, 2.0, 5.0, 3.0, 1.0], "bins": [-0.043365478515625, -0.042043209075927734, -0.04072093963623047, -0.0393986701965332, -0.03807640075683594, -0.03675413131713867, -0.035431861877441406, -0.03410959243774414, -0.032787322998046875, -0.03146505355834961, -0.030142784118652344, -0.028820514678955078, -0.027498245239257812, -0.026175975799560547, -0.02485370635986328, -0.023531436920166016, -0.02220916748046875, -0.020886898040771484, -0.01956462860107422, -0.018242359161376953, -0.016920089721679688, -0.015597820281982422, -0.014275550842285156, -0.01295328140258789, -0.011631011962890625, -0.01030874252319336, -0.008986473083496094, -0.007664203643798828, -0.0063419342041015625, -0.005019664764404297, -0.0036973953247070312, -0.0023751258850097656, -0.0010528564453125, 0.0002694129943847656, 0.0015916824340820312, 0.002913951873779297, 0.0042362213134765625, 0.005558490753173828, 0.006880760192871094, 0.00820302963256836, 0.009525299072265625, 0.01084756851196289, 0.012169837951660156, 0.013492107391357422, 0.014814376831054688, 0.016136646270751953, 0.01745891571044922, 0.018781185150146484, 0.02010345458984375, 0.021425724029541016, 0.02274799346923828, 0.024070262908935547, 0.025392532348632812, 0.026714801788330078, 0.028037071228027344, 0.02935934066772461, 0.030681610107421875, 0.03200387954711914, 0.033326148986816406, 0.03464841842651367, 0.03597068786621094, 0.0372929573059082, 0.03861522674560547, 0.039937496185302734, 0.041259765625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 6.0, 7.0, 13.0, 9.0, 16.0, 25.0, 17.0, 13.0, 18.0, 28.0, 22.0, 33.0, 40.0, 45.0, 31.0, 38.0, 48.0, 43.0, 50.0, 37.0, 62.0, 54.0, 40.0, 31.0, 39.0, 30.0, 26.0, 25.0, 23.0, 27.0, 24.0, 18.0, 14.0, 10.0, 8.0, 11.0, 4.0, 3.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0247650146484375, -0.024006366729736328, -0.023247718811035156, -0.022489070892333984, -0.021730422973632812, -0.02097177505493164, -0.02021312713623047, -0.019454479217529297, -0.018695831298828125, -0.017937183380126953, -0.01717853546142578, -0.01641988754272461, -0.015661239624023438, -0.014902591705322266, -0.014143943786621094, -0.013385295867919922, -0.01262664794921875, -0.011868000030517578, -0.011109352111816406, -0.010350704193115234, -0.009592056274414062, -0.00883340835571289, -0.008074760437011719, -0.007316112518310547, -0.006557464599609375, -0.005798816680908203, -0.005040168762207031, -0.004281520843505859, -0.0035228729248046875, -0.0027642250061035156, -0.0020055770874023438, -0.0012469291687011719, -0.00048828125, 0.0002703666687011719, 0.0010290145874023438, 0.0017876625061035156, 0.0025463104248046875, 0.0033049583435058594, 0.004063606262207031, 0.004822254180908203, 0.005580902099609375, 0.006339550018310547, 0.007098197937011719, 0.00785684585571289, 0.008615493774414062, 0.009374141693115234, 0.010132789611816406, 0.010891437530517578, 0.01165008544921875, 0.012408733367919922, 0.013167381286621094, 0.013926029205322266, 0.014684677124023438, 0.01544332504272461, 0.01620197296142578, 0.016960620880126953, 0.017719268798828125, 0.018477916717529297, 0.01923656463623047, 0.01999521255493164, 0.020753860473632812, 0.021512508392333984, 0.022271156311035156, 0.023029804229736328, 0.0237884521484375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 10.0, 6.0, 13.0, 26.0, 40.0, 52.0, 85.0, 104.0, 176.0, 210.0, 310.0, 397.0, 643.0, 860.0, 1277.0, 1833.0, 2668.0, 3827.0, 5841.0, 8717.0, 13667.0, 21964.0, 36824.0, 63799.0, 115084.0, 197668.0, 228053.0, 144350.0, 80063.0, 45203.0, 26676.0, 16426.0, 10357.0, 6811.0, 4588.0, 3046.0, 2069.0, 1439.0, 978.0, 720.0, 500.0, 358.0, 230.0, 174.0, 141.0, 91.0, 56.0, 46.0, 30.0, 22.0, 13.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.0406494140625, -0.039386749267578125, -0.03812408447265625, -0.036861419677734375, -0.0355987548828125, -0.034336090087890625, -0.03307342529296875, -0.031810760498046875, -0.030548095703125, -0.029285430908203125, -0.02802276611328125, -0.026760101318359375, -0.0254974365234375, -0.024234771728515625, -0.02297210693359375, -0.021709442138671875, -0.02044677734375, -0.019184112548828125, -0.01792144775390625, -0.016658782958984375, -0.0153961181640625, -0.014133453369140625, -0.01287078857421875, -0.011608123779296875, -0.010345458984375, -0.009082794189453125, -0.00782012939453125, -0.006557464599609375, -0.0052947998046875, -0.004032135009765625, -0.00276947021484375, -0.001506805419921875, -0.000244140625, 0.001018524169921875, 0.00228118896484375, 0.003543853759765625, 0.0048065185546875, 0.006069183349609375, 0.00733184814453125, 0.008594512939453125, 0.009857177734375, 0.011119842529296875, 0.01238250732421875, 0.013645172119140625, 0.0149078369140625, 0.016170501708984375, 0.01743316650390625, 0.018695831298828125, 0.01995849609375, 0.021221160888671875, 0.02248382568359375, 0.023746490478515625, 0.0250091552734375, 0.026271820068359375, 0.02753448486328125, 0.028797149658203125, 0.030059814453125, 0.031322479248046875, 0.03258514404296875, 0.033847808837890625, 0.0351104736328125, 0.036373138427734375, 0.03763580322265625, 0.038898468017578125, 0.0401611328125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 4.0, 3.0, 4.0, 7.0, 11.0, 5.0, 13.0, 11.0, 12.0, 23.0, 24.0, 26.0, 25.0, 27.0, 28.0, 27.0, 38.0, 37.0, 31.0, 38.0, 38.0, 40.0, 37.0, 37.0, 31.0, 41.0, 39.0, 45.0, 36.0, 39.0, 31.0, 18.0, 26.0, 22.0, 26.0, 16.0, 14.0, 12.0, 13.0, 5.0, 9.0, 10.0, 4.0, 7.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0142364501953125, -0.013802409172058105, -0.013368368148803711, -0.012934327125549316, -0.012500286102294922, -0.012066245079040527, -0.011632204055786133, -0.011198163032531738, -0.010764122009277344, -0.01033008098602295, -0.009896039962768555, -0.00946199893951416, -0.009027957916259766, -0.008593916893005371, -0.008159875869750977, -0.007725834846496582, -0.0072917938232421875, -0.006857752799987793, -0.0064237117767333984, -0.005989670753479004, -0.005555629730224609, -0.005121588706970215, -0.00468754768371582, -0.004253506660461426, -0.0038194656372070312, -0.0033854246139526367, -0.002951383590698242, -0.0025173425674438477, -0.002083301544189453, -0.0016492605209350586, -0.001215219497680664, -0.0007811784744262695, -0.000347137451171875, 8.690357208251953e-05, 0.0005209445953369141, 0.0009549856185913086, 0.0013890266418457031, 0.0018230676651000977, 0.002257108688354492, 0.0026911497116088867, 0.0031251907348632812, 0.0035592317581176758, 0.00399327278137207, 0.004427313804626465, 0.004861354827880859, 0.005295395851135254, 0.0057294368743896484, 0.006163477897644043, 0.0065975189208984375, 0.007031559944152832, 0.0074656009674072266, 0.007899641990661621, 0.008333683013916016, 0.00876772403717041, 0.009201765060424805, 0.0096358060836792, 0.010069847106933594, 0.010503888130187988, 0.010937929153442383, 0.011371970176696777, 0.011806011199951172, 0.012240052223205566, 0.012674093246459961, 0.013108134269714355, 0.01354217529296875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 2.0, 4.0, 2.0, 8.0, 14.0, 10.0, 22.0, 24.0, 24.0, 37.0, 58.0, 62.0, 129.0, 184.0, 240.0, 332.0, 553.0, 793.0, 1228.0, 2025.0, 3257.0, 5573.0, 10106.0, 19671.0, 41896.0, 704168.0, 176964.0, 39270.0, 18281.0, 9610.0, 5395.0, 3121.0, 1894.0, 1168.0, 800.0, 523.0, 316.0, 241.0, 155.0, 113.0, 84.0, 58.0, 26.0, 29.0, 22.0, 19.0, 14.0, 9.0, 6.0, 3.0, 5.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.028472900390625, -0.02758193016052246, -0.026690959930419922, -0.025799989700317383, -0.024909019470214844, -0.024018049240112305, -0.023127079010009766, -0.022236108779907227, -0.021345138549804688, -0.02045416831970215, -0.01956319808959961, -0.01867222785949707, -0.01778125762939453, -0.016890287399291992, -0.015999317169189453, -0.015108346939086914, -0.014217376708984375, -0.013326406478881836, -0.012435436248779297, -0.011544466018676758, -0.010653495788574219, -0.00976252555847168, -0.00887155532836914, -0.007980585098266602, -0.0070896148681640625, -0.0061986446380615234, -0.005307674407958984, -0.004416704177856445, -0.0035257339477539062, -0.002634763717651367, -0.0017437934875488281, -0.0008528232574462891, 3.814697265625e-05, 0.0009291172027587891, 0.0018200874328613281, 0.002711057662963867, 0.0036020278930664062, 0.004492998123168945, 0.005383968353271484, 0.0062749385833740234, 0.0071659088134765625, 0.008056879043579102, 0.00894784927368164, 0.00983881950378418, 0.010729789733886719, 0.011620759963989258, 0.012511730194091797, 0.013402700424194336, 0.014293670654296875, 0.015184640884399414, 0.016075611114501953, 0.016966581344604492, 0.01785755157470703, 0.01874852180480957, 0.01963949203491211, 0.02053046226501465, 0.021421432495117188, 0.022312402725219727, 0.023203372955322266, 0.024094343185424805, 0.024985313415527344, 0.025876283645629883, 0.026767253875732422, 0.02765822410583496, 0.0285491943359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 9.0, 8.0, 17.0, 17.0, 14.0, 35.0, 30.0, 49.0, 48.0, 58.0, 80.0, 124.0, 89.0, 90.0, 61.0, 51.0, 77.0, 15.0, 25.0, 17.0, 9.0, 22.0, 8.0, 7.0, 4.0, 4.0, 2.0, 7.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.291534423828125e-06, -4.161149263381958e-06, -4.030764102935791e-06, -3.900378942489624e-06, -3.769993782043457e-06, -3.63960862159729e-06, -3.509223461151123e-06, -3.378838300704956e-06, -3.248453140258789e-06, -3.118067979812622e-06, -2.987682819366455e-06, -2.857297658920288e-06, -2.726912498474121e-06, -2.596527338027954e-06, -2.466142177581787e-06, -2.33575701713562e-06, -2.205371856689453e-06, -2.074986696243286e-06, -1.944601535797119e-06, -1.8142163753509521e-06, -1.6838312149047852e-06, -1.5534460544586182e-06, -1.4230608940124512e-06, -1.2926757335662842e-06, -1.1622905731201172e-06, -1.0319054126739502e-06, -9.015202522277832e-07, -7.711350917816162e-07, -6.407499313354492e-07, -5.103647708892822e-07, -3.7997961044311523e-07, -2.4959444999694824e-07, -1.1920928955078125e-07, 1.1175870895385742e-08, 1.4156103134155273e-07, 2.7194619178771973e-07, 4.023313522338867e-07, 5.327165126800537e-07, 6.631016731262207e-07, 7.934868335723877e-07, 9.238719940185547e-07, 1.0542571544647217e-06, 1.1846423149108887e-06, 1.3150274753570557e-06, 1.4454126358032227e-06, 1.5757977962493896e-06, 1.7061829566955566e-06, 1.8365681171417236e-06, 1.9669532775878906e-06, 2.0973384380340576e-06, 2.2277235984802246e-06, 2.3581087589263916e-06, 2.4884939193725586e-06, 2.6188790798187256e-06, 2.7492642402648926e-06, 2.8796494007110596e-06, 3.0100345611572266e-06, 3.1404197216033936e-06, 3.2708048820495605e-06, 3.4011900424957275e-06, 3.5315752029418945e-06, 3.6619603633880615e-06, 3.7923455238342285e-06, 3.9227306842803955e-06, 4.0531158447265625e-06]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 9.0, 13.0, 12.0, 16.0, 20.0, 30.0, 35.0, 43.0, 52.0, 66.0, 76.0, 132.0, 196.0, 267.0, 359.0, 480.0, 642.0, 1001.0, 1450.0, 2176.0, 3396.0, 5220.0, 8617.0, 14924.0, 28519.0, 72039.0, 800174.0, 51362.0, 23258.0, 12548.0, 7477.0, 4587.0, 2986.0, 1933.0, 1254.0, 901.0, 651.0, 433.0, 282.0, 229.0, 192.0, 102.0, 94.0, 70.0, 58.0, 42.0, 26.0, 19.0, 15.0, 12.0, 15.0, 16.0, 13.0, 4.0, 6.0, 2.0, 4.0], "bins": [-0.025726318359375, -0.024955034255981445, -0.02418375015258789, -0.023412466049194336, -0.02264118194580078, -0.021869897842407227, -0.021098613739013672, -0.020327329635620117, -0.019556045532226562, -0.018784761428833008, -0.018013477325439453, -0.0172421932220459, -0.016470909118652344, -0.01569962501525879, -0.014928340911865234, -0.01415705680847168, -0.013385772705078125, -0.01261448860168457, -0.011843204498291016, -0.011071920394897461, -0.010300636291503906, -0.009529352188110352, -0.008758068084716797, -0.007986783981323242, -0.0072154998779296875, -0.006444215774536133, -0.005672931671142578, -0.0049016475677490234, -0.004130363464355469, -0.003359079360961914, -0.0025877952575683594, -0.0018165111541748047, -0.00104522705078125, -0.0002739429473876953, 0.0004973411560058594, 0.001268625259399414, 0.0020399093627929688, 0.0028111934661865234, 0.003582477569580078, 0.004353761672973633, 0.0051250457763671875, 0.005896329879760742, 0.006667613983154297, 0.0074388980865478516, 0.008210182189941406, 0.008981466293334961, 0.009752750396728516, 0.01052403450012207, 0.011295318603515625, 0.01206660270690918, 0.012837886810302734, 0.013609170913696289, 0.014380455017089844, 0.015151739120483398, 0.015923023223876953, 0.016694307327270508, 0.017465591430664062, 0.018236875534057617, 0.019008159637451172, 0.019779443740844727, 0.02055072784423828, 0.021322011947631836, 0.02209329605102539, 0.022864580154418945, 0.0236358642578125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 11.0, 5.0, 6.0, 14.0, 11.0, 17.0, 19.0, 12.0, 25.0, 24.0, 46.0, 611.0, 42.0, 25.0, 16.0, 15.0, 12.0, 9.0, 8.0, 13.0, 7.0, 11.0, 3.0, 6.0, 9.0, 0.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.007175445556640625, -0.0069383978843688965, -0.006701350212097168, -0.0064643025398254395, -0.006227254867553711, -0.005990207195281982, -0.005753159523010254, -0.005516111850738525, -0.005279064178466797, -0.005042016506195068, -0.00480496883392334, -0.004567921161651611, -0.004330873489379883, -0.004093825817108154, -0.0038567781448364258, -0.0036197304725646973, -0.0033826828002929688, -0.0031456351280212402, -0.0029085874557495117, -0.002671539783477783, -0.0024344921112060547, -0.002197444438934326, -0.0019603967666625977, -0.0017233490943908691, -0.0014863014221191406, -0.0012492537498474121, -0.0010122060775756836, -0.0007751584053039551, -0.0005381107330322266, -0.00030106306076049805, -6.401538848876953e-05, 0.00017303228378295898, 0.0004100799560546875, 0.000647127628326416, 0.0008841753005981445, 0.001121222972869873, 0.0013582706451416016, 0.00159531831741333, 0.0018323659896850586, 0.002069413661956787, 0.0023064613342285156, 0.002543509006500244, 0.0027805566787719727, 0.003017604351043701, 0.0032546520233154297, 0.003491699695587158, 0.0037287473678588867, 0.003965795040130615, 0.004202842712402344, 0.004439890384674072, 0.004676938056945801, 0.004913985729217529, 0.005151033401489258, 0.005388081073760986, 0.005625128746032715, 0.005862176418304443, 0.006099224090576172, 0.0063362717628479, 0.006573319435119629, 0.006810367107391357, 0.007047414779663086, 0.0072844624519348145, 0.007521510124206543, 0.0077585577964782715, 0.00799560546875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 8.0, 10.0, 19.0, 27.0, 22.0, 33.0, 43.0, 72.0, 107.0, 121.0, 167.0, 99.0, 75.0, 51.0, 36.0, 29.0, 13.0, 10.0, 11.0, 7.0, 3.0, 4.0, 10.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03716970235109329, -0.03571251779794693, -0.03425533324480057, -0.032798148691654205, -0.03134096413850784, -0.02988377958536148, -0.02842659316956997, -0.026969408616423607, -0.025512224063277245, -0.024055039510130882, -0.02259785495698452, -0.02114066854119301, -0.019683483988046646, -0.018226299434900284, -0.01676911488175392, -0.01531193032860756, -0.013854745775461197, -0.012397561222314835, -0.010940376669168472, -0.009483191184699535, -0.008026006631553173, -0.006568822078406811, -0.005111636593937874, -0.0036544520407915115, -0.0021972674876451492, -0.0007400827016681433, 0.0007171020843088627, 0.0021742871031165123, 0.0036314716562628746, 0.005088656209409237, 0.006545841693878174, 0.008003026247024536, 0.009460210800170898, 0.01091739535331726, 0.012374579906463623, 0.01383176539093256, 0.015288949944078922, 0.01674613356590271, 0.01820331998169422, 0.019660504534840584, 0.021117689087986946, 0.02257487364113331, 0.02403205819427967, 0.025489244610071182, 0.026946429163217545, 0.028403613716363907, 0.02986079826951027, 0.03131798282265663, 0.032775167375802994, 0.034232351928949356, 0.03568953648209572, 0.03714672103524208, 0.03860390558838844, 0.040061090141534805, 0.041518278419971466, 0.04297546297311783, 0.04443264752626419, 0.04588983207941055, 0.047347016632556915, 0.04880420118570328, 0.05026138573884964, 0.051718570291996, 0.053175754845142365, 0.05463293939828873, 0.05609012395143509]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 11.0, 10.0, 18.0, 18.0, 6.0, 15.0, 22.0, 28.0, 22.0, 31.0, 29.0, 25.0, 46.0, 35.0, 51.0, 44.0, 40.0, 48.0, 58.0, 53.0, 38.0, 40.0, 34.0, 31.0, 42.0, 26.0, 27.0, 19.0, 22.0, 17.0, 21.0, 15.0, 14.0, 8.0, 8.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02734782174229622, -0.026530755683779716, -0.025713687762618065, -0.024896621704101562, -0.02407955564558506, -0.02326248772442341, -0.022445421665906906, -0.021628353744745255, -0.020811287686228752, -0.01999422162771225, -0.019177153706550598, -0.018360087648034096, -0.017543021589517593, -0.016725953668355942, -0.01590888760983944, -0.015091820620000362, -0.01427475456148386, -0.013457687571644783, -0.01264062151312828, -0.011823554523289204, -0.011006487533450127, -0.010189421474933624, -0.009372354485094547, -0.00855528749525547, -0.007738220971077681, -0.006921154446899891, -0.006104087457060814, -0.005287020932883024, -0.0044699544087052345, -0.0036528874188661575, -0.002835820894688368, -0.002018753904849291, -0.0012016873806715012, -0.00038462068187072873, 0.0004324460169300437, 0.0012495126575231552, 0.0020665794145315886, 0.002883646171540022, 0.0037007126957178116, 0.004517779685556889, 0.005334846209734678, 0.006151912733912468, 0.006968979723751545, 0.007786046247929335, 0.008603112772107124, 0.009420179761946201, 0.010237246751785278, 0.01105431281030178, 0.011871379800140858, 0.012688446789979935, 0.013505512848496437, 0.014322579838335514, 0.015139646828174591, 0.015956712886691093, 0.016773778945207596, 0.017590846866369247, 0.01840791292488575, 0.019224978983402252, 0.020042046904563904, 0.020859112963080406, 0.02167617902159691, 0.02249324694275856, 0.023310313001275063, 0.024127379059791565, 0.024944446980953217]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 11.0, 11.0, 16.0, 35.0, 50.0, 53.0, 78.0, 142.0, 218.0, 320.0, 508.0, 825.0, 1289.0, 1987.0, 3203.0, 5334.0, 8851.0, 15344.0, 26878.0, 49857.0, 97355.0, 219899.0, 768745.0, 2001926.0, 606847.0, 189688.0, 86580.0, 44759.0, 24952.0, 14371.0, 8905.0, 5519.0, 3499.0, 2179.0, 1346.0, 894.0, 575.0, 382.0, 274.0, 212.0, 107.0, 77.0, 61.0, 45.0, 20.0, 16.0, 13.0, 8.0, 8.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.037353515625, -0.03620147705078125, -0.0350494384765625, -0.03389739990234375, -0.032745361328125, -0.03159332275390625, -0.0304412841796875, -0.02928924560546875, -0.02813720703125, -0.02698516845703125, -0.0258331298828125, -0.02468109130859375, -0.023529052734375, -0.02237701416015625, -0.0212249755859375, -0.02007293701171875, -0.0189208984375, -0.01776885986328125, -0.0166168212890625, -0.01546478271484375, -0.014312744140625, -0.01316070556640625, -0.0120086669921875, -0.01085662841796875, -0.00970458984375, -0.00855255126953125, -0.0074005126953125, -0.00624847412109375, -0.005096435546875, -0.00394439697265625, -0.0027923583984375, -0.00164031982421875, -0.00048828125, 0.00066375732421875, 0.0018157958984375, 0.00296783447265625, 0.004119873046875, 0.00527191162109375, 0.0064239501953125, 0.00757598876953125, 0.00872802734375, 0.00988006591796875, 0.0110321044921875, 0.01218414306640625, 0.013336181640625, 0.01448822021484375, 0.0156402587890625, 0.01679229736328125, 0.0179443359375, 0.01909637451171875, 0.0202484130859375, 0.02140045166015625, 0.022552490234375, 0.02370452880859375, 0.0248565673828125, 0.02600860595703125, 0.02716064453125, 0.02831268310546875, 0.0294647216796875, 0.03061676025390625, 0.031768798828125, 0.03292083740234375, 0.0340728759765625, 0.03522491455078125, 0.036376953125]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 10.0, 6.0, 13.0, 10.0, 15.0, 13.0, 15.0, 14.0, 22.0, 20.0, 27.0, 18.0, 29.0, 27.0, 37.0, 35.0, 53.0, 46.0, 41.0, 46.0, 46.0, 44.0, 43.0, 39.0, 39.0, 35.0, 30.0, 20.0, 25.0, 31.0, 21.0, 18.0, 20.0, 18.0, 12.0, 23.0, 11.0, 3.0, 3.0, 3.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.0155487060546875, -0.015092134475708008, -0.014635562896728516, -0.014178991317749023, -0.013722419738769531, -0.013265848159790039, -0.012809276580810547, -0.012352705001831055, -0.011896133422851562, -0.01143956184387207, -0.010982990264892578, -0.010526418685913086, -0.010069847106933594, -0.009613275527954102, -0.00915670394897461, -0.008700132369995117, -0.008243560791015625, -0.007786989212036133, -0.007330417633056641, -0.0068738460540771484, -0.006417274475097656, -0.005960702896118164, -0.005504131317138672, -0.00504755973815918, -0.0045909881591796875, -0.004134416580200195, -0.003677845001220703, -0.003221273422241211, -0.0027647018432617188, -0.0023081302642822266, -0.0018515586853027344, -0.0013949871063232422, -0.00093841552734375, -0.0004818439483642578, -2.5272369384765625e-05, 0.00043129920959472656, 0.0008878707885742188, 0.001344442367553711, 0.0018010139465332031, 0.0022575855255126953, 0.0027141571044921875, 0.0031707286834716797, 0.003627300262451172, 0.004083871841430664, 0.004540443420410156, 0.0049970149993896484, 0.005453586578369141, 0.005910158157348633, 0.006366729736328125, 0.006823301315307617, 0.007279872894287109, 0.0077364444732666016, 0.008193016052246094, 0.008649587631225586, 0.009106159210205078, 0.00956273078918457, 0.010019302368164062, 0.010475873947143555, 0.010932445526123047, 0.011389017105102539, 0.011845588684082031, 0.012302160263061523, 0.012758731842041016, 0.013215303421020508, 0.013671875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 5.0, 15.0, 23.0, 24.0, 38.0, 56.0, 93.0, 133.0, 218.0, 352.0, 508.0, 770.0, 1283.0, 1926.0, 3268.0, 5192.0, 8808.0, 15275.0, 27324.0, 51744.0, 105165.0, 243054.0, 693803.0, 1818321.0, 733757.0, 253287.0, 109497.0, 53187.0, 28079.0, 15650.0, 9020.0, 5393.0, 3318.0, 2055.0, 1300.0, 777.0, 559.0, 332.0, 214.0, 163.0, 100.0, 65.0, 41.0, 27.0, 30.0, 5.0, 11.0, 3.0, 6.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0298004150390625, -0.0288240909576416, -0.027847766876220703, -0.026871442794799805, -0.025895118713378906, -0.024918794631958008, -0.02394247055053711, -0.02296614646911621, -0.021989822387695312, -0.021013498306274414, -0.020037174224853516, -0.019060850143432617, -0.01808452606201172, -0.01710820198059082, -0.016131877899169922, -0.015155553817749023, -0.014179229736328125, -0.013202905654907227, -0.012226581573486328, -0.01125025749206543, -0.010273933410644531, -0.009297609329223633, -0.008321285247802734, -0.007344961166381836, -0.0063686370849609375, -0.005392313003540039, -0.004415988922119141, -0.003439664840698242, -0.0024633407592773438, -0.0014870166778564453, -0.0005106925964355469, 0.00046563148498535156, 0.00144195556640625, 0.0024182796478271484, 0.003394603729248047, 0.004370927810668945, 0.005347251892089844, 0.006323575973510742, 0.007299900054931641, 0.008276224136352539, 0.009252548217773438, 0.010228872299194336, 0.011205196380615234, 0.012181520462036133, 0.013157844543457031, 0.01413416862487793, 0.015110492706298828, 0.016086816787719727, 0.017063140869140625, 0.018039464950561523, 0.019015789031982422, 0.01999211311340332, 0.02096843719482422, 0.021944761276245117, 0.022921085357666016, 0.023897409439086914, 0.024873733520507812, 0.02585005760192871, 0.02682638168334961, 0.027802705764770508, 0.028779029846191406, 0.029755353927612305, 0.030731678009033203, 0.0317080020904541, 0.032684326171875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 9.0, 16.0, 16.0, 19.0, 19.0, 17.0, 33.0, 42.0, 43.0, 59.0, 68.0, 87.0, 90.0, 121.0, 137.0, 167.0, 172.0, 204.0, 208.0, 255.0, 275.0, 273.0, 293.0, 218.0, 201.0, 189.0, 157.0, 104.0, 101.0, 88.0, 79.0, 55.0, 47.0, 39.0, 34.0, 24.0, 31.0, 12.0, 10.0, 12.0, 8.0, 9.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.007678985595703125, -0.00744551420211792, -0.007212042808532715, -0.00697857141494751, -0.006745100021362305, -0.0065116286277771, -0.0062781572341918945, -0.0060446858406066895, -0.005811214447021484, -0.005577743053436279, -0.005344271659851074, -0.005110800266265869, -0.004877328872680664, -0.004643857479095459, -0.004410386085510254, -0.004176914691925049, -0.003943443298339844, -0.0037099719047546387, -0.0034765005111694336, -0.0032430291175842285, -0.0030095577239990234, -0.0027760863304138184, -0.0025426149368286133, -0.002309143543243408, -0.002075672149658203, -0.001842200756072998, -0.001608729362487793, -0.0013752579689025879, -0.0011417865753173828, -0.0009083151817321777, -0.0006748437881469727, -0.0004413723945617676, -0.0002079010009765625, 2.5570392608642578e-05, 0.00025904178619384766, 0.0004925131797790527, 0.0007259845733642578, 0.0009594559669494629, 0.001192927360534668, 0.001426398754119873, 0.0016598701477050781, 0.0018933415412902832, 0.0021268129348754883, 0.0023602843284606934, 0.0025937557220458984, 0.0028272271156311035, 0.0030606985092163086, 0.0032941699028015137, 0.0035276412963867188, 0.003761112689971924, 0.003994584083557129, 0.004228055477142334, 0.004461526870727539, 0.004694998264312744, 0.004928469657897949, 0.005161941051483154, 0.005395412445068359, 0.0056288838386535645, 0.0058623552322387695, 0.006095826625823975, 0.00632929801940918, 0.006562769412994385, 0.00679624080657959, 0.007029712200164795, 0.00726318359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 11.0, 14.0, 20.0, 20.0, 38.0, 49.0, 68.0, 86.0, 135.0, 142.0, 104.0, 75.0, 60.0, 34.0, 27.0, 25.0, 17.0, 13.0, 13.0, 7.0, 9.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02560489997267723, -0.024678954854607582, -0.023753009736537933, -0.022827064618468285, -0.021901119500398636, -0.020975174382328987, -0.02004922926425934, -0.01912328414618969, -0.01819733902812004, -0.017271393910050392, -0.016345448791980743, -0.015419503673911095, -0.014493558555841446, -0.013567613437771797, -0.012641668319702148, -0.0117157232016325, -0.010789777152240276, -0.009863832034170628, -0.008937886916100979, -0.00801194179803133, -0.007085996679961681, -0.006160051096230745, -0.005234105978161097, -0.004308160860091448, -0.003382215742021799, -0.0024562706239521503, -0.0015303253894671798, -0.0006043801549822092, 0.00032156496308743954, 0.001247510313987732, 0.0021734554320573807, 0.0030994005501270294, 0.004025345668196678, 0.004951290786266327, 0.005877235904335976, 0.006803181022405624, 0.007729126140475273, 0.008655071258544922, 0.00958101637661457, 0.01050696149468422, 0.011432906612753868, 0.012358851730823517, 0.013284796848893166, 0.014210741966962814, 0.015136687085032463, 0.016062632203102112, 0.01698857732117176, 0.01791452243924141, 0.018840469419956207, 0.019766414538025856, 0.020692359656095505, 0.021618304774165154, 0.022544249892234802, 0.02347019501030445, 0.0243961401283741, 0.02532208524644375, 0.026248030364513397, 0.027173975482583046, 0.028099920600652695, 0.029025865718722343, 0.029951810836791992, 0.03087775595486164, 0.03180370107293129, 0.03272964805364609, 0.03365559130907059]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 11.0, 16.0, 21.0, 16.0, 24.0, 22.0, 26.0, 32.0, 37.0, 35.0, 25.0, 47.0, 46.0, 32.0, 43.0, 41.0, 50.0, 40.0, 41.0, 43.0, 37.0, 35.0, 33.0, 35.0, 25.0, 28.0, 26.0, 27.0, 14.0, 16.0, 14.0, 10.0, 6.0, 8.0, 7.0, 9.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.02004498615860939, -0.01951558329164982, -0.018986178562045097, -0.018456775695085526, -0.017927370965480804, -0.017397968098521233, -0.01686856336891651, -0.01633916050195694, -0.01580975577235222, -0.015280351974070072, -0.014750948175787926, -0.01422154437750578, -0.013692140579223633, -0.013162737712264061, -0.012633333913981915, -0.012103930115699768, -0.011574527248740196, -0.01104512345045805, -0.010515719652175903, -0.009986315853893757, -0.00945691205561161, -0.008927509188652039, -0.008398105390369892, -0.007868701592087746, -0.007339297793805599, -0.006809893995523453, -0.006280490197241306, -0.005751086864620447, -0.005221683066338301, -0.004692279268056154, -0.004162875935435295, -0.0036334721371531487, -0.0031040702015161514, -0.002574666403234005, -0.002045262837782502, -0.0015158591559156775, -0.000986455474048853, -0.00045705167576670647, 7.235188968479633e-05, 0.0006017554551362991, 0.0011311592534184456, 0.0016605629352852702, 0.002189966617152095, 0.0027193701826035976, 0.003248773980885744, 0.0037781777791678905, 0.00430758111178875, 0.004836984910070896, 0.005366388708353043, 0.005895792506635189, 0.0064251963049173355, 0.006954599637538195, 0.007484003435820341, 0.0080134067684412, 0.008542810566723347, 0.009072214365005493, 0.00960161816328764, 0.010131021961569786, 0.010660425759851933, 0.011189829558134079, 0.01171923242509365, 0.012248637154698372, 0.012778040021657944, 0.01330744381994009, 0.013836847618222237]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 5.0, 8.0, 9.0, 10.0, 12.0, 26.0, 29.0, 65.0, 69.0, 118.0, 135.0, 249.0, 389.0, 570.0, 1011.0, 1772.0, 2998.0, 5475.0, 9999.0, 20034.0, 43453.0, 113556.0, 349730.0, 317041.0, 101513.0, 40189.0, 18485.0, 9387.0, 5110.0, 2904.0, 1653.0, 932.0, 581.0, 376.0, 224.0, 156.0, 96.0, 50.0, 42.0, 28.0, 14.0, 25.0, 10.0, 6.0, 6.0, 6.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0258331298828125, -0.024970531463623047, -0.024107933044433594, -0.02324533462524414, -0.022382736206054688, -0.021520137786865234, -0.02065753936767578, -0.019794940948486328, -0.018932342529296875, -0.018069744110107422, -0.01720714569091797, -0.016344547271728516, -0.015481948852539062, -0.01461935043334961, -0.013756752014160156, -0.012894153594970703, -0.01203155517578125, -0.011168956756591797, -0.010306358337402344, -0.00944375991821289, -0.008581161499023438, -0.007718563079833984, -0.006855964660644531, -0.005993366241455078, -0.005130767822265625, -0.004268169403076172, -0.0034055709838867188, -0.0025429725646972656, -0.0016803741455078125, -0.0008177757263183594, 4.482269287109375e-05, 0.0009074211120605469, 0.00177001953125, 0.002632617950439453, 0.0034952163696289062, 0.004357814788818359, 0.0052204132080078125, 0.006083011627197266, 0.006945610046386719, 0.007808208465576172, 0.008670806884765625, 0.009533405303955078, 0.010396003723144531, 0.011258602142333984, 0.012121200561523438, 0.01298379898071289, 0.013846397399902344, 0.014708995819091797, 0.01557159423828125, 0.016434192657470703, 0.017296791076660156, 0.01815938949584961, 0.019021987915039062, 0.019884586334228516, 0.02074718475341797, 0.021609783172607422, 0.022472381591796875, 0.023334980010986328, 0.02419757843017578, 0.025060176849365234, 0.025922775268554688, 0.02678537368774414, 0.027647972106933594, 0.028510570526123047, 0.0293731689453125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 14.0, 12.0, 16.0, 17.0, 17.0, 24.0, 31.0, 29.0, 33.0, 25.0, 46.0, 40.0, 32.0, 48.0, 38.0, 35.0, 48.0, 39.0, 47.0, 46.0, 41.0, 25.0, 34.0, 40.0, 23.0, 30.0, 28.0, 23.0, 12.0, 19.0, 21.0, 8.0, 9.0, 9.0, 5.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0177764892578125, -0.017272114753723145, -0.01676774024963379, -0.016263365745544434, -0.015758991241455078, -0.015254616737365723, -0.014750242233276367, -0.014245867729187012, -0.013741493225097656, -0.0132371187210083, -0.012732744216918945, -0.01222836971282959, -0.011723995208740234, -0.011219620704650879, -0.010715246200561523, -0.010210871696472168, -0.009706497192382812, -0.009202122688293457, -0.008697748184204102, -0.008193373680114746, -0.007688999176025391, -0.007184624671936035, -0.00668025016784668, -0.006175875663757324, -0.005671501159667969, -0.005167126655578613, -0.004662752151489258, -0.004158377647399902, -0.003654003143310547, -0.0031496286392211914, -0.002645254135131836, -0.0021408796310424805, -0.001636505126953125, -0.0011321306228637695, -0.0006277561187744141, -0.0001233816146850586, 0.0003809928894042969, 0.0008853673934936523, 0.0013897418975830078, 0.0018941164016723633, 0.0023984909057617188, 0.0029028654098510742, 0.0034072399139404297, 0.003911614418029785, 0.004415988922119141, 0.004920363426208496, 0.0054247379302978516, 0.005929112434387207, 0.0064334869384765625, 0.006937861442565918, 0.0074422359466552734, 0.007946610450744629, 0.008450984954833984, 0.00895535945892334, 0.009459733963012695, 0.00996410846710205, 0.010468482971191406, 0.010972857475280762, 0.011477231979370117, 0.011981606483459473, 0.012485980987548828, 0.012990355491638184, 0.013494729995727539, 0.013999104499816895, 0.01450347900390625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 11.0, 15.0, 22.0, 20.0, 41.0, 39.0, 53.0, 63.0, 92.0, 134.0, 220.0, 310.0, 463.0, 720.0, 1190.0, 2118.0, 4000.0, 8551.0, 22363.0, 82211.0, 567714.0, 281682.0, 47446.0, 15031.0, 6245.0, 3126.0, 1747.0, 970.0, 677.0, 401.0, 254.0, 183.0, 116.0, 78.0, 44.0, 47.0, 35.0, 20.0, 25.0, 20.0, 19.0, 10.0, 5.0, 8.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.043060302734375, -0.04170703887939453, -0.04035377502441406, -0.039000511169433594, -0.037647247314453125, -0.036293983459472656, -0.03494071960449219, -0.03358745574951172, -0.03223419189453125, -0.03088092803955078, -0.029527664184570312, -0.028174400329589844, -0.026821136474609375, -0.025467872619628906, -0.024114608764648438, -0.02276134490966797, -0.0214080810546875, -0.02005481719970703, -0.018701553344726562, -0.017348289489746094, -0.015995025634765625, -0.014641761779785156, -0.013288497924804688, -0.011935234069824219, -0.01058197021484375, -0.009228706359863281, -0.007875442504882812, -0.006522178649902344, -0.005168914794921875, -0.0038156509399414062, -0.0024623870849609375, -0.0011091232299804688, 0.000244140625, 0.0015974044799804688, 0.0029506683349609375, 0.004303932189941406, 0.005657196044921875, 0.007010459899902344, 0.008363723754882812, 0.009716987609863281, 0.01107025146484375, 0.012423515319824219, 0.013776779174804688, 0.015130043029785156, 0.016483306884765625, 0.017836570739746094, 0.019189834594726562, 0.02054309844970703, 0.0218963623046875, 0.02324962615966797, 0.024602890014648438, 0.025956153869628906, 0.027309417724609375, 0.028662681579589844, 0.030015945434570312, 0.03136920928955078, 0.03272247314453125, 0.03407573699951172, 0.03542900085449219, 0.036782264709472656, 0.038135528564453125, 0.039488792419433594, 0.04084205627441406, 0.04219532012939453, 0.043548583984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 12.0, 9.0, 13.0, 12.0, 22.0, 27.0, 15.0, 27.0, 27.0, 39.0, 47.0, 40.0, 31.0, 41.0, 53.0, 35.0, 46.0, 59.0, 45.0, 33.0, 40.0, 39.0, 32.0, 34.0, 31.0, 25.0, 21.0, 20.0, 20.0, 20.0, 11.0, 13.0, 15.0, 10.0, 3.0, 8.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01010894775390625, -0.009773731231689453, -0.009438514709472656, -0.00910329818725586, -0.008768081665039062, -0.008432865142822266, -0.008097648620605469, -0.007762432098388672, -0.007427215576171875, -0.007091999053955078, -0.006756782531738281, -0.006421566009521484, -0.0060863494873046875, -0.005751132965087891, -0.005415916442871094, -0.005080699920654297, -0.0047454833984375, -0.004410266876220703, -0.004075050354003906, -0.0037398338317871094, -0.0034046173095703125, -0.0030694007873535156, -0.0027341842651367188, -0.002398967742919922, -0.002063751220703125, -0.0017285346984863281, -0.0013933181762695312, -0.0010581016540527344, -0.0007228851318359375, -0.0003876686096191406, -5.245208740234375e-05, 0.0002827644348144531, 0.00061798095703125, 0.0009531974792480469, 0.0012884140014648438, 0.0016236305236816406, 0.0019588470458984375, 0.0022940635681152344, 0.0026292800903320312, 0.002964496612548828, 0.003299713134765625, 0.003634929656982422, 0.003970146179199219, 0.004305362701416016, 0.0046405792236328125, 0.004975795745849609, 0.005311012268066406, 0.005646228790283203, 0.0059814453125, 0.006316661834716797, 0.006651878356933594, 0.006987094879150391, 0.0073223114013671875, 0.007657527923583984, 0.007992744445800781, 0.008327960968017578, 0.008663177490234375, 0.008998394012451172, 0.009333610534667969, 0.009668827056884766, 0.010004043579101562, 0.01033926010131836, 0.010674476623535156, 0.011009693145751953, 0.01134490966796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 10.0, 4.0, 12.0, 26.0, 15.0, 25.0, 46.0, 43.0, 80.0, 63.0, 134.0, 190.0, 263.0, 399.0, 545.0, 756.0, 1203.0, 1665.0, 2596.0, 4076.0, 6712.0, 11295.0, 21156.0, 46616.0, 133781.0, 485027.0, 207695.0, 62340.0, 26419.0, 13686.0, 7842.0, 4759.0, 2950.0, 1981.0, 1275.0, 857.0, 570.0, 395.0, 287.0, 216.0, 157.0, 95.0, 71.0, 61.0, 51.0, 26.0, 26.0, 14.0, 13.0, 6.0, 7.0, 8.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-0.004367828369140625, -0.0042340755462646484, -0.004100322723388672, -0.003966569900512695, -0.0038328170776367188, -0.003699064254760742, -0.0035653114318847656, -0.003431558609008789, -0.0032978057861328125, -0.003164052963256836, -0.0030303001403808594, -0.002896547317504883, -0.0027627944946289062, -0.0026290416717529297, -0.002495288848876953, -0.0023615360260009766, -0.002227783203125, -0.0020940303802490234, -0.001960277557373047, -0.0018265247344970703, -0.0016927719116210938, -0.0015590190887451172, -0.0014252662658691406, -0.001291513442993164, -0.0011577606201171875, -0.001024007797241211, -0.0008902549743652344, -0.0007565021514892578, -0.0006227493286132812, -0.0004889965057373047, -0.0003552436828613281, -0.00022149085998535156, -8.7738037109375e-05, 4.601478576660156e-05, 0.00017976760864257812, 0.0003135204315185547, 0.00044727325439453125, 0.0005810260772705078, 0.0007147789001464844, 0.0008485317230224609, 0.0009822845458984375, 0.001116037368774414, 0.0012497901916503906, 0.0013835430145263672, 0.0015172958374023438, 0.0016510486602783203, 0.0017848014831542969, 0.0019185543060302734, 0.00205230712890625, 0.0021860599517822266, 0.002319812774658203, 0.0024535655975341797, 0.0025873184204101562, 0.002721071243286133, 0.0028548240661621094, 0.002988576889038086, 0.0031223297119140625, 0.003256082534790039, 0.0033898353576660156, 0.003523588180541992, 0.0036573410034179688, 0.0037910938262939453, 0.003924846649169922, 0.0040585994720458984, 0.004192352294921875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 7.0, 4.0, 3.0, 7.0, 15.0, 23.0, 22.0, 25.0, 25.0, 39.0, 63.0, 89.0, 125.0, 147.0, 91.0, 86.0, 37.0, 36.0, 24.0, 30.0, 22.0, 15.0, 16.0, 13.0, 5.0, 5.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.895427703857422e-05, -1.836474984884262e-05, -1.7775222659111023e-05, -1.7185695469379425e-05, -1.6596168279647827e-05, -1.600664108991623e-05, -1.541711390018463e-05, -1.4827586710453033e-05, -1.4238059520721436e-05, -1.3648532330989838e-05, -1.305900514125824e-05, -1.2469477951526642e-05, -1.1879950761795044e-05, -1.1290423572063446e-05, -1.0700896382331848e-05, -1.011136919260025e-05, -9.521842002868652e-06, -8.932314813137054e-06, -8.342787623405457e-06, -7.753260433673859e-06, -7.163733243942261e-06, -6.574206054210663e-06, -5.984678864479065e-06, -5.395151674747467e-06, -4.805624485015869e-06, -4.216097295284271e-06, -3.6265701055526733e-06, -3.0370429158210754e-06, -2.4475157260894775e-06, -1.8579885363578796e-06, -1.2684613466262817e-06, -6.789341568946838e-07, -8.940696716308594e-08, 5.00120222568512e-07, 1.0896474123001099e-06, 1.6791746020317078e-06, 2.2687017917633057e-06, 2.8582289814949036e-06, 3.4477561712265015e-06, 4.037283360958099e-06, 4.626810550689697e-06, 5.216337740421295e-06, 5.805864930152893e-06, 6.395392119884491e-06, 6.984919309616089e-06, 7.574446499347687e-06, 8.163973689079285e-06, 8.753500878810883e-06, 9.34302806854248e-06, 9.932555258274078e-06, 1.0522082448005676e-05, 1.1111609637737274e-05, 1.1701136827468872e-05, 1.229066401720047e-05, 1.2880191206932068e-05, 1.3469718396663666e-05, 1.4059245586395264e-05, 1.4648772776126862e-05, 1.523829996585846e-05, 1.5827827155590057e-05, 1.6417354345321655e-05, 1.7006881535053253e-05, 1.759640872478485e-05, 1.818593591451645e-05, 1.8775463104248047e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 7.0, 13.0, 12.0, 20.0, 32.0, 29.0, 46.0, 80.0, 123.0, 182.0, 317.0, 442.0, 704.0, 1185.0, 1941.0, 3161.0, 5557.0, 10229.0, 19805.0, 41420.0, 97776.0, 276065.0, 356963.0, 128534.0, 51454.0, 23934.0, 12273.0, 6638.0, 3834.0, 2153.0, 1324.0, 776.0, 518.0, 334.0, 221.0, 138.0, 92.0, 73.0, 48.0, 31.0, 24.0, 13.0, 4.0, 11.0, 8.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0030975341796875, -0.0030011534690856934, -0.0029047727584838867, -0.00280839204788208, -0.0027120113372802734, -0.002615630626678467, -0.00251924991607666, -0.0024228692054748535, -0.002326488494873047, -0.0022301077842712402, -0.0021337270736694336, -0.002037346363067627, -0.0019409656524658203, -0.0018445849418640137, -0.001748204231262207, -0.0016518235206604004, -0.0015554428100585938, -0.0014590620994567871, -0.0013626813888549805, -0.0012663006782531738, -0.0011699199676513672, -0.0010735392570495605, -0.000977158546447754, -0.0008807778358459473, -0.0007843971252441406, -0.000688016414642334, -0.0005916357040405273, -0.0004952549934387207, -0.00039887428283691406, -0.0003024935722351074, -0.00020611286163330078, -0.00010973215103149414, -1.33514404296875e-05, 8.302927017211914e-05, 0.00017940998077392578, 0.0002757906913757324, 0.00037217140197753906, 0.0004685521125793457, 0.0005649328231811523, 0.000661313533782959, 0.0007576942443847656, 0.0008540749549865723, 0.0009504556655883789, 0.0010468363761901855, 0.0011432170867919922, 0.0012395977973937988, 0.0013359785079956055, 0.0014323592185974121, 0.0015287399291992188, 0.0016251206398010254, 0.001721501350402832, 0.0018178820610046387, 0.0019142627716064453, 0.002010643482208252, 0.0021070241928100586, 0.0022034049034118652, 0.002299785614013672, 0.0023961663246154785, 0.002492547035217285, 0.002588927745819092, 0.0026853084564208984, 0.002781689167022705, 0.0028780698776245117, 0.0029744505882263184, 0.003070831298828125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 5.0, 8.0, 4.0, 9.0, 11.0, 9.0, 15.0, 13.0, 22.0, 39.0, 32.0, 44.0, 61.0, 70.0, 72.0, 95.0, 88.0, 82.0, 73.0, 55.0, 36.0, 36.0, 24.0, 19.0, 9.0, 16.0, 6.0, 6.0, 4.0, 4.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0011348724365234375, -0.0011012852191925049, -0.0010676980018615723, -0.0010341107845306396, -0.001000523567199707, -0.0009669363498687744, -0.0009333491325378418, -0.0008997619152069092, -0.0008661746978759766, -0.0008325874805450439, -0.0007990002632141113, -0.0007654130458831787, -0.0007318258285522461, -0.0006982386112213135, -0.0006646513938903809, -0.0006310641765594482, -0.0005974769592285156, -0.000563889741897583, -0.0005303025245666504, -0.0004967153072357178, -0.00046312808990478516, -0.00042954087257385254, -0.0003959536552429199, -0.0003623664379119873, -0.0003287792205810547, -0.00029519200325012207, -0.00026160478591918945, -0.00022801756858825684, -0.00019443035125732422, -0.0001608431339263916, -0.00012725591659545898, -9.366869926452637e-05, -6.008148193359375e-05, -2.6494264602661133e-05, 7.092952728271484e-06, 4.06801700592041e-05, 7.426738739013672e-05, 0.00010785460472106934, 0.00014144182205200195, 0.00017502903938293457, 0.0002086162567138672, 0.0002422034740447998, 0.0002757906913757324, 0.00030937790870666504, 0.00034296512603759766, 0.0003765523433685303, 0.0004101395606994629, 0.0004437267780303955, 0.0004773139953613281, 0.0005109012126922607, 0.0005444884300231934, 0.000578075647354126, 0.0006116628646850586, 0.0006452500820159912, 0.0006788372993469238, 0.0007124245166778564, 0.0007460117340087891, 0.0007795989513397217, 0.0008131861686706543, 0.0008467733860015869, 0.0008803606033325195, 0.0009139478206634521, 0.0009475350379943848, 0.0009811222553253174, 0.00101470947265625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 8.0, 8.0, 12.0, 21.0, 24.0, 26.0, 47.0, 58.0, 94.0, 124.0, 150.0, 119.0, 86.0, 54.0, 25.0, 25.0, 24.0, 21.0, 13.0, 12.0, 6.0, 11.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.022909805178642273, -0.022049417719244957, -0.02118903025984764, -0.020328642800450325, -0.01946825534105301, -0.018607867881655693, -0.017747480422258377, -0.01688709296286106, -0.016026705503463745, -0.01516631804406643, -0.014305930584669113, -0.013445543125271797, -0.012585155665874481, -0.011724768206477165, -0.01086438074707985, -0.010003993287682533, -0.009143604896962643, -0.008283217437565327, -0.007422829978168011, -0.006562442518770695, -0.005702055059373379, -0.0048416671343147755, -0.0039812796749174595, -0.0031208922155201435, -0.0022605047561228275, -0.0014001172967255116, -0.0005397297209128737, 0.00032065785489976406, 0.00118104531429708, 0.0020414330065250397, 0.0029018204659223557, 0.0037622079253196716, 0.004622595384716988, 0.005482982844114304, 0.00634337030351162, 0.0072037577629089355, 0.008064145222306252, 0.008924532681703568, 0.009784920141100883, 0.0106453076004982, 0.011505695059895515, 0.012366082519292831, 0.013226469978690147, 0.014086857438087463, 0.01494724489748478, 0.015807632356882095, 0.01666801981627941, 0.017528407275676727, 0.018388796597719193, 0.01924918405711651, 0.020109571516513824, 0.02096995897591114, 0.021830346435308456, 0.022690733894705772, 0.02355112135410309, 0.024411508813500404, 0.02527189627289772, 0.026132283732295036, 0.026992671191692352, 0.02785305865108967, 0.028713446110486984, 0.0295738335698843, 0.030434221029281616, 0.03129461035132408, 0.03215499594807625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 12.0, 18.0, 21.0, 19.0, 18.0, 30.0, 25.0, 34.0, 36.0, 32.0, 27.0, 48.0, 49.0, 35.0, 40.0, 48.0, 43.0, 42.0, 47.0, 37.0, 31.0, 35.0, 40.0, 29.0, 25.0, 33.0, 23.0, 24.0, 15.0, 10.0, 16.0, 9.0, 7.0, 9.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.018828339874744415, -0.018327655270695686, -0.017826968804001808, -0.01732628419995308, -0.01682559959590435, -0.01632491499185562, -0.015824228525161743, -0.015323543921113014, -0.01482285838574171, -0.014322172850370407, -0.013821488246321678, -0.013320802710950375, -0.012820117175579071, -0.012319432571530342, -0.011818747036159039, -0.011318061500787735, -0.010817376896739006, -0.010316691361367702, -0.009816006757318974, -0.00931532122194767, -0.008814636617898941, -0.008313951082527637, -0.007813265547156334, -0.007312580477446318, -0.006811895407736301, -0.006311210338026285, -0.005810525268316269, -0.005309839732944965, -0.004809154663234949, -0.004308469593524933, -0.003807784290984273, -0.003307098988443613, -0.0028064120560884476, -0.0023057269863784313, -0.0018050416838377714, -0.0013043564977124333, -0.0008036713115870953, -0.000302986241877079, 0.0001976990606635809, 0.0006983843632042408, 0.001199069432914257, 0.0016997546190395951, 0.002200439805164933, 0.002701125107705593, 0.0032018101774156094, 0.0037024952471256256, 0.004203180782496929, 0.004703865852206945, 0.005204550921916962, 0.005705235991626978, 0.006205921061336994, 0.006706606596708298, 0.007207291666418314, 0.00770797673612833, 0.008208662271499634, 0.008709346875548363, 0.009210032410919666, 0.00971071794629097, 0.010211402550339699, 0.010712088085711002, 0.011212773621082306, 0.011713458225131035, 0.012214143760502338, 0.012714829295873642, 0.013215513899922371]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 8.0, 9.0, 10.0, 6.0, 9.0, 26.0, 29.0, 46.0, 77.0, 85.0, 144.0, 226.0, 316.0, 446.0, 721.0, 926.0, 1325.0, 2065.0, 3044.0, 4591.0, 6932.0, 10429.0, 16307.0, 26854.0, 44274.0, 77877.0, 141259.0, 234726.0, 202521.0, 112028.0, 62536.0, 36123.0, 22085.0, 13738.0, 8821.0, 5800.0, 3912.0, 2572.0, 1698.0, 1233.0, 852.0, 589.0, 428.0, 275.0, 185.0, 107.0, 87.0, 57.0, 47.0, 36.0, 18.0, 16.0, 16.0, 8.0, 4.0, 5.0, 2.0], "bins": [-0.026580810546875, -0.025817155838012695, -0.02505350112915039, -0.024289846420288086, -0.02352619171142578, -0.022762537002563477, -0.021998882293701172, -0.021235227584838867, -0.020471572875976562, -0.019707918167114258, -0.018944263458251953, -0.01818060874938965, -0.017416954040527344, -0.01665329933166504, -0.015889644622802734, -0.01512598991394043, -0.014362335205078125, -0.01359868049621582, -0.012835025787353516, -0.012071371078491211, -0.011307716369628906, -0.010544061660766602, -0.009780406951904297, -0.009016752243041992, -0.008253097534179688, -0.007489442825317383, -0.006725788116455078, -0.0059621334075927734, -0.005198478698730469, -0.004434823989868164, -0.0036711692810058594, -0.0029075145721435547, -0.00214385986328125, -0.0013802051544189453, -0.0006165504455566406, 0.00014710426330566406, 0.0009107589721679688, 0.0016744136810302734, 0.002438068389892578, 0.003201723098754883, 0.0039653778076171875, 0.004729032516479492, 0.005492687225341797, 0.0062563419342041016, 0.007019996643066406, 0.007783651351928711, 0.008547306060791016, 0.00931096076965332, 0.010074615478515625, 0.01083827018737793, 0.011601924896240234, 0.012365579605102539, 0.013129234313964844, 0.013892889022827148, 0.014656543731689453, 0.015420198440551758, 0.016183853149414062, 0.016947507858276367, 0.017711162567138672, 0.018474817276000977, 0.01923847198486328, 0.020002126693725586, 0.02076578140258789, 0.021529436111450195, 0.0222930908203125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 7.0, 8.0, 14.0, 15.0, 21.0, 24.0, 18.0, 32.0, 24.0, 25.0, 33.0, 39.0, 41.0, 43.0, 42.0, 42.0, 46.0, 43.0, 44.0, 37.0, 42.0, 44.0, 24.0, 35.0, 34.0, 26.0, 33.0, 24.0, 21.0, 24.0, 14.0, 13.0, 9.0, 11.0, 12.0, 5.0, 5.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0144195556640625, -0.014011859893798828, -0.013604164123535156, -0.013196468353271484, -0.012788772583007812, -0.01238107681274414, -0.011973381042480469, -0.011565685272216797, -0.011157989501953125, -0.010750293731689453, -0.010342597961425781, -0.00993490219116211, -0.009527206420898438, -0.009119510650634766, -0.008711814880371094, -0.008304119110107422, -0.00789642333984375, -0.007488727569580078, -0.007081031799316406, -0.006673336029052734, -0.0062656402587890625, -0.005857944488525391, -0.005450248718261719, -0.005042552947998047, -0.004634857177734375, -0.004227161407470703, -0.0038194656372070312, -0.0034117698669433594, -0.0030040740966796875, -0.0025963783264160156, -0.0021886825561523438, -0.0017809867858886719, -0.001373291015625, -0.0009655952453613281, -0.0005578994750976562, -0.00015020370483398438, 0.0002574920654296875, 0.0006651878356933594, 0.0010728836059570312, 0.0014805793762207031, 0.001888275146484375, 0.002295970916748047, 0.0027036666870117188, 0.0031113624572753906, 0.0035190582275390625, 0.003926753997802734, 0.004334449768066406, 0.004742145538330078, 0.00514984130859375, 0.005557537078857422, 0.005965232849121094, 0.006372928619384766, 0.0067806243896484375, 0.007188320159912109, 0.007596015930175781, 0.008003711700439453, 0.008411407470703125, 0.008819103240966797, 0.009226799011230469, 0.00963449478149414, 0.010042190551757812, 0.010449886322021484, 0.010857582092285156, 0.011265277862548828, 0.0116729736328125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 12.0, 15.0, 27.0, 33.0, 40.0, 78.0, 121.0, 185.0, 299.0, 409.0, 670.0, 1053.0, 1743.0, 2798.0, 4747.0, 7798.0, 13645.0, 23851.0, 43319.0, 83165.0, 167329.0, 290758.0, 195492.0, 96330.0, 50000.0, 26922.0, 15177.0, 8893.0, 5226.0, 3228.0, 1853.0, 1209.0, 787.0, 478.0, 285.0, 198.0, 130.0, 84.0, 56.0, 41.0, 24.0, 17.0, 10.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02618408203125, -0.025328636169433594, -0.024473190307617188, -0.02361774444580078, -0.022762298583984375, -0.02190685272216797, -0.021051406860351562, -0.020195960998535156, -0.01934051513671875, -0.018485069274902344, -0.017629623413085938, -0.01677417755126953, -0.015918731689453125, -0.015063285827636719, -0.014207839965820312, -0.013352394104003906, -0.0124969482421875, -0.011641502380371094, -0.010786056518554688, -0.009930610656738281, -0.009075164794921875, -0.008219718933105469, -0.0073642730712890625, -0.006508827209472656, -0.00565338134765625, -0.004797935485839844, -0.0039424896240234375, -0.0030870437622070312, -0.002231597900390625, -0.0013761520385742188, -0.0005207061767578125, 0.00033473968505859375, 0.001190185546875, 0.0020456314086914062, 0.0029010772705078125, 0.0037565231323242188, 0.004611968994140625, 0.005467414855957031, 0.0063228607177734375, 0.007178306579589844, 0.00803375244140625, 0.008889198303222656, 0.009744644165039062, 0.010600090026855469, 0.011455535888671875, 0.012310981750488281, 0.013166427612304688, 0.014021873474121094, 0.0148773193359375, 0.015732765197753906, 0.016588211059570312, 0.01744365692138672, 0.018299102783203125, 0.01915454864501953, 0.020009994506835938, 0.020865440368652344, 0.02172088623046875, 0.022576332092285156, 0.023431777954101562, 0.02428722381591797, 0.025142669677734375, 0.02599811553955078, 0.026853561401367188, 0.027709007263183594, 0.028564453125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 5.0, 9.0, 17.0, 14.0, 18.0, 20.0, 21.0, 19.0, 28.0, 29.0, 34.0, 35.0, 31.0, 35.0, 41.0, 27.0, 44.0, 44.0, 42.0, 49.0, 30.0, 44.0, 33.0, 42.0, 25.0, 39.0, 35.0, 30.0, 21.0, 23.0, 26.0, 17.0, 7.0, 14.0, 15.0, 9.0, 2.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007568359375, -0.007318854331970215, -0.00706934928894043, -0.0068198442459106445, -0.006570339202880859, -0.006320834159851074, -0.006071329116821289, -0.005821824073791504, -0.005572319030761719, -0.005322813987731934, -0.0050733089447021484, -0.004823803901672363, -0.004574298858642578, -0.004324793815612793, -0.004075288772583008, -0.0038257837295532227, -0.0035762786865234375, -0.0033267736434936523, -0.003077268600463867, -0.002827763557434082, -0.002578258514404297, -0.0023287534713745117, -0.0020792484283447266, -0.0018297433853149414, -0.0015802383422851562, -0.001330733299255371, -0.001081228256225586, -0.0008317232131958008, -0.0005822181701660156, -0.00033271312713623047, -8.320808410644531e-05, 0.00016629695892333984, 0.000415802001953125, 0.0006653070449829102, 0.0009148120880126953, 0.0011643171310424805, 0.0014138221740722656, 0.0016633272171020508, 0.001912832260131836, 0.002162337303161621, 0.0024118423461914062, 0.0026613473892211914, 0.0029108524322509766, 0.0031603574752807617, 0.003409862518310547, 0.003659367561340332, 0.003908872604370117, 0.004158377647399902, 0.0044078826904296875, 0.004657387733459473, 0.004906892776489258, 0.005156397819519043, 0.005405902862548828, 0.005655407905578613, 0.0059049129486083984, 0.006154417991638184, 0.006403923034667969, 0.006653428077697754, 0.006902933120727539, 0.007152438163757324, 0.007401943206787109, 0.0076514482498168945, 0.00790095329284668, 0.008150458335876465, 0.00839996337890625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 10.0, 9.0, 14.0, 19.0, 24.0, 31.0, 41.0, 55.0, 101.0, 134.0, 182.0, 234.0, 388.0, 563.0, 900.0, 1316.0, 2150.0, 3273.0, 5675.0, 10038.0, 19188.0, 42003.0, 753905.0, 134404.0, 34563.0, 16647.0, 8960.0, 4979.0, 3112.0, 1880.0, 1218.0, 830.0, 496.0, 341.0, 279.0, 172.0, 132.0, 81.0, 65.0, 41.0, 32.0, 21.0, 17.0, 15.0, 4.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.01300811767578125, -0.012612700462341309, -0.012217283248901367, -0.011821866035461426, -0.011426448822021484, -0.011031031608581543, -0.010635614395141602, -0.01024019718170166, -0.009844779968261719, -0.009449362754821777, -0.009053945541381836, -0.008658528327941895, -0.008263111114501953, -0.007867693901062012, -0.00747227668762207, -0.007076859474182129, -0.0066814422607421875, -0.006286025047302246, -0.005890607833862305, -0.005495190620422363, -0.005099773406982422, -0.0047043561935424805, -0.004308938980102539, -0.003913521766662598, -0.0035181045532226562, -0.003122687339782715, -0.0027272701263427734, -0.002331852912902832, -0.0019364356994628906, -0.0015410184860229492, -0.0011456012725830078, -0.0007501840591430664, -0.000354766845703125, 4.0650367736816406e-05, 0.0004360675811767578, 0.0008314847946166992, 0.0012269020080566406, 0.001622319221496582, 0.0020177364349365234, 0.002413153648376465, 0.0028085708618164062, 0.0032039880752563477, 0.003599405288696289, 0.0039948225021362305, 0.004390239715576172, 0.004785656929016113, 0.005181074142456055, 0.005576491355895996, 0.0059719085693359375, 0.006367325782775879, 0.00676274299621582, 0.007158160209655762, 0.007553577423095703, 0.007948994636535645, 0.008344411849975586, 0.008739829063415527, 0.009135246276855469, 0.00953066349029541, 0.009926080703735352, 0.010321497917175293, 0.010716915130615234, 0.011112332344055176, 0.011507749557495117, 0.011903166770935059, 0.012298583984375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 9.0, 3.0, 8.0, 10.0, 6.0, 14.0, 13.0, 19.0, 20.0, 21.0, 45.0, 55.0, 104.0, 73.0, 121.0, 67.0, 90.0, 78.0, 51.0, 47.0, 29.0, 21.0, 16.0, 8.0, 9.0, 3.0, 9.0, 10.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.304813385009766e-06, -5.161389708518982e-06, -5.017966032028198e-06, -4.8745423555374146e-06, -4.731118679046631e-06, -4.587695002555847e-06, -4.4442713260650635e-06, -4.30084764957428e-06, -4.157423973083496e-06, -4.014000296592712e-06, -3.870576620101929e-06, -3.727152943611145e-06, -3.5837292671203613e-06, -3.4403055906295776e-06, -3.296881914138794e-06, -3.1534582376480103e-06, -3.0100345611572266e-06, -2.866610884666443e-06, -2.723187208175659e-06, -2.5797635316848755e-06, -2.436339855194092e-06, -2.292916178703308e-06, -2.1494925022125244e-06, -2.0060688257217407e-06, -1.862645149230957e-06, -1.7192214727401733e-06, -1.5757977962493896e-06, -1.432374119758606e-06, -1.2889504432678223e-06, -1.1455267667770386e-06, -1.0021030902862549e-06, -8.586794137954712e-07, -7.152557373046875e-07, -5.718320608139038e-07, -4.284083843231201e-07, -2.849847078323364e-07, -1.4156103134155273e-07, 1.862645149230957e-09, 1.4528632164001465e-07, 2.8870999813079834e-07, 4.3213367462158203e-07, 5.755573511123657e-07, 7.189810276031494e-07, 8.624047040939331e-07, 1.0058283805847168e-06, 1.1492520570755005e-06, 1.2926757335662842e-06, 1.4360994100570679e-06, 1.5795230865478516e-06, 1.7229467630386353e-06, 1.866370439529419e-06, 2.0097941160202026e-06, 2.1532177925109863e-06, 2.29664146900177e-06, 2.4400651454925537e-06, 2.5834888219833374e-06, 2.726912498474121e-06, 2.8703361749649048e-06, 3.0137598514556885e-06, 3.157183527946472e-06, 3.300607204437256e-06, 3.4440308809280396e-06, 3.5874545574188232e-06, 3.730878233909607e-06, 3.874301910400391e-06]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 7.0, 11.0, 17.0, 18.0, 21.0, 37.0, 43.0, 79.0, 114.0, 179.0, 255.0, 375.0, 564.0, 900.0, 1366.0, 2164.0, 3472.0, 5925.0, 10488.0, 21615.0, 55396.0, 803029.0, 82910.0, 28228.0, 13088.0, 7132.0, 4114.0, 2500.0, 1603.0, 982.0, 642.0, 411.0, 270.0, 183.0, 136.0, 77.0, 63.0, 41.0, 34.0, 16.0, 16.0, 13.0, 9.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01323699951171875, -0.012843728065490723, -0.012450456619262695, -0.012057185173034668, -0.01166391372680664, -0.011270642280578613, -0.010877370834350586, -0.010484099388122559, -0.010090827941894531, -0.009697556495666504, -0.009304285049438477, -0.00891101360321045, -0.008517742156982422, -0.008124470710754395, -0.007731199264526367, -0.00733792781829834, -0.0069446563720703125, -0.006551384925842285, -0.006158113479614258, -0.0057648420333862305, -0.005371570587158203, -0.004978299140930176, -0.0045850276947021484, -0.004191756248474121, -0.0037984848022460938, -0.0034052133560180664, -0.003011941909790039, -0.0026186704635620117, -0.0022253990173339844, -0.001832127571105957, -0.0014388561248779297, -0.0010455846786499023, -0.000652313232421875, -0.00025904178619384766, 0.0001342296600341797, 0.000527501106262207, 0.0009207725524902344, 0.0013140439987182617, 0.001707315444946289, 0.0021005868911743164, 0.0024938583374023438, 0.002887129783630371, 0.0032804012298583984, 0.0036736726760864258, 0.004066944122314453, 0.0044602155685424805, 0.004853487014770508, 0.005246758460998535, 0.0056400299072265625, 0.00603330135345459, 0.006426572799682617, 0.0068198442459106445, 0.007213115692138672, 0.007606387138366699, 0.007999658584594727, 0.008392930030822754, 0.008786201477050781, 0.009179472923278809, 0.009572744369506836, 0.009966015815734863, 0.01035928726196289, 0.010752558708190918, 0.011145830154418945, 0.011539101600646973, 0.011932373046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 9.0, 5.0, 8.0, 10.0, 15.0, 16.0, 24.0, 24.0, 33.0, 40.0, 472.0, 156.0, 21.0, 30.0, 19.0, 16.0, 20.0, 15.0, 11.0, 3.0, 5.0, 4.0, 5.0, 6.0, 6.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00345611572265625, -0.003354191780090332, -0.003252267837524414, -0.003150343894958496, -0.003048419952392578, -0.00294649600982666, -0.002844572067260742, -0.0027426481246948242, -0.0026407241821289062, -0.0025388002395629883, -0.0024368762969970703, -0.0023349523544311523, -0.0022330284118652344, -0.0021311044692993164, -0.0020291805267333984, -0.0019272565841674805, -0.0018253326416015625, -0.0017234086990356445, -0.0016214847564697266, -0.0015195608139038086, -0.0014176368713378906, -0.0013157129287719727, -0.0012137889862060547, -0.0011118650436401367, -0.0010099411010742188, -0.0009080171585083008, -0.0008060932159423828, -0.0007041692733764648, -0.0006022453308105469, -0.0005003213882446289, -0.00039839744567871094, -0.00029647350311279297, -0.000194549560546875, -9.262561798095703e-05, 9.298324584960938e-06, 0.0001112222671508789, 0.00021314620971679688, 0.00031507015228271484, 0.0004169940948486328, 0.0005189180374145508, 0.0006208419799804688, 0.0007227659225463867, 0.0008246898651123047, 0.0009266138076782227, 0.0010285377502441406, 0.0011304616928100586, 0.0012323856353759766, 0.0013343095779418945, 0.0014362335205078125, 0.0015381574630737305, 0.0016400814056396484, 0.0017420053482055664, 0.0018439292907714844, 0.0019458532333374023, 0.0020477771759033203, 0.0021497011184692383, 0.0022516250610351562, 0.0023535490036010742, 0.002455472946166992, 0.00255739688873291, 0.002659320831298828, 0.002761244773864746, 0.002863168716430664, 0.002965092658996582, 0.0030670166015625]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 11.0, 9.0, 11.0, 18.0, 15.0, 24.0, 45.0, 51.0, 72.0, 98.0, 150.0, 138.0, 89.0, 63.0, 49.0, 31.0, 25.0, 20.0, 9.0, 6.0, 16.0, 11.0, 8.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02014574594795704, -0.019432228058576584, -0.01871870830655098, -0.018005188554525375, -0.01729167066514492, -0.016578152775764465, -0.01586463302373886, -0.015151114203035831, -0.014437595382332802, -0.013724076561629772, -0.013010557740926743, -0.012297038920223713, -0.011583520099520683, -0.010870001278817654, -0.010156482458114624, -0.009442963637411594, -0.008729444816708565, -0.008015925996005535, -0.0073024071753025055, -0.006588888354599476, -0.005875369533896446, -0.005161850713193417, -0.004448331892490387, -0.0037348130717873573, -0.0030212942510843277, -0.002307775430381298, -0.0015942566096782684, -0.0008807377889752388, -0.00016721896827220917, 0.0005462998524308205, 0.00125981867313385, 0.0019733374938368797, 0.0026868563145399094, 0.003400375135242939, 0.004113893955945969, 0.004827412776648998, 0.005540931597352028, 0.0062544504180550575, 0.006967969238758087, 0.007681488059461117, 0.008395006880164146, 0.009108525700867176, 0.009822044521570206, 0.010535563342273235, 0.011249082162976265, 0.011962600983679295, 0.012676119804382324, 0.013389638625085354, 0.014103157445788383, 0.014816676266491413, 0.015530195087194443, 0.016243714839220047, 0.016957232728600502, 0.017670750617980957, 0.01838427037000656, 0.019097790122032166, 0.01981130801141262, 0.020524825900793076, 0.02123834565281868, 0.021951865404844284, 0.02266538329422474, 0.023378901183605194, 0.0240924209356308, 0.024805940687656403, 0.025519458577036858]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 9.0, 3.0, 5.0, 14.0, 13.0, 16.0, 25.0, 26.0, 24.0, 37.0, 38.0, 26.0, 31.0, 48.0, 46.0, 58.0, 54.0, 45.0, 48.0, 47.0, 55.0, 46.0, 41.0, 34.0, 37.0, 25.0, 32.0, 20.0, 19.0, 18.0, 14.0, 9.0, 14.0, 5.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.0207980889827013, -0.020295774564146996, -0.01979346200823784, -0.019291147589683533, -0.018788833171129227, -0.01828651875257492, -0.017784204334020615, -0.017281891778111458, -0.016779577359557152, -0.016277262941002846, -0.01577495038509369, -0.015272635966539383, -0.014770321547985077, -0.014268007129430771, -0.01376569364219904, -0.013263380154967308, -0.012761065736413002, -0.012258751317858696, -0.011756437830626965, -0.011254124343395233, -0.010751809924840927, -0.010249495506286621, -0.00974718201905489, -0.009244868531823158, -0.008742554113268852, -0.008240239694714546, -0.007737926207482815, -0.007235612254589796, -0.006733298301696777, -0.006230984348803759, -0.00572867039591074, -0.005226356443017721, -0.004724044352769852, -0.004221730399876833, -0.0037194164469838142, -0.0032171024940907955, -0.002714788541197777, -0.002212474588304758, -0.0017101606354117393, -0.0012078466825187206, -0.0007055327296257019, -0.00020321877673268318, 0.00029909517616033554, 0.0008014091290533543, 0.001303723081946373, 0.0018060370348393917, 0.0023083509877324104, 0.002810664940625429, 0.003312978893518448, 0.0038152928464114666, 0.004317606799304485, 0.004819920752197504, 0.005322234705090523, 0.0058245486579835415, 0.00632686261087656, 0.006829176563769579, 0.007331490516662598, 0.007833804935216904, 0.008336118422448635, 0.008838431909680367, 0.009340746328234673, 0.009843060746788979, 0.01034537423402071, 0.010847687721252441, 0.011350002139806747]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 9.0, 11.0, 11.0, 27.0, 45.0, 44.0, 66.0, 102.0, 142.0, 237.0, 328.0, 540.0, 963.0, 1458.0, 2554.0, 4372.0, 7741.0, 14840.0, 28443.0, 60609.0, 148341.0, 501550.0, 2294975.0, 786314.0, 193769.0, 74925.0, 34622.0, 17179.0, 9070.0, 4781.0, 2659.0, 1492.0, 835.0, 495.0, 303.0, 149.0, 107.0, 75.0, 39.0, 17.0, 11.0, 15.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0], "bins": [-0.0311737060546875, -0.03036665916442871, -0.029559612274169922, -0.028752565383911133, -0.027945518493652344, -0.027138471603393555, -0.026331424713134766, -0.025524377822875977, -0.024717330932617188, -0.0239102840423584, -0.02310323715209961, -0.02229619026184082, -0.02148914337158203, -0.020682096481323242, -0.019875049591064453, -0.019068002700805664, -0.018260955810546875, -0.017453908920288086, -0.016646862030029297, -0.015839815139770508, -0.015032768249511719, -0.01422572135925293, -0.01341867446899414, -0.012611627578735352, -0.011804580688476562, -0.010997533798217773, -0.010190486907958984, -0.009383440017700195, -0.008576393127441406, -0.007769346237182617, -0.006962299346923828, -0.006155252456665039, -0.00534820556640625, -0.004541158676147461, -0.003734111785888672, -0.002927064895629883, -0.0021200180053710938, -0.0013129711151123047, -0.0005059242248535156, 0.00030112266540527344, 0.0011081695556640625, 0.0019152164459228516, 0.0027222633361816406, 0.0035293102264404297, 0.004336357116699219, 0.005143404006958008, 0.005950450897216797, 0.006757497787475586, 0.007564544677734375, 0.008371591567993164, 0.009178638458251953, 0.009985685348510742, 0.010792732238769531, 0.01159977912902832, 0.01240682601928711, 0.013213872909545898, 0.014020919799804688, 0.014827966690063477, 0.015635013580322266, 0.016442060470581055, 0.017249107360839844, 0.018056154251098633, 0.018863201141357422, 0.01967024803161621, 0.020477294921875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 7.0, 6.0, 19.0, 18.0, 13.0, 17.0, 33.0, 28.0, 37.0, 32.0, 35.0, 46.0, 51.0, 50.0, 58.0, 51.0, 48.0, 51.0, 55.0, 42.0, 39.0, 38.0, 37.0, 34.0, 25.0, 16.0, 21.0, 18.0, 16.0, 15.0, 11.0, 4.0, 8.0, 8.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.01309967041015625, -0.012785494327545166, -0.012471318244934082, -0.012157142162322998, -0.011842966079711914, -0.01152878999710083, -0.011214613914489746, -0.010900437831878662, -0.010586261749267578, -0.010272085666656494, -0.00995790958404541, -0.009643733501434326, -0.009329557418823242, -0.009015381336212158, -0.008701205253601074, -0.00838702917098999, -0.008072853088378906, -0.007758677005767822, -0.007444500923156738, -0.007130324840545654, -0.00681614875793457, -0.006501972675323486, -0.006187796592712402, -0.005873620510101318, -0.005559444427490234, -0.00524526834487915, -0.004931092262268066, -0.004616916179656982, -0.0043027400970458984, -0.0039885640144348145, -0.0036743879318237305, -0.0033602118492126465, -0.0030460357666015625, -0.0027318596839904785, -0.0024176836013793945, -0.0021035075187683105, -0.0017893314361572266, -0.0014751553535461426, -0.0011609792709350586, -0.0008468031883239746, -0.0005326271057128906, -0.00021845102310180664, 9.572505950927734e-05, 0.00040990114212036133, 0.0007240772247314453, 0.0010382533073425293, 0.0013524293899536133, 0.0016666054725646973, 0.0019807815551757812, 0.0022949576377868652, 0.0026091337203979492, 0.002923309803009033, 0.003237485885620117, 0.003551661968231201, 0.003865838050842285, 0.004180014133453369, 0.004494190216064453, 0.004808366298675537, 0.005122542381286621, 0.005436718463897705, 0.005750894546508789, 0.006065070629119873, 0.006379246711730957, 0.006693422794342041, 0.007007598876953125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 5.0, 13.0, 14.0, 26.0, 35.0, 49.0, 73.0, 91.0, 133.0, 209.0, 271.0, 371.0, 508.0, 771.0, 1131.0, 1561.0, 2224.0, 3294.0, 4864.0, 7784.0, 11932.0, 19089.0, 30541.0, 50699.0, 88330.0, 166443.0, 352148.0, 894745.0, 1414275.0, 586367.0, 251486.0, 125571.0, 68889.0, 40696.0, 24401.0, 15180.0, 9934.0, 6336.0, 4223.0, 2855.0, 2000.0, 1380.0, 971.0, 714.0, 495.0, 342.0, 243.0, 197.0, 112.0, 84.0, 65.0, 49.0, 25.0, 17.0, 13.0, 5.0, 9.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.013214111328125, -0.012791752815246582, -0.012369394302368164, -0.011947035789489746, -0.011524677276611328, -0.01110231876373291, -0.010679960250854492, -0.010257601737976074, -0.009835243225097656, -0.009412884712219238, -0.00899052619934082, -0.008568167686462402, -0.008145809173583984, -0.007723450660705566, -0.0073010921478271484, -0.0068787336349487305, -0.0064563751220703125, -0.0060340166091918945, -0.0056116580963134766, -0.005189299583435059, -0.004766941070556641, -0.004344582557678223, -0.003922224044799805, -0.0034998655319213867, -0.0030775070190429688, -0.0026551485061645508, -0.002232789993286133, -0.0018104314804077148, -0.0013880729675292969, -0.0009657144546508789, -0.0005433559417724609, -0.00012099742889404297, 0.000301361083984375, 0.000723719596862793, 0.001146078109741211, 0.001568436622619629, 0.001990795135498047, 0.002413153648376465, 0.002835512161254883, 0.0032578706741333008, 0.0036802291870117188, 0.004102587699890137, 0.004524946212768555, 0.004947304725646973, 0.005369663238525391, 0.005792021751403809, 0.0062143802642822266, 0.0066367387771606445, 0.0070590972900390625, 0.0074814558029174805, 0.007903814315795898, 0.008326172828674316, 0.008748531341552734, 0.009170889854431152, 0.00959324836730957, 0.010015606880187988, 0.010437965393066406, 0.010860323905944824, 0.011282682418823242, 0.01170504093170166, 0.012127399444580078, 0.012549757957458496, 0.012972116470336914, 0.013394474983215332, 0.01381683349609375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 6.0, 5.0, 6.0, 8.0, 9.0, 12.0, 17.0, 20.0, 37.0, 33.0, 34.0, 55.0, 52.0, 80.0, 98.0, 123.0, 133.0, 145.0, 179.0, 206.0, 223.0, 265.0, 263.0, 309.0, 248.0, 230.0, 215.0, 206.0, 169.0, 129.0, 110.0, 98.0, 82.0, 65.0, 45.0, 29.0, 21.0, 30.0, 18.0, 15.0, 8.0, 8.0, 3.0, 8.0, 4.0, 2.0, 2.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004161834716796875, -0.004023134708404541, -0.003884434700012207, -0.003745734691619873, -0.003607034683227539, -0.003468334674835205, -0.003329634666442871, -0.003190934658050537, -0.003052234649658203, -0.002913534641265869, -0.002774834632873535, -0.002636134624481201, -0.002497434616088867, -0.002358734607696533, -0.0022200345993041992, -0.0020813345909118652, -0.0019426345825195312, -0.0018039345741271973, -0.0016652345657348633, -0.0015265345573425293, -0.0013878345489501953, -0.0012491345405578613, -0.0011104345321655273, -0.0009717345237731934, -0.0008330345153808594, -0.0006943345069885254, -0.0005556344985961914, -0.0004169344902038574, -0.00027823448181152344, -0.00013953447341918945, -8.344650268554688e-07, 0.00013786554336547852, 0.0002765655517578125, 0.0004152655601501465, 0.0005539655685424805, 0.0006926655769348145, 0.0008313655853271484, 0.0009700655937194824, 0.0011087656021118164, 0.0012474656105041504, 0.0013861656188964844, 0.0015248656272888184, 0.0016635656356811523, 0.0018022656440734863, 0.0019409656524658203, 0.0020796656608581543, 0.0022183656692504883, 0.0023570656776428223, 0.0024957656860351562, 0.0026344656944274902, 0.0027731657028198242, 0.002911865711212158, 0.003050565719604492, 0.003189265727996826, 0.00332796573638916, 0.003466665744781494, 0.003605365753173828, 0.003744065761566162, 0.003882765769958496, 0.00402146577835083, 0.004160165786743164, 0.004298865795135498, 0.004437565803527832, 0.004576265811920166, 0.0047149658203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 6.0, 5.0, 8.0, 14.0, 20.0, 31.0, 45.0, 62.0, 96.0, 125.0, 145.0, 151.0, 83.0, 56.0, 45.0, 25.0, 20.0, 12.0, 15.0, 4.0, 6.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02188003435730934, -0.021284710615873337, -0.02068938873708248, -0.020094066858291626, -0.01949874311685562, -0.018903419375419617, -0.01830809749662876, -0.017712775617837906, -0.0171174518764019, -0.016522128134965897, -0.01592680625617504, -0.015331483446061611, -0.014736160635948181, -0.014140837825834751, -0.013545515015721321, -0.012950192205607891, -0.012354869395494461, -0.011759546585381031, -0.011164223775267601, -0.010568900965154171, -0.009973578155040741, -0.009378255344927311, -0.008782932534813881, -0.008187609724700451, -0.007592286914587021, -0.006996964104473591, -0.006401641294360161, -0.005806318484246731, -0.005210995674133301, -0.004615672864019871, -0.004020350053906441, -0.0034250272437930107, -0.00282970629632473, -0.0022343834862113, -0.0016390606760978699, -0.0010437378659844398, -0.0004484150558710098, 0.0001469077542424202, 0.0007422305643558502, 0.0013375533744692802, 0.0019328761845827103, 0.0025281989946961403, 0.0031235218048095703, 0.0037188446149230003, 0.00431416742503643, 0.00490949023514986, 0.00550481304526329, 0.00610013585537672, 0.0066954586654901505, 0.0072907814756035805, 0.00788610428571701, 0.00848142709583044, 0.00907674990594387, 0.0096720727160573, 0.01026739552617073, 0.01086271833628416, 0.01145804114639759, 0.01205336395651102, 0.01264868676662445, 0.01324400957673788, 0.01383933238685131, 0.01443465519696474, 0.01502997800707817, 0.015625301748514175, 0.01622062362730503]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 11.0, 8.0, 12.0, 14.0, 17.0, 34.0, 26.0, 32.0, 28.0, 40.0, 46.0, 49.0, 57.0, 40.0, 42.0, 50.0, 48.0, 53.0, 41.0, 65.0, 40.0, 35.0, 38.0, 34.0, 23.0, 25.0, 16.0, 18.0, 12.0, 18.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.01368509978055954, -0.013337675482034683, -0.012990251183509827, -0.01264282688498497, -0.012295402586460114, -0.011947978287935257, -0.0116005539894104, -0.011253129690885544, -0.010905705392360687, -0.01055828109383583, -0.010210856795310974, -0.009863432496786118, -0.009516008198261261, -0.009168583899736404, -0.008821159601211548, -0.008473735302686691, -0.008126311004161835, -0.007778886705636978, -0.007431462407112122, -0.007084038108587265, -0.0067366138100624084, -0.006389189511537552, -0.006041765213012695, -0.005694340914487839, -0.005346917547285557, -0.0049994932487607, -0.004652068950235844, -0.004304644651710987, -0.0039572203531861305, -0.003609796054661274, -0.003262371988967061, -0.0029149476904422045, -0.0025675231590867043, -0.0022200988605618477, -0.0018726745620369911, -0.0015252503799274564, -0.0011778260814025998, -0.0008304017828777432, -0.0004829776007682085, -0.00013555330224335194, 0.00021187099628150463, 0.0005592952948063612, 0.0009067195351235569, 0.0012541437754407525, 0.001601568073965609, 0.0019489923724904656, 0.0022964165546000004, 0.002643840853124857, 0.0029912651516497135, 0.00333868945017457, 0.0036861137486994267, 0.004033538047224283, 0.00438096234574914, 0.004728386644273996, 0.005075810477137566, 0.005423234775662422, 0.005770659074187279, 0.006118083372712135, 0.006465507671236992, 0.0068129319697618484, 0.007160356268286705, 0.007507780566811562, 0.007855204865336418, 0.008202629163861275, 0.008550053462386131]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 10.0, 9.0, 10.0, 25.0, 30.0, 45.0, 65.0, 87.0, 152.0, 246.0, 384.0, 601.0, 889.0, 1278.0, 2053.0, 3301.0, 5378.0, 9368.0, 16398.0, 31390.0, 65684.0, 157816.0, 355615.0, 220670.0, 88118.0, 40069.0, 20420.0, 11137.0, 6453.0, 3942.0, 2454.0, 1574.0, 1041.0, 613.0, 421.0, 282.0, 174.0, 122.0, 95.0, 55.0, 28.0, 17.0, 18.0, 13.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015380859375, -0.014862537384033203, -0.014344215393066406, -0.01382589340209961, -0.013307571411132812, -0.012789249420166016, -0.012270927429199219, -0.011752605438232422, -0.011234283447265625, -0.010715961456298828, -0.010197639465332031, -0.009679317474365234, -0.009160995483398438, -0.00864267349243164, -0.008124351501464844, -0.007606029510498047, -0.00708770751953125, -0.006569385528564453, -0.006051063537597656, -0.005532741546630859, -0.0050144195556640625, -0.004496097564697266, -0.003977775573730469, -0.003459453582763672, -0.002941131591796875, -0.002422809600830078, -0.0019044876098632812, -0.0013861656188964844, -0.0008678436279296875, -0.0003495216369628906, 0.00016880035400390625, 0.0006871223449707031, 0.0012054443359375, 0.0017237663269042969, 0.0022420883178710938, 0.0027604103088378906, 0.0032787322998046875, 0.0037970542907714844, 0.004315376281738281, 0.004833698272705078, 0.005352020263671875, 0.005870342254638672, 0.006388664245605469, 0.006906986236572266, 0.0074253082275390625, 0.00794363021850586, 0.008461952209472656, 0.008980274200439453, 0.00949859619140625, 0.010016918182373047, 0.010535240173339844, 0.01105356216430664, 0.011571884155273438, 0.012090206146240234, 0.012608528137207031, 0.013126850128173828, 0.013645172119140625, 0.014163494110107422, 0.014681816101074219, 0.015200138092041016, 0.015718460083007812, 0.01623678207397461, 0.016755104064941406, 0.017273426055908203, 0.017791748046875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 11.0, 10.0, 14.0, 18.0, 19.0, 23.0, 33.0, 35.0, 28.0, 38.0, 41.0, 50.0, 56.0, 34.0, 45.0, 45.0, 50.0, 48.0, 46.0, 40.0, 49.0, 40.0, 29.0, 42.0, 31.0, 15.0, 23.0, 10.0, 14.0, 13.0, 16.0, 7.0, 9.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.01216888427734375, -0.011868894100189209, -0.011568903923034668, -0.011268913745880127, -0.010968923568725586, -0.010668933391571045, -0.010368943214416504, -0.010068953037261963, -0.009768962860107422, -0.00946897268295288, -0.00916898250579834, -0.008868992328643799, -0.008569002151489258, -0.008269011974334717, -0.007969021797180176, -0.007669031620025635, -0.007369041442871094, -0.007069051265716553, -0.006769061088562012, -0.006469070911407471, -0.00616908073425293, -0.005869090557098389, -0.005569100379943848, -0.005269110202789307, -0.004969120025634766, -0.004669129848480225, -0.004369139671325684, -0.004069149494171143, -0.0037691593170166016, -0.0034691691398620605, -0.0031691789627075195, -0.0028691887855529785, -0.0025691986083984375, -0.0022692084312438965, -0.0019692182540893555, -0.0016692280769348145, -0.0013692378997802734, -0.0010692477226257324, -0.0007692575454711914, -0.0004692673683166504, -0.00016927719116210938, 0.00013071298599243164, 0.00043070316314697266, 0.0007306933403015137, 0.0010306835174560547, 0.0013306736946105957, 0.0016306638717651367, 0.0019306540489196777, 0.0022306442260742188, 0.0025306344032287598, 0.0028306245803833008, 0.003130614757537842, 0.003430604934692383, 0.003730595111846924, 0.004030585289001465, 0.004330575466156006, 0.004630565643310547, 0.004930555820465088, 0.005230545997619629, 0.00553053617477417, 0.005830526351928711, 0.006130516529083252, 0.006430506706237793, 0.006730496883392334, 0.007030487060546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 6.0, 5.0, 12.0, 15.0, 25.0, 23.0, 40.0, 62.0, 98.0, 163.0, 233.0, 371.0, 578.0, 1057.0, 1675.0, 2968.0, 5819.0, 12726.0, 34818.0, 152656.0, 644716.0, 134053.0, 31839.0, 11917.0, 5648.0, 2921.0, 1556.0, 911.0, 566.0, 388.0, 233.0, 157.0, 102.0, 55.0, 39.0, 33.0, 23.0, 18.0, 7.0, 13.0, 4.0, 2.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0219268798828125, -0.021030664443969727, -0.020134449005126953, -0.01923823356628418, -0.018342018127441406, -0.017445802688598633, -0.01654958724975586, -0.015653371810913086, -0.014757156372070312, -0.013860940933227539, -0.012964725494384766, -0.012068510055541992, -0.011172294616699219, -0.010276079177856445, -0.009379863739013672, -0.008483648300170898, -0.007587432861328125, -0.0066912174224853516, -0.005795001983642578, -0.004898786544799805, -0.004002571105957031, -0.003106355667114258, -0.0022101402282714844, -0.001313924789428711, -0.0004177093505859375, 0.00047850608825683594, 0.0013747215270996094, 0.002270936965942383, 0.0031671524047851562, 0.00406336784362793, 0.004959583282470703, 0.0058557987213134766, 0.00675201416015625, 0.0076482295989990234, 0.008544445037841797, 0.00944066047668457, 0.010336875915527344, 0.011233091354370117, 0.01212930679321289, 0.013025522232055664, 0.013921737670898438, 0.014817953109741211, 0.015714168548583984, 0.016610383987426758, 0.01750659942626953, 0.018402814865112305, 0.019299030303955078, 0.02019524574279785, 0.021091461181640625, 0.0219876766204834, 0.022883892059326172, 0.023780107498168945, 0.02467632293701172, 0.025572538375854492, 0.026468753814697266, 0.02736496925354004, 0.028261184692382812, 0.029157400131225586, 0.03005361557006836, 0.030949831008911133, 0.031846046447753906, 0.03274226188659668, 0.03363847732543945, 0.03453469276428223, 0.035430908203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 3.0, 9.0, 10.0, 13.0, 11.0, 11.0, 15.0, 22.0, 29.0, 23.0, 32.0, 31.0, 29.0, 28.0, 37.0, 34.0, 33.0, 45.0, 43.0, 42.0, 37.0, 45.0, 51.0, 42.0, 40.0, 33.0, 40.0, 33.0, 26.0, 19.0, 22.0, 17.0, 14.0, 12.0, 18.0, 13.0, 5.0, 9.0, 3.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005344390869140625, -0.005178511142730713, -0.005012631416320801, -0.004846751689910889, -0.0046808719635009766, -0.0045149922370910645, -0.004349112510681152, -0.00418323278427124, -0.004017353057861328, -0.003851473331451416, -0.003685593605041504, -0.003519713878631592, -0.0033538341522216797, -0.0031879544258117676, -0.0030220746994018555, -0.0028561949729919434, -0.0026903152465820312, -0.002524435520172119, -0.002358555793762207, -0.002192676067352295, -0.002026796340942383, -0.0018609166145324707, -0.0016950368881225586, -0.0015291571617126465, -0.0013632774353027344, -0.0011973977088928223, -0.0010315179824829102, -0.000865638256072998, -0.0006997585296630859, -0.0005338788032531738, -0.0003679990768432617, -0.0002021193504333496, -3.62396240234375e-05, 0.0001296401023864746, 0.0002955198287963867, 0.00046139955520629883, 0.0006272792816162109, 0.000793159008026123, 0.0009590387344360352, 0.0011249184608459473, 0.0012907981872558594, 0.0014566779136657715, 0.0016225576400756836, 0.0017884373664855957, 0.001954317092895508, 0.00212019681930542, 0.002286076545715332, 0.002451956272125244, 0.0026178359985351562, 0.0027837157249450684, 0.0029495954513549805, 0.0031154751777648926, 0.0032813549041748047, 0.003447234630584717, 0.003613114356994629, 0.003778994083404541, 0.003944873809814453, 0.004110753536224365, 0.004276633262634277, 0.0044425129890441895, 0.0046083927154541016, 0.004774272441864014, 0.004940152168273926, 0.005106031894683838, 0.00527191162109375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 5.0, 11.0, 15.0, 34.0, 35.0, 50.0, 79.0, 101.0, 150.0, 187.0, 266.0, 352.0, 548.0, 845.0, 1147.0, 1608.0, 2476.0, 4293.0, 7091.0, 13079.0, 25865.0, 59848.0, 178687.0, 478350.0, 162338.0, 55637.0, 24488.0, 12293.0, 6694.0, 4065.0, 2544.0, 1681.0, 1129.0, 767.0, 519.0, 375.0, 284.0, 196.0, 136.0, 95.0, 63.0, 44.0, 27.0, 20.0, 8.0, 4.0, 10.0, 1.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0], "bins": [-0.003154754638671875, -0.0030575692653656006, -0.002960383892059326, -0.0028631985187530518, -0.0027660131454467773, -0.002668827772140503, -0.0025716423988342285, -0.002474457025527954, -0.0023772716522216797, -0.0022800862789154053, -0.002182900905609131, -0.0020857155323028564, -0.001988530158996582, -0.0018913447856903076, -0.0017941594123840332, -0.0016969740390777588, -0.0015997886657714844, -0.00150260329246521, -0.0014054179191589355, -0.0013082325458526611, -0.0012110471725463867, -0.0011138617992401123, -0.0010166764259338379, -0.0009194910526275635, -0.0008223056793212891, -0.0007251203060150146, -0.0006279349327087402, -0.0005307495594024658, -0.0004335641860961914, -0.000336378812789917, -0.00023919343948364258, -0.00014200806617736816, -4.482269287109375e-05, 5.2362680435180664e-05, 0.00014954805374145508, 0.0002467334270477295, 0.0003439188003540039, 0.0004411041736602783, 0.0005382895469665527, 0.0006354749202728271, 0.0007326602935791016, 0.000829845666885376, 0.0009270310401916504, 0.0010242164134979248, 0.0011214017868041992, 0.0012185871601104736, 0.001315772533416748, 0.0014129579067230225, 0.0015101432800292969, 0.0016073286533355713, 0.0017045140266418457, 0.0018016993999481201, 0.0018988847732543945, 0.001996070146560669, 0.0020932555198669434, 0.0021904408931732178, 0.002287626266479492, 0.0023848116397857666, 0.002481997013092041, 0.0025791823863983154, 0.00267636775970459, 0.0027735531330108643, 0.0028707385063171387, 0.002967923879623413, 0.0030651092529296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 7.0, 12.0, 22.0, 20.0, 23.0, 23.0, 43.0, 36.0, 37.0, 61.0, 72.0, 94.0, 94.0, 73.0, 70.0, 40.0, 38.0, 40.0, 33.0, 20.0, 26.0, 20.0, 15.0, 10.0, 11.0, 4.0, 2.0, 7.0, 3.0, 6.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9669532775878906e-05, -1.911260187625885e-05, -1.8555670976638794e-05, -1.7998740077018738e-05, -1.744180917739868e-05, -1.6884878277778625e-05, -1.632794737815857e-05, -1.5771016478538513e-05, -1.5214085578918457e-05, -1.4657154679298401e-05, -1.4100223779678345e-05, -1.3543292880058289e-05, -1.2986361980438232e-05, -1.2429431080818176e-05, -1.187250018119812e-05, -1.1315569281578064e-05, -1.0758638381958008e-05, -1.0201707482337952e-05, -9.644776582717896e-06, -9.08784568309784e-06, -8.530914783477783e-06, -7.973983883857727e-06, -7.417052984237671e-06, -6.860122084617615e-06, -6.303191184997559e-06, -5.7462602853775024e-06, -5.189329385757446e-06, -4.63239848613739e-06, -4.075467586517334e-06, -3.518536686897278e-06, -2.9616057872772217e-06, -2.4046748876571655e-06, -1.8477439880371094e-06, -1.2908130884170532e-06, -7.338821887969971e-07, -1.7695128917694092e-07, 3.7997961044311523e-07, 9.369105100631714e-07, 1.4938414096832275e-06, 2.0507723093032837e-06, 2.60770320892334e-06, 3.164634108543396e-06, 3.721565008163452e-06, 4.278495907783508e-06, 4.8354268074035645e-06, 5.392357707023621e-06, 5.949288606643677e-06, 6.506219506263733e-06, 7.063150405883789e-06, 7.620081305503845e-06, 8.177012205123901e-06, 8.733943104743958e-06, 9.290874004364014e-06, 9.84780490398407e-06, 1.0404735803604126e-05, 1.0961666703224182e-05, 1.1518597602844238e-05, 1.2075528502464294e-05, 1.263245940208435e-05, 1.3189390301704407e-05, 1.3746321201324463e-05, 1.4303252100944519e-05, 1.4860183000564575e-05, 1.541711390018463e-05, 1.5974044799804688e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 5.0, 10.0, 11.0, 16.0, 21.0, 28.0, 43.0, 65.0, 80.0, 123.0, 194.0, 257.0, 461.0, 776.0, 1264.0, 2556.0, 5077.0, 10910.0, 23978.0, 58560.0, 163177.0, 437904.0, 214384.0, 73189.0, 29480.0, 12862.0, 6223.0, 3011.0, 1597.0, 853.0, 468.0, 332.0, 213.0, 127.0, 79.0, 65.0, 43.0, 24.0, 28.0, 16.0, 5.0, 11.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002719879150390625, -0.0026364922523498535, -0.002553105354309082, -0.0024697184562683105, -0.002386331558227539, -0.0023029446601867676, -0.002219557762145996, -0.0021361708641052246, -0.002052783966064453, -0.0019693970680236816, -0.0018860101699829102, -0.0018026232719421387, -0.0017192363739013672, -0.0016358494758605957, -0.0015524625778198242, -0.0014690756797790527, -0.0013856887817382812, -0.0013023018836975098, -0.0012189149856567383, -0.0011355280876159668, -0.0010521411895751953, -0.0009687542915344238, -0.0008853673934936523, -0.0008019804954528809, -0.0007185935974121094, -0.0006352066993713379, -0.0005518198013305664, -0.0004684329032897949, -0.00038504600524902344, -0.00030165910720825195, -0.00021827220916748047, -0.00013488531112670898, -5.14984130859375e-05, 3.1888484954833984e-05, 0.00011527538299560547, 0.00019866228103637695, 0.00028204917907714844, 0.0003654360771179199, 0.0004488229751586914, 0.0005322098731994629, 0.0006155967712402344, 0.0006989836692810059, 0.0007823705673217773, 0.0008657574653625488, 0.0009491443634033203, 0.0010325312614440918, 0.0011159181594848633, 0.0011993050575256348, 0.0012826919555664062, 0.0013660788536071777, 0.0014494657516479492, 0.0015328526496887207, 0.0016162395477294922, 0.0016996264457702637, 0.0017830133438110352, 0.0018664002418518066, 0.0019497871398925781, 0.0020331740379333496, 0.002116560935974121, 0.0021999478340148926, 0.002283334732055664, 0.0023667216300964355, 0.002450108528137207, 0.0025334954261779785, 0.00261688232421875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 11.0, 12.0, 29.0, 33.0, 55.0, 57.0, 87.0, 92.0, 106.0, 112.0, 112.0, 85.0, 56.0, 56.0, 42.0, 20.0, 11.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008835792541503906, -0.0008452907204627991, -0.0008070021867752075, -0.000768713653087616, -0.0007304251194000244, -0.0006921365857124329, -0.0006538480520248413, -0.0006155595183372498, -0.0005772709846496582, -0.0005389824509620667, -0.0005006939172744751, -0.00046240538358688354, -0.000424116849899292, -0.00038582831621170044, -0.0003475397825241089, -0.00030925124883651733, -0.0002709627151489258, -0.00023267418146133423, -0.00019438564777374268, -0.00015609711408615112, -0.00011780858039855957, -7.952004671096802e-05, -4.1231513023376465e-05, -2.942979335784912e-06, 3.534555435180664e-05, 7.36340880393982e-05, 0.00011192262172698975, 0.0001502111554145813, 0.00018849968910217285, 0.0002267882227897644, 0.00026507675647735596, 0.0003033652901649475, 0.00034165382385253906, 0.0003799423575401306, 0.00041823089122772217, 0.0004565194249153137, 0.0004948079586029053, 0.0005330964922904968, 0.0005713850259780884, 0.0006096735596656799, 0.0006479620933532715, 0.000686250627040863, 0.0007245391607284546, 0.0007628276944160461, 0.0008011162281036377, 0.0008394047617912292, 0.0008776932954788208, 0.0009159818291664124, 0.0009542703628540039, 0.0009925588965415955, 0.001030847430229187, 0.0010691359639167786, 0.0011074244976043701, 0.0011457130312919617, 0.0011840015649795532, 0.0012222900986671448, 0.0012605786323547363, 0.0012988671660423279, 0.0013371556997299194, 0.001375444233417511, 0.0014137327671051025, 0.001452021300792694, 0.0014903098344802856, 0.0015285983681678772, 0.0015668869018554688]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 0.0, 5.0, 6.0, 12.0, 15.0, 26.0, 32.0, 48.0, 72.0, 125.0, 120.0, 162.0, 123.0, 74.0, 49.0, 32.0, 22.0, 21.0, 11.0, 7.0, 7.0, 6.0, 7.0, 3.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01937452331185341, -0.018839702010154724, -0.01830487884581089, -0.017770057544112206, -0.01723523437976837, -0.016700413078069687, -0.016165591776371002, -0.01563076861202717, -0.015095947310328484, -0.014561125077307224, -0.014026302844285965, -0.01349148154258728, -0.012956659309566021, -0.012421837076544762, -0.011887015774846077, -0.011352193541824818, -0.010817371308803558, -0.010282549075782299, -0.00974772684276104, -0.009212905541062355, -0.008678083308041096, -0.008143261075019836, -0.007608439307659864, -0.007073617540299892, -0.006538795307278633, -0.006003973074257374, -0.005469151306897402, -0.00493432953953743, -0.0043995073065161705, -0.003864685306325555, -0.003329863306134939, -0.0027950413059443235, -0.002260221168398857, -0.0017253991682082415, -0.0011905771680176258, -0.0006557551678270102, -0.0001209331676363945, 0.00041388883255422115, 0.0009487108327448368, 0.0014835328329354525, 0.002018354833126068, 0.0025531768333166838, 0.0030879988335072994, 0.003622820833697915, 0.004157642833888531, 0.00469246506690979, 0.005227286834269762, 0.005762108601629734, 0.006296930834650993, 0.006831753067672253, 0.007366574835032225, 0.007901396602392197, 0.008436218835413456, 0.008971041068434715, 0.0095058623701334, 0.01004068460315466, 0.010575506836175919, 0.011110329069197178, 0.011645151302218437, 0.012179972603917122, 0.012714794836938381, 0.01324961706995964, 0.013784438371658325, 0.014319260604679585, 0.014854082837700844]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 6.0, 4.0, 12.0, 10.0, 11.0, 17.0, 25.0, 33.0, 31.0, 30.0, 38.0, 37.0, 52.0, 42.0, 64.0, 44.0, 54.0, 39.0, 49.0, 47.0, 51.0, 46.0, 47.0, 35.0, 33.0, 27.0, 31.0, 15.0, 14.0, 13.0, 20.0, 11.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.012406989932060242, -0.012095599435269833, -0.011784208938479424, -0.011472818441689014, -0.011161427944898605, -0.010850036516785622, -0.010538646019995213, -0.010227255523204803, -0.009915865026414394, -0.009604474529623985, -0.009293084032833576, -0.008981693536043167, -0.008670302107930183, -0.008358911611139774, -0.008047521114349365, -0.007736130617558956, -0.007424740120768547, -0.007113349623978138, -0.006801959127187729, -0.0064905681647360325, -0.006179177667945623, -0.005867787171155214, -0.005556396208703518, -0.005245005711913109, -0.0049336152151227, -0.004622224718332291, -0.0043108342215418816, -0.003999443259090185, -0.003688052762299776, -0.003376662265509367, -0.0030652715358883142, -0.0027538808062672615, -0.0024424903094768524, -0.0021310998126864433, -0.0018197090830653906, -0.0015083184698596597, -0.0011969278566539288, -0.0008855372434481978, -0.0005741466302424669, -0.0002627559006214142, 4.8634596168994904e-05, 0.0003600252093747258, 0.0006714158225804567, 0.0009828064357861876, 0.0012941970489919186, 0.0016055876621976495, 0.0019169782754033804, 0.002228369005024433, 0.0025397595018148422, 0.0028511499986052513, 0.003162540728226304, 0.003473931457847357, 0.003785321954637766, 0.004096712451428175, 0.004408103413879871, 0.0047194939106702805, 0.0050308844074606895, 0.005342274904251099, 0.005653665401041508, 0.005965056363493204, 0.006276446860283613, 0.006587837357074022, 0.006899228319525719, 0.007210618816316128, 0.007522009313106537]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 7.0, 10.0, 19.0, 22.0, 29.0, 51.0, 62.0, 84.0, 132.0, 202.0, 303.0, 512.0, 807.0, 1264.0, 1879.0, 2920.0, 4603.0, 7371.0, 12283.0, 20791.0, 36280.0, 65821.0, 125274.0, 229290.0, 240041.0, 133464.0, 70530.0, 38141.0, 22048.0, 13013.0, 7842.0, 4850.0, 3043.0, 1965.0, 1279.0, 817.0, 513.0, 343.0, 197.0, 147.0, 82.0, 76.0, 48.0, 40.0, 22.0, 15.0, 6.0, 4.0, 2.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.015716552734375, -0.015241026878356934, -0.014765501022338867, -0.0142899751663208, -0.013814449310302734, -0.013338923454284668, -0.012863397598266602, -0.012387871742248535, -0.011912345886230469, -0.011436820030212402, -0.010961294174194336, -0.01048576831817627, -0.010010242462158203, -0.009534716606140137, -0.00905919075012207, -0.008583664894104004, -0.008108139038085938, -0.007632613182067871, -0.007157087326049805, -0.006681561470031738, -0.006206035614013672, -0.0057305097579956055, -0.005254983901977539, -0.004779458045959473, -0.004303932189941406, -0.00382840633392334, -0.0033528804779052734, -0.002877354621887207, -0.0024018287658691406, -0.0019263029098510742, -0.0014507770538330078, -0.0009752511978149414, -0.000499725341796875, -2.4199485778808594e-05, 0.0004513263702392578, 0.0009268522262573242, 0.0014023780822753906, 0.001877903938293457, 0.0023534297943115234, 0.00282895565032959, 0.0033044815063476562, 0.0037800073623657227, 0.004255533218383789, 0.0047310590744018555, 0.005206584930419922, 0.005682110786437988, 0.006157636642456055, 0.006633162498474121, 0.0071086883544921875, 0.007584214210510254, 0.00805974006652832, 0.008535265922546387, 0.009010791778564453, 0.00948631763458252, 0.009961843490600586, 0.010437369346618652, 0.010912895202636719, 0.011388421058654785, 0.011863946914672852, 0.012339472770690918, 0.012814998626708984, 0.01329052448272705, 0.013766050338745117, 0.014241576194763184, 0.01471710205078125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 11.0, 13.0, 18.0, 20.0, 27.0, 31.0, 28.0, 39.0, 40.0, 38.0, 39.0, 39.0, 47.0, 44.0, 55.0, 43.0, 48.0, 48.0, 49.0, 47.0, 38.0, 37.0, 37.0, 29.0, 22.0, 25.0, 15.0, 4.0, 18.0, 15.0, 12.0, 4.0, 4.0, 2.0, 0.0, 2.0, 4.0, 1.0], "bins": [-0.01015472412109375, -0.009905576705932617, -0.009656429290771484, -0.009407281875610352, -0.009158134460449219, -0.008908987045288086, -0.008659839630126953, -0.00841069221496582, -0.008161544799804688, -0.007912397384643555, -0.007663249969482422, -0.007414102554321289, -0.007164955139160156, -0.0069158077239990234, -0.006666660308837891, -0.006417512893676758, -0.006168365478515625, -0.005919218063354492, -0.005670070648193359, -0.0054209232330322266, -0.005171775817871094, -0.004922628402709961, -0.004673480987548828, -0.004424333572387695, -0.0041751861572265625, -0.00392603874206543, -0.003676891326904297, -0.003427743911743164, -0.0031785964965820312, -0.0029294490814208984, -0.0026803016662597656, -0.002431154251098633, -0.0021820068359375, -0.0019328594207763672, -0.0016837120056152344, -0.0014345645904541016, -0.0011854171752929688, -0.0009362697601318359, -0.0006871223449707031, -0.0004379749298095703, -0.0001888275146484375, 6.031990051269531e-05, 0.0003094673156738281, 0.0005586147308349609, 0.0008077621459960938, 0.0010569095611572266, 0.0013060569763183594, 0.0015552043914794922, 0.001804351806640625, 0.002053499221801758, 0.0023026466369628906, 0.0025517940521240234, 0.0028009414672851562, 0.003050088882446289, 0.003299236297607422, 0.0035483837127685547, 0.0037975311279296875, 0.00404667854309082, 0.004295825958251953, 0.004544973373413086, 0.004794120788574219, 0.0050432682037353516, 0.005292415618896484, 0.005541563034057617, 0.00579071044921875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 11.0, 17.0, 31.0, 26.0, 49.0, 84.0, 93.0, 149.0, 219.0, 338.0, 475.0, 657.0, 930.0, 1377.0, 1873.0, 2800.0, 4020.0, 5678.0, 8736.0, 13287.0, 19567.0, 30426.0, 47265.0, 76117.0, 123935.0, 190902.0, 188572.0, 121731.0, 74106.0, 46446.0, 29538.0, 19151.0, 12693.0, 8673.0, 5801.0, 3944.0, 2643.0, 1845.0, 1306.0, 875.0, 650.0, 491.0, 312.0, 229.0, 144.0, 119.0, 84.0, 46.0, 29.0, 26.0, 13.0, 15.0, 7.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.01110076904296875, -0.010764122009277344, -0.010427474975585938, -0.010090827941894531, -0.009754180908203125, -0.009417533874511719, -0.009080886840820312, -0.008744239807128906, -0.0084075927734375, -0.008070945739746094, -0.0077342987060546875, -0.007397651672363281, -0.007061004638671875, -0.006724357604980469, -0.0063877105712890625, -0.006051063537597656, -0.00571441650390625, -0.005377769470214844, -0.0050411224365234375, -0.004704475402832031, -0.004367828369140625, -0.004031181335449219, -0.0036945343017578125, -0.0033578872680664062, -0.003021240234375, -0.0026845932006835938, -0.0023479461669921875, -0.0020112991333007812, -0.001674652099609375, -0.0013380050659179688, -0.0010013580322265625, -0.0006647109985351562, -0.00032806396484375, 8.58306884765625e-06, 0.0003452301025390625, 0.0006818771362304688, 0.001018524169921875, 0.0013551712036132812, 0.0016918182373046875, 0.0020284652709960938, 0.0023651123046875, 0.0027017593383789062, 0.0030384063720703125, 0.0033750534057617188, 0.003711700439453125, 0.004048347473144531, 0.0043849945068359375, 0.004721641540527344, 0.00505828857421875, 0.005394935607910156, 0.0057315826416015625, 0.006068229675292969, 0.006404876708984375, 0.006741523742675781, 0.0070781707763671875, 0.007414817810058594, 0.00775146484375, 0.008088111877441406, 0.008424758911132812, 0.008761405944824219, 0.009098052978515625, 0.009434700012207031, 0.009771347045898438, 0.010107994079589844, 0.01044464111328125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 9.0, 3.0, 8.0, 5.0, 8.0, 5.0, 7.0, 9.0, 18.0, 8.0, 17.0, 16.0, 15.0, 29.0, 17.0, 20.0, 24.0, 19.0, 36.0, 31.0, 31.0, 32.0, 46.0, 35.0, 36.0, 32.0, 42.0, 33.0, 37.0, 42.0, 35.0, 36.0, 30.0, 31.0, 30.0, 16.0, 30.0, 18.0, 17.0, 16.0, 18.0, 10.0, 10.0, 5.0, 3.0, 5.0, 7.0, 4.0, 2.0, 6.0, 6.0, 2.0, 3.0], "bins": [-0.00443267822265625, -0.004308074712753296, -0.004183471202850342, -0.004058867692947388, -0.003934264183044434, -0.0038096606731414795, -0.0036850571632385254, -0.0035604536533355713, -0.003435850143432617, -0.003311246633529663, -0.003186643123626709, -0.003062039613723755, -0.0029374361038208008, -0.0028128325939178467, -0.0026882290840148926, -0.0025636255741119385, -0.0024390220642089844, -0.0023144185543060303, -0.002189815044403076, -0.002065211534500122, -0.001940608024597168, -0.0018160045146942139, -0.0016914010047912598, -0.0015667974948883057, -0.0014421939849853516, -0.0013175904750823975, -0.0011929869651794434, -0.0010683834552764893, -0.0009437799453735352, -0.0008191764354705811, -0.000694572925567627, -0.0005699694156646729, -0.00044536590576171875, -0.00032076239585876465, -0.00019615888595581055, -7.155537605285645e-05, 5.3048133850097656e-05, 0.00017765164375305176, 0.00030225515365600586, 0.00042685866355895996, 0.0005514621734619141, 0.0006760656833648682, 0.0008006691932678223, 0.0009252727031707764, 0.0010498762130737305, 0.0011744797229766846, 0.0012990832328796387, 0.0014236867427825928, 0.0015482902526855469, 0.001672893762588501, 0.001797497272491455, 0.0019221007823944092, 0.0020467042922973633, 0.0021713078022003174, 0.0022959113121032715, 0.0024205148220062256, 0.0025451183319091797, 0.002669721841812134, 0.002794325351715088, 0.002918928861618042, 0.003043532371520996, 0.00316813588142395, 0.0032927393913269043, 0.0034173429012298584, 0.0035419464111328125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 8.0, 9.0, 12.0, 18.0, 23.0, 27.0, 32.0, 63.0, 63.0, 80.0, 127.0, 173.0, 224.0, 301.0, 429.0, 642.0, 954.0, 1386.0, 2100.0, 3555.0, 6071.0, 11109.0, 22294.0, 64000.0, 854315.0, 40587.0, 17130.0, 9042.0, 5019.0, 2931.0, 1851.0, 1160.0, 828.0, 538.0, 393.0, 269.0, 207.0, 136.0, 127.0, 76.0, 62.0, 47.0, 46.0, 23.0, 24.0, 16.0, 4.0, 9.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00467681884765625, -0.004532158374786377, -0.004387497901916504, -0.004242837429046631, -0.004098176956176758, -0.003953516483306885, -0.0038088560104370117, -0.0036641955375671387, -0.0035195350646972656, -0.0033748745918273926, -0.0032302141189575195, -0.0030855536460876465, -0.0029408931732177734, -0.0027962327003479004, -0.0026515722274780273, -0.0025069117546081543, -0.0023622512817382812, -0.002217590808868408, -0.002072930335998535, -0.0019282698631286621, -0.001783609390258789, -0.001638948917388916, -0.001494288444519043, -0.00134962797164917, -0.0012049674987792969, -0.0010603070259094238, -0.0009156465530395508, -0.0007709860801696777, -0.0006263256072998047, -0.00048166513442993164, -0.0003370046615600586, -0.00019234418869018555, -4.76837158203125e-05, 9.697675704956055e-05, 0.0002416372299194336, 0.00038629770278930664, 0.0005309581756591797, 0.0006756186485290527, 0.0008202791213989258, 0.0009649395942687988, 0.0011096000671386719, 0.001254260540008545, 0.001398921012878418, 0.001543581485748291, 0.001688241958618164, 0.0018329024314880371, 0.00197756290435791, 0.002122223377227783, 0.0022668838500976562, 0.0024115443229675293, 0.0025562047958374023, 0.0027008652687072754, 0.0028455257415771484, 0.0029901862144470215, 0.0031348466873168945, 0.0032795071601867676, 0.0034241676330566406, 0.0035688281059265137, 0.0037134885787963867, 0.0038581490516662598, 0.004002809524536133, 0.004147469997406006, 0.004292130470275879, 0.004436790943145752, 0.004581451416015625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 9.0, 11.0, 4.0, 18.0, 10.0, 24.0, 19.0, 23.0, 46.0, 30.0, 38.0, 75.0, 58.0, 67.0, 108.0, 76.0, 61.0, 69.0, 47.0, 55.0, 36.0, 18.0, 24.0, 21.0, 8.0, 10.0, 5.0, 5.0, 5.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.649162292480469e-06, -4.5085325837135315e-06, -4.367902874946594e-06, -4.227273166179657e-06, -4.08664345741272e-06, -3.9460137486457825e-06, -3.8053840398788452e-06, -3.664754331111908e-06, -3.5241246223449707e-06, -3.3834949135780334e-06, -3.242865204811096e-06, -3.102235496044159e-06, -2.9616057872772217e-06, -2.8209760785102844e-06, -2.680346369743347e-06, -2.53971666097641e-06, -2.3990869522094727e-06, -2.2584572434425354e-06, -2.117827534675598e-06, -1.977197825908661e-06, -1.8365681171417236e-06, -1.6959384083747864e-06, -1.5553086996078491e-06, -1.4146789908409119e-06, -1.2740492820739746e-06, -1.1334195733070374e-06, -9.927898645401e-07, -8.521601557731628e-07, -7.115304470062256e-07, -5.709007382392883e-07, -4.302710294723511e-07, -2.896413207054138e-07, -1.4901161193847656e-07, -8.381903171539307e-09, 1.3224780559539795e-07, 2.728775143623352e-07, 4.1350722312927246e-07, 5.541369318962097e-07, 6.94766640663147e-07, 8.353963494300842e-07, 9.760260581970215e-07, 1.1166557669639587e-06, 1.257285475730896e-06, 1.3979151844978333e-06, 1.5385448932647705e-06, 1.6791746020317078e-06, 1.819804310798645e-06, 1.9604340195655823e-06, 2.1010637283325195e-06, 2.2416934370994568e-06, 2.382323145866394e-06, 2.5229528546333313e-06, 2.6635825634002686e-06, 2.804212272167206e-06, 2.944841980934143e-06, 3.0854716897010803e-06, 3.2261013984680176e-06, 3.366731107234955e-06, 3.507360816001892e-06, 3.6479905247688293e-06, 3.7886202335357666e-06, 3.929249942302704e-06, 4.069879651069641e-06, 4.210509359836578e-06, 4.351139068603516e-06]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 4.0, 14.0, 14.0, 33.0, 30.0, 44.0, 71.0, 117.0, 147.0, 257.0, 327.0, 482.0, 714.0, 1091.0, 1652.0, 2747.0, 4793.0, 8071.0, 15194.0, 37444.0, 870509.0, 60272.0, 19936.0, 9765.0, 5563.0, 3331.0, 2023.0, 1273.0, 784.0, 579.0, 400.0, 251.0, 174.0, 127.0, 85.0, 69.0, 53.0, 30.0, 24.0, 12.0, 14.0, 5.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005084991455078125, -0.004901230335235596, -0.004717469215393066, -0.004533708095550537, -0.004349946975708008, -0.0041661858558654785, -0.003982424736022949, -0.00379866361618042, -0.0036149024963378906, -0.0034311413764953613, -0.003247380256652832, -0.0030636191368103027, -0.0028798580169677734, -0.002696096897125244, -0.002512335777282715, -0.0023285746574401855, -0.0021448135375976562, -0.001961052417755127, -0.0017772912979125977, -0.0015935301780700684, -0.001409769058227539, -0.0012260079383850098, -0.0010422468185424805, -0.0008584856986999512, -0.0006747245788574219, -0.0004909634590148926, -0.0003072023391723633, -0.00012344121932983398, 6.031990051269531e-05, 0.0002440810203552246, 0.0004278421401977539, 0.0006116032600402832, 0.0007953643798828125, 0.0009791254997253418, 0.001162886619567871, 0.0013466477394104004, 0.0015304088592529297, 0.001714169979095459, 0.0018979310989379883, 0.0020816922187805176, 0.002265453338623047, 0.002449214458465576, 0.0026329755783081055, 0.0028167366981506348, 0.003000497817993164, 0.0031842589378356934, 0.0033680200576782227, 0.003551781177520752, 0.0037355422973632812, 0.0039193034172058105, 0.00410306453704834, 0.004286825656890869, 0.0044705867767333984, 0.004654347896575928, 0.004838109016418457, 0.005021870136260986, 0.005205631256103516, 0.005389392375946045, 0.005573153495788574, 0.0057569146156311035, 0.005940675735473633, 0.006124436855316162, 0.006308197975158691, 0.006491959095001221, 0.00667572021484375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 6.0, 15.0, 8.0, 7.0, 11.0, 19.0, 26.0, 47.0, 694.0, 42.0, 23.0, 20.0, 9.0, 6.0, 8.0, 4.0, 7.0, 9.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00188446044921875, -0.0018329918384552002, -0.0017815232276916504, -0.0017300546169281006, -0.0016785860061645508, -0.001627117395401001, -0.0015756487846374512, -0.0015241801738739014, -0.0014727115631103516, -0.0014212429523468018, -0.001369774341583252, -0.0013183057308197021, -0.0012668371200561523, -0.0012153685092926025, -0.0011638998985290527, -0.001112431287765503, -0.0010609626770019531, -0.0010094940662384033, -0.0009580254554748535, -0.0009065568447113037, -0.0008550882339477539, -0.0008036196231842041, -0.0007521510124206543, -0.0007006824016571045, -0.0006492137908935547, -0.0005977451801300049, -0.0005462765693664551, -0.0004948079586029053, -0.00044333934783935547, -0.00039187073707580566, -0.00034040212631225586, -0.00028893351554870605, -0.00023746490478515625, -0.00018599629402160645, -0.00013452768325805664, -8.305907249450684e-05, -3.159046173095703e-05, 1.9878149032592773e-05, 7.134675979614258e-05, 0.00012281537055969238, 0.0001742839813232422, 0.000225752592086792, 0.0002772212028503418, 0.0003286898136138916, 0.0003801584243774414, 0.0004316270351409912, 0.000483095645904541, 0.0005345642566680908, 0.0005860328674316406, 0.0006375014781951904, 0.0006889700889587402, 0.00074043869972229, 0.0007919073104858398, 0.0008433759212493896, 0.0008948445320129395, 0.0009463131427764893, 0.000997781753540039, 0.0010492503643035889, 0.0011007189750671387, 0.0011521875858306885, 0.0012036561965942383, 0.001255124807357788, 0.0013065934181213379, 0.0013580620288848877, 0.0014095306396484375]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 6.0, 11.0, 18.0, 21.0, 39.0, 59.0, 84.0, 125.0, 177.0, 170.0, 88.0, 57.0, 38.0, 29.0, 21.0, 17.0, 10.0, 10.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020647283643484116, -0.020116202533245087, -0.019585121423006058, -0.01905404031276703, -0.018522959202528, -0.01799187622964382, -0.017460795119404793, -0.016929714009165764, -0.016398632898926735, -0.015867551788687706, -0.015336470678448677, -0.014805388636887074, -0.014274307526648045, -0.013743226416409016, -0.013212144374847412, -0.012681063264608383, -0.012149982154369354, -0.011618901044130325, -0.011087819933891296, -0.010556737892329693, -0.010025656782090664, -0.009494575671851635, -0.008963493630290031, -0.008432412520051003, -0.007901331409811974, -0.007370250299572945, -0.006839168723672628, -0.006308087147772312, -0.005777006037533283, -0.005245924927294254, -0.004714843351393938, -0.004183761775493622, -0.003652682527899742, -0.0031216011848300695, -0.002590519841760397, -0.0020594384986907244, -0.0015283571556210518, -0.0009972758125513792, -0.0004661944694817066, 6.488687358796597e-05, 0.0005959682166576385, 0.0011270495597273111, 0.0016581309027969837, 0.0021892122458666563, 0.002720293588936329, 0.0032513749320060015, 0.003782456275075674, 0.00431353785097599, 0.004844618961215019, 0.005375700071454048, 0.005906781647354364, 0.006437863223254681, 0.0069689443334937096, 0.0075000254437327385, 0.008031107485294342, 0.008562188595533371, 0.0090932697057724, 0.009624350816011429, 0.010155431926250458, 0.010686513967812061, 0.01121759507805109, 0.01174867618829012, 0.012279758229851723, 0.012810839340090752, 0.01334192045032978]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 4.0, 2.0, 4.0, 5.0, 7.0, 16.0, 12.0, 8.0, 23.0, 17.0, 20.0, 28.0, 34.0, 30.0, 35.0, 37.0, 25.0, 34.0, 34.0, 56.0, 49.0, 51.0, 53.0, 45.0, 38.0, 39.0, 44.0, 35.0, 31.0, 23.0, 25.0, 31.0, 27.0, 11.0, 16.0, 16.0, 11.0, 5.0, 11.0, 2.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.008906406350433826, -0.008667942136526108, -0.008429478853940964, -0.008191014640033245, -0.007952550426125526, -0.007714086677879095, -0.007475622929632664, -0.007237158715724945, -0.006998694967478514, -0.006760231219232082, -0.006521767005324364, -0.006283303257077932, -0.006044839043170214, -0.005806375294923782, -0.005567911081016064, -0.005329447332769632, -0.005090983584523201, -0.00485251983627677, -0.004614055622369051, -0.00437559187412262, -0.004137127660214901, -0.0038986639119684696, -0.0036601999308913946, -0.0034217359498143196, -0.003183271735906601, -0.002944807754829526, -0.002706343773752451, -0.0024678800255060196, -0.0022294160444289446, -0.0019909520633518696, -0.0017524880822747946, -0.0015140242176130414, -0.0012755603529512882, -0.0010370963718742132, -0.00079863250721246, -0.000560168526135385, -0.00032170460326597095, -8.324068039655685e-05, 0.00015522330068051815, 0.00039368716534227133, 0.0006321511464193463, 0.0008706150692887604, 0.0011090789921581745, 0.0013475429732352495, 0.0015860069543123245, 0.0018244708189740777, 0.0020629349164664745, 0.002301398664712906, 0.002539862645789981, 0.002778326626867056, 0.003016790607944131, 0.003255254589021206, 0.0034937183372676373, 0.0037321823183447123, 0.003970646299421787, 0.004209110047668219, 0.004447574261575937, 0.004686038009822369, 0.004924502223730087, 0.005162965971976519, 0.005401430185884237, 0.005639893934130669, 0.005878358148038387, 0.006116821896284819, 0.00635528564453125]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 11.0, 10.0, 21.0, 27.0, 54.0, 57.0, 93.0, 126.0, 183.0, 260.0, 386.0, 557.0, 805.0, 1241.0, 1950.0, 2948.0, 4633.0, 7785.0, 12990.0, 22795.0, 40796.0, 79761.0, 170991.0, 453501.0, 1599494.0, 1177211.0, 333454.0, 135987.0, 64709.0, 34206.0, 18838.0, 11090.0, 6743.0, 4071.0, 2380.0, 1497.0, 926.0, 610.0, 371.0, 218.0, 150.0, 88.0, 75.0, 49.0, 26.0, 31.0, 15.0, 17.0, 8.0, 11.0, 9.0, 7.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0091552734375, -0.008826613426208496, -0.008497953414916992, -0.008169293403625488, -0.007840633392333984, -0.0075119733810424805, -0.0071833133697509766, -0.006854653358459473, -0.006525993347167969, -0.006197333335876465, -0.005868673324584961, -0.005540013313293457, -0.005211353302001953, -0.004882693290710449, -0.004554033279418945, -0.004225373268127441, -0.0038967132568359375, -0.0035680532455444336, -0.0032393932342529297, -0.0029107332229614258, -0.002582073211669922, -0.002253413200378418, -0.001924753189086914, -0.0015960931777954102, -0.0012674331665039062, -0.0009387731552124023, -0.0006101131439208984, -0.00028145313262939453, 4.7206878662109375e-05, 0.0003758668899536133, 0.0007045269012451172, 0.001033186912536621, 0.001361846923828125, 0.001690506935119629, 0.002019166946411133, 0.0023478269577026367, 0.0026764869689941406, 0.0030051469802856445, 0.0033338069915771484, 0.0036624670028686523, 0.003991127014160156, 0.00431978702545166, 0.004648447036743164, 0.004977107048034668, 0.005305767059326172, 0.005634427070617676, 0.00596308708190918, 0.006291747093200684, 0.0066204071044921875, 0.006949067115783691, 0.007277727127075195, 0.007606387138366699, 0.007935047149658203, 0.008263707160949707, 0.008592367172241211, 0.008921027183532715, 0.009249687194824219, 0.009578347206115723, 0.009907007217407227, 0.01023566722869873, 0.010564327239990234, 0.010892987251281738, 0.011221647262573242, 0.011550307273864746, 0.01187896728515625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 2.0, 10.0, 7.0, 6.0, 18.0, 16.0, 15.0, 22.0, 15.0, 24.0, 24.0, 34.0, 39.0, 33.0, 28.0, 37.0, 47.0, 42.0, 43.0, 40.0, 46.0, 41.0, 48.0, 45.0, 41.0, 41.0, 29.0, 24.0, 23.0, 18.0, 28.0, 21.0, 22.0, 15.0, 13.0, 12.0, 8.0, 4.0, 3.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.00531768798828125, -0.0051721930503845215, -0.005026698112487793, -0.0048812031745910645, -0.004735708236694336, -0.004590213298797607, -0.004444718360900879, -0.00429922342300415, -0.004153728485107422, -0.004008233547210693, -0.003862738609313965, -0.0037172436714172363, -0.003571748733520508, -0.0034262537956237793, -0.0032807588577270508, -0.0031352639198303223, -0.0029897689819335938, -0.0028442740440368652, -0.0026987791061401367, -0.002553284168243408, -0.0024077892303466797, -0.002262294292449951, -0.0021167993545532227, -0.001971304416656494, -0.0018258094787597656, -0.0016803145408630371, -0.0015348196029663086, -0.00138932466506958, -0.0012438297271728516, -0.001098334789276123, -0.0009528398513793945, -0.000807344913482666, -0.0006618499755859375, -0.000516355037689209, -0.00037086009979248047, -0.00022536516189575195, -7.987022399902344e-05, 6.562471389770508e-05, 0.0002111196517944336, 0.0003566145896911621, 0.0005021095275878906, 0.0006476044654846191, 0.0007930994033813477, 0.0009385943412780762, 0.0010840892791748047, 0.0012295842170715332, 0.0013750791549682617, 0.0015205740928649902, 0.0016660690307617188, 0.0018115639686584473, 0.0019570589065551758, 0.0021025538444519043, 0.002248048782348633, 0.0023935437202453613, 0.00253903865814209, 0.0026845335960388184, 0.002830028533935547, 0.0029755234718322754, 0.003121018409729004, 0.0032665133476257324, 0.003412008285522461, 0.0035575032234191895, 0.003702998161315918, 0.0038484930992126465, 0.003993988037109375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 10.0, 17.0, 35.0, 51.0, 70.0, 112.0, 168.0, 249.0, 372.0, 602.0, 879.0, 1308.0, 2101.0, 3323.0, 5155.0, 8293.0, 12988.0, 22214.0, 38252.0, 67969.0, 127328.0, 256738.0, 583680.0, 1360172.0, 928998.0, 377693.0, 178477.0, 92375.0, 50417.0, 28849.0, 17101.0, 10327.0, 6453.0, 4088.0, 2591.0, 1680.0, 1096.0, 713.0, 476.0, 292.0, 197.0, 135.0, 86.0, 45.0, 39.0, 21.0, 13.0, 14.0, 10.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.00832366943359375, -0.008084118366241455, -0.00784456729888916, -0.007605016231536865, -0.00736546516418457, -0.007125914096832275, -0.0068863630294799805, -0.0066468119621276855, -0.006407260894775391, -0.006167709827423096, -0.005928158760070801, -0.005688607692718506, -0.005449056625366211, -0.005209505558013916, -0.004969954490661621, -0.004730403423309326, -0.004490852355957031, -0.004251301288604736, -0.004011750221252441, -0.0037721991539001465, -0.0035326480865478516, -0.0032930970191955566, -0.0030535459518432617, -0.002813994884490967, -0.002574443817138672, -0.002334892749786377, -0.002095341682434082, -0.0018557906150817871, -0.0016162395477294922, -0.0013766884803771973, -0.0011371374130249023, -0.0008975863456726074, -0.0006580352783203125, -0.0004184842109680176, -0.00017893314361572266, 6.0617923736572266e-05, 0.0003001689910888672, 0.0005397200584411621, 0.000779271125793457, 0.001018822193145752, 0.0012583732604980469, 0.0014979243278503418, 0.0017374753952026367, 0.0019770264625549316, 0.0022165775299072266, 0.0024561285972595215, 0.0026956796646118164, 0.0029352307319641113, 0.0031747817993164062, 0.003414332866668701, 0.003653883934020996, 0.003893435001373291, 0.004132986068725586, 0.004372537136077881, 0.004612088203430176, 0.004851639270782471, 0.005091190338134766, 0.0053307414054870605, 0.0055702924728393555, 0.00580984354019165, 0.006049394607543945, 0.00628894567489624, 0.006528496742248535, 0.00676804780960083, 0.007007598876953125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 5.0, 13.0, 15.0, 16.0, 21.0, 29.0, 22.0, 27.0, 39.0, 61.0, 62.0, 68.0, 89.0, 97.0, 125.0, 160.0, 160.0, 186.0, 202.0, 230.0, 255.0, 267.0, 237.0, 239.0, 195.0, 172.0, 164.0, 159.0, 135.0, 102.0, 102.0, 81.0, 59.0, 60.0, 54.0, 30.0, 29.0, 26.0, 12.0, 13.0, 8.0, 8.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0020427703857421875, -0.001973867416381836, -0.0019049644470214844, -0.0018360614776611328, -0.0017671585083007812, -0.0016982555389404297, -0.0016293525695800781, -0.0015604496002197266, -0.001491546630859375, -0.0014226436614990234, -0.0013537406921386719, -0.0012848377227783203, -0.0012159347534179688, -0.0011470317840576172, -0.0010781288146972656, -0.001009225845336914, -0.0009403228759765625, -0.0008714199066162109, -0.0008025169372558594, -0.0007336139678955078, -0.0006647109985351562, -0.0005958080291748047, -0.0005269050598144531, -0.00045800209045410156, -0.00038909912109375, -0.00032019615173339844, -0.0002512931823730469, -0.0001823902130126953, -0.00011348724365234375, -4.458427429199219e-05, 2.4318695068359375e-05, 9.322166442871094e-05, 0.0001621246337890625, 0.00023102760314941406, 0.0002999305725097656, 0.0003688335418701172, 0.00043773651123046875, 0.0005066394805908203, 0.0005755424499511719, 0.0006444454193115234, 0.000713348388671875, 0.0007822513580322266, 0.0008511543273925781, 0.0009200572967529297, 0.0009889602661132812, 0.0010578632354736328, 0.0011267662048339844, 0.001195669174194336, 0.0012645721435546875, 0.001333475112915039, 0.0014023780822753906, 0.0014712810516357422, 0.0015401840209960938, 0.0016090869903564453, 0.0016779899597167969, 0.0017468929290771484, 0.0018157958984375, 0.0018846988677978516, 0.001953601837158203, 0.0020225048065185547, 0.0020914077758789062, 0.002160310745239258, 0.0022292137145996094, 0.002298116683959961, 0.0023670196533203125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 14.0, 7.0, 20.0, 17.0, 26.0, 48.0, 78.0, 97.0, 96.0, 164.0, 128.0, 86.0, 58.0, 41.0, 30.0, 23.0, 18.0, 13.0, 14.0, 4.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.012131369672715664, -0.011809755116701126, -0.011488141492009163, -0.011166526935994625, -0.010844912379980087, -0.010523298755288124, -0.010201684199273586, -0.009880069643259048, -0.009558456018567085, -0.009236841462552547, -0.008915227837860584, -0.008593613281846046, -0.008271999657154083, -0.007950385101139545, -0.007628770545125008, -0.007307156454771757, -0.006985542364418507, -0.006663928274065256, -0.006342314183712006, -0.006020699627697468, -0.005699085537344217, -0.005377471446990967, -0.005055856890976429, -0.0047342428006231785, -0.004412628710269928, -0.0040910146199166775, -0.0037694002967327833, -0.003447785973548889, -0.0031261718831956387, -0.002804557792842388, -0.002482943469658494, -0.0021613291464746, -0.001839715987443924, -0.0015181017806753516, -0.0011964875739067793, -0.000874873367138207, -0.0005532591603696346, -0.0002316449536010623, 8.996925316751003e-05, 0.0004115835763514042, 0.0007331976667046547, 0.001054811873473227, 0.0013764260802417994, 0.0016980402870103717, 0.002019654493778944, 0.0023412685841321945, 0.0026628829073160887, 0.002984497230499983, 0.0033061113208532333, 0.003627725411206484, 0.003949339501559734, 0.004270954057574272, 0.004592568147927523, 0.004914182238280773, 0.005235796794295311, 0.0055574108846485615, 0.005879024975001812, 0.0062006390653550625, 0.006522253155708313, 0.006843867711722851, 0.007165481802076101, 0.007487095892429352, 0.00780871044844389, 0.008130325004458427, 0.00845193862915039]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 6.0, 6.0, 14.0, 12.0, 20.0, 26.0, 18.0, 19.0, 29.0, 32.0, 37.0, 31.0, 38.0, 39.0, 46.0, 36.0, 48.0, 32.0, 39.0, 46.0, 37.0, 43.0, 43.0, 35.0, 25.0, 30.0, 31.0, 31.0, 20.0, 14.0, 14.0, 22.0, 17.0, 9.0, 10.0, 8.0, 11.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005460231099277735, -0.00530237564817071, -0.005144519731402397, -0.004986664280295372, -0.004828808829188347, -0.004670953378081322, -0.004513097926974297, -0.004355242010205984, -0.004197386559098959, -0.004039531107991934, -0.003881675424054265, -0.0037238197401165962, -0.003565964289009571, -0.003408108837902546, -0.003250253153964877, -0.0030923974700272083, -0.002934542018920183, -0.002776686567813158, -0.0026188308838754892, -0.0024609751999378204, -0.0023031197488307953, -0.00214526429772377, -0.0019874086137861013, -0.0018295530462637544, -0.0016716974787414074, -0.0015138419112190604, -0.0013559863436967134, -0.0011981307761743665, -0.0010402752086520195, -0.0008824196411296725, -0.0007245640736073256, -0.0005667085060849786, -0.0004088529385626316, -0.00025099737104028463, -9.314180351793766e-05, 6.471376400440931e-05, 0.0002225693315267563, 0.00038042489904910326, 0.0005382804665714502, 0.0006961360340937972, 0.0008539916016161442, 0.0010118471691384912, 0.0011697027366608381, 0.001327558304183185, 0.001485413871705532, 0.001643269439227879, 0.001801125006750226, 0.001958980690687895, 0.00211683614179492, 0.002274691592901945, 0.002432547276839614, 0.0025904029607772827, 0.002748258411884308, 0.002906113862991333, 0.003063969546929002, 0.0032218252308666706, 0.0033796806819736958, 0.003537536133080721, 0.0036953918170183897, 0.0038532475009560585, 0.004011102952063084, 0.004168958403170109, 0.004326813854277134, 0.004484669771045446, 0.0046425252221524715]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 6.0, 8.0, 7.0, 6.0, 16.0, 26.0, 43.0, 57.0, 82.0, 111.0, 213.0, 309.0, 519.0, 885.0, 1410.0, 2473.0, 4398.0, 7627.0, 14043.0, 26508.0, 51836.0, 106621.0, 231792.0, 301452.0, 150595.0, 70455.0, 35430.0, 18304.0, 10103.0, 5441.0, 2970.0, 1860.0, 1116.0, 659.0, 427.0, 262.0, 156.0, 106.0, 74.0, 50.0, 34.0, 27.0, 17.0, 12.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010040283203125, -0.009728670120239258, -0.009417057037353516, -0.009105443954467773, -0.008793830871582031, -0.008482217788696289, -0.008170604705810547, -0.007858991622924805, -0.0075473785400390625, -0.00723576545715332, -0.006924152374267578, -0.006612539291381836, -0.006300926208496094, -0.0059893131256103516, -0.005677700042724609, -0.005366086959838867, -0.005054473876953125, -0.004742860794067383, -0.004431247711181641, -0.0041196346282958984, -0.0038080215454101562, -0.003496408462524414, -0.003184795379638672, -0.0028731822967529297, -0.0025615692138671875, -0.0022499561309814453, -0.0019383430480957031, -0.001626729965209961, -0.0013151168823242188, -0.0010035037994384766, -0.0006918907165527344, -0.0003802776336669922, -6.866455078125e-05, 0.0002429485321044922, 0.0005545616149902344, 0.0008661746978759766, 0.0011777877807617188, 0.001489400863647461, 0.0018010139465332031, 0.0021126270294189453, 0.0024242401123046875, 0.0027358531951904297, 0.003047466278076172, 0.003359079360961914, 0.0036706924438476562, 0.0039823055267333984, 0.004293918609619141, 0.004605531692504883, 0.004917144775390625, 0.005228757858276367, 0.005540370941162109, 0.0058519840240478516, 0.006163597106933594, 0.006475210189819336, 0.006786823272705078, 0.00709843635559082, 0.0074100494384765625, 0.007721662521362305, 0.008033275604248047, 0.008344888687133789, 0.008656501770019531, 0.008968114852905273, 0.009279727935791016, 0.009591341018676758, 0.0099029541015625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 4.0, 2.0, 6.0, 14.0, 8.0, 14.0, 20.0, 13.0, 20.0, 26.0, 24.0, 33.0, 40.0, 36.0, 36.0, 44.0, 35.0, 44.0, 37.0, 47.0, 39.0, 46.0, 37.0, 42.0, 52.0, 27.0, 35.0, 44.0, 24.0, 20.0, 18.0, 19.0, 14.0, 16.0, 13.0, 10.0, 12.0, 4.0, 10.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004657745361328125, -0.004510223865509033, -0.004362702369689941, -0.00421518087387085, -0.004067659378051758, -0.003920137882232666, -0.0037726163864135742, -0.0036250948905944824, -0.0034775733947753906, -0.003330051898956299, -0.003182530403137207, -0.0030350089073181152, -0.0028874874114990234, -0.0027399659156799316, -0.00259244441986084, -0.002444922924041748, -0.0022974014282226562, -0.0021498799324035645, -0.0020023584365844727, -0.0018548369407653809, -0.001707315444946289, -0.0015597939491271973, -0.0014122724533081055, -0.0012647509574890137, -0.0011172294616699219, -0.0009697079658508301, -0.0008221864700317383, -0.0006746649742126465, -0.0005271434783935547, -0.0003796219825744629, -0.0002321004867553711, -8.45789909362793e-05, 6.29425048828125e-05, 0.0002104640007019043, 0.0003579854965209961, 0.0005055069923400879, 0.0006530284881591797, 0.0008005499839782715, 0.0009480714797973633, 0.001095592975616455, 0.0012431144714355469, 0.0013906359672546387, 0.0015381574630737305, 0.0016856789588928223, 0.001833200454711914, 0.001980721950531006, 0.0021282434463500977, 0.0022757649421691895, 0.0024232864379882812, 0.002570807933807373, 0.002718329429626465, 0.0028658509254455566, 0.0030133724212646484, 0.0031608939170837402, 0.003308415412902832, 0.003455936908721924, 0.0036034584045410156, 0.0037509799003601074, 0.0038985013961791992, 0.004046022891998291, 0.004193544387817383, 0.004341065883636475, 0.004488587379455566, 0.004636108875274658, 0.00478363037109375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 11.0, 8.0, 13.0, 26.0, 21.0, 47.0, 62.0, 106.0, 158.0, 247.0, 400.0, 652.0, 1041.0, 1897.0, 3356.0, 6478.0, 14139.0, 36962.0, 141595.0, 597014.0, 171016.0, 41857.0, 15643.0, 7088.0, 3707.0, 2030.0, 1187.0, 654.0, 395.0, 243.0, 171.0, 114.0, 73.0, 49.0, 26.0, 31.0, 9.0, 8.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013763427734375, -0.013245105743408203, -0.012726783752441406, -0.01220846176147461, -0.011690139770507812, -0.011171817779541016, -0.010653495788574219, -0.010135173797607422, -0.009616851806640625, -0.009098529815673828, -0.008580207824707031, -0.008061885833740234, -0.0075435638427734375, -0.007025241851806641, -0.006506919860839844, -0.005988597869873047, -0.00547027587890625, -0.004951953887939453, -0.004433631896972656, -0.003915309906005859, -0.0033969879150390625, -0.0028786659240722656, -0.0023603439331054688, -0.0018420219421386719, -0.001323699951171875, -0.0008053779602050781, -0.00028705596923828125, 0.00023126602172851562, 0.0007495880126953125, 0.0012679100036621094, 0.0017862319946289062, 0.002304553985595703, 0.0028228759765625, 0.003341197967529297, 0.0038595199584960938, 0.004377841949462891, 0.0048961639404296875, 0.005414485931396484, 0.005932807922363281, 0.006451129913330078, 0.006969451904296875, 0.007487773895263672, 0.008006095886230469, 0.008524417877197266, 0.009042739868164062, 0.00956106185913086, 0.010079383850097656, 0.010597705841064453, 0.01111602783203125, 0.011634349822998047, 0.012152671813964844, 0.01267099380493164, 0.013189315795898438, 0.013707637786865234, 0.014225959777832031, 0.014744281768798828, 0.015262603759765625, 0.015780925750732422, 0.01629924774169922, 0.016817569732666016, 0.017335891723632812, 0.01785421371459961, 0.018372535705566406, 0.018890857696533203, 0.0194091796875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 6.0, 5.0, 12.0, 16.0, 14.0, 11.0, 13.0, 19.0, 21.0, 27.0, 19.0, 28.0, 37.0, 42.0, 36.0, 39.0, 48.0, 41.0, 51.0, 39.0, 41.0, 39.0, 40.0, 44.0, 38.0, 33.0, 24.0, 28.0, 32.0, 30.0, 16.0, 15.0, 23.0, 13.0, 11.0, 8.0, 13.0, 5.0, 4.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.00342559814453125, -0.003329366445541382, -0.0032331347465515137, -0.0031369030475616455, -0.0030406713485717773, -0.002944439649581909, -0.002848207950592041, -0.002751976251602173, -0.0026557445526123047, -0.0025595128536224365, -0.0024632811546325684, -0.0023670494556427, -0.002270817756652832, -0.002174586057662964, -0.0020783543586730957, -0.0019821226596832275, -0.0018858909606933594, -0.0017896592617034912, -0.001693427562713623, -0.0015971958637237549, -0.0015009641647338867, -0.0014047324657440186, -0.0013085007667541504, -0.0012122690677642822, -0.001116037368774414, -0.001019805669784546, -0.0009235739707946777, -0.0008273422718048096, -0.0007311105728149414, -0.0006348788738250732, -0.0005386471748352051, -0.0004424154758453369, -0.00034618377685546875, -0.0002499520778656006, -0.00015372037887573242, -5.748867988586426e-05, 3.8743019104003906e-05, 0.00013497471809387207, 0.00023120641708374023, 0.0003274381160736084, 0.00042366981506347656, 0.0005199015140533447, 0.0006161332130432129, 0.0007123649120330811, 0.0008085966110229492, 0.0009048283100128174, 0.0010010600090026855, 0.0010972917079925537, 0.0011935234069824219, 0.00128975510597229, 0.0013859868049621582, 0.0014822185039520264, 0.0015784502029418945, 0.0016746819019317627, 0.0017709136009216309, 0.001867145299911499, 0.001963376998901367, 0.0020596086978912354, 0.0021558403968811035, 0.0022520720958709717, 0.00234830379486084, 0.002444535493850708, 0.002540767192840576, 0.0026369988918304443, 0.0027332305908203125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 14.0, 8.0, 21.0, 26.0, 23.0, 33.0, 42.0, 77.0, 86.0, 115.0, 165.0, 200.0, 289.0, 363.0, 592.0, 781.0, 1231.0, 1969.0, 3204.0, 5786.0, 11758.0, 29464.0, 108029.0, 616099.0, 192684.0, 42088.0, 15387.0, 7138.0, 3823.0, 2267.0, 1480.0, 944.0, 648.0, 478.0, 348.0, 244.0, 180.0, 136.0, 99.0, 53.0, 39.0, 30.0, 34.0, 22.0, 21.0, 11.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00337982177734375, -0.0032730698585510254, -0.0031663179397583008, -0.003059566020965576, -0.0029528141021728516, -0.002846062183380127, -0.0027393102645874023, -0.0026325583457946777, -0.002525806427001953, -0.0024190545082092285, -0.002312302589416504, -0.0022055506706237793, -0.0020987987518310547, -0.00199204683303833, -0.0018852949142456055, -0.0017785429954528809, -0.0016717910766601562, -0.0015650391578674316, -0.001458287239074707, -0.0013515353202819824, -0.0012447834014892578, -0.0011380314826965332, -0.0010312795639038086, -0.000924527645111084, -0.0008177757263183594, -0.0007110238075256348, -0.0006042718887329102, -0.0004975199699401855, -0.00039076805114746094, -0.00028401613235473633, -0.00017726421356201172, -7.051229476928711e-05, 3.62396240234375e-05, 0.0001429915428161621, 0.0002497434616088867, 0.00035649538040161133, 0.00046324729919433594, 0.0005699992179870605, 0.0006767511367797852, 0.0007835030555725098, 0.0008902549743652344, 0.000997006893157959, 0.0011037588119506836, 0.0012105107307434082, 0.0013172626495361328, 0.0014240145683288574, 0.001530766487121582, 0.0016375184059143066, 0.0017442703247070312, 0.0018510222434997559, 0.0019577741622924805, 0.002064526081085205, 0.0021712779998779297, 0.0022780299186706543, 0.002384781837463379, 0.0024915337562561035, 0.002598285675048828, 0.0027050375938415527, 0.0028117895126342773, 0.002918541431427002, 0.0030252933502197266, 0.003132045269012451, 0.0032387971878051758, 0.0033455491065979004, 0.003452301025390625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 7.0, 6.0, 21.0, 18.0, 16.0, 20.0, 23.0, 26.0, 25.0, 41.0, 57.0, 43.0, 42.0, 74.0, 92.0, 75.0, 68.0, 50.0, 36.0, 30.0, 37.0, 29.0, 26.0, 16.0, 20.0, 18.0, 14.0, 6.0, 10.0, 7.0, 7.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.9252300262451172e-05, -1.8700025975704193e-05, -1.8147751688957214e-05, -1.7595477402210236e-05, -1.7043203115463257e-05, -1.6490928828716278e-05, -1.59386545419693e-05, -1.538638025522232e-05, -1.4834105968475342e-05, -1.4281831681728363e-05, -1.3729557394981384e-05, -1.3177283108234406e-05, -1.2625008821487427e-05, -1.2072734534740448e-05, -1.152046024799347e-05, -1.096818596124649e-05, -1.0415911674499512e-05, -9.863637387752533e-06, -9.311363101005554e-06, -8.759088814258575e-06, -8.206814527511597e-06, -7.654540240764618e-06, -7.102265954017639e-06, -6.54999166727066e-06, -5.997717380523682e-06, -5.445443093776703e-06, -4.893168807029724e-06, -4.340894520282745e-06, -3.7886202335357666e-06, -3.236345946788788e-06, -2.684071660041809e-06, -2.1317973732948303e-06, -1.5795230865478516e-06, -1.0272487998008728e-06, -4.7497451305389404e-07, 7.729977369308472e-08, 6.295740604400635e-07, 1.1818483471870422e-06, 1.734122633934021e-06, 2.2863969206809998e-06, 2.8386712074279785e-06, 3.3909454941749573e-06, 3.943219780921936e-06, 4.495494067668915e-06, 5.0477683544158936e-06, 5.600042641162872e-06, 6.152316927909851e-06, 6.70459121465683e-06, 7.256865501403809e-06, 7.809139788150787e-06, 8.361414074897766e-06, 8.913688361644745e-06, 9.465962648391724e-06, 1.0018236935138702e-05, 1.0570511221885681e-05, 1.112278550863266e-05, 1.1675059795379639e-05, 1.2227334082126617e-05, 1.2779608368873596e-05, 1.3331882655620575e-05, 1.3884156942367554e-05, 1.4436431229114532e-05, 1.4988705515861511e-05, 1.554097980260849e-05, 1.609325408935547e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 3.0, 1.0, 4.0, 16.0, 22.0, 25.0, 34.0, 44.0, 64.0, 83.0, 139.0, 225.0, 278.0, 362.0, 592.0, 906.0, 1586.0, 2575.0, 4632.0, 8603.0, 17277.0, 37264.0, 94181.0, 308150.0, 373276.0, 113608.0, 43280.0, 19372.0, 9448.0, 4998.0, 2771.0, 1665.0, 1046.0, 650.0, 404.0, 284.0, 186.0, 152.0, 86.0, 80.0, 42.0, 25.0, 39.0, 21.0, 20.0, 11.0, 6.0, 11.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0016336441040039062, -0.0015810877084732056, -0.0015285313129425049, -0.0014759749174118042, -0.0014234185218811035, -0.0013708621263504028, -0.0013183057308197021, -0.0012657493352890015, -0.0012131929397583008, -0.0011606365442276, -0.0011080801486968994, -0.0010555237531661987, -0.001002967357635498, -0.0009504109621047974, -0.0008978545665740967, -0.000845298171043396, -0.0007927417755126953, -0.0007401853799819946, -0.0006876289844512939, -0.0006350725889205933, -0.0005825161933898926, -0.0005299597978591919, -0.0004774034023284912, -0.00042484700679779053, -0.00037229061126708984, -0.00031973421573638916, -0.0002671778202056885, -0.0002146214246749878, -0.0001620650291442871, -0.00010950863361358643, -5.695223808288574e-05, -4.395842552185059e-06, 4.8160552978515625e-05, 0.00010071694850921631, 0.000153273344039917, 0.00020582973957061768, 0.00025838613510131836, 0.00031094253063201904, 0.0003634989261627197, 0.0004160553216934204, 0.0004686117172241211, 0.0005211681127548218, 0.0005737245082855225, 0.0006262809038162231, 0.0006788372993469238, 0.0007313936948776245, 0.0007839500904083252, 0.0008365064859390259, 0.0008890628814697266, 0.0009416192770004272, 0.000994175672531128, 0.0010467320680618286, 0.0010992884635925293, 0.00115184485912323, 0.0012044012546539307, 0.0012569576501846313, 0.001309514045715332, 0.0013620704412460327, 0.0014146268367767334, 0.001467183232307434, 0.0015197396278381348, 0.0015722960233688354, 0.0016248524188995361, 0.0016774088144302368, 0.0017299652099609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 11.0, 9.0, 9.0, 16.0, 21.0, 19.0, 27.0, 24.0, 42.0, 29.0, 41.0, 44.0, 48.0, 54.0, 44.0, 64.0, 47.0, 56.0, 52.0, 52.0, 42.0, 38.0, 33.0, 34.0, 26.0, 23.0, 16.0, 15.0, 18.0, 3.0, 6.0, 10.0, 3.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003590583801269531, -0.0003480352461338043, -0.0003370121121406555, -0.0003259889781475067, -0.0003149658441543579, -0.0003039427101612091, -0.0002929195761680603, -0.0002818964421749115, -0.0002708733081817627, -0.0002598501741886139, -0.0002488270401954651, -0.00023780390620231628, -0.00022678077220916748, -0.00021575763821601868, -0.00020473450422286987, -0.00019371137022972107, -0.00018268823623657227, -0.00017166510224342346, -0.00016064196825027466, -0.00014961883425712585, -0.00013859570026397705, -0.00012757256627082825, -0.00011654943227767944, -0.00010552629828453064, -9.450316429138184e-05, -8.348003029823303e-05, -7.245689630508423e-05, -6.143376231193542e-05, -5.041062831878662e-05, -3.938749432563782e-05, -2.8364360332489014e-05, -1.734122633934021e-05, -6.318092346191406e-06, 4.7050416469573975e-06, 1.57281756401062e-05, 2.6751309633255005e-05, 3.777444362640381e-05, 4.879757761955261e-05, 5.9820711612701416e-05, 7.084384560585022e-05, 8.186697959899902e-05, 9.289011359214783e-05, 0.00010391324758529663, 0.00011493638157844543, 0.00012595951557159424, 0.00013698264956474304, 0.00014800578355789185, 0.00015902891755104065, 0.00017005205154418945, 0.00018107518553733826, 0.00019209831953048706, 0.00020312145352363586, 0.00021414458751678467, 0.00022516772150993347, 0.00023619085550308228, 0.0002472139894962311, 0.0002582371234893799, 0.0002692602574825287, 0.0002802833914756775, 0.0002913065254688263, 0.0003023296594619751, 0.0003133527934551239, 0.0003243759274482727, 0.0003353990614414215, 0.0003464221954345703]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 8.0, 10.0, 15.0, 15.0, 18.0, 19.0, 29.0, 44.0, 61.0, 74.0, 98.0, 128.0, 125.0, 83.0, 67.0, 55.0, 34.0, 18.0, 15.0, 20.0, 14.0, 6.0, 16.0, 8.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.007771916221827269, -0.007542204111814499, -0.007312492001801729, -0.0070827798917889595, -0.0068530673161149025, -0.006623355206102133, -0.006393643096089363, -0.006163930986076593, -0.005934218876063824, -0.005704506766051054, -0.005474794656038284, -0.005245082080364227, -0.005015369970351458, -0.004785657860338688, -0.004555945750325918, -0.0043262336403131485, -0.0040965210646390915, -0.003866808954626322, -0.0036370966117829084, -0.0034073845017701387, -0.0031776721589267254, -0.0029479600489139557, -0.002718247938901186, -0.0024885358288884163, -0.002258823486045003, -0.0020291113760322332, -0.0017993990331888199, -0.0015696869231760502, -0.0013399746967479587, -0.0011102624703198671, -0.0008805503603070974, -0.0006508381338790059, -0.0004211263731122017, -0.00019141417578794062, 3.829802153632045e-05, 0.00026801018975675106, 0.0004977224161848426, 0.0007274346426129341, 0.0009571467526257038, 0.0011868589790537953, 0.0014165712054818869, 0.0016462834319099784, 0.00187599565833807, 0.0021057077683508396, 0.0023354198783636093, 0.0025651322212070227, 0.0027948443312197924, 0.0030245566740632057, 0.0032542687840759754, 0.003483980894088745, 0.0037136932369321585, 0.0039434051141142845, 0.0041731176897883415, 0.004402829799801111, 0.004632541909813881, 0.004862254019826651, 0.00509196612983942, 0.00532167823985219, 0.00555139034986496, 0.005781102925539017, 0.006010815035551786, 0.006240527145564556, 0.006470239255577326, 0.0066999513655900955, 0.0069296639412641525]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 9.0, 7.0, 7.0, 8.0, 15.0, 17.0, 21.0, 20.0, 16.0, 33.0, 25.0, 38.0, 32.0, 35.0, 40.0, 52.0, 35.0, 47.0, 40.0, 39.0, 51.0, 37.0, 43.0, 47.0, 30.0, 29.0, 33.0, 34.0, 27.0, 16.0, 17.0, 17.0, 23.0, 16.0, 8.0, 10.0, 7.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004885593894869089, -0.004740923643112183, -0.004596253391355276, -0.004451583605259657, -0.00430691335350275, -0.004162243101745844, -0.004017572849988937, -0.003872902598232031, -0.003728232579305768, -0.0035835623275488615, -0.0034388923086225986, -0.003294222056865692, -0.0031495518051087856, -0.0030048817861825228, -0.0028602115344256163, -0.0027155415154993534, -0.002570871263742447, -0.0024262010119855404, -0.0022815309930592775, -0.002136860741302371, -0.001992190722376108, -0.0018475204706192017, -0.0017028502188622952, -0.0015581800835207105, -0.0014135099481791258, -0.001268839812837541, -0.0011241696774959564, -0.00097949942573905, -0.0008348292903974652, -0.0006901591550558805, -0.000545488961506635, -0.00040081876795738935, -0.000256149098277092, -0.00011147893383167684, 3.31912306137383e-05, 0.00017786139505915344, 0.0003225315595045686, 0.00046720169484615326, 0.0006118718883953989, 0.0007565420819446445, 0.0009012122172862291, 0.0010458823526278138, 0.0011905524879693985, 0.001335222739726305, 0.0014798928750678897, 0.0016245630104094744, 0.0017692332621663809, 0.0019139033975079656, 0.0020585735328495502, 0.0022032437846064568, 0.0023479138035327196, 0.002492584055289626, 0.002637254074215889, 0.0027819243259727955, 0.002926594577729702, 0.0030712648294866085, 0.0032159348484128714, 0.003360605100169778, 0.0035052751190960407, 0.0036499453708529472, 0.0037946156226098537, 0.00393928587436676, 0.0040839556604623795, 0.004228625912219286, 0.0043732961639761925]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 15.0, 15.0, 22.0, 40.0, 74.0, 104.0, 177.0, 234.0, 388.0, 713.0, 1177.0, 2150.0, 4090.0, 7870.0, 15371.0, 31763.0, 69168.0, 164216.0, 342106.0, 230555.0, 94383.0, 41977.0, 20179.0, 10065.0, 5235.0, 2916.0, 1503.0, 855.0, 491.0, 271.0, 151.0, 101.0, 45.0, 36.0, 19.0, 20.0, 16.0, 11.0, 12.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0125885009765625, -0.012235760688781738, -0.011883020401000977, -0.011530280113220215, -0.011177539825439453, -0.010824799537658691, -0.01047205924987793, -0.010119318962097168, -0.009766578674316406, -0.009413838386535645, -0.009061098098754883, -0.008708357810974121, -0.00835561752319336, -0.008002877235412598, -0.007650136947631836, -0.007297396659851074, -0.0069446563720703125, -0.006591916084289551, -0.006239175796508789, -0.005886435508728027, -0.005533695220947266, -0.005180954933166504, -0.004828214645385742, -0.0044754743576049805, -0.004122734069824219, -0.003769993782043457, -0.0034172534942626953, -0.0030645132064819336, -0.002711772918701172, -0.00235903263092041, -0.0020062923431396484, -0.0016535520553588867, -0.001300811767578125, -0.0009480714797973633, -0.0005953311920166016, -0.00024259090423583984, 0.00011014938354492188, 0.0004628896713256836, 0.0008156299591064453, 0.001168370246887207, 0.0015211105346679688, 0.0018738508224487305, 0.002226591110229492, 0.002579331398010254, 0.0029320716857910156, 0.0032848119735717773, 0.003637552261352539, 0.003990292549133301, 0.0043430328369140625, 0.004695773124694824, 0.005048513412475586, 0.005401253700256348, 0.005753993988037109, 0.006106734275817871, 0.006459474563598633, 0.0068122148513793945, 0.007164955139160156, 0.007517695426940918, 0.00787043571472168, 0.008223176002502441, 0.008575916290283203, 0.008928656578063965, 0.009281396865844727, 0.009634137153625488, 0.00998687744140625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 3.0, 8.0, 10.0, 9.0, 14.0, 20.0, 13.0, 27.0, 26.0, 19.0, 31.0, 34.0, 39.0, 36.0, 43.0, 56.0, 44.0, 53.0, 44.0, 46.0, 48.0, 45.0, 42.0, 42.0, 34.0, 32.0, 27.0, 35.0, 23.0, 17.0, 19.0, 19.0, 11.0, 8.0, 8.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004383087158203125, -0.004254519939422607, -0.00412595272064209, -0.003997385501861572, -0.0038688182830810547, -0.003740251064300537, -0.0036116838455200195, -0.003483116626739502, -0.0033545494079589844, -0.003225982189178467, -0.0030974149703979492, -0.0029688477516174316, -0.002840280532836914, -0.0027117133140563965, -0.002583146095275879, -0.0024545788764953613, -0.0023260116577148438, -0.002197444438934326, -0.0020688772201538086, -0.001940310001373291, -0.0018117427825927734, -0.0016831755638122559, -0.0015546083450317383, -0.0014260411262512207, -0.0012974739074707031, -0.0011689066886901855, -0.001040339469909668, -0.0009117722511291504, -0.0007832050323486328, -0.0006546378135681152, -0.0005260705947875977, -0.0003975033760070801, -0.0002689361572265625, -0.00014036893844604492, -1.1801719665527344e-05, 0.00011676549911499023, 0.0002453327178955078, 0.0003738999366760254, 0.000502467155456543, 0.0006310343742370605, 0.0007596015930175781, 0.0008881688117980957, 0.0010167360305786133, 0.0011453032493591309, 0.0012738704681396484, 0.001402437686920166, 0.0015310049057006836, 0.0016595721244812012, 0.0017881393432617188, 0.0019167065620422363, 0.002045273780822754, 0.0021738409996032715, 0.002302408218383789, 0.0024309754371643066, 0.0025595426559448242, 0.002688109874725342, 0.0028166770935058594, 0.002945244312286377, 0.0030738115310668945, 0.003202378749847412, 0.0033309459686279297, 0.0034595131874084473, 0.003588080406188965, 0.0037166476249694824, 0.00384521484375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 10.0, 10.0, 11.0, 24.0, 45.0, 56.0, 107.0, 133.0, 176.0, 290.0, 415.0, 659.0, 1159.0, 1748.0, 2644.0, 4027.0, 6168.0, 9040.0, 14048.0, 22013.0, 34977.0, 58530.0, 98610.0, 165503.0, 223401.0, 159672.0, 94838.0, 55715.0, 33806.0, 21036.0, 13530.0, 8934.0, 6009.0, 3856.0, 2565.0, 1770.0, 1082.0, 659.0, 444.0, 290.0, 200.0, 109.0, 84.0, 55.0, 38.0, 17.0, 17.0, 8.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.007076263427734375, -0.006870925426483154, -0.006665587425231934, -0.006460249423980713, -0.006254911422729492, -0.0060495734214782715, -0.005844235420227051, -0.00563889741897583, -0.005433559417724609, -0.005228221416473389, -0.005022883415222168, -0.004817545413970947, -0.0046122074127197266, -0.004406869411468506, -0.004201531410217285, -0.0039961934089660645, -0.0037908554077148438, -0.003585517406463623, -0.0033801794052124023, -0.0031748414039611816, -0.002969503402709961, -0.0027641654014587402, -0.0025588274002075195, -0.002353489398956299, -0.002148151397705078, -0.0019428133964538574, -0.0017374753952026367, -0.001532137393951416, -0.0013267993927001953, -0.0011214613914489746, -0.0009161233901977539, -0.0007107853889465332, -0.0005054473876953125, -0.0003001093864440918, -9.47713851928711e-05, 0.00011056661605834961, 0.0003159046173095703, 0.000521242618560791, 0.0007265806198120117, 0.0009319186210632324, 0.0011372566223144531, 0.0013425946235656738, 0.0015479326248168945, 0.0017532706260681152, 0.001958608627319336, 0.0021639466285705566, 0.0023692846298217773, 0.002574622631072998, 0.0027799606323242188, 0.0029852986335754395, 0.00319063663482666, 0.003395974636077881, 0.0036013126373291016, 0.0038066506385803223, 0.004011988639831543, 0.004217326641082764, 0.004422664642333984, 0.004628002643585205, 0.004833340644836426, 0.0050386786460876465, 0.005244016647338867, 0.005449354648590088, 0.005654692649841309, 0.005860030651092529, 0.00606536865234375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 6.0, 10.0, 9.0, 10.0, 26.0, 17.0, 23.0, 24.0, 16.0, 34.0, 36.0, 36.0, 31.0, 45.0, 29.0, 37.0, 46.0, 34.0, 45.0, 46.0, 35.0, 44.0, 42.0, 39.0, 33.0, 43.0, 23.0, 20.0, 24.0, 24.0, 23.0, 15.0, 16.0, 11.0, 10.0, 10.0, 4.0, 7.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0022525787353515625, -0.0021780431270599365, -0.0021035075187683105, -0.0020289719104766846, -0.0019544363021850586, -0.0018799006938934326, -0.0018053650856018066, -0.0017308294773101807, -0.0016562938690185547, -0.0015817582607269287, -0.0015072226524353027, -0.0014326870441436768, -0.0013581514358520508, -0.0012836158275604248, -0.0012090802192687988, -0.0011345446109771729, -0.0010600090026855469, -0.000985473394393921, -0.0009109377861022949, -0.0008364021778106689, -0.000761866569519043, -0.000687330961227417, -0.000612795352935791, -0.000538259744644165, -0.00046372413635253906, -0.0003891885280609131, -0.0003146529197692871, -0.00024011731147766113, -0.00016558170318603516, -9.104609489440918e-05, -1.6510486602783203e-05, 5.8025121688842773e-05, 0.00013256072998046875, 0.00020709633827209473, 0.0002816319465637207, 0.0003561675548553467, 0.00043070316314697266, 0.0005052387714385986, 0.0005797743797302246, 0.0006543099880218506, 0.0007288455963134766, 0.0008033812046051025, 0.0008779168128967285, 0.0009524524211883545, 0.0010269880294799805, 0.0011015236377716064, 0.0011760592460632324, 0.0012505948543548584, 0.0013251304626464844, 0.0013996660709381104, 0.0014742016792297363, 0.0015487372875213623, 0.0016232728958129883, 0.0016978085041046143, 0.0017723441123962402, 0.0018468797206878662, 0.0019214153289794922, 0.001995950937271118, 0.002070486545562744, 0.00214502215385437, 0.002219557762145996, 0.002294093370437622, 0.002368628978729248, 0.002443164587020874, 0.0025177001953125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 6.0, 8.0, 11.0, 16.0, 21.0, 31.0, 38.0, 59.0, 71.0, 121.0, 136.0, 209.0, 271.0, 373.0, 566.0, 742.0, 1175.0, 1831.0, 2962.0, 5142.0, 9349.0, 19373.0, 59916.0, 852997.0, 52792.0, 18138.0, 8990.0, 4816.0, 2849.0, 1785.0, 1165.0, 740.0, 544.0, 352.0, 259.0, 192.0, 120.0, 102.0, 80.0, 58.0, 40.0, 36.0, 20.0, 17.0, 11.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0009598731994628906, -0.0009293630719184875, -0.0008988529443740845, -0.0008683428168296814, -0.0008378326892852783, -0.0008073225617408752, -0.0007768124341964722, -0.0007463023066520691, -0.000715792179107666, -0.0006852820515632629, -0.0006547719240188599, -0.0006242617964744568, -0.0005937516689300537, -0.0005632415413856506, -0.0005327314138412476, -0.0005022212862968445, -0.0004717111587524414, -0.00044120103120803833, -0.00041069090366363525, -0.0003801807761192322, -0.0003496706485748291, -0.000319160521030426, -0.00028865039348602295, -0.0002581402659416199, -0.0002276301383972168, -0.00019712001085281372, -0.00016660988330841064, -0.00013609975576400757, -0.00010558962821960449, -7.507950067520142e-05, -4.456937313079834e-05, -1.4059245586395264e-05, 1.6450881958007812e-05, 4.696100950241089e-05, 7.747113704681396e-05, 0.00010798126459121704, 0.00013849139213562012, 0.0001690015196800232, 0.00019951164722442627, 0.00023002177476882935, 0.0002605319023132324, 0.0002910420298576355, 0.0003215521574020386, 0.00035206228494644165, 0.0003825724124908447, 0.0004130825400352478, 0.0004435926675796509, 0.00047410279512405396, 0.000504612922668457, 0.0005351230502128601, 0.0005656331777572632, 0.0005961433053016663, 0.0006266534328460693, 0.0006571635603904724, 0.0006876736879348755, 0.0007181838154792786, 0.0007486939430236816, 0.0007792040705680847, 0.0008097141981124878, 0.0008402243256568909, 0.0008707344532012939, 0.000901244580745697, 0.0009317547082901001, 0.0009622648358345032, 0.0009927749633789062]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 7.0, 9.0, 7.0, 21.0, 15.0, 40.0, 68.0, 64.0, 85.0, 136.0, 121.0, 95.0, 83.0, 76.0, 42.0, 32.0, 26.0, 12.0, 11.0, 10.0, 2.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.584210157394409e-06, -5.386769771575928e-06, -5.189329385757446e-06, -4.991888999938965e-06, -4.794448614120483e-06, -4.597008228302002e-06, -4.3995678424835205e-06, -4.202127456665039e-06, -4.004687070846558e-06, -3.807246685028076e-06, -3.6098062992095947e-06, -3.4123659133911133e-06, -3.214925527572632e-06, -3.0174851417541504e-06, -2.820044755935669e-06, -2.6226043701171875e-06, -2.425163984298706e-06, -2.2277235984802246e-06, -2.030283212661743e-06, -1.8328428268432617e-06, -1.6354024410247803e-06, -1.4379620552062988e-06, -1.2405216693878174e-06, -1.043081283569336e-06, -8.456408977508545e-07, -6.48200511932373e-07, -4.507601261138916e-07, -2.5331974029541016e-07, -5.587935447692871e-08, 1.4156103134155273e-07, 3.390014171600342e-07, 5.364418029785156e-07, 7.338821887969971e-07, 9.313225746154785e-07, 1.12876296043396e-06, 1.3262033462524414e-06, 1.5236437320709229e-06, 1.7210841178894043e-06, 1.9185245037078857e-06, 2.115964889526367e-06, 2.3134052753448486e-06, 2.51084566116333e-06, 2.7082860469818115e-06, 2.905726432800293e-06, 3.1031668186187744e-06, 3.300607204437256e-06, 3.4980475902557373e-06, 3.6954879760742188e-06, 3.8929283618927e-06, 4.090368747711182e-06, 4.287809133529663e-06, 4.4852495193481445e-06, 4.682689905166626e-06, 4.880130290985107e-06, 5.077570676803589e-06, 5.27501106262207e-06, 5.472451448440552e-06, 5.669891834259033e-06, 5.867332220077515e-06, 6.064772605895996e-06, 6.2622129917144775e-06, 6.459653377532959e-06, 6.6570937633514404e-06, 6.854534149169922e-06]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 6.0, 15.0, 32.0, 34.0, 44.0, 71.0, 94.0, 129.0, 230.0, 313.0, 451.0, 694.0, 1183.0, 1893.0, 3134.0, 5652.0, 10035.0, 20344.0, 53243.0, 843529.0, 60436.0, 21924.0, 10645.0, 5760.0, 3204.0, 1997.0, 1212.0, 721.0, 477.0, 337.0, 211.0, 158.0, 115.0, 64.0, 55.0, 29.0, 17.0, 12.0, 21.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000949859619140625, -0.0009187608957290649, -0.0008876621723175049, -0.0008565634489059448, -0.0008254647254943848, -0.0007943660020828247, -0.0007632672786712646, -0.0007321685552597046, -0.0007010698318481445, -0.0006699711084365845, -0.0006388723850250244, -0.0006077736616134644, -0.0005766749382019043, -0.0005455762147903442, -0.0005144774913787842, -0.0004833787679672241, -0.00045228004455566406, -0.000421181321144104, -0.00039008259773254395, -0.0003589838743209839, -0.00032788515090942383, -0.00029678642749786377, -0.0002656877040863037, -0.00023458898067474365, -0.0002034902572631836, -0.00017239153385162354, -0.00014129281044006348, -0.00011019408702850342, -7.909536361694336e-05, -4.79966402053833e-05, -1.6897916793823242e-05, 1.4200806617736816e-05, 4.5299530029296875e-05, 7.639825344085693e-05, 0.00010749697685241699, 0.00013859570026397705, 0.0001696944236755371, 0.00020079314708709717, 0.00023189187049865723, 0.0002629905939102173, 0.00029408931732177734, 0.0003251880407333374, 0.00035628676414489746, 0.0003873854875564575, 0.0004184842109680176, 0.00044958293437957764, 0.0004806816577911377, 0.0005117803812026978, 0.0005428791046142578, 0.0005739778280258179, 0.0006050765514373779, 0.000636175274848938, 0.000667273998260498, 0.0006983727216720581, 0.0007294714450836182, 0.0007605701684951782, 0.0007916688919067383, 0.0008227676153182983, 0.0008538663387298584, 0.0008849650621414185, 0.0009160637855529785, 0.0009471625089645386, 0.0009782612323760986, 0.0010093599557876587, 0.0010404586791992188]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 4.0, 4.0, 10.0, 5.0, 6.0, 8.0, 5.0, 13.0, 13.0, 15.0, 16.0, 24.0, 199.0, 480.0, 63.0, 19.0, 21.0, 9.0, 10.0, 14.0, 11.0, 9.0, 4.0, 7.0, 11.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00025844573974609375, -0.000251108780503273, -0.00024377182126045227, -0.00023643486201763153, -0.0002290979027748108, -0.00022176094353199005, -0.0002144239842891693, -0.00020708702504634857, -0.00019975006580352783, -0.0001924131065607071, -0.00018507614731788635, -0.0001777391880750656, -0.00017040222883224487, -0.00016306526958942413, -0.0001557283103466034, -0.00014839135110378265, -0.00014105439186096191, -0.00013371743261814117, -0.00012638047337532043, -0.0001190435141324997, -0.00011170655488967896, -0.00010436959564685822, -9.703263640403748e-05, -8.969567716121674e-05, -8.2358717918396e-05, -7.502175867557526e-05, -6.768479943275452e-05, -6.034784018993378e-05, -5.301088094711304e-05, -4.56739217042923e-05, -3.833696246147156e-05, -3.100000321865082e-05, -2.3663043975830078e-05, -1.632608473300934e-05, -8.989125490188599e-06, -1.6521662473678589e-06, 5.684792995452881e-06, 1.302175223827362e-05, 2.035871148109436e-05, 2.76956707239151e-05, 3.503262996673584e-05, 4.236958920955658e-05, 4.970654845237732e-05, 5.704350769519806e-05, 6.43804669380188e-05, 7.171742618083954e-05, 7.905438542366028e-05, 8.639134466648102e-05, 9.372830390930176e-05, 0.0001010652631521225, 0.00010840222239494324, 0.00011573918163776398, 0.00012307614088058472, 0.00013041310012340546, 0.0001377500593662262, 0.00014508701860904694, 0.00015242397785186768, 0.00015976093709468842, 0.00016709789633750916, 0.0001744348555803299, 0.00018177181482315063, 0.00018910877406597137, 0.00019644573330879211, 0.00020378269255161285, 0.0002111196517944336]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 9.0, 8.0, 18.0, 18.0, 21.0, 28.0, 50.0, 49.0, 75.0, 84.0, 121.0, 118.0, 100.0, 80.0, 47.0, 24.0, 32.0, 29.0, 18.0, 17.0, 12.0, 10.0, 6.0, 2.0, 6.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005534959491342306, -0.005338046699762344, -0.005141133908182383, -0.004944221116602421, -0.004747308790683746, -0.0045503959991037846, -0.004353483207523823, -0.004156570415943861, -0.003959657624363899, -0.0037627448327839375, -0.0035658322740346193, -0.0033689194824546576, -0.0031720069237053394, -0.0029750941321253777, -0.002778181340545416, -0.002581268548965454, -0.0023843562230467796, -0.002187443431466818, -0.0019905308727174997, -0.001793618081137538, -0.001596705405972898, -0.001399792730808258, -0.0012028799392282963, -0.0010059672640636563, -0.0008090545888990164, -0.0006121419137343764, -0.00041522918036207557, -0.0002183164469897747, -2.1403771825134754e-05, 0.0001755089033395052, 0.00037242169491946697, 0.0005693343700841069, 0.0007662470452487469, 0.0009631597204133868, 0.0011600723955780268, 0.0013569851871579885, 0.0015538978623226285, 0.0017508105374872684, 0.0019477233290672302, 0.002144636120647192, 0.00234154867939651, 0.002538461470976472, 0.00273537402972579, 0.002932286821305752, 0.0031291996128857136, 0.0033261121716350317, 0.0035230249632149935, 0.0037199375219643116, 0.003916850313544273, 0.004113763105124235, 0.004310675896704197, 0.004507588222622871, 0.004704501014202833, 0.004901413805782795, 0.005098326597362757, 0.0052952393889427185, 0.005492151714861393, 0.005689064506441355, 0.0058859772980213165, 0.006082889623939991, 0.006279802415519953, 0.0064767152070999146, 0.006673627998679876, 0.006870540790259838, 0.0070674535818398]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 3.0, 7.0, 8.0, 11.0, 11.0, 20.0, 16.0, 13.0, 12.0, 20.0, 14.0, 24.0, 27.0, 30.0, 29.0, 33.0, 27.0, 30.0, 35.0, 46.0, 45.0, 44.0, 39.0, 47.0, 30.0, 36.0, 24.0, 35.0, 30.0, 29.0, 32.0, 24.0, 23.0, 19.0, 19.0, 22.0, 19.0, 17.0, 11.0, 7.0, 8.0, 9.0, 5.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00321229943074286, -0.0031003376934677362, -0.002988375723361969, -0.0028764139860868454, -0.002764452248811722, -0.002652490511536598, -0.002540528541430831, -0.0024285668041557074, -0.00231660483404994, -0.0022046430967748165, -0.0020926811266690493, -0.0019807193893939257, -0.001868757652118802, -0.0017567957984283566, -0.0016448339447379112, -0.0015328722074627876, -0.001420910470187664, -0.0013089486164972186, -0.001196986879222095, -0.0010850250255316496, -0.0009730632300488651, -0.0008611014345660806, -0.0007491395808756351, -0.0006371777853928506, -0.0005252159899100661, -0.0004132541944272816, -0.00030129236984066665, -0.00018933054525405169, -7.736874977126718e-05, 3.4593045711517334e-05, 0.00014655489940196276, 0.00025851669488474727, 0.00037047872319817543, 0.00048244051868095994, 0.0005944023141637444, 0.0007063641678541899, 0.0008183259633369744, 0.0009302877588197589, 0.0010422496125102043, 0.001154211349785328, 0.0012661732034757733, 0.0013781350571662188, 0.0014900967944413424, 0.0016020586481317878, 0.0017140205018222332, 0.0018259822390973568, 0.0019379440927878022, 0.0020499059464782476, 0.0021618676837533712, 0.002273829421028495, 0.002385791391134262, 0.0024977531284093857, 0.0026097148656845093, 0.002721676602959633, 0.0028336385730654, 0.0029456003103405237, 0.003057562280446291, 0.0031695240177214146, 0.003281485987827182, 0.0033934477251023054, 0.003505409462377429, 0.0036173714324831963, 0.00372933316975832, 0.0038412949070334435, 0.003953256644308567]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 8.0, 9.0, 11.0, 15.0, 33.0, 50.0, 74.0, 98.0, 143.0, 192.0, 290.0, 448.0, 631.0, 883.0, 1300.0, 1836.0, 2932.0, 4253.0, 6413.0, 10014.0, 15349.0, 24449.0, 40664.0, 70239.0, 129311.0, 266951.0, 704612.0, 1510322.0, 774910.0, 295217.0, 142399.0, 76904.0, 43432.0, 25694.0, 15826.0, 9807.0, 6371.0, 4129.0, 2690.0, 1795.0, 1250.0, 763.0, 517.0, 364.0, 215.0, 157.0, 107.0, 69.0, 42.0, 34.0, 19.0, 12.0, 12.0, 9.0, 4.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.004138946533203125, -0.003998875617980957, -0.003858804702758789, -0.003718733787536621, -0.003578662872314453, -0.003438591957092285, -0.003298521041870117, -0.0031584501266479492, -0.0030183792114257812, -0.0028783082962036133, -0.0027382373809814453, -0.0025981664657592773, -0.0024580955505371094, -0.0023180246353149414, -0.0021779537200927734, -0.0020378828048706055, -0.0018978118896484375, -0.0017577409744262695, -0.0016176700592041016, -0.0014775991439819336, -0.0013375282287597656, -0.0011974573135375977, -0.0010573863983154297, -0.0009173154830932617, -0.0007772445678710938, -0.0006371736526489258, -0.0004971027374267578, -0.00035703182220458984, -0.00021696090698242188, -7.68899917602539e-05, 6.318092346191406e-05, 0.00020325183868408203, 0.00034332275390625, 0.00048339366912841797, 0.0006234645843505859, 0.0007635354995727539, 0.0009036064147949219, 0.0010436773300170898, 0.0011837482452392578, 0.0013238191604614258, 0.0014638900756835938, 0.0016039609909057617, 0.0017440319061279297, 0.0018841028213500977, 0.0020241737365722656, 0.0021642446517944336, 0.0023043155670166016, 0.0024443864822387695, 0.0025844573974609375, 0.0027245283126831055, 0.0028645992279052734, 0.0030046701431274414, 0.0031447410583496094, 0.0032848119735717773, 0.0034248828887939453, 0.0035649538040161133, 0.0037050247192382812, 0.0038450956344604492, 0.003985166549682617, 0.004125237464904785, 0.004265308380126953, 0.004405379295349121, 0.004545450210571289, 0.004685521125793457, 0.004825592041015625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 1.0, 2.0, 6.0, 6.0, 6.0, 10.0, 14.0, 16.0, 11.0, 11.0, 13.0, 17.0, 10.0, 23.0, 21.0, 19.0, 30.0, 30.0, 36.0, 32.0, 31.0, 35.0, 27.0, 48.0, 36.0, 47.0, 43.0, 34.0, 33.0, 30.0, 29.0, 28.0, 33.0, 29.0, 33.0, 21.0, 18.0, 11.0, 13.0, 21.0, 17.0, 14.0, 12.0, 9.0, 6.0, 11.0, 6.0, 5.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002124786376953125, -0.0020564496517181396, -0.0019881129264831543, -0.001919776201248169, -0.0018514394760131836, -0.0017831027507781982, -0.0017147660255432129, -0.0016464293003082275, -0.0015780925750732422, -0.0015097558498382568, -0.0014414191246032715, -0.0013730823993682861, -0.0013047456741333008, -0.0012364089488983154, -0.00116807222366333, -0.0010997354984283447, -0.0010313987731933594, -0.000963062047958374, -0.0008947253227233887, -0.0008263885974884033, -0.000758051872253418, -0.0006897151470184326, -0.0006213784217834473, -0.0005530416965484619, -0.00048470497131347656, -0.0004163682460784912, -0.00034803152084350586, -0.0002796947956085205, -0.00021135807037353516, -0.0001430213451385498, -7.468461990356445e-05, -6.3478946685791016e-06, 6.198883056640625e-05, 0.0001303255558013916, 0.00019866228103637695, 0.0002669990062713623, 0.00033533573150634766, 0.000403672456741333, 0.00047200918197631836, 0.0005403459072113037, 0.0006086826324462891, 0.0006770193576812744, 0.0007453560829162598, 0.0008136928081512451, 0.0008820295333862305, 0.0009503662586212158, 0.0010187029838562012, 0.0010870397090911865, 0.0011553764343261719, 0.0012237131595611572, 0.0012920498847961426, 0.001360386610031128, 0.0014287233352661133, 0.0014970600605010986, 0.001565396785736084, 0.0016337335109710693, 0.0017020702362060547, 0.00177040696144104, 0.0018387436866760254, 0.0019070804119110107, 0.001975417137145996, 0.0020437538623809814, 0.002112090587615967, 0.002180427312850952, 0.0022487640380859375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 9.0, 8.0, 12.0, 8.0, 19.0, 27.0, 43.0, 52.0, 58.0, 84.0, 126.0, 221.0, 305.0, 438.0, 658.0, 959.0, 1442.0, 2186.0, 3430.0, 5410.0, 8683.0, 14680.0, 24608.0, 43081.0, 77906.0, 147070.0, 296448.0, 678876.0, 1389109.0, 793754.0, 337002.0, 164463.0, 86042.0, 47934.0, 27228.0, 15900.0, 9305.0, 5914.0, 3750.0, 2333.0, 1503.0, 1051.0, 668.0, 469.0, 307.0, 226.0, 142.0, 88.0, 76.0, 51.0, 45.0, 25.0, 22.0, 13.0, 9.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0], "bins": [-0.004055023193359375, -0.003926634788513184, -0.003798246383666992, -0.0036698579788208008, -0.0035414695739746094, -0.003413081169128418, -0.0032846927642822266, -0.003156304359436035, -0.0030279159545898438, -0.0028995275497436523, -0.002771139144897461, -0.0026427507400512695, -0.002514362335205078, -0.0023859739303588867, -0.0022575855255126953, -0.002129197120666504, -0.0020008087158203125, -0.001872420310974121, -0.0017440319061279297, -0.0016156435012817383, -0.0014872550964355469, -0.0013588666915893555, -0.001230478286743164, -0.0011020898818969727, -0.0009737014770507812, -0.0008453130722045898, -0.0007169246673583984, -0.000588536262512207, -0.0004601478576660156, -0.0003317594528198242, -0.0002033710479736328, -7.49826431274414e-05, 5.340576171875e-05, 0.0001817941665649414, 0.0003101825714111328, 0.0004385709762573242, 0.0005669593811035156, 0.000695347785949707, 0.0008237361907958984, 0.0009521245956420898, 0.0010805130004882812, 0.0012089014053344727, 0.001337289810180664, 0.0014656782150268555, 0.0015940666198730469, 0.0017224550247192383, 0.0018508434295654297, 0.001979231834411621, 0.0021076202392578125, 0.002236008644104004, 0.0023643970489501953, 0.0024927854537963867, 0.002621173858642578, 0.0027495622634887695, 0.002877950668334961, 0.0030063390731811523, 0.0031347274780273438, 0.003263115882873535, 0.0033915042877197266, 0.003519892692565918, 0.0036482810974121094, 0.0037766695022583008, 0.003905057907104492, 0.004033446311950684, 0.004161834716796875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 3.0, 4.0, 5.0, 5.0, 9.0, 18.0, 20.0, 17.0, 22.0, 27.0, 52.0, 34.0, 51.0, 75.0, 86.0, 119.0, 118.0, 147.0, 139.0, 188.0, 232.0, 255.0, 205.0, 248.0, 240.0, 228.0, 231.0, 194.0, 179.0, 161.0, 127.0, 124.0, 93.0, 74.0, 73.0, 71.0, 49.0, 36.0, 30.0, 18.0, 13.0, 12.0, 14.0, 5.0, 3.0, 7.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0012636184692382812, -0.0012249499559402466, -0.001186281442642212, -0.0011476129293441772, -0.0011089444160461426, -0.001070275902748108, -0.0010316073894500732, -0.0009929388761520386, -0.0009542703628540039, -0.0009156018495559692, -0.0008769333362579346, -0.0008382648229598999, -0.0007995963096618652, -0.0007609277963638306, -0.0007222592830657959, -0.0006835907697677612, -0.0006449222564697266, -0.0006062537431716919, -0.0005675852298736572, -0.0005289167165756226, -0.0004902482032775879, -0.0004515796899795532, -0.00041291117668151855, -0.0003742426633834839, -0.0003355741500854492, -0.00029690563678741455, -0.0002582371234893799, -0.00021956861019134521, -0.00018090009689331055, -0.00014223158359527588, -0.00010356307029724121, -6.489455699920654e-05, -2.6226043701171875e-05, 1.2442469596862793e-05, 5.111098289489746e-05, 8.977949619293213e-05, 0.0001284480094909668, 0.00016711652278900146, 0.00020578503608703613, 0.0002444535493850708, 0.00028312206268310547, 0.00032179057598114014, 0.0003604590892791748, 0.00039912760257720947, 0.00043779611587524414, 0.0004764646291732788, 0.0005151331424713135, 0.0005538016557693481, 0.0005924701690673828, 0.0006311386823654175, 0.0006698071956634521, 0.0007084757089614868, 0.0007471442222595215, 0.0007858127355575562, 0.0008244812488555908, 0.0008631497621536255, 0.0009018182754516602, 0.0009404867887496948, 0.0009791553020477295, 0.0010178238153457642, 0.0010564923286437988, 0.0010951608419418335, 0.0011338293552398682, 0.0011724978685379028, 0.0012111663818359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 9.0, 5.0, 12.0, 10.0, 21.0, 29.0, 40.0, 49.0, 73.0, 122.0, 165.0, 158.0, 116.0, 65.0, 43.0, 33.0, 19.0, 12.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005865850951522589, -0.005662374664098024, -0.00545889837667346, -0.005255422554910183, -0.005051946267485619, -0.004848469980061054, -0.00464499369263649, -0.0044415174052119255, -0.0042380415834486485, -0.004034565296024084, -0.0038310892414301634, -0.003627612954005599, -0.0034241368994116783, -0.003220660611987114, -0.0030171843245625496, -0.002813708269968629, -0.0026102319825440645, -0.0024067556951195, -0.0022032796405255795, -0.001999803353101015, -0.0017963272985070944, -0.00159285101108253, -0.0013893748400732875, -0.001185898669064045, -0.0009824224980548024, -0.0007789463270455599, -0.0005754701560363173, -0.0003719939268194139, -0.00016851775581017137, 3.495847340673208e-05, 0.00023843464441597462, 0.00044191081542521715, 0.0006453869864344597, 0.0008488631574437022, 0.0010523393284529448, 0.0012558156158775091, 0.0014592916704714298, 0.0016627679578959942, 0.0018662441289052367, 0.0020697202999144793, 0.0022731963545084, 0.0024766726419329643, 0.002680148696526885, 0.0028836249839514494, 0.00308710103854537, 0.0032905773259699345, 0.003494053613394499, 0.0036975296679884195, 0.003901005955412984, 0.004104482010006905, 0.004307958297431469, 0.004511434584856033, 0.004714910872280598, 0.004918387159705162, 0.005121862981468439, 0.0053253392688930035, 0.005528815556317568, 0.005732291843742132, 0.0059357681311666965, 0.006139243952929974, 0.006342720240354538, 0.006546196527779102, 0.006749672815203667, 0.006953149102628231, 0.007156624924391508]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 6.0, 1.0, 4.0, 10.0, 8.0, 13.0, 11.0, 18.0, 16.0, 16.0, 16.0, 17.0, 19.0, 15.0, 33.0, 31.0, 27.0, 33.0, 40.0, 38.0, 39.0, 42.0, 61.0, 42.0, 37.0, 32.0, 44.0, 37.0, 37.0, 32.0, 34.0, 29.0, 30.0, 23.0, 24.0, 20.0, 13.0, 10.0, 12.0, 11.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025942407082766294, -0.0025094933807849884, -0.0024247460532933474, -0.0023399987258017063, -0.0022552513983100653, -0.0021705040708184242, -0.002085756743326783, -0.002001009415835142, -0.001916262088343501, -0.00183151476085186, -0.001746767433360219, -0.001662020105868578, -0.001577272778376937, -0.0014925254508852959, -0.0014077781233936548, -0.0013230307959020138, -0.0012382834684103727, -0.0011535361409187317, -0.0010687888134270906, -0.0009840414859354496, -0.0008992941584438086, -0.0008145468309521675, -0.0007297995034605265, -0.0006450521759688854, -0.0005603048484772444, -0.00047555752098560333, -0.0003908101934939623, -0.00030606286600232124, -0.0002213155385106802, -0.00013656821101903915, -5.182088352739811e-05, 3.2926443964242935e-05, 0.00011767353862524033, 0.00020242086611688137, 0.0002871681936085224, 0.00037191552110016346, 0.0004566628485918045, 0.0005414101760834455, 0.0006261575035750866, 0.0007109048310667276, 0.0007956521585583687, 0.0008803994860500097, 0.0009651468135416508, 0.0010498941410332918, 0.0011346414685249329, 0.001219388796016574, 0.001304136123508215, 0.001388883450999856, 0.001473630778491497, 0.001558378105983138, 0.0016431254334747791, 0.0017278727609664202, 0.0018126200884580612, 0.0018973674159497023, 0.0019821147434413433, 0.0020668620709329844, 0.0021516093984246254, 0.0022363567259162664, 0.0023211040534079075, 0.0024058513808995485, 0.0024905987083911896, 0.0025753460358828306, 0.0026600933633744717, 0.0027448406908661127, 0.0028295880183577538]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 18.0, 30.0, 70.0, 79.0, 124.0, 226.0, 371.0, 609.0, 949.0, 1677.0, 2916.0, 5060.0, 8876.0, 16217.0, 29885.0, 55315.0, 108634.0, 230467.0, 287692.0, 144141.0, 71033.0, 37634.0, 20189.0, 11068.0, 6270.0, 3623.0, 2114.0, 1298.0, 744.0, 448.0, 293.0, 170.0, 84.0, 79.0, 51.0, 33.0, 19.0, 12.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00579071044921875, -0.005616247653961182, -0.005441784858703613, -0.005267322063446045, -0.0050928592681884766, -0.004918396472930908, -0.00474393367767334, -0.0045694708824157715, -0.004395008087158203, -0.004220545291900635, -0.004046082496643066, -0.003871619701385498, -0.0036971569061279297, -0.0035226941108703613, -0.003348231315612793, -0.0031737685203552246, -0.0029993057250976562, -0.002824842929840088, -0.0026503801345825195, -0.002475917339324951, -0.002301454544067383, -0.0021269917488098145, -0.001952528953552246, -0.0017780661582946777, -0.0016036033630371094, -0.001429140567779541, -0.0012546777725219727, -0.0010802149772644043, -0.0009057521820068359, -0.0007312893867492676, -0.0005568265914916992, -0.00038236379623413086, -0.0002079010009765625, -3.343820571899414e-05, 0.00014102458953857422, 0.0003154873847961426, 0.0004899501800537109, 0.0006644129753112793, 0.0008388757705688477, 0.001013338565826416, 0.0011878013610839844, 0.0013622641563415527, 0.001536726951599121, 0.0017111897468566895, 0.0018856525421142578, 0.002060115337371826, 0.0022345781326293945, 0.002409040927886963, 0.0025835037231445312, 0.0027579665184020996, 0.002932429313659668, 0.0031068921089172363, 0.0032813549041748047, 0.003455817699432373, 0.0036302804946899414, 0.0038047432899475098, 0.003979206085205078, 0.0041536688804626465, 0.004328131675720215, 0.004502594470977783, 0.0046770572662353516, 0.00485152006149292, 0.005025982856750488, 0.005200445652008057, 0.005374908447265625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 7.0, 2.0, 5.0, 8.0, 11.0, 18.0, 9.0, 14.0, 16.0, 16.0, 20.0, 19.0, 31.0, 33.0, 26.0, 37.0, 33.0, 30.0, 50.0, 34.0, 37.0, 64.0, 47.0, 35.0, 38.0, 45.0, 38.0, 38.0, 36.0, 38.0, 30.0, 23.0, 32.0, 13.0, 15.0, 13.0, 8.0, 14.0, 6.0, 5.0, 5.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00258636474609375, -0.0025066733360290527, -0.0024269819259643555, -0.002347290515899658, -0.002267599105834961, -0.0021879076957702637, -0.0021082162857055664, -0.002028524875640869, -0.0019488334655761719, -0.0018691420555114746, -0.0017894506454467773, -0.00170975923538208, -0.0016300678253173828, -0.0015503764152526855, -0.0014706850051879883, -0.001390993595123291, -0.0013113021850585938, -0.0012316107749938965, -0.0011519193649291992, -0.001072227954864502, -0.0009925365447998047, -0.0009128451347351074, -0.0008331537246704102, -0.0007534623146057129, -0.0006737709045410156, -0.0005940794944763184, -0.0005143880844116211, -0.00043469667434692383, -0.00035500526428222656, -0.0002753138542175293, -0.00019562244415283203, -0.00011593103408813477, -3.62396240234375e-05, 4.3451786041259766e-05, 0.00012314319610595703, 0.0002028346061706543, 0.00028252601623535156, 0.00036221742630004883, 0.0004419088363647461, 0.0005216002464294434, 0.0006012916564941406, 0.0006809830665588379, 0.0007606744766235352, 0.0008403658866882324, 0.0009200572967529297, 0.000999748706817627, 0.0010794401168823242, 0.0011591315269470215, 0.0012388229370117188, 0.001318514347076416, 0.0013982057571411133, 0.0014778971672058105, 0.0015575885772705078, 0.001637279987335205, 0.0017169713973999023, 0.0017966628074645996, 0.0018763542175292969, 0.001956045627593994, 0.0020357370376586914, 0.0021154284477233887, 0.002195119857788086, 0.002274811267852783, 0.0023545026779174805, 0.0024341940879821777, 0.002513885498046875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 18.0, 20.0, 30.0, 52.0, 83.0, 165.0, 239.0, 408.0, 671.0, 1223.0, 2199.0, 4364.0, 9044.0, 22729.0, 77282.0, 531563.0, 312133.0, 53596.0, 17353.0, 7257.0, 3549.0, 1919.0, 1064.0, 672.0, 376.0, 211.0, 127.0, 78.0, 46.0, 26.0, 13.0, 7.0, 7.0, 3.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0087127685546875, -0.008388519287109375, -0.00806427001953125, -0.007740020751953125, -0.007415771484375, -0.007091522216796875, -0.00676727294921875, -0.006443023681640625, -0.0061187744140625, -0.005794525146484375, -0.00547027587890625, -0.005146026611328125, -0.00482177734375, -0.004497528076171875, -0.00417327880859375, -0.003849029541015625, -0.0035247802734375, -0.003200531005859375, -0.00287628173828125, -0.002552032470703125, -0.002227783203125, -0.001903533935546875, -0.00157928466796875, -0.001255035400390625, -0.0009307861328125, -0.000606536865234375, -0.00028228759765625, 4.1961669921875e-05, 0.0003662109375, 0.000690460205078125, 0.00101470947265625, 0.001338958740234375, 0.0016632080078125, 0.001987457275390625, 0.00231170654296875, 0.002635955810546875, 0.002960205078125, 0.003284454345703125, 0.00360870361328125, 0.003932952880859375, 0.0042572021484375, 0.004581451416015625, 0.00490570068359375, 0.005229949951171875, 0.00555419921875, 0.005878448486328125, 0.00620269775390625, 0.006526947021484375, 0.0068511962890625, 0.007175445556640625, 0.00749969482421875, 0.007823944091796875, 0.008148193359375, 0.008472442626953125, 0.00879669189453125, 0.009120941162109375, 0.0094451904296875, 0.009769439697265625, 0.01009368896484375, 0.010417938232421875, 0.0107421875, 0.011066436767578125, 0.01139068603515625, 0.011714935302734375, 0.0120391845703125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 9.0, 9.0, 13.0, 14.0, 18.0, 12.0, 27.0, 19.0, 36.0, 27.0, 38.0, 35.0, 36.0, 49.0, 50.0, 47.0, 41.0, 46.0, 31.0, 44.0, 51.0, 52.0, 31.0, 39.0, 33.0, 40.0, 30.0, 18.0, 15.0, 21.0, 19.0, 12.0, 16.0, 6.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016317367553710938, -0.0015757977962493896, -0.0015198588371276855, -0.0014639198780059814, -0.0014079809188842773, -0.0013520419597625732, -0.0012961030006408691, -0.001240164041519165, -0.001184225082397461, -0.0011282861232757568, -0.0010723471641540527, -0.0010164082050323486, -0.0009604692459106445, -0.0009045302867889404, -0.0008485913276672363, -0.0007926523685455322, -0.0007367134094238281, -0.000680774450302124, -0.0006248354911804199, -0.0005688965320587158, -0.0005129575729370117, -0.0004570186138153076, -0.0004010796546936035, -0.0003451406955718994, -0.0002892017364501953, -0.0002332627773284912, -0.0001773238182067871, -0.00012138485908508301, -6.54458999633789e-05, -9.506940841674805e-06, 4.64320182800293e-05, 0.0001023709774017334, 0.0001583099365234375, 0.0002142488956451416, 0.0002701878547668457, 0.0003261268138885498, 0.0003820657730102539, 0.000438004732131958, 0.0004939436912536621, 0.0005498826503753662, 0.0006058216094970703, 0.0006617605686187744, 0.0007176995277404785, 0.0007736384868621826, 0.0008295774459838867, 0.0008855164051055908, 0.0009414553642272949, 0.000997394323348999, 0.0010533332824707031, 0.0011092722415924072, 0.0011652112007141113, 0.0012211501598358154, 0.0012770891189575195, 0.0013330280780792236, 0.0013889670372009277, 0.0014449059963226318, 0.001500844955444336, 0.00155678391456604, 0.0016127228736877441, 0.0016686618328094482, 0.0017246007919311523, 0.0017805397510528564, 0.0018364787101745605, 0.0018924176692962646, 0.0019483566284179688]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 11.0, 13.0, 15.0, 31.0, 61.0, 65.0, 110.0, 160.0, 286.0, 414.0, 707.0, 1144.0, 1744.0, 3018.0, 5835.0, 13528.0, 41447.0, 231453.0, 629631.0, 79426.0, 21337.0, 8051.0, 4070.0, 2296.0, 1388.0, 848.0, 502.0, 361.0, 204.0, 140.0, 73.0, 57.0, 36.0, 22.0, 22.0, 16.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.0024471282958984375, -0.0023813843727111816, -0.0023156404495239258, -0.00224989652633667, -0.002184152603149414, -0.002118408679962158, -0.0020526647567749023, -0.0019869208335876465, -0.0019211769104003906, -0.0018554329872131348, -0.001789689064025879, -0.001723945140838623, -0.0016582012176513672, -0.0015924572944641113, -0.0015267133712768555, -0.0014609694480895996, -0.0013952255249023438, -0.0013294816017150879, -0.001263737678527832, -0.0011979937553405762, -0.0011322498321533203, -0.0010665059089660645, -0.0010007619857788086, -0.0009350180625915527, -0.0008692741394042969, -0.000803530216217041, -0.0007377862930297852, -0.0006720423698425293, -0.0006062984466552734, -0.0005405545234680176, -0.0004748106002807617, -0.00040906667709350586, -0.00034332275390625, -0.00027757883071899414, -0.00021183490753173828, -0.00014609098434448242, -8.034706115722656e-05, -1.4603137969970703e-05, 5.1140785217285156e-05, 0.00011688470840454102, 0.00018262863159179688, 0.00024837255477905273, 0.0003141164779663086, 0.00037986040115356445, 0.0004456043243408203, 0.0005113482475280762, 0.000577092170715332, 0.0006428360939025879, 0.0007085800170898438, 0.0007743239402770996, 0.0008400678634643555, 0.0009058117866516113, 0.0009715557098388672, 0.001037299633026123, 0.001103043556213379, 0.0011687874794006348, 0.0012345314025878906, 0.0013002753257751465, 0.0013660192489624023, 0.0014317631721496582, 0.001497507095336914, 0.00156325101852417, 0.0016289949417114258, 0.0016947388648986816, 0.0017604827880859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 0.0, 6.0, 7.0, 7.0, 11.0, 12.0, 18.0, 24.0, 37.0, 42.0, 68.0, 59.0, 75.0, 91.0, 102.0, 95.0, 82.0, 55.0, 52.0, 38.0, 39.0, 21.0, 9.0, 16.0, 6.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.0517578125e-05, -2.971850335597992e-05, -2.891942858695984e-05, -2.8120353817939758e-05, -2.7321279048919678e-05, -2.6522204279899597e-05, -2.5723129510879517e-05, -2.4924054741859436e-05, -2.4124979972839355e-05, -2.3325905203819275e-05, -2.2526830434799194e-05, -2.1727755665779114e-05, -2.0928680896759033e-05, -2.0129606127738953e-05, -1.9330531358718872e-05, -1.853145658969879e-05, -1.773238182067871e-05, -1.693330705165863e-05, -1.613423228263855e-05, -1.533515751361847e-05, -1.4536082744598389e-05, -1.3737007975578308e-05, -1.2937933206558228e-05, -1.2138858437538147e-05, -1.1339783668518066e-05, -1.0540708899497986e-05, -9.741634130477905e-06, -8.942559361457825e-06, -8.143484592437744e-06, -7.3444098234176636e-06, -6.545335054397583e-06, -5.7462602853775024e-06, -4.947185516357422e-06, -4.148110747337341e-06, -3.3490359783172607e-06, -2.54996120929718e-06, -1.7508864402770996e-06, -9.51811671257019e-07, -1.5273690223693848e-07, 6.463378667831421e-07, 1.4454126358032227e-06, 2.2444874048233032e-06, 3.043562173843384e-06, 3.842636942863464e-06, 4.641711711883545e-06, 5.4407864809036255e-06, 6.239861249923706e-06, 7.038936018943787e-06, 7.838010787963867e-06, 8.637085556983948e-06, 9.436160326004028e-06, 1.0235235095024109e-05, 1.103430986404419e-05, 1.183338463306427e-05, 1.263245940208435e-05, 1.3431534171104431e-05, 1.4230608940124512e-05, 1.5029683709144592e-05, 1.5828758478164673e-05, 1.6627833247184753e-05, 1.7426908016204834e-05, 1.8225982785224915e-05, 1.9025057554244995e-05, 1.9824132323265076e-05, 2.0623207092285156e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 13.0, 19.0, 23.0, 33.0, 43.0, 82.0, 106.0, 179.0, 247.0, 359.0, 560.0, 748.0, 1193.0, 1716.0, 2618.0, 4330.0, 6808.0, 12029.0, 22412.0, 47493.0, 121749.0, 419535.0, 250934.0, 79218.0, 33992.0, 16986.0, 9357.0, 5523.0, 3484.0, 2255.0, 1479.0, 1013.0, 643.0, 389.0, 320.0, 217.0, 131.0, 93.0, 87.0, 39.0, 34.0, 17.0, 9.0, 12.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0008344650268554688, -0.000809013843536377, -0.0007835626602172852, -0.0007581114768981934, -0.0007326602935791016, -0.0007072091102600098, -0.000681757926940918, -0.0006563067436218262, -0.0006308555603027344, -0.0006054043769836426, -0.0005799531936645508, -0.000554502010345459, -0.0005290508270263672, -0.0005035996437072754, -0.0004781484603881836, -0.0004526972770690918, -0.00042724609375, -0.0004017949104309082, -0.0003763437271118164, -0.0003508925437927246, -0.0003254413604736328, -0.000299990177154541, -0.0002745389938354492, -0.0002490878105163574, -0.00022363662719726562, -0.00019818544387817383, -0.00017273426055908203, -0.00014728307723999023, -0.00012183189392089844, -9.638071060180664e-05, -7.092952728271484e-05, -4.547834396362305e-05, -2.002716064453125e-05, 5.424022674560547e-06, 3.0875205993652344e-05, 5.632638931274414e-05, 8.177757263183594e-05, 0.00010722875595092773, 0.00013267993927001953, 0.00015813112258911133, 0.00018358230590820312, 0.00020903348922729492, 0.00023448467254638672, 0.0002599358558654785, 0.0002853870391845703, 0.0003108382225036621, 0.0003362894058227539, 0.0003617405891418457, 0.0003871917724609375, 0.0004126429557800293, 0.0004380941390991211, 0.0004635453224182129, 0.0004889965057373047, 0.0005144476890563965, 0.0005398988723754883, 0.0005653500556945801, 0.0005908012390136719, 0.0006162524223327637, 0.0006417036056518555, 0.0006671547889709473, 0.0006926059722900391, 0.0007180571556091309, 0.0007435083389282227, 0.0007689595222473145, 0.0007944107055664062]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 8.0, 1.0, 8.0, 9.0, 8.0, 14.0, 21.0, 18.0, 21.0, 26.0, 20.0, 35.0, 51.0, 46.0, 59.0, 69.0, 73.0, 68.0, 82.0, 67.0, 46.0, 63.0, 28.0, 35.0, 22.0, 27.0, 25.0, 11.0, 9.0, 9.0, 9.0, 6.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020945072174072266, -0.00020335428416728973, -0.0001972578465938568, -0.0001911614090204239, -0.00018506497144699097, -0.00017896853387355804, -0.00017287209630012512, -0.0001667756587266922, -0.00016067922115325928, -0.00015458278357982635, -0.00014848634600639343, -0.0001423899084329605, -0.0001362934708595276, -0.00013019703328609467, -0.00012410059571266174, -0.00011800415813922882, -0.0001119077205657959, -0.00010581128299236298, -9.971484541893005e-05, -9.361840784549713e-05, -8.752197027206421e-05, -8.142553269863129e-05, -7.532909512519836e-05, -6.923265755176544e-05, -6.313621997833252e-05, -5.70397824048996e-05, -5.0943344831466675e-05, -4.484690725803375e-05, -3.875046968460083e-05, -3.265403211116791e-05, -2.6557594537734985e-05, -2.0461156964302063e-05, -1.436471939086914e-05, -8.268281817436218e-06, -2.171844244003296e-06, 3.9245933294296265e-06, 1.0021030902862549e-05, 1.611746847629547e-05, 2.2213906049728394e-05, 2.8310343623161316e-05, 3.440678119659424e-05, 4.050321877002716e-05, 4.659965634346008e-05, 5.2696093916893005e-05, 5.879253149032593e-05, 6.488896906375885e-05, 7.098540663719177e-05, 7.70818442106247e-05, 8.317828178405762e-05, 8.927471935749054e-05, 9.537115693092346e-05, 0.00010146759450435638, 0.0001075640320777893, 0.00011366046965122223, 0.00011975690722465515, 0.00012585334479808807, 0.000131949782371521, 0.00013804621994495392, 0.00014414265751838684, 0.00015023909509181976, 0.00015633553266525269, 0.0001624319702386856, 0.00016852840781211853, 0.00017462484538555145, 0.00018072128295898438]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 12.0, 8.0, 17.0, 20.0, 27.0, 38.0, 43.0, 79.0, 119.0, 163.0, 128.0, 110.0, 63.0, 45.0, 33.0, 26.0, 12.0, 15.0, 8.0, 5.0, 8.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003399189794436097, -0.0032499174121767282, -0.003100645262748003, -0.002951372880488634, -0.002802100731059909, -0.00265282834880054, -0.0025035561993718147, -0.002354283817112446, -0.002205011434853077, -0.002055739052593708, -0.0019064669031649828, -0.001757194520905614, -0.0016079223714768887, -0.0014586499892175198, -0.0013093777233734727, -0.0011601054575294256, -0.0010108333081007004, -0.0008615610422566533, -0.0007122887764126062, -0.0005630164523608983, -0.0004137441865168512, -0.0002644719206728041, -0.00011519959662109613, 3.4072669222950935e-05, 0.000183344935066998, 0.0003326172009110451, 0.0004818894958589226, 0.0006311617908068001, 0.0007804340566508472, 0.0009297063224948943, 0.0010789786465466022, 0.0012282509123906493, 0.00137752341106534, 0.0015267956769093871, 0.0016760679427534342, 0.001825340325012803, 0.0019746124744415283, 0.002123884856700897, 0.002273157238960266, 0.0024224293883889914, 0.0025717015378177166, 0.0027209739200770855, 0.0028702460695058107, 0.0030195184517651796, 0.003168790601193905, 0.0033180629834532738, 0.0034673353657126427, 0.003616607515141368, 0.003765879897400737, 0.003915152046829462, 0.004064424429088831, 0.0042136968113482, 0.004362969193607569, 0.00451224111020565, 0.004661513492465019, 0.004810785874724388, 0.004960058256983757, 0.005109330639243126, 0.005258603021502495, 0.005407874938100576, 0.005557147320359945, 0.005706419702619314, 0.005855692084878683, 0.006004964001476765, 0.006154236383736134]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 9.0, 9.0, 17.0, 16.0, 17.0, 17.0, 15.0, 16.0, 17.0, 21.0, 30.0, 28.0, 29.0, 35.0, 44.0, 40.0, 39.0, 43.0, 57.0, 46.0, 29.0, 41.0, 39.0, 39.0, 34.0, 40.0, 26.0, 34.0, 29.0, 30.0, 18.0, 20.0, 11.0, 10.0, 9.0, 13.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002225827192887664, -0.0021506878547370434, -0.0020755482837557793, -0.002000408945605159, -0.0019252696074545383, -0.001850130152888596, -0.0017749906983226538, -0.0016998513601720333, -0.001624711905606091, -0.0015495724510401487, -0.0014744331128895283, -0.001399293658323586, -0.0013241542037576437, -0.0012490148656070232, -0.001173875411041081, -0.0010987359564751387, -0.0010235966183245182, -0.0009484572219662368, -0.0008733178256079555, -0.0007981783710420132, -0.0007230389746837318, -0.0006478995783254504, -0.0005727601237595081, -0.0004976207274012268, -0.0004224813310429454, -0.000347341934684664, -0.0002722025092225522, -0.00019706309831235558, -0.00012192368740215898, -4.67842910438776e-05, 2.835513441823423e-05, 0.00010349455988034606, 0.0001786341890692711, 0.00025377358542755246, 0.0003289130108896643, 0.0004040524363517761, 0.0004791918327100575, 0.0005543312290683389, 0.0006294706836342812, 0.0007046100799925625, 0.0007797494763508439, 0.0008548888727091253, 0.0009300282690674067, 0.001005167723633349, 0.0010803071781992912, 0.0011554465163499117, 0.001230585970915854, 0.0013057254254817963, 0.0013808647636324167, 0.001456004218198359, 0.0015311435563489795, 0.0016062830109149218, 0.0016814223490655422, 0.0017565618036314845, 0.0018317012581974268, 0.0019068405963480473, 0.0019819801673293114, 0.002057119505479932, 0.002132259076461196, 0.0022073984146118164, 0.002282537752762437, 0.0023576770909130573, 0.0024328166618943214, 0.002507956000044942, 0.0025830953381955624]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 12.0, 6.0, 13.0, 20.0, 31.0, 26.0, 47.0, 68.0, 112.0, 138.0, 214.0, 307.0, 515.0, 764.0, 1195.0, 1914.0, 3294.0, 5271.0, 8605.0, 13354.0, 22422.0, 37395.0, 64783.0, 116266.0, 210795.0, 236668.0, 137883.0, 75991.0, 43434.0, 25742.0, 15729.0, 9614.0, 6085.0, 3630.0, 2293.0, 1378.0, 843.0, 569.0, 374.0, 244.0, 153.0, 93.0, 84.0, 54.0, 33.0, 36.0, 19.0, 11.0, 9.0, 9.0, 3.0, 3.0, 1.0, 0.0, 4.0, 4.0], "bins": [-0.004436492919921875, -0.004302620887756348, -0.00416874885559082, -0.004034876823425293, -0.0039010047912597656, -0.0037671327590942383, -0.003633260726928711, -0.0034993886947631836, -0.0033655166625976562, -0.003231644630432129, -0.0030977725982666016, -0.0029639005661010742, -0.002830028533935547, -0.0026961565017700195, -0.002562284469604492, -0.002428412437438965, -0.0022945404052734375, -0.00216066837310791, -0.002026796340942383, -0.0018929243087768555, -0.0017590522766113281, -0.0016251802444458008, -0.0014913082122802734, -0.001357436180114746, -0.0012235641479492188, -0.0010896921157836914, -0.0009558200836181641, -0.0008219480514526367, -0.0006880760192871094, -0.000554203987121582, -0.0004203319549560547, -0.00028645992279052734, -0.000152587890625, -1.8715858459472656e-05, 0.00011515617370605469, 0.00024902820587158203, 0.0003829002380371094, 0.0005167722702026367, 0.0006506443023681641, 0.0007845163345336914, 0.0009183883666992188, 0.001052260398864746, 0.0011861324310302734, 0.0013200044631958008, 0.0014538764953613281, 0.0015877485275268555, 0.0017216205596923828, 0.0018554925918579102, 0.0019893646240234375, 0.002123236656188965, 0.002257108688354492, 0.0023909807205200195, 0.002524852752685547, 0.0026587247848510742, 0.0027925968170166016, 0.002926468849182129, 0.0030603408813476562, 0.0031942129135131836, 0.003328084945678711, 0.0034619569778442383, 0.0035958290100097656, 0.003729701042175293, 0.0038635730743408203, 0.003997445106506348, 0.004131317138671875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 4.0, 10.0, 9.0, 10.0, 16.0, 12.0, 16.0, 15.0, 17.0, 21.0, 21.0, 21.0, 39.0, 24.0, 27.0, 35.0, 60.0, 22.0, 46.0, 36.0, 44.0, 41.0, 34.0, 42.0, 50.0, 34.0, 37.0, 25.0, 35.0, 29.0, 20.0, 22.0, 15.0, 26.0, 10.0, 12.0, 11.0, 10.0, 11.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0018672943115234375, -0.0018113404512405396, -0.0017553865909576416, -0.0016994327306747437, -0.0016434788703918457, -0.0015875250101089478, -0.0015315711498260498, -0.0014756172895431519, -0.001419663429260254, -0.001363709568977356, -0.001307755708694458, -0.00125180184841156, -0.0011958479881286621, -0.0011398941278457642, -0.0010839402675628662, -0.0010279864072799683, -0.0009720325469970703, -0.0009160786867141724, -0.0008601248264312744, -0.0008041709661483765, -0.0007482171058654785, -0.0006922632455825806, -0.0006363093852996826, -0.0005803555250167847, -0.0005244016647338867, -0.00046844780445098877, -0.0004124939441680908, -0.00035654008388519287, -0.0003005862236022949, -0.00024463236331939697, -0.00018867850303649902, -0.00013272464275360107, -7.677078247070312e-05, -2.0816922187805176e-05, 3.5136938095092773e-05, 9.109079837799072e-05, 0.00014704465866088867, 0.00020299851894378662, 0.00025895237922668457, 0.0003149062395095825, 0.00037086009979248047, 0.0004268139600753784, 0.00048276782035827637, 0.0005387216806411743, 0.0005946755409240723, 0.0006506294012069702, 0.0007065832614898682, 0.0007625371217727661, 0.0008184909820556641, 0.000874444842338562, 0.00093039870262146, 0.000986352562904358, 0.0010423064231872559, 0.0010982602834701538, 0.0011542141437530518, 0.0012101680040359497, 0.0012661218643188477, 0.0013220757246017456, 0.0013780295848846436, 0.0014339834451675415, 0.0014899373054504395, 0.0015458911657333374, 0.0016018450260162354, 0.0016577988862991333, 0.0017137527465820312]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 9.0, 13.0, 8.0, 22.0, 42.0, 45.0, 89.0, 95.0, 193.0, 309.0, 519.0, 845.0, 1352.0, 2448.0, 4053.0, 6751.0, 11174.0, 19624.0, 34149.0, 63495.0, 125192.0, 249357.0, 253434.0, 127864.0, 64415.0, 34955.0, 19590.0, 11490.0, 6941.0, 4126.0, 2349.0, 1429.0, 848.0, 520.0, 308.0, 185.0, 101.0, 85.0, 36.0, 35.0, 25.0, 15.0, 11.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00466156005859375, -0.00452035665512085, -0.004379153251647949, -0.004237949848175049, -0.0040967464447021484, -0.003955543041229248, -0.0038143396377563477, -0.0036731362342834473, -0.003531932830810547, -0.0033907294273376465, -0.003249526023864746, -0.0031083226203918457, -0.0029671192169189453, -0.002825915813446045, -0.0026847124099731445, -0.002543509006500244, -0.0024023056030273438, -0.0022611021995544434, -0.002119898796081543, -0.0019786953926086426, -0.0018374919891357422, -0.0016962885856628418, -0.0015550851821899414, -0.001413881778717041, -0.0012726783752441406, -0.0011314749717712402, -0.0009902715682983398, -0.0008490681648254395, -0.0007078647613525391, -0.0005666613578796387, -0.0004254579544067383, -0.0002842545509338379, -0.0001430511474609375, -1.8477439880371094e-06, 0.00013935565948486328, 0.00028055906295776367, 0.00042176246643066406, 0.0005629658699035645, 0.0007041692733764648, 0.0008453726768493652, 0.0009865760803222656, 0.001127779483795166, 0.0012689828872680664, 0.0014101862907409668, 0.0015513896942138672, 0.0016925930976867676, 0.001833796501159668, 0.0019749999046325684, 0.0021162033081054688, 0.002257406711578369, 0.0023986101150512695, 0.00253981351852417, 0.0026810169219970703, 0.0028222203254699707, 0.002963423728942871, 0.0031046271324157715, 0.003245830535888672, 0.0033870339393615723, 0.0035282373428344727, 0.003669440746307373, 0.0038106441497802734, 0.003951847553253174, 0.004093050956726074, 0.004234254360198975, 0.004375457763671875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 11.0, 9.0, 8.0, 16.0, 20.0, 10.0, 21.0, 22.0, 28.0, 22.0, 19.0, 34.0, 34.0, 39.0, 30.0, 49.0, 43.0, 43.0, 41.0, 33.0, 30.0, 40.0, 35.0, 41.0, 36.0, 27.0, 28.0, 26.0, 30.0, 33.0, 20.0, 16.0, 23.0, 18.0, 8.0, 6.0, 8.0, 4.0, 9.0, 5.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001110076904296875, -0.0010740309953689575, -0.00103798508644104, -0.0010019391775131226, -0.0009658932685852051, -0.0009298473596572876, -0.0008938014507293701, -0.0008577555418014526, -0.0008217096328735352, -0.0007856637239456177, -0.0007496178150177002, -0.0007135719060897827, -0.0006775259971618652, -0.0006414800882339478, -0.0006054341793060303, -0.0005693882703781128, -0.0005333423614501953, -0.0004972964525222778, -0.00046125054359436035, -0.00042520463466644287, -0.0003891587257385254, -0.0003531128168106079, -0.00031706690788269043, -0.00028102099895477295, -0.00024497509002685547, -0.000208929181098938, -0.0001728832721710205, -0.00013683736324310303, -0.00010079145431518555, -6.474554538726807e-05, -2.8699636459350586e-05, 7.3462724685668945e-06, 4.3392181396484375e-05, 7.943809032440186e-05, 0.00011548399925231934, 0.00015152990818023682, 0.0001875758171081543, 0.00022362172603607178, 0.00025966763496398926, 0.00029571354389190674, 0.0003317594528198242, 0.0003678053617477417, 0.0004038512706756592, 0.00043989717960357666, 0.00047594308853149414, 0.0005119889974594116, 0.0005480349063873291, 0.0005840808153152466, 0.0006201267242431641, 0.0006561726331710815, 0.000692218542098999, 0.0007282644510269165, 0.000764310359954834, 0.0008003562688827515, 0.0008364021778106689, 0.0008724480867385864, 0.0009084939956665039, 0.0009445399045944214, 0.0009805858135223389, 0.0010166317224502563, 0.0010526776313781738, 0.0010887235403060913, 0.0011247694492340088, 0.0011608153581619263, 0.0011968612670898438]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 20.0, 20.0, 27.0, 38.0, 55.0, 74.0, 101.0, 146.0, 186.0, 222.0, 304.0, 425.0, 588.0, 823.0, 1182.0, 1919.0, 3096.0, 5750.0, 10881.0, 27598.0, 929868.0, 36025.0, 12682.0, 6304.0, 3527.0, 2086.0, 1299.0, 906.0, 634.0, 451.0, 338.0, 272.0, 159.0, 125.0, 123.0, 70.0, 67.0, 42.0, 30.0, 19.0, 22.0, 7.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0008387565612792969, -0.000813022255897522, -0.0007872879505157471, -0.0007615536451339722, -0.0007358193397521973, -0.0007100850343704224, -0.0006843507289886475, -0.0006586164236068726, -0.0006328821182250977, -0.0006071478128433228, -0.0005814135074615479, -0.000555679202079773, -0.000529944896697998, -0.0005042105913162231, -0.00047847628593444824, -0.00045274198055267334, -0.00042700767517089844, -0.00040127336978912354, -0.00037553906440734863, -0.00034980475902557373, -0.00032407045364379883, -0.0002983361482620239, -0.000272601842880249, -0.0002468675374984741, -0.00022113323211669922, -0.00019539892673492432, -0.00016966462135314941, -0.0001439303159713745, -0.00011819601058959961, -9.246170520782471e-05, -6.67273998260498e-05, -4.09930944442749e-05, -1.52587890625e-05, 1.0475516319274902e-05, 3.6209821701049805e-05, 6.194412708282471e-05, 8.767843246459961e-05, 0.00011341273784637451, 0.00013914704322814941, 0.00016488134860992432, 0.00019061565399169922, 0.00021634995937347412, 0.00024208426475524902, 0.0002678185701370239, 0.00029355287551879883, 0.00031928718090057373, 0.00034502148628234863, 0.00037075579166412354, 0.00039649009704589844, 0.00042222440242767334, 0.00044795870780944824, 0.00047369301319122314, 0.000499427318572998, 0.000525161623954773, 0.0005508959293365479, 0.0005766302347183228, 0.0006023645401000977, 0.0006280988454818726, 0.0006538331508636475, 0.0006795674562454224, 0.0007053017616271973, 0.0007310360670089722, 0.0007567703723907471, 0.000782504677772522, 0.0008082389831542969]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 10.0, 6.0, 6.0, 18.0, 8.0, 8.0, 23.0, 11.0, 25.0, 11.0, 21.0, 45.0, 24.0, 71.0, 52.0, 56.0, 109.0, 64.0, 89.0, 38.0, 24.0, 66.0, 27.0, 41.0, 18.0, 16.0, 32.0, 8.0, 7.0, 17.0, 7.0, 8.0, 2.0, 4.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8014183044433594e-06, -2.7185305953025818e-06, -2.635642886161804e-06, -2.5527551770210266e-06, -2.469867467880249e-06, -2.3869797587394714e-06, -2.304092049598694e-06, -2.2212043404579163e-06, -2.1383166313171387e-06, -2.055428922176361e-06, -1.9725412130355835e-06, -1.889653503894806e-06, -1.8067657947540283e-06, -1.7238780856132507e-06, -1.6409903764724731e-06, -1.5581026673316956e-06, -1.475214958190918e-06, -1.3923272490501404e-06, -1.3094395399093628e-06, -1.2265518307685852e-06, -1.1436641216278076e-06, -1.06077641248703e-06, -9.778887033462524e-07, -8.950009942054749e-07, -8.121132850646973e-07, -7.292255759239197e-07, -6.463378667831421e-07, -5.634501576423645e-07, -4.805624485015869e-07, -3.976747393608093e-07, -3.1478703022003174e-07, -2.3189932107925415e-07, -1.4901161193847656e-07, -6.612390279769897e-08, 1.6763806343078613e-08, 9.96515154838562e-08, 1.825392246246338e-07, 2.654269337654114e-07, 3.4831464290618896e-07, 4.3120235204696655e-07, 5.140900611877441e-07, 5.969777703285217e-07, 6.798654794692993e-07, 7.627531886100769e-07, 8.456408977508545e-07, 9.285286068916321e-07, 1.0114163160324097e-06, 1.0943040251731873e-06, 1.1771917343139648e-06, 1.2600794434547424e-06, 1.34296715259552e-06, 1.4258548617362976e-06, 1.5087425708770752e-06, 1.5916302800178528e-06, 1.6745179891586304e-06, 1.757405698299408e-06, 1.8402934074401855e-06, 1.923181116580963e-06, 2.0060688257217407e-06, 2.0889565348625183e-06, 2.171844244003296e-06, 2.2547319531440735e-06, 2.337619662284851e-06, 2.4205073714256287e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 9.0, 12.0, 17.0, 18.0, 27.0, 36.0, 59.0, 73.0, 104.0, 154.0, 224.0, 273.0, 404.0, 555.0, 811.0, 1094.0, 1538.0, 2285.0, 3474.0, 5420.0, 9156.0, 16593.0, 99242.0, 858121.0, 20131.0, 10315.0, 6162.0, 3784.0, 2543.0, 1736.0, 1194.0, 841.0, 581.0, 456.0, 322.0, 226.0, 168.0, 112.0, 85.0, 52.0, 43.0, 31.0, 22.0, 19.0, 10.0, 6.0, 6.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.0007710456848144531, -0.0007470399141311646, -0.000723034143447876, -0.0006990283727645874, -0.0006750226020812988, -0.0006510168313980103, -0.0006270110607147217, -0.0006030052900314331, -0.0005789995193481445, -0.000554993748664856, -0.0005309879779815674, -0.0005069822072982788, -0.00048297643661499023, -0.00045897066593170166, -0.0004349648952484131, -0.0004109591245651245, -0.00038695335388183594, -0.00036294758319854736, -0.0003389418125152588, -0.0003149360418319702, -0.00029093027114868164, -0.00026692450046539307, -0.0002429187297821045, -0.00021891295909881592, -0.00019490718841552734, -0.00017090141773223877, -0.0001468956470489502, -0.00012288987636566162, -9.888410568237305e-05, -7.487833499908447e-05, -5.08725643157959e-05, -2.6866793632507324e-05, -2.86102294921875e-06, 2.1144747734069824e-05, 4.51505184173584e-05, 6.915628910064697e-05, 9.316205978393555e-05, 0.00011716783046722412, 0.0001411736011505127, 0.00016517937183380127, 0.00018918514251708984, 0.00021319091320037842, 0.000237196683883667, 0.00026120245456695557, 0.00028520822525024414, 0.0003092139959335327, 0.0003332197666168213, 0.00035722553730010986, 0.00038123130798339844, 0.000405237078666687, 0.0004292428493499756, 0.00045324862003326416, 0.00047725439071655273, 0.0005012601613998413, 0.0005252659320831299, 0.0005492717027664185, 0.000573277473449707, 0.0005972832441329956, 0.0006212890148162842, 0.0006452947854995728, 0.0006693005561828613, 0.0006933063268661499, 0.0007173120975494385, 0.000741317868232727, 0.0007653236389160156]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 7.0, 5.0, 6.0, 13.0, 10.0, 23.0, 579.0, 250.0, 21.0, 8.0, 2.0, 6.0, 10.0, 7.0, 4.0, 1.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00021564960479736328, -0.00020887888967990875, -0.00020210817456245422, -0.0001953374594449997, -0.00018856674432754517, -0.00018179602921009064, -0.0001750253140926361, -0.00016825459897518158, -0.00016148388385772705, -0.00015471316874027252, -0.000147942453622818, -0.00014117173850536346, -0.00013440102338790894, -0.0001276303082704544, -0.00012085959315299988, -0.00011408887803554535, -0.00010731816291809082, -0.00010054744780063629, -9.377673268318176e-05, -8.700601756572723e-05, -8.02353024482727e-05, -7.346458733081818e-05, -6.669387221336365e-05, -5.992315709590912e-05, -5.315244197845459e-05, -4.638172686100006e-05, -3.961101174354553e-05, -3.2840296626091003e-05, -2.6069581508636475e-05, -1.9298866391181946e-05, -1.2528151273727417e-05, -5.757436156272888e-06, 1.0132789611816406e-06, 7.78399407863617e-06, 1.4554709196090698e-05, 2.1325424313545227e-05, 2.8096139430999756e-05, 3.4866854548454285e-05, 4.1637569665908813e-05, 4.840828478336334e-05, 5.517899990081787e-05, 6.19497150182724e-05, 6.872043013572693e-05, 7.549114525318146e-05, 8.226186037063599e-05, 8.903257548809052e-05, 9.580329060554504e-05, 0.00010257400572299957, 0.0001093447208404541, 0.00011611543595790863, 0.00012288615107536316, 0.0001296568661928177, 0.00013642758131027222, 0.00014319829642772675, 0.00014996901154518127, 0.0001567397266626358, 0.00016351044178009033, 0.00017028115689754486, 0.0001770518720149994, 0.00018382258713245392, 0.00019059330224990845, 0.00019736401736736298, 0.0002041347324848175, 0.00021090544760227203, 0.00021767616271972656]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 8.0, 2.0, 9.0, 12.0, 12.0, 13.0, 27.0, 26.0, 46.0, 59.0, 71.0, 103.0, 103.0, 103.0, 93.0, 69.0, 49.0, 45.0, 34.0, 25.0, 16.0, 18.0, 11.0, 12.0, 11.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0025737187825143337, -0.002476002089679241, -0.002378285164013505, -0.0022805684711784124, -0.0021828515455126762, -0.0020851348526775837, -0.001987418159842491, -0.0018897013505920768, -0.0017919845413416624, -0.001694267732091248, -0.0015965509228408337, -0.0014988342300057411, -0.0014011174207553267, -0.0013034006115049124, -0.0012056839186698198, -0.0011079671094194055, -0.001010250300168991, -0.0009125334909185767, -0.0008148167398758233, -0.0007170999888330698, -0.0006193831795826554, -0.0005216663703322411, -0.0004239496192894876, -0.00032623286824673414, -0.00022851605899631977, -0.00013079927884973586, -3.308249870315194e-05, 6.463428144343197e-05, 0.0001623510615900159, 0.00026006787084043026, 0.0003577846218831837, 0.0004555013729259372, 0.0005532179493457079, 0.0006509347585961223, 0.0007486515096388757, 0.0008463682606816292, 0.0009440850699320436, 0.001041801879182458, 0.0011395185720175505, 0.0012372353812679648, 0.0013349521905183792, 0.0014326689997687936, 0.001530385809019208, 0.0016281025018543005, 0.0017258193111047149, 0.0018235361203551292, 0.0019212528131902218, 0.0020189695060253143, 0.0021166864316910505, 0.002214403124526143, 0.0023121200501918793, 0.002409836743026972, 0.0025075534358620644, 0.0026052703615278006, 0.002702987054362893, 0.0028007039800286293, 0.002898420672863722, 0.0029961373656988144, 0.0030938542913645506, 0.003191570984199643, 0.0032892879098653793, 0.003387004602700472, 0.0034847212955355644, 0.003582437988370657, 0.003680154914036393]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 7.0, 8.0, 7.0, 5.0, 6.0, 21.0, 17.0, 18.0, 23.0, 22.0, 32.0, 36.0, 23.0, 33.0, 47.0, 38.0, 43.0, 36.0, 43.0, 42.0, 49.0, 49.0, 54.0, 41.0, 46.0, 47.0, 32.0, 36.0, 24.0, 17.0, 20.0, 12.0, 18.0, 14.0, 13.0, 8.0, 7.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00232955371029675, -0.002257940825074911, -0.002186327939853072, -0.002114715054631233, -0.0020431019365787506, -0.0019714890513569117, -0.0018998761661350727, -0.0018282632809132338, -0.0017566503956913948, -0.0016850375104695559, -0.001613424625247717, -0.0015418116236105561, -0.0014701987383887172, -0.0013985858531668782, -0.0013269728515297174, -0.0012553599663078785, -0.0011837470810860395, -0.0011121341958642006, -0.0010405213106423616, -0.0009689083090052009, -0.0008972954237833619, -0.000825682538561523, -0.0007540695951320231, -0.0006824566517025232, -0.0006108437664806843, -0.0005392308812588453, -0.00046761793782934546, -0.00039600502350367606, -0.00032439210917800665, -0.00025277919485233724, -0.00018116628052666783, -0.00010955333709716797, -3.794068470597267e-05, 3.3672229619696736e-05, 0.00010528514394536614, 0.00017689805827103555, 0.00024851097259670496, 0.00032012388692237437, 0.0003917368012480438, 0.00046334974467754364, 0.0005349626298993826, 0.0006065755151212215, 0.0006781884585507214, 0.0007498014019802213, 0.0008214142872020602, 0.0008930271724238992, 0.000964640115853399, 0.001036253059282899, 0.0011078659445047379, 0.0011794788297265768, 0.0012510917149484158, 0.0013227047165855765, 0.0013943176018074155, 0.0014659304870292544, 0.0015375434886664152, 0.0016091563738882542, 0.0016807692591100931, 0.001752382144331932, 0.001823995029553771, 0.0018956080311909318, 0.0019672210328280926, 0.0020388339180499315, 0.0021104468032717705, 0.0021820596884936094, 0.0022536725737154484]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 15.0, 38.0, 53.0, 77.0, 115.0, 239.0, 391.0, 636.0, 1033.0, 1752.0, 2825.0, 4720.0, 8158.0, 13950.0, 25519.0, 47470.0, 95633.0, 213680.0, 654258.0, 1870906.0, 782423.0, 254415.0, 109351.0, 51623.0, 25475.0, 13230.0, 7153.0, 3993.0, 2137.0, 1172.0, 691.0, 356.0, 253.0, 154.0, 101.0, 65.0, 54.0, 42.0, 21.0, 25.0, 15.0, 17.0, 14.0, 5.0, 6.0, 12.0, 5.0, 3.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025177001953125, -0.0024191737174987793, -0.0023206472396850586, -0.002222120761871338, -0.002123594284057617, -0.0020250678062438965, -0.0019265413284301758, -0.001828014850616455, -0.0017294883728027344, -0.0016309618949890137, -0.001532435417175293, -0.0014339089393615723, -0.0013353824615478516, -0.0012368559837341309, -0.0011383295059204102, -0.0010398030281066895, -0.0009412765502929688, -0.000842750072479248, -0.0007442235946655273, -0.0006456971168518066, -0.0005471706390380859, -0.00044864416122436523, -0.00035011768341064453, -0.00025159120559692383, -0.00015306472778320312, -5.453824996948242e-05, 4.398822784423828e-05, 0.00014251470565795898, 0.0002410411834716797, 0.0003395676612854004, 0.0004380941390991211, 0.0005366206169128418, 0.0006351470947265625, 0.0007336735725402832, 0.0008322000503540039, 0.0009307265281677246, 0.0010292530059814453, 0.001127779483795166, 0.0012263059616088867, 0.0013248324394226074, 0.0014233589172363281, 0.0015218853950500488, 0.0016204118728637695, 0.0017189383506774902, 0.001817464828491211, 0.0019159913063049316, 0.0020145177841186523, 0.002113044261932373, 0.0022115707397460938, 0.0023100972175598145, 0.002408623695373535, 0.002507150173187256, 0.0026056766510009766, 0.0027042031288146973, 0.002802729606628418, 0.0029012560844421387, 0.0029997825622558594, 0.00309830904006958, 0.0031968355178833008, 0.0032953619956970215, 0.003393888473510742, 0.003492414951324463, 0.0035909414291381836, 0.0036894679069519043, 0.003787994384765625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 7.0, 17.0, 13.0, 12.0, 21.0, 27.0, 28.0, 25.0, 36.0, 29.0, 37.0, 42.0, 43.0, 38.0, 44.0, 47.0, 43.0, 45.0, 46.0, 47.0, 46.0, 46.0, 35.0, 37.0, 26.0, 29.0, 22.0, 16.0, 11.0, 11.0, 12.0, 14.0, 8.0, 7.0, 4.0, 0.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0014657974243164062, -0.0014225095510482788, -0.0013792216777801514, -0.001335933804512024, -0.0012926459312438965, -0.001249358057975769, -0.0012060701847076416, -0.0011627823114395142, -0.0011194944381713867, -0.0010762065649032593, -0.0010329186916351318, -0.0009896308183670044, -0.000946342945098877, -0.0009030550718307495, -0.0008597671985626221, -0.0008164793252944946, -0.0007731914520263672, -0.0007299035787582397, -0.0006866157054901123, -0.0006433278322219849, -0.0006000399589538574, -0.00055675208568573, -0.0005134642124176025, -0.0004701763391494751, -0.00042688846588134766, -0.0003836005926132202, -0.0003403127193450928, -0.00029702484607696533, -0.0002537369728088379, -0.00021044909954071045, -0.000167161226272583, -0.00012387335300445557, -8.058547973632812e-05, -3.7297606468200684e-05, 5.990266799926758e-06, 4.92781400680542e-05, 9.256601333618164e-05, 0.00013585388660430908, 0.00017914175987243652, 0.00022242963314056396, 0.0002657175064086914, 0.00030900537967681885, 0.0003522932529449463, 0.00039558112621307373, 0.00043886899948120117, 0.0004821568727493286, 0.0005254447460174561, 0.0005687326192855835, 0.0006120204925537109, 0.0006553083658218384, 0.0006985962390899658, 0.0007418841123580933, 0.0007851719856262207, 0.0008284598588943481, 0.0008717477321624756, 0.000915035605430603, 0.0009583234786987305, 0.001001611351966858, 0.0010448992252349854, 0.0010881870985031128, 0.0011314749717712402, 0.0011747628450393677, 0.0012180507183074951, 0.0012613385915756226, 0.00130462646484375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 9.0, 7.0, 12.0, 17.0, 29.0, 39.0, 39.0, 68.0, 112.0, 179.0, 260.0, 352.0, 564.0, 795.0, 1287.0, 1965.0, 3159.0, 4658.0, 7478.0, 11610.0, 18364.0, 29430.0, 49374.0, 84929.0, 152625.0, 293847.0, 638751.0, 1295778.0, 810448.0, 358731.0, 181348.0, 98856.0, 57240.0, 33871.0, 21212.0, 13265.0, 8256.0, 5437.0, 3397.0, 2210.0, 1418.0, 995.0, 614.0, 432.0, 257.0, 172.0, 135.0, 86.0, 59.0, 37.0, 12.0, 21.0, 14.0, 12.0, 7.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.001842498779296875, -0.0017803311347961426, -0.0017181634902954102, -0.0016559958457946777, -0.0015938282012939453, -0.0015316605567932129, -0.0014694929122924805, -0.001407325267791748, -0.0013451576232910156, -0.0012829899787902832, -0.0012208223342895508, -0.0011586546897888184, -0.001096487045288086, -0.0010343194007873535, -0.0009721517562866211, -0.0009099841117858887, -0.0008478164672851562, -0.0007856488227844238, -0.0007234811782836914, -0.000661313533782959, -0.0005991458892822266, -0.0005369782447814941, -0.0004748106002807617, -0.0004126429557800293, -0.0003504753112792969, -0.00028830766677856445, -0.00022614002227783203, -0.0001639723777770996, -0.00010180473327636719, -3.9637088775634766e-05, 2.2530555725097656e-05, 8.469820022583008e-05, 0.0001468658447265625, 0.00020903348922729492, 0.00027120113372802734, 0.00033336877822875977, 0.0003955364227294922, 0.0004577040672302246, 0.000519871711730957, 0.0005820393562316895, 0.0006442070007324219, 0.0007063746452331543, 0.0007685422897338867, 0.0008307099342346191, 0.0008928775787353516, 0.000955045223236084, 0.0010172128677368164, 0.0010793805122375488, 0.0011415481567382812, 0.0012037158012390137, 0.001265883445739746, 0.0013280510902404785, 0.001390218734741211, 0.0014523863792419434, 0.0015145540237426758, 0.0015767216682434082, 0.0016388893127441406, 0.001701056957244873, 0.0017632246017456055, 0.0018253922462463379, 0.0018875598907470703, 0.0019497275352478027, 0.002011895179748535, 0.0020740628242492676, 0.00213623046875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 8.0, 11.0, 7.0, 8.0, 20.0, 20.0, 27.0, 32.0, 30.0, 53.0, 69.0, 64.0, 69.0, 101.0, 101.0, 131.0, 158.0, 182.0, 196.0, 222.0, 237.0, 245.0, 233.0, 244.0, 250.0, 199.0, 199.0, 169.0, 145.0, 111.0, 106.0, 98.0, 77.0, 54.0, 51.0, 24.0, 26.0, 18.0, 22.0, 16.0, 10.0, 10.0, 5.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.000728607177734375, -0.0007084012031555176, -0.0006881952285766602, -0.0006679892539978027, -0.0006477832794189453, -0.0006275773048400879, -0.0006073713302612305, -0.000587165355682373, -0.0005669593811035156, -0.0005467534065246582, -0.0005265474319458008, -0.0005063414573669434, -0.00048613548278808594, -0.0004659295082092285, -0.0004457235336303711, -0.00042551755905151367, -0.00040531158447265625, -0.00038510560989379883, -0.0003648996353149414, -0.000344693660736084, -0.00032448768615722656, -0.00030428171157836914, -0.0002840757369995117, -0.0002638697624206543, -0.00024366378784179688, -0.00022345781326293945, -0.00020325183868408203, -0.0001830458641052246, -0.0001628398895263672, -0.00014263391494750977, -0.00012242794036865234, -0.00010222196578979492, -8.20159912109375e-05, -6.181001663208008e-05, -4.1604042053222656e-05, -2.1398067474365234e-05, -1.1920928955078125e-06, 1.901388168334961e-05, 3.921985626220703e-05, 5.942583084106445e-05, 7.963180541992188e-05, 9.98377799987793e-05, 0.00012004375457763672, 0.00014024972915649414, 0.00016045570373535156, 0.00018066167831420898, 0.0002008676528930664, 0.00022107362747192383, 0.00024127960205078125, 0.00026148557662963867, 0.0002816915512084961, 0.0003018975257873535, 0.00032210350036621094, 0.00034230947494506836, 0.0003625154495239258, 0.0003827214241027832, 0.0004029273986816406, 0.00042313337326049805, 0.00044333934783935547, 0.0004635453224182129, 0.0004837512969970703, 0.0005039572715759277, 0.0005241632461547852, 0.0005443692207336426, 0.0005645751953125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 2.0, 4.0, 3.0, 5.0, 9.0, 5.0, 6.0, 13.0, 8.0, 16.0, 24.0, 34.0, 56.0, 60.0, 64.0, 94.0, 103.0, 97.0, 84.0, 60.0, 57.0, 46.0, 43.0, 18.0, 15.0, 10.0, 17.0, 13.0, 4.0, 5.0, 7.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001890539308078587, -0.0018278262577950954, -0.0017651133239269257, -0.001702400273643434, -0.0016396872233599424, -0.0015769742894917727, -0.001514261239208281, -0.0014515481889247894, -0.0013888352550566196, -0.001326122204773128, -0.0012634092709049582, -0.0012006962206214666, -0.001137983170337975, -0.0010752701200544834, -0.0010125571861863136, -0.000949844135902822, -0.0008871310856193304, -0.0008244180935434997, -0.0007617050432600081, -0.0006989920511841774, -0.0006362790009006858, -0.0005735660088248551, -0.0005108530167490244, -0.00044813999556936324, -0.0003854269743897021, -0.0003227139532100409, -0.00026000093203037977, -0.00019728793995454907, -0.00013457491877488792, -7.186189759522676e-05, -9.148905519396067e-06, 5.356411566026509e-05, 0.00011627725325524807, 0.00017899027443490922, 0.00024170328106265515, 0.0003044162876904011, 0.00036712930887006223, 0.0004298423300497234, 0.0004925553221255541, 0.0005552683724090457, 0.0006179813644848764, 0.0006806943565607071, 0.0007434074068441987, 0.0008061203989200294, 0.0008688333909958601, 0.0009315464412793517, 0.0009942594915628433, 0.001056972425431013, 0.0011196854757145047, 0.0011823985259979963, 0.0012451114598661661, 0.0013078245101496577, 0.0013705375604331493, 0.0014332504943013191, 0.0014959635445848107, 0.0015586765948683023, 0.0016213895287364721, 0.0016841025790199637, 0.0017468155128881335, 0.0018095285631716251, 0.0018722416134551167, 0.0019349546637386084, 0.001997667597606778, 0.002060380531474948, 0.0021230936981737614]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 8.0, 4.0, 8.0, 13.0, 12.0, 16.0, 16.0, 17.0, 24.0, 34.0, 16.0, 25.0, 31.0, 30.0, 27.0, 34.0, 26.0, 46.0, 41.0, 35.0, 46.0, 37.0, 43.0, 38.0, 33.0, 43.0, 36.0, 34.0, 30.0, 17.0, 24.0, 21.0, 19.0, 23.0, 25.0, 5.0, 11.0, 9.0, 11.0, 6.0, 6.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013730599312111735, -0.0013317173579707742, -0.0012903747847303748, -0.0012490322114899755, -0.0012076895218342543, -0.001166346948593855, -0.0011250043753534555, -0.0010836618021130562, -0.0010423192288726568, -0.0010009766556322575, -0.0009596340823918581, -0.0009182914509437978, -0.0008769488777033985, -0.0008356063044629991, -0.0007942636730149388, -0.0007529210997745395, -0.0007115785265341401, -0.0006702359532937407, -0.0006288933800533414, -0.0005875507486052811, -0.0005462081753648818, -0.0005048656021244824, -0.0004635229997802526, -0.00042218039743602276, -0.0003808378241956234, -0.00033949525095522404, -0.0002981526486109942, -0.0002568100462667644, -0.00021546747302636504, -0.00017412488523405045, -0.00013278229744173586, -9.143969509750605e-05, -5.0097121857106686e-05, -8.754534064792097e-06, 3.258805372752249e-05, 7.393064151983708e-05, 0.00011527322931215167, 0.00015661581710446626, 0.00019795840489678085, 0.00023930100724101067, 0.00028064358048141, 0.0003219861537218094, 0.0003633287560660392, 0.000404671358410269, 0.0004460139316506684, 0.00048735650489106774, 0.000528699136339128, 0.0005700417095795274, 0.0006113842828199267, 0.0006527268560603261, 0.0006940694293007255, 0.0007354120607487857, 0.0007767546339891851, 0.0008180972072295845, 0.0008594398386776447, 0.0009007824119180441, 0.0009421249851584435, 0.0009834675583988428, 0.0010248101316392422, 0.0010661527048796415, 0.001107495278120041, 0.001148837967775762, 0.0011901805410161614, 0.0012315231142565608, 0.0012728656874969602]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 7.0, 7.0, 10.0, 20.0, 21.0, 32.0, 58.0, 76.0, 118.0, 157.0, 279.0, 394.0, 520.0, 764.0, 1175.0, 1762.0, 2670.0, 3943.0, 5994.0, 9033.0, 14137.0, 20681.0, 32035.0, 49537.0, 75854.0, 116684.0, 168298.0, 177251.0, 126846.0, 83593.0, 53992.0, 35126.0, 23131.0, 14992.0, 9741.0, 6508.0, 4403.0, 2797.0, 1925.0, 1264.0, 929.0, 606.0, 378.0, 265.0, 178.0, 114.0, 79.0, 61.0, 38.0, 28.0, 21.0, 12.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0018558502197265625, -0.0017961859703063965, -0.0017365217208862305, -0.0016768574714660645, -0.0016171932220458984, -0.0015575289726257324, -0.0014978647232055664, -0.0014382004737854004, -0.0013785362243652344, -0.0013188719749450684, -0.0012592077255249023, -0.0011995434761047363, -0.0011398792266845703, -0.0010802149772644043, -0.0010205507278442383, -0.0009608864784240723, -0.0009012222290039062, -0.0008415579795837402, -0.0007818937301635742, -0.0007222294807434082, -0.0006625652313232422, -0.0006029009819030762, -0.0005432367324829102, -0.00048357248306274414, -0.0004239082336425781, -0.0003642439842224121, -0.0003045797348022461, -0.0002449154853820801, -0.00018525123596191406, -0.00012558698654174805, -6.592273712158203e-05, -6.258487701416016e-06, 5.340576171875e-05, 0.00011307001113891602, 0.00017273426055908203, 0.00023239850997924805, 0.00029206275939941406, 0.0003517270088195801, 0.0004113912582397461, 0.0004710555076599121, 0.0005307197570800781, 0.0005903840065002441, 0.0006500482559204102, 0.0007097125053405762, 0.0007693767547607422, 0.0008290410041809082, 0.0008887052536010742, 0.0009483695030212402, 0.0010080337524414062, 0.0010676980018615723, 0.0011273622512817383, 0.0011870265007019043, 0.0012466907501220703, 0.0013063549995422363, 0.0013660192489624023, 0.0014256834983825684, 0.0014853477478027344, 0.0015450119972229004, 0.0016046762466430664, 0.0016643404960632324, 0.0017240047454833984, 0.0017836689949035645, 0.0018433332443237305, 0.0019029974937438965, 0.0019626617431640625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 1.0, 4.0, 5.0, 6.0, 8.0, 13.0, 9.0, 17.0, 9.0, 23.0, 20.0, 21.0, 24.0, 26.0, 35.0, 26.0, 35.0, 26.0, 32.0, 26.0, 32.0, 36.0, 39.0, 46.0, 36.0, 38.0, 36.0, 46.0, 33.0, 46.0, 32.0, 21.0, 17.0, 36.0, 19.0, 21.0, 22.0, 19.0, 16.0, 9.0, 6.0, 4.0, 14.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0011987686157226562, -0.001163586974143982, -0.0011284053325653076, -0.0010932236909866333, -0.001058042049407959, -0.0010228604078292847, -0.0009876787662506104, -0.000952497124671936, -0.0009173154830932617, -0.0008821338415145874, -0.0008469521999359131, -0.0008117705583572388, -0.0007765889167785645, -0.0007414072751998901, -0.0007062256336212158, -0.0006710439920425415, -0.0006358623504638672, -0.0006006807088851929, -0.0005654990673065186, -0.0005303174257278442, -0.0004951357841491699, -0.0004599541425704956, -0.0004247725009918213, -0.00038959085941314697, -0.00035440921783447266, -0.00031922757625579834, -0.000284045934677124, -0.0002488642930984497, -0.0002136826515197754, -0.00017850100994110107, -0.00014331936836242676, -0.00010813772678375244, -7.295608520507812e-05, -3.777444362640381e-05, -2.592802047729492e-06, 3.2588839530944824e-05, 6.777048110961914e-05, 0.00010295212268829346, 0.00013813376426696777, 0.0001733154058456421, 0.0002084970474243164, 0.00024367868900299072, 0.00027886033058166504, 0.00031404197216033936, 0.00034922361373901367, 0.000384405255317688, 0.0004195868968963623, 0.0004547685384750366, 0.0004899501800537109, 0.0005251318216323853, 0.0005603134632110596, 0.0005954951047897339, 0.0006306767463684082, 0.0006658583879470825, 0.0007010400295257568, 0.0007362216711044312, 0.0007714033126831055, 0.0008065849542617798, 0.0008417665958404541, 0.0008769482374191284, 0.0009121298789978027, 0.000947311520576477, 0.0009824931621551514, 0.0010176748037338257, 0.0010528564453125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 5.0, 8.0, 9.0, 23.0, 27.0, 30.0, 75.0, 102.0, 150.0, 224.0, 366.0, 575.0, 885.0, 1482.0, 2539.0, 4363.0, 8057.0, 15843.0, 35894.0, 110614.0, 506397.0, 250879.0, 60855.0, 23605.0, 11234.0, 5966.0, 3353.0, 1860.0, 1155.0, 718.0, 449.0, 276.0, 150.0, 143.0, 78.0, 58.0, 32.0, 26.0, 15.0, 12.0, 11.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00438690185546875, -0.00426068902015686, -0.004134476184844971, -0.004008263349533081, -0.0038820505142211914, -0.0037558376789093018, -0.003629624843597412, -0.0035034120082855225, -0.003377199172973633, -0.003250986337661743, -0.0031247735023498535, -0.002998560667037964, -0.0028723478317260742, -0.0027461349964141846, -0.002619922161102295, -0.0024937093257904053, -0.0023674964904785156, -0.002241283655166626, -0.0021150708198547363, -0.0019888579845428467, -0.001862645149230957, -0.0017364323139190674, -0.0016102194786071777, -0.001484006643295288, -0.0013577938079833984, -0.0012315809726715088, -0.0011053681373596191, -0.0009791553020477295, -0.0008529424667358398, -0.0007267296314239502, -0.0006005167961120605, -0.0004743039608001709, -0.00034809112548828125, -0.0002218782901763916, -9.566545486450195e-05, 3.0547380447387695e-05, 0.00015676021575927734, 0.000282973051071167, 0.00040918588638305664, 0.0005353987216949463, 0.0006616115570068359, 0.0007878243923187256, 0.0009140372276306152, 0.0010402500629425049, 0.0011664628982543945, 0.0012926757335662842, 0.0014188885688781738, 0.0015451014041900635, 0.0016713142395019531, 0.0017975270748138428, 0.0019237399101257324, 0.002049952745437622, 0.0021761655807495117, 0.0023023784160614014, 0.002428591251373291, 0.0025548040866851807, 0.0026810169219970703, 0.00280722975730896, 0.0029334425926208496, 0.0030596554279327393, 0.003185868263244629, 0.0033120810985565186, 0.003438293933868408, 0.003564506769180298, 0.0036907196044921875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 4.0, 5.0, 7.0, 9.0, 16.0, 5.0, 13.0, 18.0, 15.0, 13.0, 18.0, 24.0, 25.0, 32.0, 25.0, 36.0, 38.0, 38.0, 33.0, 37.0, 39.0, 45.0, 50.0, 48.0, 42.0, 41.0, 27.0, 38.0, 36.0, 27.0, 26.0, 31.0, 22.0, 12.0, 18.0, 15.0, 15.0, 18.0, 12.0, 7.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000736236572265625, -0.0007123500108718872, -0.0006884634494781494, -0.0006645768880844116, -0.0006406903266906738, -0.000616803765296936, -0.0005929172039031982, -0.0005690306425094604, -0.0005451440811157227, -0.0005212575197219849, -0.0004973709583282471, -0.0004734843969345093, -0.0004495978355407715, -0.0004257112741470337, -0.0004018247127532959, -0.0003779381513595581, -0.0003540515899658203, -0.0003301650285720825, -0.0003062784671783447, -0.00028239190578460693, -0.00025850534439086914, -0.00023461878299713135, -0.00021073222160339355, -0.00018684566020965576, -0.00016295909881591797, -0.00013907253742218018, -0.00011518597602844238, -9.129941463470459e-05, -6.74128532409668e-05, -4.3526291847229004e-05, -1.963973045349121e-05, 4.246830940246582e-06, 2.8133392333984375e-05, 5.201995372772217e-05, 7.590651512145996e-05, 9.979307651519775e-05, 0.00012367963790893555, 0.00014756619930267334, 0.00017145276069641113, 0.00019533932209014893, 0.00021922588348388672, 0.0002431124448776245, 0.0002669990062713623, 0.0002908855676651001, 0.0003147721290588379, 0.0003386586904525757, 0.0003625452518463135, 0.00038643181324005127, 0.00041031837463378906, 0.00043420493602752686, 0.00045809149742126465, 0.00048197805881500244, 0.0005058646202087402, 0.000529751181602478, 0.0005536377429962158, 0.0005775243043899536, 0.0006014108657836914, 0.0006252974271774292, 0.000649183988571167, 0.0006730705499649048, 0.0006969571113586426, 0.0007208436727523804, 0.0007447302341461182, 0.000768616795539856, 0.0007925033569335938]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 18.0, 19.0, 21.0, 30.0, 35.0, 50.0, 85.0, 106.0, 181.0, 251.0, 406.0, 578.0, 837.0, 1376.0, 2118.0, 3452.0, 6125.0, 12079.0, 30034.0, 96018.0, 520571.0, 270040.0, 60787.0, 20931.0, 9340.0, 4941.0, 2848.0, 1728.0, 1130.0, 739.0, 513.0, 371.0, 256.0, 149.0, 115.0, 86.0, 58.0, 44.0, 28.0, 14.0, 17.0, 10.0, 7.0, 8.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008230209350585938, -0.0007963180541992188, -0.0007696151733398438, -0.0007429122924804688, -0.0007162094116210938, -0.0006895065307617188, -0.0006628036499023438, -0.0006361007690429688, -0.0006093978881835938, -0.0005826950073242188, -0.0005559921264648438, -0.0005292892456054688, -0.0005025863647460938, -0.00047588348388671875, -0.00044918060302734375, -0.00042247772216796875, -0.00039577484130859375, -0.00036907196044921875, -0.00034236907958984375, -0.00031566619873046875, -0.00028896331787109375, -0.00026226043701171875, -0.00023555755615234375, -0.00020885467529296875, -0.00018215179443359375, -0.00015544891357421875, -0.00012874603271484375, -0.00010204315185546875, -7.534027099609375e-05, -4.863739013671875e-05, -2.193450927734375e-05, 4.76837158203125e-06, 3.147125244140625e-05, 5.817413330078125e-05, 8.487701416015625e-05, 0.00011157989501953125, 0.00013828277587890625, 0.00016498565673828125, 0.00019168853759765625, 0.00021839141845703125, 0.00024509429931640625, 0.00027179718017578125, 0.00029850006103515625, 0.00032520294189453125, 0.00035190582275390625, 0.00037860870361328125, 0.00040531158447265625, 0.00043201446533203125, 0.00045871734619140625, 0.00048542022705078125, 0.0005121231079101562, 0.0005388259887695312, 0.0005655288696289062, 0.0005922317504882812, 0.0006189346313476562, 0.0006456375122070312, 0.0006723403930664062, 0.0006990432739257812, 0.0007257461547851562, 0.0007524490356445312, 0.0007791519165039062, 0.0008058547973632812, 0.0008325576782226562, 0.0008592605590820312, 0.0008859634399414062]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 2.0, 8.0, 9.0, 6.0, 13.0, 16.0, 14.0, 22.0, 22.0, 32.0, 30.0, 44.0, 37.0, 38.0, 41.0, 61.0, 61.0, 45.0, 69.0, 50.0, 50.0, 46.0, 40.0, 42.0, 25.0, 36.0, 18.0, 24.0, 14.0, 19.0, 13.0, 9.0, 4.0, 11.0, 6.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4185905456542969e-05, -1.3724900782108307e-05, -1.3263896107673645e-05, -1.2802891433238983e-05, -1.2341886758804321e-05, -1.188088208436966e-05, -1.1419877409934998e-05, -1.0958872735500336e-05, -1.0497868061065674e-05, -1.0036863386631012e-05, -9.57585871219635e-06, -9.114854037761688e-06, -8.653849363327026e-06, -8.192844688892365e-06, -7.731840014457703e-06, -7.270835340023041e-06, -6.809830665588379e-06, -6.348825991153717e-06, -5.887821316719055e-06, -5.426816642284393e-06, -4.9658119678497314e-06, -4.50480729341507e-06, -4.043802618980408e-06, -3.582797944545746e-06, -3.121793270111084e-06, -2.660788595676422e-06, -2.1997839212417603e-06, -1.7387792468070984e-06, -1.2777745723724365e-06, -8.167698979377747e-07, -3.557652235031128e-07, 1.0523945093154907e-07, 5.662441253662109e-07, 1.0272487998008728e-06, 1.4882534742355347e-06, 1.9492581486701965e-06, 2.4102628231048584e-06, 2.8712674975395203e-06, 3.332272171974182e-06, 3.793276846408844e-06, 4.254281520843506e-06, 4.715286195278168e-06, 5.17629086971283e-06, 5.6372955441474915e-06, 6.098300218582153e-06, 6.559304893016815e-06, 7.020309567451477e-06, 7.481314241886139e-06, 7.9423189163208e-06, 8.403323590755463e-06, 8.864328265190125e-06, 9.325332939624786e-06, 9.786337614059448e-06, 1.024734228849411e-05, 1.0708346962928772e-05, 1.1169351637363434e-05, 1.1630356311798096e-05, 1.2091360986232758e-05, 1.255236566066742e-05, 1.3013370335102081e-05, 1.3474375009536743e-05, 1.3935379683971405e-05, 1.4396384358406067e-05, 1.4857389032840729e-05, 1.531839370727539e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 17.0, 11.0, 26.0, 39.0, 65.0, 88.0, 169.0, 210.0, 360.0, 481.0, 784.0, 1188.0, 1917.0, 3205.0, 5139.0, 8942.0, 15938.0, 28981.0, 56006.0, 124156.0, 317067.0, 268078.0, 104748.0, 50077.0, 25833.0, 14232.0, 8131.0, 4806.0, 2946.0, 1720.0, 1101.0, 696.0, 530.0, 316.0, 186.0, 115.0, 74.0, 60.0, 43.0, 24.0, 19.0, 13.0, 5.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003600120544433594, -0.0003493949770927429, -0.00033877789974212646, -0.00032816082239151, -0.00031754374504089355, -0.0003069266676902771, -0.00029630959033966064, -0.0002856925129890442, -0.00027507543563842773, -0.0002644583582878113, -0.0002538412809371948, -0.00024322420358657837, -0.00023260712623596191, -0.00022199004888534546, -0.000211372971534729, -0.00020075589418411255, -0.0001901388168334961, -0.00017952173948287964, -0.00016890466213226318, -0.00015828758478164673, -0.00014767050743103027, -0.00013705343008041382, -0.00012643635272979736, -0.00011581927537918091, -0.00010520219802856445, -9.4585120677948e-05, -8.396804332733154e-05, -7.335096597671509e-05, -6.273388862609863e-05, -5.211681127548218e-05, -4.149973392486572e-05, -3.088265657424927e-05, -2.0265579223632812e-05, -9.648501873016357e-06, 9.685754776000977e-07, 1.1585652828216553e-05, 2.2202730178833008e-05, 3.281980752944946e-05, 4.343688488006592e-05, 5.405396223068237e-05, 6.467103958129883e-05, 7.528811693191528e-05, 8.590519428253174e-05, 9.65222716331482e-05, 0.00010713934898376465, 0.0001177564263343811, 0.00012837350368499756, 0.00013899058103561401, 0.00014960765838623047, 0.00016022473573684692, 0.00017084181308746338, 0.00018145889043807983, 0.0001920759677886963, 0.00020269304513931274, 0.0002133101224899292, 0.00022392719984054565, 0.0002345442771911621, 0.00024516135454177856, 0.000255778431892395, 0.0002663955092430115, 0.00027701258659362793, 0.0002876296639442444, 0.00029824674129486084, 0.0003088638186454773, 0.00031948089599609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 5.0, 3.0, 7.0, 6.0, 7.0, 9.0, 9.0, 11.0, 15.0, 20.0, 19.0, 35.0, 38.0, 42.0, 43.0, 45.0, 43.0, 54.0, 68.0, 52.0, 55.0, 54.0, 60.0, 50.0, 43.0, 40.0, 21.0, 27.0, 21.0, 16.0, 19.0, 15.0, 7.0, 6.0, 4.0, 7.0, 8.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.113550186157227e-05, -8.814781904220581e-05, -8.516013622283936e-05, -8.21724534034729e-05, -7.918477058410645e-05, -7.619708776473999e-05, -7.320940494537354e-05, -7.022172212600708e-05, -6.723403930664062e-05, -6.424635648727417e-05, -6.125867366790771e-05, -5.827099084854126e-05, -5.5283308029174805e-05, -5.229562520980835e-05, -4.9307942390441895e-05, -4.632025957107544e-05, -4.3332576751708984e-05, -4.034489393234253e-05, -3.7357211112976074e-05, -3.436952829360962e-05, -3.1381845474243164e-05, -2.839416265487671e-05, -2.5406479835510254e-05, -2.24187970161438e-05, -1.9431114196777344e-05, -1.644343137741089e-05, -1.3455748558044434e-05, -1.0468065738677979e-05, -7.4803829193115234e-06, -4.492700099945068e-06, -1.5050172805786133e-06, 1.4826655387878418e-06, 4.470348358154297e-06, 7.458031177520752e-06, 1.0445713996887207e-05, 1.3433396816253662e-05, 1.6421079635620117e-05, 1.9408762454986572e-05, 2.2396445274353027e-05, 2.5384128093719482e-05, 2.8371810913085938e-05, 3.135949373245239e-05, 3.434717655181885e-05, 3.73348593711853e-05, 4.032254219055176e-05, 4.331022500991821e-05, 4.629790782928467e-05, 4.928559064865112e-05, 5.227327346801758e-05, 5.526095628738403e-05, 5.824863910675049e-05, 6.123632192611694e-05, 6.42240047454834e-05, 6.721168756484985e-05, 7.019937038421631e-05, 7.318705320358276e-05, 7.617473602294922e-05, 7.916241884231567e-05, 8.215010166168213e-05, 8.513778448104858e-05, 8.812546730041504e-05, 9.11131501197815e-05, 9.410083293914795e-05, 9.70885157585144e-05, 0.00010007619857788086]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 7.0, 8.0, 8.0, 11.0, 20.0, 15.0, 26.0, 37.0, 51.0, 69.0, 109.0, 117.0, 128.0, 94.0, 74.0, 46.0, 38.0, 36.0, 17.0, 11.0, 15.0, 12.0, 10.0, 13.0, 7.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016265162266790867, -0.00156866863835603, -0.0015108210500329733, -0.0014529735781252384, -0.0013951259898021817, -0.001337278401479125, -0.0012794309295713902, -0.0012215833412483335, -0.0011637357529252768, -0.00110588816460222, -0.0010480405762791634, -0.0009901931043714285, -0.0009323455160483718, -0.0008744979277253151, -0.0008166503976099193, -0.0007588028674945235, -0.0007009552791714668, -0.0006431076908484101, -0.0005852601607330143, -0.0005274126306176186, -0.00046956504229456186, -0.0004117174830753356, -0.0003538699238561094, -0.00029602236463688314, -0.0002381748054176569, -0.00018032724619843066, -0.00012247968697920442, -6.463212775997818e-05, -6.784568540751934e-06, 5.106299067847431e-05, 0.00010891054989770055, 0.0001667581091169268, 0.00022460566833615303, 0.00028245322755537927, 0.0003403007867746055, 0.00039814834599383175, 0.000455995905213058, 0.0005138434935361147, 0.0005716910236515105, 0.0006295385537669063, 0.000687386142089963, 0.0007452337304130197, 0.0008030812605284154, 0.0008609287906438112, 0.0009187763789668679, 0.0009766239672899246, 0.0010344714391976595, 0.0010923190275207162, 0.0011501666158437729, 0.0012080142041668296, 0.0012658617924898863, 0.0013237092643976212, 0.0013815568527206779, 0.0014394044410437346, 0.0014972519129514694, 0.0015550995012745261, 0.0016129470895975828, 0.0016707946779206395, 0.0017286422662436962, 0.001786489738151431, 0.0018443373264744878, 0.0019021849147975445, 0.0019600323867052794, 0.002017880091443658, 0.0020757275633513927]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 11.0, 3.0, 5.0, 8.0, 7.0, 13.0, 12.0, 12.0, 16.0, 23.0, 21.0, 28.0, 19.0, 28.0, 34.0, 19.0, 30.0, 42.0, 26.0, 36.0, 34.0, 48.0, 48.0, 28.0, 40.0, 38.0, 40.0, 29.0, 41.0, 36.0, 35.0, 16.0, 21.0, 30.0, 15.0, 23.0, 25.0, 8.0, 9.0, 9.0, 10.0, 7.0, 7.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010892567224800587, -0.0010554756736382842, -0.001021694508381188, -0.0009879134595394135, -0.0009541322942823172, -0.0009203512454405427, -0.0008865701383911073, -0.0008527890313416719, -0.0008190079242922366, -0.0007852268172428012, -0.0007514457101933658, -0.0007176646031439304, -0.000683883554302156, -0.0006501023890450597, -0.0006163213402032852, -0.0005825402331538498, -0.0005487591261044145, -0.0005149780190549791, -0.0004811969120055437, -0.0004474158340599388, -0.0004136347270105034, -0.00037985361996106803, -0.0003460725420154631, -0.00031229143496602774, -0.00027851032791659236, -0.000244729220867157, -0.00021094812836963683, -0.00017716703587211668, -0.0001433859288226813, -0.00010960482177324593, -7.582372927572578e-05, -4.204263677820563e-05, -8.261529728770256e-06, 2.5519570044707507e-05, 5.930066981818527e-05, 9.308176959166303e-05, 0.0001268628693651408, 0.00016064397641457617, 0.00019442506891209632, 0.00022820616140961647, 0.00026198726845905185, 0.0002957683755084872, 0.0003295494825579226, 0.0003633305605035275, 0.0003971116675529629, 0.0004308927746023983, 0.0004646738525480032, 0.0004984549595974386, 0.000532236066646874, 0.0005660171736963093, 0.0005997982807457447, 0.0006335793877951801, 0.0006673604948446155, 0.0007011415436863899, 0.0007349226507358253, 0.0007687037577852607, 0.0008024848648346961, 0.0008362659718841314, 0.0008700470789335668, 0.0009038281859830022, 0.0009376092348247766, 0.0009713904000818729, 0.0010051714489236474, 0.0010389524977654219, 0.0010727336630225182]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 16.0, 20.0, 32.0, 42.0, 66.0, 102.0, 145.0, 191.0, 301.0, 458.0, 719.0, 1029.0, 1553.0, 2285.0, 3520.0, 5448.0, 8385.0, 12650.0, 20363.0, 33435.0, 55931.0, 98031.0, 170118.0, 230204.0, 165415.0, 94777.0, 54669.0, 32572.0, 19873.0, 12485.0, 8079.0, 5359.0, 3411.0, 2269.0, 1500.0, 968.0, 678.0, 485.0, 319.0, 202.0, 141.0, 97.0, 61.0, 42.0, 34.0, 27.0, 16.0, 9.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0019893646240234375, -0.0019281059503555298, -0.001866847276687622, -0.0018055886030197144, -0.0017443299293518066, -0.001683071255683899, -0.0016218125820159912, -0.0015605539083480835, -0.0014992952346801758, -0.001438036561012268, -0.0013767778873443604, -0.0013155192136764526, -0.001254260540008545, -0.0011930018663406372, -0.0011317431926727295, -0.0010704845190048218, -0.001009225845336914, -0.0009479671716690063, -0.0008867084980010986, -0.0008254498243331909, -0.0007641911506652832, -0.0007029324769973755, -0.0006416738033294678, -0.0005804151296615601, -0.0005191564559936523, -0.00045789778232574463, -0.0003966391086578369, -0.0003353804349899292, -0.0002741217613220215, -0.00021286308765411377, -0.00015160441398620605, -9.034574031829834e-05, -2.9087066650390625e-05, 3.217160701751709e-05, 9.34302806854248e-05, 0.00015468895435333252, 0.00021594762802124023, 0.00027720630168914795, 0.00033846497535705566, 0.0003997236490249634, 0.0004609823226928711, 0.0005222409963607788, 0.0005834996700286865, 0.0006447583436965942, 0.000706017017364502, 0.0007672756910324097, 0.0008285343647003174, 0.0008897930383682251, 0.0009510517120361328, 0.0010123103857040405, 0.0010735690593719482, 0.001134827733039856, 0.0011960864067077637, 0.0012573450803756714, 0.001318603754043579, 0.0013798624277114868, 0.0014411211013793945, 0.0015023797750473022, 0.00156363844871521, 0.0016248971223831177, 0.0016861557960510254, 0.001747414469718933, 0.0018086731433868408, 0.0018699318170547485, 0.0019311904907226562]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 7.0, 5.0, 15.0, 13.0, 17.0, 8.0, 16.0, 20.0, 29.0, 13.0, 25.0, 26.0, 31.0, 27.0, 43.0, 34.0, 30.0, 41.0, 41.0, 37.0, 54.0, 33.0, 38.0, 28.0, 33.0, 25.0, 40.0, 27.0, 31.0, 26.0, 29.0, 23.0, 19.0, 15.0, 24.0, 14.0, 6.0, 9.0, 9.0, 9.0, 5.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007987022399902344, -0.0007727816700935364, -0.0007468611001968384, -0.0007209405303001404, -0.0006950199604034424, -0.0006690993905067444, -0.0006431788206100464, -0.0006172582507133484, -0.0005913376808166504, -0.0005654171109199524, -0.0005394965410232544, -0.0005135759711265564, -0.0004876554012298584, -0.0004617348313331604, -0.0004358142614364624, -0.0004098936915397644, -0.0003839731216430664, -0.0003580525517463684, -0.0003321319818496704, -0.0003062114119529724, -0.0002802908420562744, -0.0002543702721595764, -0.00022844970226287842, -0.00020252913236618042, -0.00017660856246948242, -0.00015068799257278442, -0.00012476742267608643, -9.884685277938843e-05, -7.292628288269043e-05, -4.700571298599243e-05, -2.1085143089294434e-05, 4.8354268074035645e-06, 3.075599670410156e-05, 5.667656660079956e-05, 8.259713649749756e-05, 0.00010851770639419556, 0.00013443827629089355, 0.00016035884618759155, 0.00018627941608428955, 0.00021219998598098755, 0.00023812055587768555, 0.00026404112577438354, 0.00028996169567108154, 0.00031588226556777954, 0.00034180283546447754, 0.00036772340536117554, 0.00039364397525787354, 0.00041956454515457153, 0.00044548511505126953, 0.00047140568494796753, 0.0004973262548446655, 0.0005232468247413635, 0.0005491673946380615, 0.0005750879645347595, 0.0006010085344314575, 0.0006269291043281555, 0.0006528496742248535, 0.0006787702441215515, 0.0007046908140182495, 0.0007306113839149475, 0.0007565319538116455, 0.0007824525237083435, 0.0008083730936050415, 0.0008342936635017395, 0.0008602142333984375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 5.0, 10.0, 8.0, 12.0, 20.0, 35.0, 34.0, 67.0, 83.0, 125.0, 196.0, 291.0, 432.0, 595.0, 845.0, 1374.0, 2012.0, 2994.0, 4337.0, 6379.0, 9489.0, 14294.0, 21572.0, 32192.0, 49954.0, 80213.0, 130017.0, 192299.0, 179009.0, 115637.0, 71225.0, 44563.0, 28957.0, 19378.0, 13153.0, 8817.0, 5765.0, 3916.0, 2702.0, 1804.0, 1160.0, 793.0, 562.0, 405.0, 290.0, 175.0, 132.0, 77.0, 57.0, 36.0, 30.0, 17.0, 7.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00144195556640625, -0.0013952553272247314, -0.0013485550880432129, -0.0013018548488616943, -0.0012551546096801758, -0.0012084543704986572, -0.0011617541313171387, -0.0011150538921356201, -0.0010683536529541016, -0.001021653413772583, -0.0009749531745910645, -0.0009282529354095459, -0.0008815526962280273, -0.0008348524570465088, -0.0007881522178649902, -0.0007414519786834717, -0.0006947517395019531, -0.0006480515003204346, -0.000601351261138916, -0.0005546510219573975, -0.0005079507827758789, -0.00046125054359436035, -0.0004145503044128418, -0.00036785006523132324, -0.0003211498260498047, -0.00027444958686828613, -0.00022774934768676758, -0.00018104910850524902, -0.00013434886932373047, -8.764863014221191e-05, -4.094839096069336e-05, 5.751848220825195e-06, 5.245208740234375e-05, 9.91523265838623e-05, 0.00014585256576538086, 0.00019255280494689941, 0.00023925304412841797, 0.0002859532833099365, 0.0003326535224914551, 0.00037935376167297363, 0.0004260540008544922, 0.00047275424003601074, 0.0005194544792175293, 0.0005661547183990479, 0.0006128549575805664, 0.000659555196762085, 0.0007062554359436035, 0.0007529556751251221, 0.0007996559143066406, 0.0008463561534881592, 0.0008930563926696777, 0.0009397566318511963, 0.0009864568710327148, 0.0010331571102142334, 0.001079857349395752, 0.0011265575885772705, 0.001173257827758789, 0.0012199580669403076, 0.0012666583061218262, 0.0013133585453033447, 0.0013600587844848633, 0.0014067590236663818, 0.0014534592628479004, 0.001500159502029419, 0.0015468597412109375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 4.0, 10.0, 6.0, 8.0, 11.0, 14.0, 19.0, 22.0, 20.0, 32.0, 34.0, 34.0, 37.0, 31.0, 34.0, 36.0, 32.0, 32.0, 41.0, 32.0, 48.0, 37.0, 43.0, 40.0, 29.0, 32.0, 25.0, 26.0, 32.0, 32.0, 20.0, 21.0, 16.0, 21.0, 26.0, 10.0, 8.0, 10.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00048470497131347656, -0.0004676990211009979, -0.0004506930708885193, -0.00043368712067604065, -0.000416681170463562, -0.0003996752202510834, -0.00038266927003860474, -0.0003656633198261261, -0.00034865736961364746, -0.0003316514194011688, -0.0003146454691886902, -0.00029763951897621155, -0.0002806335687637329, -0.00026362761855125427, -0.00024662166833877563, -0.000229615718126297, -0.00021260976791381836, -0.00019560381770133972, -0.00017859786748886108, -0.00016159191727638245, -0.0001445859670639038, -0.00012758001685142517, -0.00011057406663894653, -9.35681164264679e-05, -7.656216621398926e-05, -5.955621600151062e-05, -4.255026578903198e-05, -2.5544315576553345e-05, -8.538365364074707e-06, 8.46758484840393e-06, 2.547353506088257e-05, 4.2479485273361206e-05, 5.9485435485839844e-05, 7.649138569831848e-05, 9.349733591079712e-05, 0.00011050328612327576, 0.0001275092363357544, 0.00014451518654823303, 0.00016152113676071167, 0.0001785270869731903, 0.00019553303718566895, 0.00021253898739814758, 0.00022954493761062622, 0.00024655088782310486, 0.0002635568380355835, 0.00028056278824806213, 0.00029756873846054077, 0.0003145746886730194, 0.00033158063888549805, 0.0003485865890979767, 0.0003655925393104553, 0.00038259848952293396, 0.0003996044397354126, 0.00041661038994789124, 0.0004336163401603699, 0.0004506222903728485, 0.00046762824058532715, 0.0004846341907978058, 0.0005016401410102844, 0.0005186460912227631, 0.0005356520414352417, 0.0005526579916477203, 0.000569663941860199, 0.0005866698920726776, 0.0006036758422851562]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 7.0, 14.0, 9.0, 15.0, 21.0, 40.0, 62.0, 66.0, 104.0, 135.0, 172.0, 227.0, 344.0, 485.0, 693.0, 1013.0, 1395.0, 2071.0, 3109.0, 4524.0, 7129.0, 12028.0, 23662.0, 138347.0, 784951.0, 29439.0, 14313.0, 8110.0, 5249.0, 3232.0, 2295.0, 1571.0, 1077.0, 745.0, 542.0, 388.0, 264.0, 196.0, 131.0, 77.0, 76.0, 57.0, 37.0, 37.0, 23.0, 18.0, 12.0, 10.0, 5.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.00023508071899414062, -0.00022776424884796143, -0.00022044777870178223, -0.00021313130855560303, -0.00020581483840942383, -0.00019849836826324463, -0.00019118189811706543, -0.00018386542797088623, -0.00017654895782470703, -0.00016923248767852783, -0.00016191601753234863, -0.00015459954738616943, -0.00014728307723999023, -0.00013996660709381104, -0.00013265013694763184, -0.00012533366680145264, -0.00011801719665527344, -0.00011070072650909424, -0.00010338425636291504, -9.606778621673584e-05, -8.875131607055664e-05, -8.143484592437744e-05, -7.411837577819824e-05, -6.680190563201904e-05, -5.9485435485839844e-05, -5.2168965339660645e-05, -4.4852495193481445e-05, -3.7536025047302246e-05, -3.0219554901123047e-05, -2.2903084754943848e-05, -1.558661460876465e-05, -8.27014446258545e-06, -9.5367431640625e-07, 6.362795829772949e-06, 1.3679265975952148e-05, 2.0995736122131348e-05, 2.8312206268310547e-05, 3.5628676414489746e-05, 4.2945146560668945e-05, 5.0261616706848145e-05, 5.7578086853027344e-05, 6.489455699920654e-05, 7.221102714538574e-05, 7.952749729156494e-05, 8.684396743774414e-05, 9.416043758392334e-05, 0.00010147690773010254, 0.00010879337787628174, 0.00011610984802246094, 0.00012342631816864014, 0.00013074278831481934, 0.00013805925846099854, 0.00014537572860717773, 0.00015269219875335693, 0.00016000866889953613, 0.00016732513904571533, 0.00017464160919189453, 0.00018195807933807373, 0.00018927454948425293, 0.00019659101963043213, 0.00020390748977661133, 0.00021122395992279053, 0.00021854043006896973, 0.00022585690021514893, 0.00023317337036132812]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 7.0, 8.0, 3.0, 23.0, 16.0, 17.0, 54.0, 38.0, 36.0, 44.0, 75.0, 55.0, 60.0, 50.0, 126.0, 46.0, 49.0, 93.0, 29.0, 27.0, 22.0, 41.0, 17.0, 5.0, 17.0, 12.0, 6.0, 3.0, 7.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-06, -2.3078173398971558e-06, -2.2314488887786865e-06, -2.1550804376602173e-06, -2.078711986541748e-06, -2.002343535423279e-06, -1.9259750843048096e-06, -1.8496066331863403e-06, -1.773238182067871e-06, -1.6968697309494019e-06, -1.6205012798309326e-06, -1.5441328287124634e-06, -1.4677643775939941e-06, -1.391395926475525e-06, -1.3150274753570557e-06, -1.2386590242385864e-06, -1.1622905731201172e-06, -1.085922122001648e-06, -1.0095536708831787e-06, -9.331852197647095e-07, -8.568167686462402e-07, -7.80448317527771e-07, -7.040798664093018e-07, -6.277114152908325e-07, -5.513429641723633e-07, -4.7497451305389404e-07, -3.986060619354248e-07, -3.2223761081695557e-07, -2.4586915969848633e-07, -1.695007085800171e-07, -9.313225746154785e-08, -1.6763806343078613e-08, 5.960464477539063e-08, 1.3597309589385986e-07, 2.123415470123291e-07, 2.8870999813079834e-07, 3.650784492492676e-07, 4.414469003677368e-07, 5.178153514862061e-07, 5.941838026046753e-07, 6.705522537231445e-07, 7.469207048416138e-07, 8.23289155960083e-07, 8.996576070785522e-07, 9.760260581970215e-07, 1.0523945093154907e-06, 1.12876296043396e-06, 1.2051314115524292e-06, 1.2814998626708984e-06, 1.3578683137893677e-06, 1.434236764907837e-06, 1.5106052160263062e-06, 1.5869736671447754e-06, 1.6633421182632446e-06, 1.7397105693817139e-06, 1.816079020500183e-06, 1.8924474716186523e-06, 1.9688159227371216e-06, 2.045184373855591e-06, 2.12155282497406e-06, 2.1979212760925293e-06, 2.2742897272109985e-06, 2.3506581783294678e-06, 2.427026629447937e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 8.0, 12.0, 8.0, 26.0, 20.0, 43.0, 61.0, 81.0, 102.0, 158.0, 222.0, 322.0, 482.0, 734.0, 1091.0, 1601.0, 2287.0, 3446.0, 5253.0, 8340.0, 15281.0, 32246.0, 882928.0, 47708.0, 18380.0, 9782.0, 5835.0, 3967.0, 2596.0, 1776.0, 1181.0, 805.0, 534.0, 383.0, 246.0, 186.0, 126.0, 89.0, 59.0, 35.0, 35.0, 24.0, 10.0, 17.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0003044605255126953, -0.0002941899001598358, -0.0002839192748069763, -0.0002736486494541168, -0.0002633780241012573, -0.00025310739874839783, -0.00024283677339553833, -0.00023256614804267883, -0.00022229552268981934, -0.00021202489733695984, -0.00020175427198410034, -0.00019148364663124084, -0.00018121302127838135, -0.00017094239592552185, -0.00016067177057266235, -0.00015040114521980286, -0.00014013051986694336, -0.00012985989451408386, -0.00011958926916122437, -0.00010931864380836487, -9.904801845550537e-05, -8.877739310264587e-05, -7.850676774978638e-05, -6.823614239692688e-05, -5.796551704406738e-05, -4.7694891691207886e-05, -3.742426633834839e-05, -2.715364098548889e-05, -1.6883015632629395e-05, -6.6123902797698975e-06, 3.6582350730895996e-06, 1.3928860425949097e-05, 2.4199485778808594e-05, 3.447011113166809e-05, 4.474073648452759e-05, 5.5011361837387085e-05, 6.528198719024658e-05, 7.555261254310608e-05, 8.582323789596558e-05, 9.609386324882507e-05, 0.00010636448860168457, 0.00011663511395454407, 0.00012690573930740356, 0.00013717636466026306, 0.00014744699001312256, 0.00015771761536598206, 0.00016798824071884155, 0.00017825886607170105, 0.00018852949142456055, 0.00019880011677742004, 0.00020907074213027954, 0.00021934136748313904, 0.00022961199283599854, 0.00023988261818885803, 0.00025015324354171753, 0.000260423868894577, 0.0002706944942474365, 0.000280965119600296, 0.0002912357449531555, 0.000301506370306015, 0.0003117769956588745, 0.000322047621011734, 0.0003323182463645935, 0.000342588871717453, 0.0003528594970703125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 6.0, 2.0, 4.0, 8.0, 9.0, 9.0, 5.0, 10.0, 21.0, 38.0, 632.0, 149.0, 10.0, 12.0, 9.0, 13.0, 10.0, 5.0, 3.0, 2.0, 2.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.147954940795898e-05, -7.85384327173233e-05, -7.559731602668762e-05, -7.265619933605194e-05, -6.971508264541626e-05, -6.677396595478058e-05, -6.38328492641449e-05, -6.0891732573509216e-05, -5.7950615882873535e-05, -5.5009499192237854e-05, -5.206838250160217e-05, -4.912726581096649e-05, -4.618614912033081e-05, -4.324503242969513e-05, -4.030391573905945e-05, -3.736279904842377e-05, -3.4421682357788086e-05, -3.1480565667152405e-05, -2.8539448976516724e-05, -2.5598332285881042e-05, -2.265721559524536e-05, -1.971609890460968e-05, -1.6774982213974e-05, -1.3833865523338318e-05, -1.0892748832702637e-05, -7.951632142066956e-06, -5.010515451431274e-06, -2.0693987607955933e-06, 8.717179298400879e-07, 3.812834620475769e-06, 6.75395131111145e-06, 9.695068001747131e-06, 1.2636184692382812e-05, 1.5577301383018494e-05, 1.8518418073654175e-05, 2.1459534764289856e-05, 2.4400651454925537e-05, 2.7341768145561218e-05, 3.02828848361969e-05, 3.322400152683258e-05, 3.616511821746826e-05, 3.910623490810394e-05, 4.2047351598739624e-05, 4.4988468289375305e-05, 4.7929584980010986e-05, 5.087070167064667e-05, 5.381181836128235e-05, 5.675293505191803e-05, 5.969405174255371e-05, 6.263516843318939e-05, 6.557628512382507e-05, 6.851740181446075e-05, 7.145851850509644e-05, 7.439963519573212e-05, 7.73407518863678e-05, 8.028186857700348e-05, 8.322298526763916e-05, 8.616410195827484e-05, 8.910521864891052e-05, 9.20463353395462e-05, 9.498745203018188e-05, 9.792856872081757e-05, 0.00010086968541145325, 0.00010381080210208893, 0.00010675191879272461]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 6.0, 4.0, 11.0, 17.0, 9.0, 12.0, 18.0, 16.0, 34.0, 44.0, 38.0, 46.0, 100.0, 109.0, 108.0, 98.0, 87.0, 53.0, 44.0, 34.0, 29.0, 19.0, 8.0, 12.0, 6.0, 10.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015584576176479459, -0.0015129238599911332, -0.0014673902187496424, -0.0014218564610928297, -0.001376322703436017, -0.0013307890621945262, -0.0012852553045377135, -0.0012397216632962227, -0.00119418790563941, -0.0011486541479825974, -0.0011031205067411065, -0.0010575867490842938, -0.0010120529914274812, -0.0009665193501859903, -0.0009209855925291777, -0.0008754518930800259, -0.0008299181354232132, -0.0007843844359740615, -0.0007388506783172488, -0.0006933169788680971, -0.0006477832794189453, -0.0006022495217621326, -0.0005567158223129809, -0.0005111821228638291, -0.0004656483943108469, -0.0004201146657578647, -0.00037458096630871296, -0.00032904723775573075, -0.00028351350920274854, -0.00023797980975359678, -0.00019244608120061457, -0.00014691238175146282, -0.0001013786531984806, -5.5844935559434816e-05, -1.0311217920389026e-05, 3.522250335663557e-05, 8.075621735770255e-05, 0.00012628993135876954, 0.00017182365991175175, 0.0002173573593609035, 0.0002628910879138857, 0.0003084248164668679, 0.0003539585159160197, 0.0003994922444690019, 0.0004450259730219841, 0.0004905596724711359, 0.0005360933719202876, 0.0005816271295771003, 0.000627160829026252, 0.0006726945284754038, 0.0007182282861322165, 0.0007637619855813682, 0.00080929568503052, 0.0008548294426873326, 0.0009003631421364844, 0.0009458968415856361, 0.0009914305992424488, 0.0010369643568992615, 0.0010824979981407523, 0.001128031755797565, 0.0011735655134543777, 0.0012190991546958685, 0.0012646329123526812, 0.0013101666700094938, 0.0013557003112509847]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 6.0, 7.0, 7.0, 9.0, 9.0, 10.0, 14.0, 22.0, 13.0, 18.0, 21.0, 19.0, 34.0, 29.0, 42.0, 33.0, 37.0, 32.0, 31.0, 45.0, 33.0, 51.0, 34.0, 38.0, 32.0, 42.0, 36.0, 29.0, 39.0, 39.0, 33.0, 21.0, 18.0, 24.0, 12.0, 11.0, 15.0, 13.0, 6.0, 9.0, 8.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000905559107195586, -0.0008773088338784873, -0.0008490585605613887, -0.0008208082872442901, -0.0007925580721348524, -0.0007643077988177538, -0.0007360575255006552, -0.0007078072521835566, -0.0006795569788664579, -0.0006513067055493593, -0.0006230564322322607, -0.0005948061589151621, -0.0005665558855980635, -0.0005383056122809649, -0.0005100553971715271, -0.00048180512385442853, -0.0004535548505373299, -0.0004253045772202313, -0.0003970543039031327, -0.0003688040596898645, -0.0003405537863727659, -0.0003123035130556673, -0.0002840532688423991, -0.0002558029955253005, -0.00022755272220820189, -0.00019930244889110327, -0.00017105219012591988, -0.0001428019313607365, -0.00011455165804363787, -8.630138472653925e-05, -5.8051125961355865e-05, -2.9800867196172476e-05, -1.5505938790738583e-06, 2.6699672162067145e-05, 5.494993820320815e-05, 8.320020424434915e-05, 0.00011145047028549016, 0.00013970074360258877, 0.00016795100236777216, 0.00019620126113295555, 0.00022445153445005417, 0.0002527018077671528, 0.0002809520810842514, 0.00030920232529751956, 0.0003374525986146182, 0.0003657028719317168, 0.00039395311614498496, 0.0004222033894620836, 0.0004504536627791822, 0.0004787039360962808, 0.0005069542094133794, 0.000535204482730478, 0.0005634546978399158, 0.0005917049711570144, 0.000619955244474113, 0.0006482055177912116, 0.0006764557911083102, 0.0007047060644254088, 0.0007329563377425075, 0.0007612066110596061, 0.0007894568843767047, 0.0008177071576938033, 0.000845957372803241, 0.0008742076461203396, 0.0009024579194374382]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 5.0, 11.0, 20.0, 25.0, 44.0, 46.0, 71.0, 117.0, 174.0, 258.0, 400.0, 575.0, 923.0, 1323.0, 2072.0, 3168.0, 5105.0, 8172.0, 13380.0, 22299.0, 37829.0, 67779.0, 128501.0, 278962.0, 829547.0, 1669209.0, 628268.0, 236266.0, 113571.0, 60099.0, 33571.0, 19744.0, 12011.0, 7467.0, 4594.0, 2982.0, 1933.0, 1340.0, 822.0, 513.0, 375.0, 253.0, 155.0, 103.0, 70.0, 47.0, 31.0, 13.0, 15.0, 12.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0012884140014648438, -0.0012498199939727783, -0.0012112259864807129, -0.0011726319789886475, -0.001134037971496582, -0.0010954439640045166, -0.0010568499565124512, -0.0010182559490203857, -0.0009796619415283203, -0.0009410679340362549, -0.0009024739265441895, -0.000863879919052124, -0.0008252859115600586, -0.0007866919040679932, -0.0007480978965759277, -0.0007095038890838623, -0.0006709098815917969, -0.0006323158740997314, -0.000593721866607666, -0.0005551278591156006, -0.0005165338516235352, -0.0004779398441314697, -0.0004393458366394043, -0.00040075182914733887, -0.00036215782165527344, -0.000323563814163208, -0.0002849698066711426, -0.00024637579917907715, -0.00020778179168701172, -0.0001691877841949463, -0.00013059377670288086, -9.199976921081543e-05, -5.340576171875e-05, -1.481175422668457e-05, 2.378225326538086e-05, 6.237626075744629e-05, 0.00010097026824951172, 0.00013956427574157715, 0.00017815828323364258, 0.000216752290725708, 0.00025534629821777344, 0.00029394030570983887, 0.0003325343132019043, 0.0003711283206939697, 0.00040972232818603516, 0.0004483163356781006, 0.000486910343170166, 0.0005255043506622314, 0.0005640983581542969, 0.0006026923656463623, 0.0006412863731384277, 0.0006798803806304932, 0.0007184743881225586, 0.000757068395614624, 0.0007956624031066895, 0.0008342564105987549, 0.0008728504180908203, 0.0009114444255828857, 0.0009500384330749512, 0.0009886324405670166, 0.001027226448059082, 0.0010658204555511475, 0.0011044144630432129, 0.0011430084705352783, 0.0011816024780273438]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 3.0, 6.0, 5.0, 6.0, 3.0, 10.0, 15.0, 14.0, 11.0, 16.0, 24.0, 14.0, 18.0, 24.0, 25.0, 28.0, 30.0, 30.0, 34.0, 29.0, 37.0, 29.0, 49.0, 34.0, 38.0, 35.0, 18.0, 36.0, 51.0, 41.0, 24.0, 35.0, 29.0, 27.0, 19.0, 23.0, 10.0, 20.0, 16.0, 12.0, 10.0, 11.0, 7.0, 10.0, 4.0, 6.0, 9.0, 2.0, 0.0, 3.0, 5.0, 3.0, 2.0, 4.0], "bins": [-0.0005316734313964844, -0.0005159229040145874, -0.0005001723766326904, -0.00048442184925079346, -0.0004686713218688965, -0.0004529207944869995, -0.00043717026710510254, -0.00042141973972320557, -0.0004056692123413086, -0.0003899186849594116, -0.00037416815757751465, -0.0003584176301956177, -0.0003426671028137207, -0.00032691657543182373, -0.00031116604804992676, -0.0002954155206680298, -0.0002796649932861328, -0.00026391446590423584, -0.00024816393852233887, -0.0002324134111404419, -0.00021666288375854492, -0.00020091235637664795, -0.00018516182899475098, -0.000169411301612854, -0.00015366077423095703, -0.00013791024684906006, -0.00012215971946716309, -0.00010640919208526611, -9.065866470336914e-05, -7.490813732147217e-05, -5.9157609939575195e-05, -4.340708255767822e-05, -2.765655517578125e-05, -1.1906027793884277e-05, 3.844499588012695e-06, 1.9595026969909668e-05, 3.534555435180664e-05, 5.109608173370361e-05, 6.684660911560059e-05, 8.259713649749756e-05, 9.834766387939453e-05, 0.0001140981912612915, 0.00012984871864318848, 0.00014559924602508545, 0.00016134977340698242, 0.0001771003007888794, 0.00019285082817077637, 0.00020860135555267334, 0.0002243518829345703, 0.00024010241031646729, 0.00025585293769836426, 0.00027160346508026123, 0.0002873539924621582, 0.0003031045198440552, 0.00031885504722595215, 0.0003346055746078491, 0.0003503561019897461, 0.00036610662937164307, 0.00038185715675354004, 0.000397607684135437, 0.000413358211517334, 0.00042910873889923096, 0.00044485926628112793, 0.0004606097936630249, 0.0004763603210449219]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 8.0, 4.0, 2.0, 3.0, 14.0, 11.0, 20.0, 34.0, 41.0, 83.0, 110.0, 192.0, 297.0, 484.0, 735.0, 1186.0, 2019.0, 3106.0, 5421.0, 9191.0, 15936.0, 27947.0, 50469.0, 93098.0, 183016.0, 398642.0, 1017669.0, 1348534.0, 539505.0, 236587.0, 117092.0, 61745.0, 34214.0, 19301.0, 11012.0, 6543.0, 3939.0, 2288.0, 1433.0, 870.0, 567.0, 336.0, 198.0, 141.0, 98.0, 51.0, 37.0, 26.0, 11.0, 8.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00098419189453125, -0.0009515732526779175, -0.000918954610824585, -0.0008863359689712524, -0.0008537173271179199, -0.0008210986852645874, -0.0007884800434112549, -0.0007558614015579224, -0.0007232427597045898, -0.0006906241178512573, -0.0006580054759979248, -0.0006253868341445923, -0.0005927681922912598, -0.0005601495504379272, -0.0005275309085845947, -0.0004949122667312622, -0.0004622936248779297, -0.00042967498302459717, -0.00039705634117126465, -0.00036443769931793213, -0.0003318190574645996, -0.0002992004156112671, -0.00026658177375793457, -0.00023396313190460205, -0.00020134449005126953, -0.000168725848197937, -0.0001361072063446045, -0.00010348856449127197, -7.086992263793945e-05, -3.8251280784606934e-05, -5.632638931274414e-06, 2.6986002922058105e-05, 5.9604644775390625e-05, 9.222328662872314e-05, 0.00012484192848205566, 0.00015746057033538818, 0.0001900792121887207, 0.00022269785404205322, 0.00025531649589538574, 0.00028793513774871826, 0.0003205537796020508, 0.0003531724214553833, 0.0003857910633087158, 0.00041840970516204834, 0.00045102834701538086, 0.0004836469888687134, 0.0005162656307220459, 0.0005488842725753784, 0.0005815029144287109, 0.0006141215562820435, 0.000646740198135376, 0.0006793588399887085, 0.000711977481842041, 0.0007445961236953735, 0.0007772147655487061, 0.0008098334074020386, 0.0008424520492553711, 0.0008750706911087036, 0.0009076893329620361, 0.0009403079748153687, 0.0009729266166687012, 0.0010055452585220337, 0.0010381639003753662, 0.0010707825422286987, 0.0011034011840820312]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 10.0, 5.0, 10.0, 19.0, 25.0, 36.0, 32.0, 42.0, 58.0, 66.0, 90.0, 85.0, 116.0, 156.0, 176.0, 188.0, 253.0, 261.0, 264.0, 281.0, 281.0, 256.0, 218.0, 203.0, 188.0, 141.0, 130.0, 106.0, 105.0, 68.0, 45.0, 47.0, 23.0, 27.0, 19.0, 12.0, 4.0, 12.0, 3.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028634071350097656, -0.0002759285271167755, -0.00026551634073257446, -0.0002551041543483734, -0.00024469196796417236, -0.0002342797815799713, -0.00022386759519577026, -0.00021345540881156921, -0.00020304322242736816, -0.00019263103604316711, -0.00018221884965896606, -0.00017180666327476501, -0.00016139447689056396, -0.00015098229050636292, -0.00014057010412216187, -0.00013015791773796082, -0.00011974573135375977, -0.00010933354496955872, -9.892135858535767e-05, -8.850917220115662e-05, -7.809698581695557e-05, -6.768479943275452e-05, -5.727261304855347e-05, -4.686042666435242e-05, -3.644824028015137e-05, -2.6036053895950317e-05, -1.5623867511749268e-05, -5.211681127548218e-06, 5.200505256652832e-06, 1.5612691640853882e-05, 2.602487802505493e-05, 3.643706440925598e-05, 4.684925079345703e-05, 5.726143717765808e-05, 6.767362356185913e-05, 7.808580994606018e-05, 8.849799633026123e-05, 9.891018271446228e-05, 0.00010932236909866333, 0.00011973455548286438, 0.00013014674186706543, 0.00014055892825126648, 0.00015097111463546753, 0.00016138330101966858, 0.00017179548740386963, 0.00018220767378807068, 0.00019261986017227173, 0.00020303204655647278, 0.00021344423294067383, 0.00022385641932487488, 0.00023426860570907593, 0.000244680792093277, 0.00025509297847747803, 0.0002655051648616791, 0.0002759173512458801, 0.0002863295376300812, 0.0002967417240142822, 0.0003071539103984833, 0.0003175660967826843, 0.0003279782831668854, 0.0003383904695510864, 0.0003488026559352875, 0.0003592148423194885, 0.0003696270287036896, 0.0003800392150878906]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 8.0, 19.0, 23.0, 16.0, 34.0, 38.0, 60.0, 77.0, 100.0, 139.0, 118.0, 87.0, 88.0, 55.0, 43.0, 22.0, 13.0, 11.0, 10.0, 11.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012677049962803721, -0.001231212168931961, -0.00119471934158355, -0.001158226397819817, -0.001121733570471406, -0.001085240743122995, -0.0010487479157745838, -0.0010122550884261727, -0.0009757622028701007, -0.0009392693755216897, -0.0009027764899656177, -0.0008662836626172066, -0.0008297908352687955, -0.0007932979497127235, -0.0007568051223643124, -0.0007203122368082404, -0.0006838194094598293, -0.0006473265821114182, -0.0006108336965553463, -0.0005743408692069352, -0.0005378479836508632, -0.0005013551563024521, -0.000464862328954041, -0.00042836947250179946, -0.0003918766160495579, -0.0003553837595973164, -0.00031889090314507484, -0.00028239807579666376, -0.0002459052193444222, -0.00020941236289218068, -0.00017291952099185437, -0.00013642667909152806, -9.993370622396469e-05, -6.344085704768077e-05, -2.694800787139684e-05, 9.544841304887086e-06, 4.603769048117101e-05, 8.253054693341255e-05, 0.00011902338883373886, 0.00015551623073406518, 0.00019200908718630672, 0.00022850194363854825, 0.0002649948000907898, 0.0003014876274392009, 0.0003379804838914424, 0.00037447334034368396, 0.00041096616769209504, 0.0004474590241443366, 0.0004839518805965781, 0.0005204447079449892, 0.0005569375935010612, 0.0005934304208494723, 0.0006299233064055443, 0.0006664161337539554, 0.0007029089611023664, 0.0007394017884507775, 0.0007758946740068495, 0.0008123875013552606, 0.0008488803869113326, 0.0008853732142597437, 0.0009218660416081548, 0.0009583589271642268, 0.0009948518127202988, 0.0010313446400687099, 0.001067837467417121]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 2.0, 4.0, 11.0, 15.0, 12.0, 13.0, 13.0, 25.0, 29.0, 20.0, 29.0, 25.0, 25.0, 31.0, 29.0, 48.0, 16.0, 36.0, 38.0, 36.0, 44.0, 32.0, 45.0, 33.0, 33.0, 39.0, 29.0, 25.0, 33.0, 27.0, 22.0, 33.0, 23.0, 16.0, 15.0, 14.0, 19.0, 11.0, 6.0, 6.0, 8.0, 10.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.0006234552711248398, -0.0006053918041288853, -0.0005873283371329308, -0.0005692648701369762, -0.0005512014031410217, -0.0005331379943527281, -0.0005150745273567736, -0.0004970110603608191, -0.0004789475933648646, -0.0004608841263689101, -0.00044282065937295556, -0.0004247572214808315, -0.000406693754484877, -0.0003886302874889225, -0.0003705668495967984, -0.0003525033826008439, -0.0003344399156048894, -0.0003163764486089349, -0.00029831298161298037, -0.0002802495437208563, -0.0002621860767249018, -0.00024412260972894728, -0.000226059157284908, -0.0002079957048408687, -0.0001899322378449142, -0.00017186877084895968, -0.0001538053184049204, -0.00013574186596088111, -0.0001176783989649266, -9.96149392449297e-05, -8.15514795249328e-05, -6.348802708089352e-05, -4.5424560084939e-05, -2.7361100364942104e-05, -9.297640644945204e-06, 8.765819075051695e-06, 2.6829278795048594e-05, 4.4892738515045494e-05, 6.295619823504239e-05, 8.101965067908168e-05, 9.908311767503619e-05, 0.00011714657739503309, 0.00013521003711503, 0.00015327348955906928, 0.0001713369565550238, 0.0001894004235509783, 0.0002074638759950176, 0.00022552732843905687, 0.0002435907954350114, 0.0002616542624309659, 0.0002797177294269204, 0.00029778116731904447, 0.000315844634314999, 0.0003339081013109535, 0.00035197153920307755, 0.00037003500619903207, 0.0003880984731949866, 0.0004061619401909411, 0.0004242254071868956, 0.00044228884507901967, 0.0004603523120749742, 0.0004784157790709287, 0.0004964792169630527, 0.0005145426839590073, 0.0005326061509549618]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 8.0, 5.0, 12.0, 15.0, 25.0, 44.0, 70.0, 115.0, 177.0, 258.0, 387.0, 560.0, 940.0, 1483.0, 2347.0, 3957.0, 6652.0, 11535.0, 19886.0, 36821.0, 69033.0, 132243.0, 239451.0, 237772.0, 131146.0, 68868.0, 36628.0, 19728.0, 11421.0, 6669.0, 3939.0, 2311.0, 1462.0, 857.0, 600.0, 411.0, 254.0, 149.0, 115.0, 75.0, 45.0, 31.0, 13.0, 13.0, 9.0, 13.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012025833129882812, -0.0011661350727081299, -0.0011296868324279785, -0.0010932385921478271, -0.0010567903518676758, -0.0010203421115875244, -0.000983893871307373, -0.0009474456310272217, -0.0009109973907470703, -0.0008745491504669189, -0.0008381009101867676, -0.0008016526699066162, -0.0007652044296264648, -0.0007287561893463135, -0.0006923079490661621, -0.0006558597087860107, -0.0006194114685058594, -0.000582963228225708, -0.0005465149879455566, -0.0005100667476654053, -0.0004736185073852539, -0.00043717026710510254, -0.00040072202682495117, -0.0003642737865447998, -0.00032782554626464844, -0.00029137730598449707, -0.0002549290657043457, -0.00021848082542419434, -0.00018203258514404297, -0.0001455843448638916, -0.00010913610458374023, -7.268786430358887e-05, -3.62396240234375e-05, 2.086162567138672e-07, 3.6656856536865234e-05, 7.31050968170166e-05, 0.00010955333709716797, 0.00014600157737731934, 0.0001824498176574707, 0.00021889805793762207, 0.00025534629821777344, 0.0002917945384979248, 0.00032824277877807617, 0.00036469101905822754, 0.0004011392593383789, 0.0004375874996185303, 0.00047403573989868164, 0.000510483980178833, 0.0005469322204589844, 0.0005833804607391357, 0.0006198287010192871, 0.0006562769412994385, 0.0006927251815795898, 0.0007291734218597412, 0.0007656216621398926, 0.0008020699024200439, 0.0008385181427001953, 0.0008749663829803467, 0.000911414623260498, 0.0009478628635406494, 0.0009843111038208008, 0.0010207593441009521, 0.0010572075843811035, 0.0010936558246612549, 0.0011301040649414062]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 16.0, 8.0, 17.0, 16.0, 19.0, 17.0, 24.0, 15.0, 28.0, 30.0, 31.0, 31.0, 41.0, 34.0, 36.0, 37.0, 37.0, 45.0, 39.0, 29.0, 51.0, 54.0, 40.0, 19.0, 39.0, 42.0, 24.0, 22.0, 22.0, 26.0, 17.0, 18.0, 13.0, 11.0, 5.0, 5.0, 6.0, 7.0, 10.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0005669593811035156, -0.0005502030253410339, -0.0005334466695785522, -0.0005166903138160706, -0.0004999339580535889, -0.0004831776022911072, -0.0004664212465286255, -0.0004496648907661438, -0.0004329085350036621, -0.0004161521792411804, -0.00039939582347869873, -0.00038263946771621704, -0.00036588311195373535, -0.00034912675619125366, -0.00033237040042877197, -0.0003156140446662903, -0.0002988576889038086, -0.0002821013331413269, -0.0002653449773788452, -0.0002485886216163635, -0.00023183226585388184, -0.00021507591009140015, -0.00019831955432891846, -0.00018156319856643677, -0.00016480684280395508, -0.0001480504870414734, -0.0001312941312789917, -0.00011453777551651001, -9.778141975402832e-05, -8.102506399154663e-05, -6.426870822906494e-05, -4.751235246658325e-05, -3.075599670410156e-05, -1.3999640941619873e-05, 2.7567148208618164e-06, 1.9513070583343506e-05, 3.6269426345825195e-05, 5.3025782108306885e-05, 6.978213787078857e-05, 8.653849363327026e-05, 0.00010329484939575195, 0.00012005120515823364, 0.00013680756092071533, 0.00015356391668319702, 0.0001703202724456787, 0.0001870766282081604, 0.0002038329839706421, 0.00022058933973312378, 0.00023734569549560547, 0.00025410205125808716, 0.00027085840702056885, 0.00028761476278305054, 0.0003043711185455322, 0.0003211274743080139, 0.0003378838300704956, 0.0003546401858329773, 0.000371396541595459, 0.0003881528973579407, 0.00040490925312042236, 0.00042166560888290405, 0.00043842196464538574, 0.00045517832040786743, 0.0004719346761703491, 0.0004886910319328308, 0.0005054473876953125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 5.0, 4.0, 14.0, 18.0, 21.0, 30.0, 49.0, 60.0, 121.0, 141.0, 242.0, 366.0, 507.0, 773.0, 1120.0, 1774.0, 2771.0, 4480.0, 7671.0, 14178.0, 30532.0, 86351.0, 388288.0, 363390.0, 82383.0, 29523.0, 14124.0, 7352.0, 4413.0, 2714.0, 1750.0, 1062.0, 742.0, 487.0, 335.0, 245.0, 160.0, 112.0, 74.0, 59.0, 26.0, 17.0, 13.0, 18.0, 8.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0015764236450195312, -0.0015255361795425415, -0.0014746487140655518, -0.001423761248588562, -0.0013728737831115723, -0.0013219863176345825, -0.0012710988521575928, -0.001220211386680603, -0.0011693239212036133, -0.0011184364557266235, -0.0010675489902496338, -0.001016661524772644, -0.0009657740592956543, -0.0009148865938186646, -0.0008639991283416748, -0.0008131116628646851, -0.0007622241973876953, -0.0007113367319107056, -0.0006604492664337158, -0.0006095618009567261, -0.0005586743354797363, -0.0005077868700027466, -0.00045689940452575684, -0.0004060119390487671, -0.00035512447357177734, -0.0003042370080947876, -0.00025334954261779785, -0.0002024620771408081, -0.00015157461166381836, -0.00010068714618682861, -4.979968070983887e-05, 1.087784767150879e-06, 5.1975250244140625e-05, 0.00010286271572113037, 0.00015375018119812012, 0.00020463764667510986, 0.0002555251121520996, 0.00030641257762908936, 0.0003573000431060791, 0.00040818750858306885, 0.0004590749740600586, 0.0005099624395370483, 0.0005608499050140381, 0.0006117373704910278, 0.0006626248359680176, 0.0007135123014450073, 0.0007643997669219971, 0.0008152872323989868, 0.0008661746978759766, 0.0009170621633529663, 0.0009679496288299561, 0.0010188370943069458, 0.0010697245597839355, 0.0011206120252609253, 0.001171499490737915, 0.0012223869562149048, 0.0012732744216918945, 0.0013241618871688843, 0.001375049352645874, 0.0014259368181228638, 0.0014768242835998535, 0.0015277117490768433, 0.001578599214553833, 0.0016294866800308228, 0.0016803741455078125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 9.0, 5.0, 8.0, 10.0, 10.0, 20.0, 17.0, 22.0, 19.0, 29.0, 18.0, 28.0, 18.0, 31.0, 28.0, 37.0, 38.0, 38.0, 44.0, 38.0, 45.0, 39.0, 38.0, 34.0, 46.0, 46.0, 40.0, 35.0, 25.0, 16.0, 26.0, 26.0, 17.0, 15.0, 17.0, 12.0, 9.0, 7.0, 7.0, 8.0, 3.0, 2.0, 3.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0003409385681152344, -0.0003301352262496948, -0.0003193318843841553, -0.0003085285425186157, -0.00029772520065307617, -0.0002869218587875366, -0.00027611851692199707, -0.0002653151750564575, -0.00025451183319091797, -0.00024370849132537842, -0.00023290514945983887, -0.00022210180759429932, -0.00021129846572875977, -0.00020049512386322021, -0.00018969178199768066, -0.0001788884401321411, -0.00016808509826660156, -0.000157281756401062, -0.00014647841453552246, -0.0001356750726699829, -0.00012487173080444336, -0.00011406838893890381, -0.00010326504707336426, -9.246170520782471e-05, -8.165836334228516e-05, -7.08550214767456e-05, -6.0051679611206055e-05, -4.9248337745666504e-05, -3.844499588012695e-05, -2.7641654014587402e-05, -1.683831214904785e-05, -6.034970283508301e-06, 4.76837158203125e-06, 1.55717134475708e-05, 2.637505531311035e-05, 3.71783971786499e-05, 4.798173904418945e-05, 5.8785080909729004e-05, 6.958842277526855e-05, 8.03917646408081e-05, 9.119510650634766e-05, 0.00010199844837188721, 0.00011280179023742676, 0.0001236051321029663, 0.00013440847396850586, 0.0001452118158340454, 0.00015601515769958496, 0.0001668184995651245, 0.00017762184143066406, 0.0001884251832962036, 0.00019922852516174316, 0.00021003186702728271, 0.00022083520889282227, 0.00023163855075836182, 0.00024244189262390137, 0.0002532452344894409, 0.00026404857635498047, 0.00027485191822052, 0.00028565526008605957, 0.0002964586019515991, 0.00030726194381713867, 0.0003180652856826782, 0.0003288686275482178, 0.0003396719694137573, 0.0003504753112792969]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 8.0, 5.0, 15.0, 22.0, 22.0, 44.0, 55.0, 69.0, 126.0, 175.0, 260.0, 387.0, 523.0, 828.0, 1337.0, 2403.0, 4734.0, 10711.0, 30747.0, 136655.0, 677194.0, 131176.0, 29811.0, 10417.0, 4525.0, 2397.0, 1381.0, 797.0, 549.0, 375.0, 234.0, 178.0, 112.0, 96.0, 58.0, 35.0, 25.0, 19.0, 16.0, 10.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005893707275390625, -0.0005717724561691284, -0.0005541741847991943, -0.0005365759134292603, -0.0005189776420593262, -0.0005013793706893921, -0.000483781099319458, -0.0004661828279495239, -0.00044858455657958984, -0.00043098628520965576, -0.0004133880138397217, -0.0003957897424697876, -0.0003781914710998535, -0.00036059319972991943, -0.00034299492835998535, -0.00032539665699005127, -0.0003077983856201172, -0.0002902001142501831, -0.000272601842880249, -0.00025500357151031494, -0.00023740530014038086, -0.00021980702877044678, -0.0002022087574005127, -0.0001846104860305786, -0.00016701221466064453, -0.00014941394329071045, -0.00013181567192077637, -0.00011421740055084229, -9.66191291809082e-05, -7.902085781097412e-05, -6.142258644104004e-05, -4.382431507110596e-05, -2.6226043701171875e-05, -8.627772331237793e-06, 8.970499038696289e-06, 2.656877040863037e-05, 4.416704177856445e-05, 6.176531314849854e-05, 7.936358451843262e-05, 9.69618558883667e-05, 0.00011456012725830078, 0.00013215839862823486, 0.00014975666999816895, 0.00016735494136810303, 0.0001849532127380371, 0.0002025514841079712, 0.00022014975547790527, 0.00023774802684783936, 0.00025534629821777344, 0.0002729445695877075, 0.0002905428409576416, 0.0003081411123275757, 0.00032573938369750977, 0.00034333765506744385, 0.00036093592643737793, 0.000378534197807312, 0.0003961324691772461, 0.0004137307405471802, 0.00043132901191711426, 0.00044892728328704834, 0.0004665255546569824, 0.0004841238260269165, 0.0005017220973968506, 0.0005193203687667847, 0.0005369186401367188]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 4.0, 5.0, 8.0, 13.0, 17.0, 22.0, 30.0, 19.0, 40.0, 45.0, 63.0, 88.0, 111.0, 112.0, 99.0, 70.0, 53.0, 30.0, 23.0, 37.0, 19.0, 15.0, 17.0, 11.0, 3.0, 11.0, 4.0, 3.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6510486602783203e-05, -1.5994533896446228e-05, -1.5478581190109253e-05, -1.4962628483772278e-05, -1.4446675777435303e-05, -1.3930723071098328e-05, -1.3414770364761353e-05, -1.2898817658424377e-05, -1.2382864952087402e-05, -1.1866912245750427e-05, -1.1350959539413452e-05, -1.0835006833076477e-05, -1.0319054126739502e-05, -9.803101420402527e-06, -9.287148714065552e-06, -8.771196007728577e-06, -8.255243301391602e-06, -7.739290595054626e-06, -7.223337888717651e-06, -6.707385182380676e-06, -6.191432476043701e-06, -5.675479769706726e-06, -5.159527063369751e-06, -4.643574357032776e-06, -4.127621650695801e-06, -3.6116689443588257e-06, -3.0957162380218506e-06, -2.5797635316848755e-06, -2.0638108253479004e-06, -1.5478581190109253e-06, -1.0319054126739502e-06, -5.159527063369751e-07, 0.0, 5.159527063369751e-07, 1.0319054126739502e-06, 1.5478581190109253e-06, 2.0638108253479004e-06, 2.5797635316848755e-06, 3.0957162380218506e-06, 3.6116689443588257e-06, 4.127621650695801e-06, 4.643574357032776e-06, 5.159527063369751e-06, 5.675479769706726e-06, 6.191432476043701e-06, 6.707385182380676e-06, 7.223337888717651e-06, 7.739290595054626e-06, 8.255243301391602e-06, 8.771196007728577e-06, 9.287148714065552e-06, 9.803101420402527e-06, 1.0319054126739502e-05, 1.0835006833076477e-05, 1.1350959539413452e-05, 1.1866912245750427e-05, 1.2382864952087402e-05, 1.2898817658424377e-05, 1.3414770364761353e-05, 1.3930723071098328e-05, 1.4446675777435303e-05, 1.4962628483772278e-05, 1.5478581190109253e-05, 1.5994533896446228e-05, 1.6510486602783203e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 11.0, 11.0, 18.0, 22.0, 29.0, 48.0, 67.0, 81.0, 97.0, 189.0, 274.0, 359.0, 545.0, 800.0, 1147.0, 1745.0, 2541.0, 4061.0, 6453.0, 10273.0, 17303.0, 31036.0, 57391.0, 119485.0, 300799.0, 262580.0, 107055.0, 52225.0, 28544.0, 16199.0, 9689.0, 6218.0, 3853.0, 2395.0, 1590.0, 1053.0, 734.0, 455.0, 370.0, 239.0, 182.0, 131.0, 78.0, 58.0, 43.0, 37.0, 16.0, 14.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00015056133270263672, -0.00014535710215568542, -0.00014015287160873413, -0.00013494864106178284, -0.00012974441051483154, -0.00012454017996788025, -0.00011933594942092896, -0.00011413171887397766, -0.00010892748832702637, -0.00010372325778007507, -9.851902723312378e-05, -9.331479668617249e-05, -8.811056613922119e-05, -8.29063355922699e-05, -7.77021050453186e-05, -7.249787449836731e-05, -6.729364395141602e-05, -6.208941340446472e-05, -5.688518285751343e-05, -5.1680952310562134e-05, -4.647672176361084e-05, -4.1272491216659546e-05, -3.606826066970825e-05, -3.086403012275696e-05, -2.5659799575805664e-05, -2.045556902885437e-05, -1.5251338481903076e-05, -1.0047107934951782e-05, -4.842877388000488e-06, 3.6135315895080566e-07, 5.5655837059021e-06, 1.0769814252853394e-05, 1.5974044799804688e-05, 2.117827534675598e-05, 2.6382505893707275e-05, 3.158673644065857e-05, 3.679096698760986e-05, 4.199519753456116e-05, 4.719942808151245e-05, 5.2403658628463745e-05, 5.760788917541504e-05, 6.281211972236633e-05, 6.801635026931763e-05, 7.322058081626892e-05, 7.842481136322021e-05, 8.362904191017151e-05, 8.88332724571228e-05, 9.40375030040741e-05, 9.924173355102539e-05, 0.00010444596409797668, 0.00010965019464492798, 0.00011485442519187927, 0.00012005865573883057, 0.00012526288628578186, 0.00013046711683273315, 0.00013567134737968445, 0.00014087557792663574, 0.00014607980847358704, 0.00015128403902053833, 0.00015648826956748962, 0.00016169250011444092, 0.0001668967306613922, 0.0001721009612083435, 0.0001773051917552948, 0.0001825094223022461]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 8.0, 3.0, 6.0, 8.0, 2.0, 7.0, 14.0, 12.0, 20.0, 23.0, 32.0, 43.0, 37.0, 80.0, 62.0, 100.0, 94.0, 93.0, 78.0, 41.0, 50.0, 45.0, 27.0, 28.0, 18.0, 18.0, 7.0, 9.0, 8.0, 4.0, 1.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.543231964111328e-05, -5.347002297639847e-05, -5.1507726311683655e-05, -4.954542964696884e-05, -4.758313298225403e-05, -4.5620836317539215e-05, -4.36585396528244e-05, -4.169624298810959e-05, -3.9733946323394775e-05, -3.777164965867996e-05, -3.580935299396515e-05, -3.3847056329250336e-05, -3.188475966453552e-05, -2.992246299982071e-05, -2.7960166335105896e-05, -2.5997869670391083e-05, -2.403557300567627e-05, -2.2073276340961456e-05, -2.0110979676246643e-05, -1.814868301153183e-05, -1.6186386346817017e-05, -1.4224089682102203e-05, -1.226179301738739e-05, -1.0299496352672577e-05, -8.337199687957764e-06, -6.3749030232429504e-06, -4.412606358528137e-06, -2.450309693813324e-06, -4.880130290985107e-07, 1.4742836356163025e-06, 3.4365803003311157e-06, 5.398876965045929e-06, 7.361173629760742e-06, 9.323470294475555e-06, 1.1285766959190369e-05, 1.3248063623905182e-05, 1.5210360288619995e-05, 1.717265695333481e-05, 1.913495361804962e-05, 2.1097250282764435e-05, 2.3059546947479248e-05, 2.502184361219406e-05, 2.6984140276908875e-05, 2.8946436941623688e-05, 3.09087336063385e-05, 3.2871030271053314e-05, 3.483332693576813e-05, 3.679562360048294e-05, 3.8757920265197754e-05, 4.072021692991257e-05, 4.268251359462738e-05, 4.4644810259342194e-05, 4.660710692405701e-05, 4.856940358877182e-05, 5.053170025348663e-05, 5.2493996918201447e-05, 5.445629358291626e-05, 5.641859024763107e-05, 5.8380886912345886e-05, 6.03431835770607e-05, 6.230548024177551e-05, 6.426777690649033e-05, 6.623007357120514e-05, 6.819237023591995e-05, 7.015466690063477e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 3.0, 1.0, 5.0, 1.0, 11.0, 9.0, 14.0, 20.0, 21.0, 37.0, 29.0, 49.0, 59.0, 79.0, 124.0, 124.0, 92.0, 97.0, 57.0, 37.0, 33.0, 28.0, 15.0, 7.0, 8.0, 12.0, 9.0, 6.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000870297197252512, -0.0008431752794422209, -0.0008160533616319299, -0.0007889314438216388, -0.0007618095260113478, -0.0007346876082010567, -0.0007075656903907657, -0.0006804438307881355, -0.0006533218547701836, -0.0006261999369598925, -0.0005990780191496015, -0.0005719561013393104, -0.0005448341835290194, -0.0005177122657187283, -0.0004905903479084373, -0.00046346845920197666, -0.00043634657049551606, -0.000409224652685225, -0.00038210273487493396, -0.0003549808170646429, -0.00032785889925435185, -0.0003007369814440608, -0.0002736150927376002, -0.00024649317492730916, -0.0002193712571170181, -0.00019224933930672705, -0.000165127421496436, -0.00013800551823806018, -0.00011088360042776912, -8.376168261747807e-05, -5.663977935910225e-05, -2.9517861548811197e-05, -2.395885530859232e-06, 2.4726028641453013e-05, 5.184794281376526e-05, 7.89698533480987e-05, 0.00010609177115838975, 0.0001332136889686808, 0.00016033559222705662, 0.00018745751003734767, 0.00021457942784763873, 0.00024170134565792978, 0.00026882326346822083, 0.0002959451521746814, 0.0003230670699849725, 0.00035018898779526353, 0.0003773109056055546, 0.00040443282341584563, 0.0004315547412261367, 0.00045867665903642774, 0.0004857985768467188, 0.0005129204946570098, 0.0005400424124673009, 0.0005671643302775919, 0.000594286248087883, 0.0006214081076905131, 0.0006485300837084651, 0.0006756520015187562, 0.0007027739193290472, 0.0007298958371393383, 0.0007570177549496293, 0.0007841396727599204, 0.0008112615905702114, 0.0008383834501728415, 0.0008655053679831326]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 3.0, 12.0, 7.0, 12.0, 16.0, 12.0, 19.0, 23.0, 23.0, 27.0, 33.0, 25.0, 25.0, 34.0, 35.0, 28.0, 34.0, 46.0, 42.0, 30.0, 33.0, 43.0, 36.0, 43.0, 41.0, 21.0, 31.0, 37.0, 25.0, 24.0, 28.0, 25.0, 19.0, 20.0, 10.0, 13.0, 14.0, 7.0, 8.0, 8.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.0005403722170740366, -0.0005248453235253692, -0.0005093184299767017, -0.0004937915364280343, -0.0004782646428793669, -0.00046273774933069944, -0.000447210855782032, -0.0004316839622333646, -0.00041615706868469715, -0.0004006301751360297, -0.0003851032815873623, -0.00036957638803869486, -0.00035404949449002743, -0.00033852260094136, -0.00032299570739269257, -0.00030746881384402514, -0.0002919419202953577, -0.0002764150267466903, -0.00026088813319802284, -0.0002453612396493554, -0.00022983434610068798, -0.00021430745255202055, -0.00019878055900335312, -0.0001832536654546857, -0.00016772677190601826, -0.00015219987835735083, -0.0001366729848086834, -0.00012114609126001596, -0.00010561919771134853, -9.00923041626811e-05, -7.456541061401367e-05, -5.903851706534624e-05, -4.35115653090179e-05, -2.7984671760350466e-05, -1.2457778211683035e-05, 3.069115336984396e-06, 1.8596008885651827e-05, 3.412290243431926e-05, 4.964979598298669e-05, 6.517668953165412e-05, 8.070358308032155e-05, 9.623047662898898e-05, 0.00011175737017765641, 0.00012728426372632384, 0.00014281115727499127, 0.0001583380508236587, 0.00017386494437232614, 0.00018939183792099357, 0.000204918731469661, 0.00022044562501832843, 0.00023597251856699586, 0.0002514994121156633, 0.0002670263056643307, 0.00028255319921299815, 0.0002980800927616656, 0.000313606986310333, 0.00032913387985900044, 0.0003446607734076679, 0.0003601876669563353, 0.00037571456050500274, 0.00039124145405367017, 0.0004067683476023376, 0.00042229524115100503, 0.00043782213469967246, 0.0004533490282483399]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 13.0, 13.0, 22.0, 33.0, 48.0, 73.0, 109.0, 145.0, 193.0, 288.0, 433.0, 699.0, 991.0, 1509.0, 2275.0, 3437.0, 5510.0, 8453.0, 13378.0, 20628.0, 33758.0, 57520.0, 103321.0, 192325.0, 248467.0, 150180.0, 81087.0, 46716.0, 28066.0, 17286.0, 11045.0, 7039.0, 4615.0, 2979.0, 1955.0, 1311.0, 850.0, 625.0, 382.0, 277.0, 164.0, 116.0, 68.0, 40.0, 33.0, 31.0, 15.0, 9.0, 13.0, 7.0, 6.0, 3.0, 1.0, 4.0], "bins": [-0.00102996826171875, -0.000999942421913147, -0.0009699165821075439, -0.0009398907423019409, -0.0009098649024963379, -0.0008798390626907349, -0.0008498132228851318, -0.0008197873830795288, -0.0007897615432739258, -0.0007597357034683228, -0.0007297098636627197, -0.0006996840238571167, -0.0006696581840515137, -0.0006396323442459106, -0.0006096065044403076, -0.0005795806646347046, -0.0005495548248291016, -0.0005195289850234985, -0.0004895031452178955, -0.0004594773054122925, -0.00042945146560668945, -0.0003994256258010864, -0.0003693997859954834, -0.00033937394618988037, -0.00030934810638427734, -0.0002793222665786743, -0.0002492964267730713, -0.00021927058696746826, -0.00018924474716186523, -0.0001592189073562622, -0.00012919306755065918, -9.916722774505615e-05, -6.914138793945312e-05, -3.91155481338501e-05, -9.08970832824707e-06, 2.0936131477355957e-05, 5.0961971282958984e-05, 8.098781108856201e-05, 0.00011101365089416504, 0.00014103949069976807, 0.0001710653305053711, 0.00020109117031097412, 0.00023111701011657715, 0.0002611428499221802, 0.0002911686897277832, 0.00032119452953338623, 0.00035122036933898926, 0.0003812462091445923, 0.0004112720489501953, 0.00044129788875579834, 0.00047132372856140137, 0.0005013495683670044, 0.0005313754081726074, 0.0005614012479782104, 0.0005914270877838135, 0.0006214529275894165, 0.0006514787673950195, 0.0006815046072006226, 0.0007115304470062256, 0.0007415562868118286, 0.0007715821266174316, 0.0008016079664230347, 0.0008316338062286377, 0.0008616596460342407, 0.0008916854858398438]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 8.0, 10.0, 4.0, 10.0, 12.0, 17.0, 20.0, 14.0, 20.0, 19.0, 22.0, 24.0, 28.0, 31.0, 29.0, 33.0, 29.0, 43.0, 35.0, 37.0, 33.0, 52.0, 44.0, 25.0, 41.0, 36.0, 25.0, 26.0, 37.0, 31.0, 29.0, 15.0, 19.0, 23.0, 11.0, 18.0, 11.0, 13.0, 15.0, 9.0, 9.0, 11.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.00041794776916503906, -0.0004060231149196625, -0.0003940984606742859, -0.0003821738064289093, -0.0003702491521835327, -0.00035832449793815613, -0.00034639984369277954, -0.00033447518944740295, -0.00032255053520202637, -0.0003106258809566498, -0.0002987012267112732, -0.0002867765724658966, -0.00027485191822052, -0.00026292726397514343, -0.00025100260972976685, -0.00023907795548439026, -0.00022715330123901367, -0.00021522864699363708, -0.0002033039927482605, -0.0001913793385028839, -0.00017945468425750732, -0.00016753003001213074, -0.00015560537576675415, -0.00014368072152137756, -0.00013175606727600098, -0.00011983141303062439, -0.0001079067587852478, -9.598210453987122e-05, -8.405745029449463e-05, -7.213279604911804e-05, -6.0208141803741455e-05, -4.828348755836487e-05, -3.635883331298828e-05, -2.4434179067611694e-05, -1.2509524822235107e-05, -5.848705768585205e-07, 1.1339783668518066e-05, 2.3264437913894653e-05, 3.518909215927124e-05, 4.711374640464783e-05, 5.9038400650024414e-05, 7.0963054895401e-05, 8.288770914077759e-05, 9.481236338615417e-05, 0.00010673701763153076, 0.00011866167187690735, 0.00013058632612228394, 0.00014251098036766052, 0.0001544356346130371, 0.0001663602888584137, 0.00017828494310379028, 0.00019020959734916687, 0.00020213425159454346, 0.00021405890583992004, 0.00022598356008529663, 0.00023790821433067322, 0.0002498328685760498, 0.0002617575228214264, 0.000273682177066803, 0.00028560683131217957, 0.00029753148555755615, 0.00030945613980293274, 0.0003213807940483093, 0.0003333054482936859, 0.0003452301025390625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 9.0, 7.0, 9.0, 19.0, 18.0, 45.0, 51.0, 104.0, 130.0, 216.0, 304.0, 419.0, 599.0, 877.0, 1265.0, 1838.0, 2742.0, 4232.0, 6203.0, 9089.0, 14285.0, 22114.0, 34788.0, 55137.0, 88080.0, 140504.0, 197683.0, 169619.0, 109480.0, 68256.0, 42465.0, 26864.0, 17242.0, 11174.0, 7378.0, 4904.0, 3322.0, 2180.0, 1581.0, 1049.0, 710.0, 475.0, 347.0, 237.0, 165.0, 120.0, 80.0, 54.0, 32.0, 25.0, 18.0, 13.0, 7.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0007696151733398438, -0.0007467940449714661, -0.0007239729166030884, -0.0007011517882347107, -0.000678330659866333, -0.0006555095314979553, -0.0006326884031295776, -0.0006098672747612, -0.0005870461463928223, -0.0005642250180244446, -0.0005414038896560669, -0.0005185827612876892, -0.0004957616329193115, -0.00047294050455093384, -0.00045011937618255615, -0.00042729824781417847, -0.0004044771194458008, -0.0003816559910774231, -0.0003588348627090454, -0.0003360137343406677, -0.00031319260597229004, -0.00029037147760391235, -0.00026755034923553467, -0.000244729220867157, -0.0002219080924987793, -0.0001990869641304016, -0.00017626583576202393, -0.00015344470739364624, -0.00013062357902526855, -0.00010780245065689087, -8.498132228851318e-05, -6.21601939201355e-05, -3.933906555175781e-05, -1.6517937183380127e-05, 6.303191184997559e-06, 2.9124319553375244e-05, 5.194544792175293e-05, 7.476657629013062e-05, 9.75877046585083e-05, 0.00012040883302688599, 0.00014322996139526367, 0.00016605108976364136, 0.00018887221813201904, 0.00021169334650039673, 0.00023451447486877441, 0.0002573356032371521, 0.0002801567316055298, 0.00030297785997390747, 0.00032579898834228516, 0.00034862011671066284, 0.00037144124507904053, 0.0003942623734474182, 0.0004170835018157959, 0.0004399046301841736, 0.00046272575855255127, 0.00048554688692092896, 0.0005083680152893066, 0.0005311891436576843, 0.000554010272026062, 0.0005768314003944397, 0.0005996525287628174, 0.0006224736571311951, 0.0006452947854995728, 0.0006681159138679504, 0.0006909370422363281]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 2.0, 7.0, 12.0, 12.0, 13.0, 17.0, 12.0, 18.0, 18.0, 15.0, 26.0, 23.0, 23.0, 32.0, 32.0, 33.0, 26.0, 32.0, 32.0, 31.0, 26.0, 34.0, 35.0, 38.0, 40.0, 32.0, 44.0, 36.0, 29.0, 23.0, 32.0, 22.0, 28.0, 35.0, 21.0, 17.0, 17.0, 9.0, 9.0, 17.0, 11.0, 11.0, 2.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002532005310058594, -0.0002452731132507324, -0.00023734569549560547, -0.00022941827774047852, -0.00022149085998535156, -0.0002135634422302246, -0.00020563602447509766, -0.0001977086067199707, -0.00018978118896484375, -0.0001818537712097168, -0.00017392635345458984, -0.0001659989356994629, -0.00015807151794433594, -0.00015014410018920898, -0.00014221668243408203, -0.00013428926467895508, -0.00012636184692382812, -0.00011843442916870117, -0.00011050701141357422, -0.00010257959365844727, -9.465217590332031e-05, -8.672475814819336e-05, -7.87973403930664e-05, -7.086992263793945e-05, -6.29425048828125e-05, -5.501508712768555e-05, -4.7087669372558594e-05, -3.916025161743164e-05, -3.123283386230469e-05, -2.3305416107177734e-05, -1.537799835205078e-05, -7.450580596923828e-06, 4.76837158203125e-07, 8.404254913330078e-06, 1.633167266845703e-05, 2.4259090423583984e-05, 3.218650817871094e-05, 4.011392593383789e-05, 4.8041343688964844e-05, 5.59687614440918e-05, 6.389617919921875e-05, 7.18235969543457e-05, 7.975101470947266e-05, 8.767843246459961e-05, 9.560585021972656e-05, 0.00010353326797485352, 0.00011146068572998047, 0.00011938810348510742, 0.00012731552124023438, 0.00013524293899536133, 0.00014317035675048828, 0.00015109777450561523, 0.0001590251922607422, 0.00016695261001586914, 0.0001748800277709961, 0.00018280744552612305, 0.00019073486328125, 0.00019866228103637695, 0.0002065896987915039, 0.00021451711654663086, 0.0002224445343017578, 0.00023037195205688477, 0.00023829936981201172, 0.00024622678756713867, 0.0002541542053222656]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 9.0, 17.0, 16.0, 18.0, 32.0, 59.0, 87.0, 132.0, 155.0, 238.0, 327.0, 467.0, 620.0, 951.0, 1411.0, 2054.0, 3157.0, 4765.0, 7983.0, 14140.0, 31484.0, 908913.0, 33915.0, 14423.0, 8313.0, 4892.0, 3215.0, 2092.0, 1368.0, 997.0, 658.0, 484.0, 300.0, 252.0, 173.0, 141.0, 81.0, 60.0, 39.0, 30.0, 17.0, 18.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.00019121170043945312, -0.00018514692783355713, -0.00017908215522766113, -0.00017301738262176514, -0.00016695261001586914, -0.00016088783740997314, -0.00015482306480407715, -0.00014875829219818115, -0.00014269351959228516, -0.00013662874698638916, -0.00013056397438049316, -0.00012449920177459717, -0.00011843442916870117, -0.00011236965656280518, -0.00010630488395690918, -0.00010024011135101318, -9.417533874511719e-05, -8.811056613922119e-05, -8.20457935333252e-05, -7.59810209274292e-05, -6.99162483215332e-05, -6.385147571563721e-05, -5.778670310974121e-05, -5.1721930503845215e-05, -4.565715789794922e-05, -3.959238529205322e-05, -3.3527612686157227e-05, -2.746284008026123e-05, -2.1398067474365234e-05, -1.5333294868469238e-05, -9.268522262573242e-06, -3.203749656677246e-06, 2.86102294921875e-06, 8.925795555114746e-06, 1.4990568161010742e-05, 2.1055340766906738e-05, 2.7120113372802734e-05, 3.318488597869873e-05, 3.9249658584594727e-05, 4.531443119049072e-05, 5.137920379638672e-05, 5.7443976402282715e-05, 6.350874900817871e-05, 6.957352161407471e-05, 7.56382942199707e-05, 8.17030668258667e-05, 8.77678394317627e-05, 9.383261203765869e-05, 9.989738464355469e-05, 0.00010596215724945068, 0.00011202692985534668, 0.00011809170246124268, 0.00012415647506713867, 0.00013022124767303467, 0.00013628602027893066, 0.00014235079288482666, 0.00014841556549072266, 0.00015448033809661865, 0.00016054511070251465, 0.00016660988330841064, 0.00017267465591430664, 0.00017873942852020264, 0.00018480420112609863, 0.00019086897373199463, 0.00019693374633789062]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 7.0, 2.0, 7.0, 13.0, 26.0, 20.0, 26.0, 45.0, 51.0, 61.0, 69.0, 88.0, 209.0, 84.0, 60.0, 36.0, 40.0, 28.0, 26.0, 16.0, 20.0, 9.0, 12.0, 4.0, 4.0, 4.0, 4.0, 7.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.1457672119140625e-06, -2.078711986541748e-06, -2.0116567611694336e-06, -1.944601535797119e-06, -1.8775463104248047e-06, -1.8104910850524902e-06, -1.7434358596801758e-06, -1.6763806343078613e-06, -1.6093254089355469e-06, -1.5422701835632324e-06, -1.475214958190918e-06, -1.4081597328186035e-06, -1.341104507446289e-06, -1.2740492820739746e-06, -1.2069940567016602e-06, -1.1399388313293457e-06, -1.0728836059570312e-06, -1.0058283805847168e-06, -9.387731552124023e-07, -8.717179298400879e-07, -8.046627044677734e-07, -7.37607479095459e-07, -6.705522537231445e-07, -6.034970283508301e-07, -5.364418029785156e-07, -4.6938657760620117e-07, -4.023313522338867e-07, -3.3527612686157227e-07, -2.682209014892578e-07, -2.0116567611694336e-07, -1.341104507446289e-07, -6.705522537231445e-08, 0.0, 6.705522537231445e-08, 1.341104507446289e-07, 2.0116567611694336e-07, 2.682209014892578e-07, 3.3527612686157227e-07, 4.023313522338867e-07, 4.6938657760620117e-07, 5.364418029785156e-07, 6.034970283508301e-07, 6.705522537231445e-07, 7.37607479095459e-07, 8.046627044677734e-07, 8.717179298400879e-07, 9.387731552124023e-07, 1.0058283805847168e-06, 1.0728836059570312e-06, 1.1399388313293457e-06, 1.2069940567016602e-06, 1.2740492820739746e-06, 1.341104507446289e-06, 1.4081597328186035e-06, 1.475214958190918e-06, 1.5422701835632324e-06, 1.6093254089355469e-06, 1.6763806343078613e-06, 1.7434358596801758e-06, 1.8104910850524902e-06, 1.8775463104248047e-06, 1.944601535797119e-06, 2.0116567611694336e-06, 2.078711986541748e-06, 2.1457672119140625e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 12.0, 6.0, 29.0, 24.0, 49.0, 65.0, 80.0, 138.0, 167.0, 239.0, 365.0, 546.0, 765.0, 1193.0, 1697.0, 2687.0, 4123.0, 6763.0, 10969.0, 18350.0, 40353.0, 895614.0, 25720.0, 14473.0, 8788.0, 5364.0, 3295.0, 2195.0, 1423.0, 960.0, 627.0, 452.0, 319.0, 206.0, 142.0, 128.0, 62.0, 57.0, 38.0, 18.0, 16.0, 10.0, 13.0, 5.0, 2.0, 8.0, 1.0, 1.0, 3.0], "bins": [-0.0002951622009277344, -0.0002870243042707443, -0.00027888640761375427, -0.0002707485109567642, -0.00026261061429977417, -0.0002544727176427841, -0.00024633482098579407, -0.00023819692432880402, -0.00023005902767181396, -0.00022192113101482391, -0.00021378323435783386, -0.0002056453377008438, -0.00019750744104385376, -0.0001893695443868637, -0.00018123164772987366, -0.0001730937510728836, -0.00016495585441589355, -0.0001568179577589035, -0.00014868006110191345, -0.0001405421644449234, -0.00013240426778793335, -0.0001242663711309433, -0.00011612847447395325, -0.0001079905778169632, -9.985268115997314e-05, -9.17147845029831e-05, -8.357688784599304e-05, -7.543899118900299e-05, -6.730109453201294e-05, -5.916319787502289e-05, -5.102530121803284e-05, -4.2887404561042786e-05, -3.4749507904052734e-05, -2.6611611247062683e-05, -1.8473714590072632e-05, -1.033581793308258e-05, -2.1979212760925293e-06, 5.939975380897522e-06, 1.4077872037887573e-05, 2.2215768694877625e-05, 3.0353665351867676e-05, 3.849156200885773e-05, 4.662945866584778e-05, 5.476735532283783e-05, 6.290525197982788e-05, 7.104314863681793e-05, 7.918104529380798e-05, 8.731894195079803e-05, 9.545683860778809e-05, 0.00010359473526477814, 0.00011173263192176819, 0.00011987052857875824, 0.0001280084252357483, 0.00013614632189273834, 0.0001442842185497284, 0.00015242211520671844, 0.0001605600118637085, 0.00016869790852069855, 0.0001768358051776886, 0.00018497370183467865, 0.0001931115984916687, 0.00020124949514865875, 0.0002093873918056488, 0.00021752528846263885, 0.0002256631851196289]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 3.0, 6.0, 9.0, 8.0, 7.0, 8.0, 6.0, 6.0, 619.0, 216.0, 12.0, 2.0, 10.0, 3.0, 5.0, 9.0, 7.0, 8.0, 5.0, 3.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.195638656616211e-05, -7.967185229063034e-05, -7.738731801509857e-05, -7.51027837395668e-05, -7.281824946403503e-05, -7.053371518850327e-05, -6.82491809129715e-05, -6.596464663743973e-05, -6.368011236190796e-05, -6.139557808637619e-05, -5.911104381084442e-05, -5.682650953531265e-05, -5.4541975259780884e-05, -5.2257440984249115e-05, -4.9972906708717346e-05, -4.768837243318558e-05, -4.540383815765381e-05, -4.311930388212204e-05, -4.083476960659027e-05, -3.85502353310585e-05, -3.6265701055526733e-05, -3.3981166779994965e-05, -3.1696632504463196e-05, -2.9412098228931427e-05, -2.7127563953399658e-05, -2.484302967786789e-05, -2.255849540233612e-05, -2.0273961126804352e-05, -1.7989426851272583e-05, -1.5704892575740814e-05, -1.3420358300209045e-05, -1.1135824024677277e-05, -8.851289749145508e-06, -6.566755473613739e-06, -4.28222119808197e-06, -1.9976869225502014e-06, 2.868473529815674e-07, 2.571381628513336e-06, 4.855915904045105e-06, 7.140450179576874e-06, 9.424984455108643e-06, 1.1709518730640411e-05, 1.399405300617218e-05, 1.627858728170395e-05, 1.8563121557235718e-05, 2.0847655832767487e-05, 2.3132190108299255e-05, 2.5416724383831024e-05, 2.7701258659362793e-05, 2.9985792934894562e-05, 3.227032721042633e-05, 3.45548614859581e-05, 3.683939576148987e-05, 3.912393003702164e-05, 4.1408464312553406e-05, 4.3692998588085175e-05, 4.597753286361694e-05, 4.826206713914871e-05, 5.054660141468048e-05, 5.283113569021225e-05, 5.511566996574402e-05, 5.740020424127579e-05, 5.9684738516807556e-05, 6.196927279233932e-05, 6.42538070678711e-05]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 10.0, 6.0, 14.0, 9.0, 19.0, 21.0, 24.0, 34.0, 48.0, 68.0, 77.0, 120.0, 121.0, 83.0, 77.0, 74.0, 57.0, 32.0, 21.0, 19.0, 16.0, 14.0, 3.0, 3.0, 5.0, 5.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007306183688342571, -0.0007079864153638482, -0.0006853545201011002, -0.0006627225666306913, -0.0006400906713679433, -0.0006174587178975344, -0.0005948267644271255, -0.0005721948109567165, -0.0005495629156939685, -0.0005269309622235596, -0.0005042990669608116, -0.0004816671134904027, -0.00045903518912382424, -0.0004364032647572458, -0.00041377131128683686, -0.0003911393869202584, -0.00036850746255367994, -0.0003458755381871015, -0.000323243613820523, -0.0003006116603501141, -0.00027797973598353565, -0.0002553478116169572, -0.0002327158726984635, -0.0002100839337799698, -0.00018745200941339135, -0.0001648200850468129, -0.0001421881461283192, -0.00011955621448578313, -9.692428284324706e-05, -7.429235120071098e-05, -5.166041955817491e-05, -2.902848063968122e-05, -6.39655627310276e-06, 1.6235375369433314e-05, 3.886730701196939e-05, 6.149923865450546e-05, 8.413117029704154e-05, 0.00010676310193957761, 0.00012939503358211368, 0.00015202697250060737, 0.00017465889686718583, 0.0001972908212337643, 0.00021992276015225798, 0.00024255469907075167, 0.0002651866234373301, 0.0002878185478039086, 0.0003104505012743175, 0.00033308242564089596, 0.0003557143500074744, 0.0003783462743740529, 0.00040097819874063134, 0.00042361015221104026, 0.0004462420765776187, 0.0004688740009441972, 0.0004915059544146061, 0.000514137907885015, 0.000536769803147763, 0.0005594017566181719, 0.0005820336518809199, 0.0006046656053513288, 0.0006272975588217378, 0.0006499294540844858, 0.0006725614075548947, 0.0006951933028176427, 0.0007178252562880516]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 7.0, 9.0, 3.0, 5.0, 13.0, 16.0, 13.0, 18.0, 21.0, 16.0, 25.0, 27.0, 28.0, 42.0, 39.0, 34.0, 35.0, 34.0, 29.0, 43.0, 31.0, 34.0, 43.0, 53.0, 39.0, 47.0, 26.0, 26.0, 17.0, 29.0, 27.0, 19.0, 16.0, 21.0, 20.0, 13.0, 13.0, 7.0, 12.0, 8.0, 7.0, 9.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00042779522482305765, -0.0004148656444158405, -0.0004019360349047929, -0.00038900645449757576, -0.00037607684498652816, -0.000363147264579311, -0.00035021768417209387, -0.00033728807466104627, -0.00032435846514999866, -0.0003114288847427815, -0.0002984992752317339, -0.0002855696948245168, -0.00027264008531346917, -0.000259710504906252, -0.0002467809244990349, -0.00023385131498798728, -0.00022092173458077013, -0.00020799213962163776, -0.0001950625446625054, -0.00018213296425528824, -0.00016920335474424064, -0.0001562737743370235, -0.00014334417937789112, -0.00013041458441875875, -0.00011748498945962638, -0.000104555394500494, -9.162579954136163e-05, -7.869621185818687e-05, -6.57666168990545e-05, -5.2837021939922124e-05, -3.9907434256747365e-05, -2.697783929761499e-05, -1.4048244338482618e-05, -1.1186511983396485e-06, 1.1810941941803321e-05, 2.4740533262956887e-05, 3.767012822208926e-05, 5.0599723181221634e-05, 6.35293108643964e-05, 7.645890582352877e-05, 8.938850078266114e-05, 0.00010231809574179351, 0.00011524769070092589, 0.00012817728566005826, 0.0001411068660672754, 0.000154036475578323, 0.00016696605598554015, 0.00017989565094467252, 0.0001928252459038049, 0.00020575484086293727, 0.00021868443582206964, 0.0002316140162292868, 0.0002445436257403344, 0.00025747320614755154, 0.00027040281565859914, 0.0002833323960658163, 0.00029626197647303343, 0.0003091915568802506, 0.0003221211663912982, 0.0003350507467985153, 0.0003479803563095629, 0.00036090993671678007, 0.0003738395171239972, 0.0003867691266350448, 0.0003996987361460924]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 10.0, 8.0, 21.0, 21.0, 34.0, 45.0, 84.0, 110.0, 159.0, 234.0, 330.0, 444.0, 725.0, 1052.0, 1632.0, 2402.0, 3579.0, 5567.0, 8864.0, 13684.0, 22462.0, 36918.0, 64420.0, 117720.0, 246308.0, 700900.0, 1658987.0, 751339.0, 263843.0, 125610.0, 67660.0, 38445.0, 22940.0, 13866.0, 8509.0, 5565.0, 3433.0, 2141.0, 1475.0, 962.0, 621.0, 393.0, 269.0, 179.0, 119.0, 68.0, 44.0, 33.0, 22.0, 12.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005669593811035156, -0.0005495250225067139, -0.0005320906639099121, -0.0005146563053131104, -0.0004972219467163086, -0.00047978758811950684, -0.0004623532295227051, -0.0004449188709259033, -0.00042748451232910156, -0.0004100501537322998, -0.00039261579513549805, -0.0003751814365386963, -0.00035774707794189453, -0.0003403127193450928, -0.000322878360748291, -0.00030544400215148926, -0.0002880096435546875, -0.00027057528495788574, -0.000253140926361084, -0.00023570656776428223, -0.00021827220916748047, -0.0002008378505706787, -0.00018340349197387695, -0.0001659691333770752, -0.00014853477478027344, -0.00013110041618347168, -0.00011366605758666992, -9.623169898986816e-05, -7.87973403930664e-05, -6.136298179626465e-05, -4.392862319946289e-05, -2.6494264602661133e-05, -9.059906005859375e-06, 8.374452590942383e-06, 2.580881118774414e-05, 4.32431697845459e-05, 6.0677528381347656e-05, 7.811188697814941e-05, 9.554624557495117e-05, 0.00011298060417175293, 0.0001304149627685547, 0.00014784932136535645, 0.0001652836799621582, 0.00018271803855895996, 0.00020015239715576172, 0.00021758675575256348, 0.00023502111434936523, 0.000252455472946167, 0.00026988983154296875, 0.0002873241901397705, 0.00030475854873657227, 0.000322192907333374, 0.0003396272659301758, 0.00035706162452697754, 0.0003744959831237793, 0.00039193034172058105, 0.0004093647003173828, 0.00042679905891418457, 0.00044423341751098633, 0.0004616677761077881, 0.00047910213470458984, 0.0004965364933013916, 0.0005139708518981934, 0.0005314052104949951, 0.0005488395690917969]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 5.0, 4.0, 4.0, 7.0, 10.0, 14.0, 14.0, 14.0, 20.0, 17.0, 16.0, 23.0, 32.0, 36.0, 23.0, 38.0, 28.0, 38.0, 42.0, 33.0, 39.0, 43.0, 46.0, 36.0, 48.0, 41.0, 36.0, 38.0, 20.0, 32.0, 24.0, 24.0, 21.0, 22.0, 10.0, 18.0, 14.0, 12.0, 6.0, 13.0, 7.0, 5.0, 2.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0], "bins": [-0.0002617835998535156, -0.00025396794080734253, -0.00024615228176116943, -0.00023833662271499634, -0.00023052096366882324, -0.00022270530462265015, -0.00021488964557647705, -0.00020707398653030396, -0.00019925832748413086, -0.00019144266843795776, -0.00018362700939178467, -0.00017581135034561157, -0.00016799569129943848, -0.00016018003225326538, -0.00015236437320709229, -0.0001445487141609192, -0.0001367330551147461, -0.000128917396068573, -0.0001211017370223999, -0.0001132860779762268, -0.00010547041893005371, -9.765475988388062e-05, -8.983910083770752e-05, -8.202344179153442e-05, -7.420778274536133e-05, -6.639212369918823e-05, -5.857646465301514e-05, -5.076080560684204e-05, -4.2945146560668945e-05, -3.512948751449585e-05, -2.7313828468322754e-05, -1.9498169422149658e-05, -1.1682510375976562e-05, -3.866851329803467e-06, 3.948807716369629e-06, 1.1764466762542725e-05, 1.958012580871582e-05, 2.7395784854888916e-05, 3.521144390106201e-05, 4.302710294723511e-05, 5.08427619934082e-05, 5.86584210395813e-05, 6.64740800857544e-05, 7.428973913192749e-05, 8.210539817810059e-05, 8.992105722427368e-05, 9.773671627044678e-05, 0.00010555237531661987, 0.00011336803436279297, 0.00012118369340896606, 0.00012899935245513916, 0.00013681501150131226, 0.00014463067054748535, 0.00015244632959365845, 0.00016026198863983154, 0.00016807764768600464, 0.00017589330673217773, 0.00018370896577835083, 0.00019152462482452393, 0.00019934028387069702, 0.00020715594291687012, 0.0002149716019630432, 0.0002227872610092163, 0.0002306029200553894, 0.0002384185791015625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 8.0, 12.0, 18.0, 30.0, 50.0, 61.0, 92.0, 165.0, 233.0, 311.0, 521.0, 830.0, 1213.0, 2002.0, 3312.0, 5268.0, 8580.0, 14591.0, 24372.0, 41830.0, 75303.0, 141019.0, 287353.0, 680622.0, 1456191.0, 780824.0, 320811.0, 155169.0, 82134.0, 45546.0, 25901.0, 15682.0, 9249.0, 5602.0, 3445.0, 2115.0, 1400.0, 809.0, 560.0, 369.0, 233.0, 142.0, 103.0, 66.0, 43.0, 30.0, 21.0, 11.0, 13.0, 10.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004813671112060547, -0.0004661194980144501, -0.00045087188482284546, -0.00043562427163124084, -0.00042037665843963623, -0.0004051290452480316, -0.000389881432056427, -0.0003746338188648224, -0.0003593862056732178, -0.00034413859248161316, -0.00032889097929000854, -0.00031364336609840393, -0.0002983957529067993, -0.0002831481397151947, -0.0002679005265235901, -0.0002526529133319855, -0.00023740530014038086, -0.00022215768694877625, -0.00020691007375717163, -0.00019166246056556702, -0.0001764148473739624, -0.0001611672341823578, -0.00014591962099075317, -0.00013067200779914856, -0.00011542439460754395, -0.00010017678141593933, -8.492916822433472e-05, -6.96815550327301e-05, -5.443394184112549e-05, -3.9186328649520874e-05, -2.393871545791626e-05, -8.691102266311646e-06, 6.556510925292969e-06, 2.1804124116897583e-05, 3.70517373085022e-05, 5.229935050010681e-05, 6.754696369171143e-05, 8.279457688331604e-05, 9.804219007492065e-05, 0.00011328980326652527, 0.00012853741645812988, 0.0001437850296497345, 0.0001590326428413391, 0.00017428025603294373, 0.00018952786922454834, 0.00020477548241615295, 0.00022002309560775757, 0.00023527070879936218, 0.0002505183219909668, 0.0002657659351825714, 0.000281013548374176, 0.00029626116156578064, 0.00031150877475738525, 0.00032675638794898987, 0.0003420040011405945, 0.0003572516143321991, 0.0003724992275238037, 0.0003877468407154083, 0.00040299445390701294, 0.00041824206709861755, 0.00043348968029022217, 0.0004487372934818268, 0.0004639849066734314, 0.000479232519865036, 0.0004944801330566406]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 15.0, 11.0, 16.0, 31.0, 28.0, 36.0, 59.0, 71.0, 88.0, 96.0, 111.0, 120.0, 176.0, 188.0, 224.0, 261.0, 281.0, 282.0, 293.0, 270.0, 231.0, 218.0, 181.0, 153.0, 126.0, 118.0, 74.0, 56.0, 58.0, 41.0, 38.0, 30.0, 25.0, 12.0, 11.0, 8.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00015616416931152344, -0.00015125423669815063, -0.00014634430408477783, -0.00014143437147140503, -0.00013652443885803223, -0.00013161450624465942, -0.00012670457363128662, -0.00012179464101791382, -0.00011688470840454102, -0.00011197477579116821, -0.00010706484317779541, -0.00010215491056442261, -9.72449779510498e-05, -9.2335045337677e-05, -8.74251127243042e-05, -8.25151801109314e-05, -7.76052474975586e-05, -7.269531488418579e-05, -6.778538227081299e-05, -6.287544965744019e-05, -5.796551704406738e-05, -5.305558443069458e-05, -4.814565181732178e-05, -4.3235719203948975e-05, -3.832578659057617e-05, -3.341585397720337e-05, -2.8505921363830566e-05, -2.3595988750457764e-05, -1.868605613708496e-05, -1.3776123523712158e-05, -8.866190910339355e-06, -3.956258296966553e-06, 9.5367431640625e-07, 5.863606929779053e-06, 1.0773539543151855e-05, 1.5683472156524658e-05, 2.059340476989746e-05, 2.5503337383270264e-05, 3.0413269996643066e-05, 3.532320261001587e-05, 4.023313522338867e-05, 4.5143067836761475e-05, 5.005300045013428e-05, 5.496293306350708e-05, 5.987286567687988e-05, 6.478279829025269e-05, 6.969273090362549e-05, 7.460266351699829e-05, 7.95125961303711e-05, 8.44225287437439e-05, 8.93324613571167e-05, 9.42423939704895e-05, 9.91523265838623e-05, 0.00010406225919723511, 0.00010897219181060791, 0.00011388212442398071, 0.00011879205703735352, 0.00012370198965072632, 0.00012861192226409912, 0.00013352185487747192, 0.00013843178749084473, 0.00014334172010421753, 0.00014825165271759033, 0.00015316158533096313, 0.00015807151794433594]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 7.0, 7.0, 12.0, 11.0, 19.0, 17.0, 26.0, 22.0, 32.0, 45.0, 63.0, 73.0, 71.0, 85.0, 86.0, 78.0, 66.0, 56.0, 43.0, 43.0, 26.0, 24.0, 24.0, 10.0, 10.0, 7.0, 5.0, 7.0, 3.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00044371484545990825, -0.00043095386354252696, -0.0004181928525213152, -0.00040543187060393393, -0.0003926708595827222, -0.0003799098776653409, -0.0003671488957479596, -0.00035438788472674787, -0.0003416269028093666, -0.0003288659208919853, -0.00031610490987077355, -0.00030334392795339227, -0.0002905829169321805, -0.00027782193501479924, -0.0002650609239935875, -0.0002522999420762062, -0.0002395389456069097, -0.00022677794913761318, -0.00021401695266831666, -0.00020125595619902015, -0.00018849497428163886, -0.00017573397781234235, -0.00016297298134304583, -0.00015021199942566454, -0.0001374509884044528, -0.00012468999193515629, -0.00011192900274181738, -9.916800627252087e-05, -8.640701707918197e-05, -7.364602060988545e-05, -6.088502414058894e-05, -4.812403494725004e-05, -3.536304575391114e-05, -2.260205292259343e-05, -9.841058272286318e-06, 2.919936378020793e-06, 1.56809292093385e-05, 2.844192204065621e-05, 4.1202918509952724e-05, 5.3963907703291625e-05, 6.672490417258814e-05, 7.948590064188465e-05, 9.224688983522356e-05, 0.00010500788630452007, 0.00011776888277381659, 0.00013052986469119787, 0.00014329087571240962, 0.0001560518576297909, 0.00016881285409908742, 0.00018157385056838393, 0.00019433484703768045, 0.00020709584350697696, 0.00021985682542435825, 0.00023261782189365476, 0.0002453788183629513, 0.00025813980028033257, 0.0002709008113015443, 0.0002836617932189256, 0.00029642280424013734, 0.0003091837861575186, 0.00032194479717873037, 0.00033470577909611166, 0.0003474667901173234, 0.0003602277720347047, 0.00037298875395208597]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 5.0, 2.0, 6.0, 6.0, 8.0, 13.0, 17.0, 11.0, 14.0, 14.0, 24.0, 23.0, 23.0, 28.0, 33.0, 29.0, 32.0, 35.0, 36.0, 34.0, 45.0, 32.0, 29.0, 30.0, 34.0, 38.0, 46.0, 41.0, 35.0, 26.0, 30.0, 17.0, 29.0, 23.0, 24.0, 12.0, 21.0, 15.0, 14.0, 7.0, 8.0, 11.0, 10.0, 10.0, 5.0, 7.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0002826947020366788, -0.00027439312543720007, -0.00026609154883772135, -0.0002577899722382426, -0.0002494883956387639, -0.00024118681903928518, -0.0002328852569917217, -0.00022458368039224297, -0.00021628210379276425, -0.00020798052719328552, -0.0001996789505938068, -0.00019137737399432808, -0.0001830758119467646, -0.00017477423534728587, -0.00016647265874780715, -0.00015817108214832842, -0.0001498695055488497, -0.00014156792894937098, -0.00013326635234989226, -0.00012496477575041354, -0.00011666320642689243, -0.00010836162982741371, -0.0001000600605038926, -9.175848390441388e-05, -8.345690730493516e-05, -7.515533070545644e-05, -6.685375410597771e-05, -5.855218478245661e-05, -5.0250608182977885e-05, -4.1949031583499163e-05, -3.364745862199925e-05, -2.5345885660499334e-05, -1.704433816485107e-05, -8.742763384361751e-06, -4.411886038724333e-07, 7.860386176616885e-06, 1.6161960957106203e-05, 2.4463537556584924e-05, 3.276511051808484e-05, 4.1066683479584754e-05, 4.9368260079063475e-05, 5.76698366785422e-05, 6.597141327802092e-05, 7.427298260154203e-05, 8.257455920102075e-05, 9.087613580049947e-05, 9.917770512402058e-05, 0.0001074792817234993, 0.00011578085832297802, 0.00012408243492245674, 0.00013238401152193546, 0.00014068558812141418, 0.0001489871647208929, 0.00015728874132037163, 0.00016559030336793512, 0.00017389187996741384, 0.00018219345656689256, 0.00019049503316637129, 0.00019879660976585, 0.00020709818636532873, 0.00021539974841289222, 0.00022370132501237094, 0.00023200290161184967, 0.0002403044782113284, 0.0002486060548108071]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 2.0, 7.0, 18.0, 22.0, 38.0, 55.0, 69.0, 103.0, 174.0, 261.0, 446.0, 642.0, 1055.0, 1833.0, 3052.0, 5113.0, 8677.0, 15314.0, 26756.0, 48405.0, 88402.0, 158182.0, 243155.0, 194833.0, 111306.0, 61004.0, 33977.0, 18934.0, 10913.0, 6252.0, 3829.0, 2210.0, 1338.0, 754.0, 510.0, 331.0, 198.0, 136.0, 88.0, 47.0, 40.0, 21.0, 18.0, 11.0, 10.0, 10.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0005984306335449219, -0.0005811825394630432, -0.0005639344453811646, -0.0005466863512992859, -0.0005294382572174072, -0.0005121901631355286, -0.0004949420690536499, -0.00047769397497177124, -0.0004604458808898926, -0.0004431977868080139, -0.00042594969272613525, -0.0004087015986442566, -0.00039145350456237793, -0.00037420541048049927, -0.0003569573163986206, -0.00033970922231674194, -0.0003224611282348633, -0.0003052130341529846, -0.00028796494007110596, -0.0002707168459892273, -0.00025346875190734863, -0.00023622065782546997, -0.0002189725637435913, -0.00020172446966171265, -0.00018447637557983398, -0.00016722828149795532, -0.00014998018741607666, -0.000132732093334198, -0.00011548399925231934, -9.823590517044067e-05, -8.098781108856201e-05, -6.373971700668335e-05, -4.649162292480469e-05, -2.9243528842926025e-05, -1.1995434761047363e-05, 5.252659320831299e-06, 2.250075340270996e-05, 3.974884748458862e-05, 5.6996941566467285e-05, 7.424503564834595e-05, 9.149312973022461e-05, 0.00010874122381210327, 0.00012598931789398193, 0.0001432374119758606, 0.00016048550605773926, 0.00017773360013961792, 0.00019498169422149658, 0.00021222978830337524, 0.0002294778823852539, 0.00024672597646713257, 0.00026397407054901123, 0.0002812221646308899, 0.00029847025871276855, 0.0003157183527946472, 0.0003329664468765259, 0.00035021454095840454, 0.0003674626350402832, 0.00038471072912216187, 0.00040195882320404053, 0.0004192069172859192, 0.00043645501136779785, 0.0004537031054496765, 0.0004709511995315552, 0.00048819929361343384, 0.0005054473876953125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 9.0, 5.0, 14.0, 10.0, 6.0, 7.0, 19.0, 11.0, 25.0, 23.0, 32.0, 21.0, 27.0, 39.0, 33.0, 26.0, 34.0, 44.0, 34.0, 38.0, 25.0, 30.0, 44.0, 33.0, 44.0, 43.0, 30.0, 38.0, 24.0, 30.0, 22.0, 23.0, 21.0, 23.0, 13.0, 24.0, 10.0, 12.0, 8.0, 9.0, 9.0, 4.0, 8.0, 3.0, 3.0, 1.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.00023627281188964844, -0.0002291649580001831, -0.00022205710411071777, -0.00021494925022125244, -0.0002078413963317871, -0.00020073354244232178, -0.00019362568855285645, -0.0001865178346633911, -0.00017940998077392578, -0.00017230212688446045, -0.00016519427299499512, -0.00015808641910552979, -0.00015097856521606445, -0.00014387071132659912, -0.0001367628574371338, -0.00012965500354766846, -0.00012254714965820312, -0.00011543929576873779, -0.00010833144187927246, -0.00010122358798980713, -9.41157341003418e-05, -8.700788021087646e-05, -7.990002632141113e-05, -7.27921724319458e-05, -6.568431854248047e-05, -5.857646465301514e-05, -5.1468610763549805e-05, -4.436075687408447e-05, -3.725290298461914e-05, -3.014504909515381e-05, -2.3037195205688477e-05, -1.5929341316223145e-05, -8.821487426757812e-06, -1.7136335372924805e-06, 5.3942203521728516e-06, 1.2502074241638184e-05, 1.9609928131103516e-05, 2.6717782020568848e-05, 3.382563591003418e-05, 4.093348979949951e-05, 4.8041343688964844e-05, 5.5149197578430176e-05, 6.225705146789551e-05, 6.936490535736084e-05, 7.647275924682617e-05, 8.35806131362915e-05, 9.068846702575684e-05, 9.779632091522217e-05, 0.0001049041748046875, 0.00011201202869415283, 0.00011911988258361816, 0.0001262277364730835, 0.00013333559036254883, 0.00014044344425201416, 0.0001475512981414795, 0.00015465915203094482, 0.00016176700592041016, 0.0001688748598098755, 0.00017598271369934082, 0.00018309056758880615, 0.00019019842147827148, 0.00019730627536773682, 0.00020441412925720215, 0.00021152198314666748, 0.0002186298370361328]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 13.0, 10.0, 17.0, 19.0, 37.0, 67.0, 89.0, 167.0, 240.0, 399.0, 691.0, 1223.0, 1983.0, 3554.0, 6710.0, 13745.0, 31972.0, 112327.0, 599752.0, 196001.0, 43726.0, 17402.0, 8220.0, 4379.0, 2334.0, 1370.0, 846.0, 470.0, 294.0, 177.0, 102.0, 74.0, 51.0, 26.0, 14.0, 17.0, 13.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010204315185546875, -0.0009901076555252075, -0.0009597837924957275, -0.0009294599294662476, -0.0008991360664367676, -0.0008688122034072876, -0.0008384883403778076, -0.0008081644773483276, -0.0007778406143188477, -0.0007475167512893677, -0.0007171928882598877, -0.0006868690252304077, -0.0006565451622009277, -0.0006262212991714478, -0.0005958974361419678, -0.0005655735731124878, -0.0005352497100830078, -0.0005049258470535278, -0.00047460198402404785, -0.00044427812099456787, -0.0004139542579650879, -0.0003836303949356079, -0.00035330653190612793, -0.00032298266887664795, -0.00029265880584716797, -0.000262334942817688, -0.000232011079788208, -0.00020168721675872803, -0.00017136335372924805, -0.00014103949069976807, -0.00011071562767028809, -8.03917646408081e-05, -5.0067901611328125e-05, -1.9744038581848145e-05, 1.0579824447631836e-05, 4.0903687477111816e-05, 7.12275505065918e-05, 0.00010155141353607178, 0.00013187527656555176, 0.00016219913959503174, 0.00019252300262451172, 0.0002228468656539917, 0.0002531707286834717, 0.00028349459171295166, 0.00031381845474243164, 0.0003441423177719116, 0.0003744661808013916, 0.0004047900438308716, 0.00043511390686035156, 0.00046543776988983154, 0.0004957616329193115, 0.0005260854959487915, 0.0005564093589782715, 0.0005867332220077515, 0.0006170570850372314, 0.0006473809480667114, 0.0006777048110961914, 0.0007080286741256714, 0.0007383525371551514, 0.0007686764001846313, 0.0007990002632141113, 0.0008293241262435913, 0.0008596479892730713, 0.0008899718523025513, 0.0009202957153320312]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 4.0, 7.0, 5.0, 11.0, 13.0, 9.0, 12.0, 12.0, 23.0, 16.0, 21.0, 23.0, 25.0, 33.0, 42.0, 21.0, 32.0, 41.0, 39.0, 30.0, 33.0, 29.0, 29.0, 39.0, 44.0, 43.0, 38.0, 43.0, 33.0, 27.0, 22.0, 19.0, 24.0, 25.0, 23.0, 21.0, 7.0, 18.0, 14.0, 7.0, 9.0, 10.0, 6.0, 5.0, 5.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.00014972686767578125, -0.00014508888125419617, -0.00014045089483261108, -0.000135812908411026, -0.00013117492198944092, -0.00012653693556785583, -0.00012189894914627075, -0.00011726096272468567, -0.00011262297630310059, -0.0001079849898815155, -0.00010334700345993042, -9.870901703834534e-05, -9.407103061676025e-05, -8.943304419517517e-05, -8.479505777359009e-05, -8.0157071352005e-05, -7.551908493041992e-05, -7.088109850883484e-05, -6.624311208724976e-05, -6.160512566566467e-05, -5.696713924407959e-05, -5.232915282249451e-05, -4.7691166400909424e-05, -4.305317997932434e-05, -3.841519355773926e-05, -3.3777207136154175e-05, -2.9139220714569092e-05, -2.450123429298401e-05, -1.9863247871398926e-05, -1.5225261449813843e-05, -1.058727502822876e-05, -5.949288606643677e-06, -1.3113021850585938e-06, 3.3266842365264893e-06, 7.964670658111572e-06, 1.2602657079696655e-05, 1.7240643501281738e-05, 2.187862992286682e-05, 2.6516616344451904e-05, 3.115460276603699e-05, 3.579258918762207e-05, 4.043057560920715e-05, 4.5068562030792236e-05, 4.970654845237732e-05, 5.43445348739624e-05, 5.8982521295547485e-05, 6.362050771713257e-05, 6.825849413871765e-05, 7.289648056030273e-05, 7.753446698188782e-05, 8.21724534034729e-05, 8.681043982505798e-05, 9.144842624664307e-05, 9.608641266822815e-05, 0.00010072439908981323, 0.00010536238551139832, 0.0001100003719329834, 0.00011463835835456848, 0.00011927634477615356, 0.00012391433119773865, 0.00012855231761932373, 0.0001331903040409088, 0.0001378282904624939, 0.00014246627688407898, 0.00014710426330566406]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 13.0, 21.0, 25.0, 43.0, 54.0, 78.0, 111.0, 175.0, 254.0, 395.0, 610.0, 979.0, 1573.0, 2933.0, 5861.0, 13402.0, 45023.0, 446596.0, 458027.0, 45825.0, 13544.0, 5697.0, 2886.0, 1610.0, 953.0, 612.0, 408.0, 251.0, 183.0, 108.0, 79.0, 66.0, 38.0, 29.0, 14.0, 17.0, 15.0, 3.0, 5.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0003705024719238281, -0.000359605997800827, -0.00034870952367782593, -0.00033781304955482483, -0.00032691657543182373, -0.00031602010130882263, -0.00030512362718582153, -0.00029422715306282043, -0.00028333067893981934, -0.00027243420481681824, -0.00026153773069381714, -0.00025064125657081604, -0.00023974478244781494, -0.00022884830832481384, -0.00021795183420181274, -0.00020705536007881165, -0.00019615888595581055, -0.00018526241183280945, -0.00017436593770980835, -0.00016346946358680725, -0.00015257298946380615, -0.00014167651534080505, -0.00013078004121780396, -0.00011988356709480286, -0.00010898709297180176, -9.809061884880066e-05, -8.719414472579956e-05, -7.629767060279846e-05, -6.540119647979736e-05, -5.4504722356796265e-05, -4.3608248233795166e-05, -3.271177411079407e-05, -2.181529998779297e-05, -1.091882586479187e-05, -2.2351741790771484e-08, 1.0874122381210327e-05, 2.1770596504211426e-05, 3.2667070627212524e-05, 4.356354475021362e-05, 5.446001887321472e-05, 6.535649299621582e-05, 7.625296711921692e-05, 8.714944124221802e-05, 9.804591536521912e-05, 0.00010894238948822021, 0.00011983886361122131, 0.0001307353377342224, 0.0001416318118572235, 0.0001525282859802246, 0.0001634247601032257, 0.0001743212342262268, 0.0001852177083492279, 0.000196114182472229, 0.0002070106565952301, 0.0002179071307182312, 0.0002288036048412323, 0.0002397000789642334, 0.0002505965530872345, 0.0002614930272102356, 0.0002723895013332367, 0.0002832859754562378, 0.0002941824495792389, 0.00030507892370224, 0.0003159753978252411, 0.0003268718719482422]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 4.0, 5.0, 8.0, 7.0, 8.0, 15.0, 19.0, 10.0, 31.0, 31.0, 75.0, 97.0, 151.0, 171.0, 114.0, 78.0, 45.0, 42.0, 18.0, 20.0, 10.0, 6.0, 5.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2576580047607422e-05, -1.2184493243694305e-05, -1.1792406439781189e-05, -1.1400319635868073e-05, -1.1008232831954956e-05, -1.061614602804184e-05, -1.0224059224128723e-05, -9.831972420215607e-06, -9.43988561630249e-06, -9.047798812389374e-06, -8.655712008476257e-06, -8.263625204563141e-06, -7.871538400650024e-06, -7.479451596736908e-06, -7.0873647928237915e-06, -6.695277988910675e-06, -6.303191184997559e-06, -5.911104381084442e-06, -5.519017577171326e-06, -5.126930773258209e-06, -4.734843969345093e-06, -4.342757165431976e-06, -3.95067036151886e-06, -3.5585835576057434e-06, -3.166496753692627e-06, -2.7744099497795105e-06, -2.382323145866394e-06, -1.9902363419532776e-06, -1.5981495380401611e-06, -1.2060627341270447e-06, -8.139759302139282e-07, -4.2188912630081177e-07, -2.9802322387695312e-08, 3.6228448152542114e-07, 7.543712854385376e-07, 1.146458089351654e-06, 1.5385448932647705e-06, 1.930631697177887e-06, 2.3227185010910034e-06, 2.71480530500412e-06, 3.1068921089172363e-06, 3.4989789128303528e-06, 3.891065716743469e-06, 4.283152520656586e-06, 4.675239324569702e-06, 5.067326128482819e-06, 5.459412932395935e-06, 5.8514997363090515e-06, 6.243586540222168e-06, 6.6356733441352844e-06, 7.027760148048401e-06, 7.419846951961517e-06, 7.811933755874634e-06, 8.20402055978775e-06, 8.596107363700867e-06, 8.988194167613983e-06, 9.3802809715271e-06, 9.772367775440216e-06, 1.0164454579353333e-05, 1.0556541383266449e-05, 1.0948628187179565e-05, 1.1340714991092682e-05, 1.1732801795005798e-05, 1.2124888598918915e-05, 1.2516975402832031e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 1.0, 6.0, 11.0, 14.0, 27.0, 28.0, 46.0, 56.0, 53.0, 90.0, 126.0, 177.0, 215.0, 286.0, 412.0, 530.0, 722.0, 1056.0, 1496.0, 2271.0, 3679.0, 5569.0, 9147.0, 15994.0, 29832.0, 67478.0, 186225.0, 428301.0, 165566.0, 61444.0, 27900.0, 14828.0, 8835.0, 5315.0, 3406.0, 2259.0, 1493.0, 972.0, 676.0, 569.0, 352.0, 276.0, 203.0, 182.0, 119.0, 80.0, 63.0, 48.0, 44.0, 26.0, 17.0, 12.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.00010633468627929688, -0.00010284222662448883, -9.934976696968079e-05, -9.585730731487274e-05, -9.23648476600647e-05, -8.887238800525665e-05, -8.537992835044861e-05, -8.188746869564056e-05, -7.839500904083252e-05, -7.490254938602448e-05, -7.141008973121643e-05, -6.791763007640839e-05, -6.442517042160034e-05, -6.09327107667923e-05, -5.744025111198425e-05, -5.394779145717621e-05, -5.0455331802368164e-05, -4.696287214756012e-05, -4.3470412492752075e-05, -3.997795283794403e-05, -3.6485493183135986e-05, -3.299303352832794e-05, -2.9500573873519897e-05, -2.6008114218711853e-05, -2.251565456390381e-05, -1.9023194909095764e-05, -1.553073525428772e-05, -1.2038275599479675e-05, -8.545815944671631e-06, -5.0533562898635864e-06, -1.560896635055542e-06, 1.9315630197525024e-06, 5.424022674560547e-06, 8.916482329368591e-06, 1.2408941984176636e-05, 1.590140163898468e-05, 1.9393861293792725e-05, 2.288632094860077e-05, 2.6378780603408813e-05, 2.9871240258216858e-05, 3.33636999130249e-05, 3.685615956783295e-05, 4.034861922264099e-05, 4.3841078877449036e-05, 4.733353853225708e-05, 5.0825998187065125e-05, 5.431845784187317e-05, 5.781091749668121e-05, 6.130337715148926e-05, 6.47958368062973e-05, 6.828829646110535e-05, 7.178075611591339e-05, 7.527321577072144e-05, 7.876567542552948e-05, 8.225813508033752e-05, 8.575059473514557e-05, 8.924305438995361e-05, 9.273551404476166e-05, 9.62279736995697e-05, 9.972043335437775e-05, 0.00010321289300918579, 0.00010670535266399384, 0.00011019781231880188, 0.00011369027197360992, 0.00011718273162841797]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 4.0, 6.0, 14.0, 10.0, 14.0, 13.0, 23.0, 25.0, 27.0, 43.0, 51.0, 63.0, 80.0, 71.0, 89.0, 95.0, 70.0, 68.0, 54.0, 42.0, 29.0, 26.0, 21.0, 14.0, 13.0, 6.0, 10.0, 6.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-05, -2.4049542844295502e-05, -2.306513488292694e-05, -2.208072692155838e-05, -2.109631896018982e-05, -2.011191099882126e-05, -1.9127503037452698e-05, -1.8143095076084137e-05, -1.7158687114715576e-05, -1.6174279153347015e-05, -1.5189871191978455e-05, -1.4205463230609894e-05, -1.3221055269241333e-05, -1.2236647307872772e-05, -1.1252239346504211e-05, -1.026783138513565e-05, -9.28342342376709e-06, -8.299015462398529e-06, -7.314607501029968e-06, -6.3301995396614075e-06, -5.345791578292847e-06, -4.361383616924286e-06, -3.376975655555725e-06, -2.3925676941871643e-06, -1.4081597328186035e-06, -4.237517714500427e-07, 5.606561899185181e-07, 1.5450641512870789e-06, 2.5294721126556396e-06, 3.5138800740242004e-06, 4.498288035392761e-06, 5.482695996761322e-06, 6.467103958129883e-06, 7.451511919498444e-06, 8.435919880867004e-06, 9.420327842235565e-06, 1.0404735803604126e-05, 1.1389143764972687e-05, 1.2373551726341248e-05, 1.3357959687709808e-05, 1.4342367649078369e-05, 1.532677561044693e-05, 1.631118357181549e-05, 1.729559153318405e-05, 1.8279999494552612e-05, 1.9264407455921173e-05, 2.0248815417289734e-05, 2.1233223378658295e-05, 2.2217631340026855e-05, 2.3202039301395416e-05, 2.4186447262763977e-05, 2.5170855224132538e-05, 2.61552631855011e-05, 2.713967114686966e-05, 2.812407910823822e-05, 2.910848706960678e-05, 3.0092895030975342e-05, 3.10773029923439e-05, 3.206171095371246e-05, 3.3046118915081024e-05, 3.4030526876449585e-05, 3.5014934837818146e-05, 3.5999342799186707e-05, 3.698375076055527e-05, 3.796815872192383e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 9.0, 7.0, 12.0, 12.0, 17.0, 16.0, 25.0, 35.0, 33.0, 40.0, 59.0, 70.0, 68.0, 91.0, 75.0, 89.0, 72.0, 45.0, 41.0, 24.0, 35.0, 26.0, 22.0, 17.0, 9.0, 7.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0003416316758375615, -0.00033181466278620064, -0.00032199762063100934, -0.0003121806075796485, -0.00030236359452828765, -0.0002925465814769268, -0.00028272956842556596, -0.00027291252627037466, -0.0002630955132190138, -0.00025327850016765296, -0.0002434614725643769, -0.00023364444496110082, -0.00022382743190973997, -0.00021401041885837913, -0.00020419339125510305, -0.00019437636365182698, -0.00018455935060046613, -0.0001747423375491053, -0.0001649253099458292, -0.00015510828234255314, -0.0001452912692911923, -0.00013547425623983145, -0.00012565722863655537, -0.00011584020830923691, -0.00010602318798191845, -9.62061676546e-05, -8.638914732728153e-05, -7.657212699996307e-05, -6.675510667264462e-05, -5.6938086345326155e-05, -4.7121066018007696e-05, -3.7304045690689236e-05, -2.748699625954032e-05, -1.766997593222186e-05, -7.8529556049034e-06, 1.96406472241506e-06, 1.178108504973352e-05, 2.159810537705198e-05, 3.141512570437044e-05, 4.12321460316889e-05, 5.104916635900736e-05, 6.086618668632582e-05, 7.068320701364428e-05, 8.050022734096274e-05, 9.03172476682812e-05, 0.00010013426799559966, 0.00010995128832291812, 0.00011976830865023658, 0.00012958532897755504, 0.00013940234202891588, 0.00014921936963219196, 0.00015903639723546803, 0.00016885341028682888, 0.00017867042333818972, 0.0001884874509414658, 0.00019830447854474187, 0.00020812149159610271, 0.00021793850464746356, 0.00022775553225073963, 0.0002375725598540157, 0.00024738957290537655, 0.0002572065859567374, 0.0002670236281119287, 0.00027684064116328955, 0.0002866576542146504]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 2.0, 8.0, 6.0, 9.0, 14.0, 9.0, 17.0, 15.0, 19.0, 19.0, 17.0, 26.0, 34.0, 34.0, 30.0, 31.0, 30.0, 42.0, 37.0, 35.0, 37.0, 35.0, 31.0, 31.0, 41.0, 45.0, 46.0, 25.0, 26.0, 26.0, 29.0, 26.0, 17.0, 22.0, 20.0, 20.0, 11.0, 11.0, 10.0, 11.0, 10.0, 10.0, 6.0, 3.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00023243452596943825, -0.00022555378382094204, -0.00021867304167244583, -0.00021179229952394962, -0.0002049115573754534, -0.0001980308152269572, -0.00019115005852654576, -0.00018426933092996478, -0.00017738857422955334, -0.00017050783208105713, -0.00016362708993256092, -0.0001567463477840647, -0.0001498656056355685, -0.0001429848634870723, -0.00013610412133857608, -0.00012922336463816464, -0.00012234263704158366, -0.00011546189489308745, -0.00010858115274459124, -0.00010170041059609503, -9.481966844759881e-05, -8.79389262991026e-05, -8.105817687464878e-05, -7.417743472615257e-05, -6.729669257765636e-05, -6.041595042916015e-05, -5.353520828066394e-05, -4.665446249418892e-05, -3.977372034569271e-05, -3.28929781971965e-05, -2.601223241072148e-05, -1.913149026222527e-05, -1.2250733561813831e-05, -5.369990503822919e-06, 1.5107525541679934e-06, 8.391496521653607e-06, 1.5272238670149818e-05, 2.215298081864603e-05, 2.9033726605121046e-05, 3.591446875361726e-05, 4.279521090211347e-05, 4.967595305060968e-05, 5.655669519910589e-05, 6.343744462355971e-05, 7.031818677205592e-05, 7.719892892055213e-05, 8.407967106904835e-05, 9.096041321754456e-05, 9.784115536604077e-05, 0.00010472189751453698, 0.00011160263966303319, 0.0001184833818115294, 0.0001253641239600256, 0.00013224486610852182, 0.00013912562280893326, 0.00014600635040551424, 0.00015288710710592568, 0.0001597678492544219, 0.0001666485914029181, 0.0001735293335514143, 0.00018041007569991052, 0.00018729081784840673, 0.00019417155999690294, 0.00020105231669731438, 0.00020793304429389536]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 5.0, 12.0, 17.0, 35.0, 33.0, 48.0, 62.0, 114.0, 138.0, 180.0, 258.0, 355.0, 546.0, 696.0, 1001.0, 1444.0, 1909.0, 2715.0, 3708.0, 5258.0, 7138.0, 10367.0, 14543.0, 21198.0, 30364.0, 45420.0, 67450.0, 101662.0, 146587.0, 169525.0, 133569.0, 90139.0, 60009.0, 40202.0, 27135.0, 18989.0, 13234.0, 9264.0, 6484.0, 4773.0, 3336.0, 2426.0, 1673.0, 1329.0, 933.0, 663.0, 512.0, 316.0, 220.0, 166.0, 112.0, 89.0, 67.0, 51.0, 35.0, 20.0, 11.0, 13.0, 4.0, 4.0, 2.0], "bins": [-0.0003173351287841797, -0.00030752643942832947, -0.00029771775007247925, -0.00028790906071662903, -0.0002781003713607788, -0.0002682916820049286, -0.00025848299264907837, -0.00024867430329322815, -0.00023886561393737793, -0.0002290569245815277, -0.0002192482352256775, -0.00020943954586982727, -0.00019963085651397705, -0.00018982216715812683, -0.0001800134778022766, -0.0001702047884464264, -0.00016039609909057617, -0.00015058740973472595, -0.00014077872037887573, -0.0001309700310230255, -0.00012116134166717529, -0.00011135265231132507, -0.00010154396295547485, -9.173527359962463e-05, -8.192658424377441e-05, -7.21178948879242e-05, -6.230920553207397e-05, -5.2500516176223755e-05, -4.2691826820373535e-05, -3.2883137464523315e-05, -2.3074448108673096e-05, -1.3265758752822876e-05, -3.4570693969726562e-06, 6.3516199588775635e-06, 1.6160309314727783e-05, 2.5968998670578003e-05, 3.577768802642822e-05, 4.558637738227844e-05, 5.539506673812866e-05, 6.520375609397888e-05, 7.50124454498291e-05, 8.482113480567932e-05, 9.462982416152954e-05, 0.00010443851351737976, 0.00011424720287322998, 0.0001240558922290802, 0.00013386458158493042, 0.00014367327094078064, 0.00015348196029663086, 0.00016329064965248108, 0.0001730993390083313, 0.00018290802836418152, 0.00019271671772003174, 0.00020252540707588196, 0.00021233409643173218, 0.0002221427857875824, 0.00023195147514343262, 0.00024176016449928284, 0.00025156885385513306, 0.0002613775432109833, 0.0002711862325668335, 0.0002809949219226837, 0.00029080361127853394, 0.00030061230063438416, 0.0003104209899902344]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 3.0, 12.0, 5.0, 14.0, 11.0, 14.0, 14.0, 12.0, 22.0, 30.0, 26.0, 27.0, 45.0, 29.0, 32.0, 44.0, 39.0, 38.0, 46.0, 36.0, 44.0, 31.0, 54.0, 36.0, 34.0, 45.0, 29.0, 25.0, 35.0, 23.0, 23.0, 22.0, 18.0, 10.0, 11.0, 6.0, 17.0, 10.0, 8.0, 6.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020694732666015625, -0.0002005062997341156, -0.00019406527280807495, -0.0001876242458820343, -0.00018118321895599365, -0.000174742192029953, -0.00016830116510391235, -0.0001618601381778717, -0.00015541911125183105, -0.0001489780843257904, -0.00014253705739974976, -0.0001360960304737091, -0.00012965500354766846, -0.0001232139766216278, -0.00011677294969558716, -0.00011033192276954651, -0.00010389089584350586, -9.744986891746521e-05, -9.100884199142456e-05, -8.456781506538391e-05, -7.812678813934326e-05, -7.168576121330261e-05, -6.524473428726196e-05, -5.8803707361221313e-05, -5.2362680435180664e-05, -4.5921653509140015e-05, -3.9480626583099365e-05, -3.3039599657058716e-05, -2.6598572731018066e-05, -2.0157545804977417e-05, -1.3716518878936768e-05, -7.275491952896118e-06, -8.344650268554688e-07, 5.606561899185181e-06, 1.204758882522583e-05, 1.848861575126648e-05, 2.492964267730713e-05, 3.137066960334778e-05, 3.781169652938843e-05, 4.425272345542908e-05, 5.0693750381469727e-05, 5.7134777307510376e-05, 6.357580423355103e-05, 7.001683115959167e-05, 7.645785808563232e-05, 8.289888501167297e-05, 8.933991193771362e-05, 9.578093886375427e-05, 0.00010222196578979492, 0.00010866299271583557, 0.00011510401964187622, 0.00012154504656791687, 0.00012798607349395752, 0.00013442710041999817, 0.00014086812734603882, 0.00014730915427207947, 0.00015375018119812012, 0.00016019120812416077, 0.00016663223505020142, 0.00017307326197624207, 0.00017951428890228271, 0.00018595531582832336, 0.00019239634275436401, 0.00019883736968040466, 0.0002052783966064453]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 4.0, 9.0, 13.0, 18.0, 33.0, 48.0, 54.0, 90.0, 116.0, 175.0, 229.0, 368.0, 521.0, 817.0, 1182.0, 1729.0, 2742.0, 4255.0, 6896.0, 10750.0, 17135.0, 27855.0, 46017.0, 75889.0, 126003.0, 198284.0, 200965.0, 127943.0, 76448.0, 46229.0, 28088.0, 17262.0, 10929.0, 6816.0, 4347.0, 2755.0, 1843.0, 1184.0, 825.0, 520.0, 351.0, 244.0, 183.0, 114.0, 87.0, 53.0, 42.0, 29.0, 23.0, 19.0, 8.0, 2.0, 10.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.0003821849822998047, -0.00037024542689323425, -0.0003583058714866638, -0.0003463663160800934, -0.00033442676067352295, -0.0003224872052669525, -0.0003105476498603821, -0.00029860809445381165, -0.0002866685390472412, -0.0002747289836406708, -0.00026278942823410034, -0.0002508498728275299, -0.00023891031742095947, -0.00022697076201438904, -0.0002150312066078186, -0.00020309165120124817, -0.00019115209579467773, -0.0001792125403881073, -0.00016727298498153687, -0.00015533342957496643, -0.000143393874168396, -0.00013145431876182556, -0.00011951476335525513, -0.00010757520794868469, -9.563565254211426e-05, -8.369609713554382e-05, -7.175654172897339e-05, -5.9816986322402954e-05, -4.787743091583252e-05, -3.5937875509262085e-05, -2.399832010269165e-05, -1.2058764696121216e-05, -1.1920928955078125e-07, 1.1820346117019653e-05, 2.3759901523590088e-05, 3.569945693016052e-05, 4.763901233673096e-05, 5.957856774330139e-05, 7.151812314987183e-05, 8.345767855644226e-05, 9.53972339630127e-05, 0.00010733678936958313, 0.00011927634477615356, 0.000131215900182724, 0.00014315545558929443, 0.00015509501099586487, 0.0001670345664024353, 0.00017897412180900574, 0.00019091367721557617, 0.0002028532326221466, 0.00021479278802871704, 0.00022673234343528748, 0.0002386718988418579, 0.00025061145424842834, 0.0002625510096549988, 0.0002744905650615692, 0.00028643012046813965, 0.0002983696758747101, 0.0003103092312812805, 0.00032224878668785095, 0.0003341883420944214, 0.0003461278975009918, 0.00035806745290756226, 0.0003700070083141327, 0.0003819465637207031]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 8.0, 7.0, 6.0, 13.0, 13.0, 10.0, 20.0, 18.0, 21.0, 19.0, 28.0, 34.0, 35.0, 30.0, 42.0, 35.0, 24.0, 37.0, 30.0, 39.0, 50.0, 34.0, 43.0, 37.0, 37.0, 44.0, 30.0, 39.0, 29.0, 28.0, 21.0, 29.0, 15.0, 23.0, 10.0, 12.0, 7.0, 7.0, 7.0, 4.0, 6.0, 6.0, 1.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00013756752014160156, -0.0001335740089416504, -0.00012958049774169922, -0.00012558698654174805, -0.00012159347534179688, -0.0001175999641418457, -0.00011360645294189453, -0.00010961294174194336, -0.00010561943054199219, -0.00010162591934204102, -9.763240814208984e-05, -9.363889694213867e-05, -8.96453857421875e-05, -8.565187454223633e-05, -8.165836334228516e-05, -7.766485214233398e-05, -7.367134094238281e-05, -6.967782974243164e-05, -6.568431854248047e-05, -6.16908073425293e-05, -5.7697296142578125e-05, -5.370378494262695e-05, -4.971027374267578e-05, -4.571676254272461e-05, -4.172325134277344e-05, -3.7729740142822266e-05, -3.3736228942871094e-05, -2.9742717742919922e-05, -2.574920654296875e-05, -2.1755695343017578e-05, -1.7762184143066406e-05, -1.3768672943115234e-05, -9.775161743164062e-06, -5.781650543212891e-06, -1.7881393432617188e-06, 2.205371856689453e-06, 6.198883056640625e-06, 1.0192394256591797e-05, 1.4185905456542969e-05, 1.817941665649414e-05, 2.2172927856445312e-05, 2.6166439056396484e-05, 3.0159950256347656e-05, 3.415346145629883e-05, 3.814697265625e-05, 4.214048385620117e-05, 4.6133995056152344e-05, 5.0127506256103516e-05, 5.412101745605469e-05, 5.811452865600586e-05, 6.210803985595703e-05, 6.61015510559082e-05, 7.009506225585938e-05, 7.408857345581055e-05, 7.808208465576172e-05, 8.207559585571289e-05, 8.606910705566406e-05, 9.006261825561523e-05, 9.40561294555664e-05, 9.804964065551758e-05, 0.00010204315185546875, 0.00010603666305541992, 0.0001100301742553711, 0.00011402368545532227, 0.00011801719665527344]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 10.0, 4.0, 10.0, 10.0, 24.0, 26.0, 29.0, 51.0, 77.0, 90.0, 135.0, 202.0, 248.0, 441.0, 670.0, 1014.0, 1584.0, 2471.0, 4504.0, 8555.0, 19616.0, 66238.0, 859586.0, 48481.0, 16481.0, 7465.0, 3997.0, 2317.0, 1396.0, 954.0, 590.0, 403.0, 279.0, 169.0, 113.0, 100.0, 47.0, 45.0, 40.0, 17.0, 20.0, 12.0, 8.0, 10.0, 2.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00013959407806396484, -0.00013528577983379364, -0.00013097748160362244, -0.00012666918337345123, -0.00012236088514328003, -0.00011805258691310883, -0.00011374428868293762, -0.00010943599045276642, -0.00010512769222259521, -0.00010081939399242401, -9.651109576225281e-05, -9.22027975320816e-05, -8.78944993019104e-05, -8.35862010717392e-05, -7.927790284156799e-05, -7.496960461139679e-05, -7.066130638122559e-05, -6.635300815105438e-05, -6.204470992088318e-05, -5.7736411690711975e-05, -5.342811346054077e-05, -4.911981523036957e-05, -4.4811517000198364e-05, -4.050321877002716e-05, -3.619492053985596e-05, -3.1886622309684753e-05, -2.757832407951355e-05, -2.3270025849342346e-05, -1.8961727619171143e-05, -1.4653429388999939e-05, -1.0345131158828735e-05, -6.036832928657532e-06, -1.7285346984863281e-06, 2.5797635316848755e-06, 6.888061761856079e-06, 1.1196359992027283e-05, 1.5504658222198486e-05, 1.981295645236969e-05, 2.4121254682540894e-05, 2.8429552912712097e-05, 3.27378511428833e-05, 3.7046149373054504e-05, 4.135444760322571e-05, 4.566274583339691e-05, 4.9971044063568115e-05, 5.427934229373932e-05, 5.858764052391052e-05, 6.289593875408173e-05, 6.720423698425293e-05, 7.151253521442413e-05, 7.582083344459534e-05, 8.012913167476654e-05, 8.443742990493774e-05, 8.874572813510895e-05, 9.305402636528015e-05, 9.736232459545135e-05, 0.00010167062282562256, 0.00010597892105579376, 0.00011028721928596497, 0.00011459551751613617, 0.00011890381574630737, 0.00012321211397647858, 0.00012752041220664978, 0.00013182871043682098, 0.0001361370086669922]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 13.0, 0.0, 12.0, 29.0, 39.0, 64.0, 92.0, 158.0, 151.0, 145.0, 0.0, 86.0, 59.0, 43.0, 29.0, 16.0, 12.0, 9.0, 6.0, 0.0, 5.0, 5.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-06, -1.794658601284027e-06, -1.7415732145309448e-06, -1.6884878277778625e-06, -1.6354024410247803e-06, -1.582317054271698e-06, -1.5292316675186157e-06, -1.4761462807655334e-06, -1.4230608940124512e-06, -1.369975507259369e-06, -1.3168901205062866e-06, -1.2638047337532043e-06, -1.210719347000122e-06, -1.1576339602470398e-06, -1.1045485734939575e-06, -1.0514631867408752e-06, -9.98377799987793e-07, -9.452924132347107e-07, -8.922070264816284e-07, -8.391216397285461e-07, -7.860362529754639e-07, -7.329508662223816e-07, -6.798654794692993e-07, -6.26780092716217e-07, -5.736947059631348e-07, -5.206093192100525e-07, -4.675239324569702e-07, -4.1443854570388794e-07, -3.6135315895080566e-07, -3.082677721977234e-07, -2.551823854446411e-07, -2.0209699869155884e-07, -1.4901161193847656e-07, -9.592622518539429e-08, -4.284083843231201e-08, 1.0244548320770264e-08, 6.332993507385254e-08, 1.1641532182693481e-07, 1.695007085800171e-07, 2.2258609533309937e-07, 2.7567148208618164e-07, 3.287568688392639e-07, 3.818422555923462e-07, 4.3492764234542847e-07, 4.880130290985107e-07, 5.41098415851593e-07, 5.941838026046753e-07, 6.472691893577576e-07, 7.003545761108398e-07, 7.534399628639221e-07, 8.065253496170044e-07, 8.596107363700867e-07, 9.126961231231689e-07, 9.657815098762512e-07, 1.0188668966293335e-06, 1.0719522833824158e-06, 1.125037670135498e-06, 1.1781230568885803e-06, 1.2312084436416626e-06, 1.2842938303947449e-06, 1.3373792171478271e-06, 1.3904646039009094e-06, 1.4435499906539917e-06, 1.496635377407074e-06, 1.5497207641601562e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 10.0, 8.0, 14.0, 16.0, 29.0, 35.0, 40.0, 43.0, 42.0, 69.0, 98.0, 144.0, 172.0, 247.0, 302.0, 347.0, 474.0, 629.0, 889.0, 1274.0, 1626.0, 2285.0, 3464.0, 5070.0, 8060.0, 13315.0, 24947.0, 63680.0, 803549.0, 57118.0, 23326.0, 12705.0, 7675.0, 5089.0, 3167.0, 2325.0, 1591.0, 1140.0, 881.0, 628.0, 433.0, 350.0, 275.0, 304.0, 212.0, 116.0, 80.0, 55.0, 44.0, 45.0, 38.0, 20.0, 22.0, 6.0, 19.0, 5.0, 11.0, 10.0, 0.0, 2.0], "bins": [-0.00011903047561645508, -0.00011536292731761932, -0.00011169537901878357, -0.00010802783071994781, -0.00010436028242111206, -0.0001006927341222763, -9.702518582344055e-05, -9.33576375246048e-05, -8.969008922576904e-05, -8.602254092693329e-05, -8.235499262809753e-05, -7.868744432926178e-05, -7.501989603042603e-05, -7.135234773159027e-05, -6.768479943275452e-05, -6.401725113391876e-05, -6.034970283508301e-05, -5.6682154536247253e-05, -5.30146062374115e-05, -4.9347057938575745e-05, -4.567950963973999e-05, -4.2011961340904236e-05, -3.834441304206848e-05, -3.467686474323273e-05, -3.100931644439697e-05, -2.7341768145561218e-05, -2.3674219846725464e-05, -2.000667154788971e-05, -1.6339123249053955e-05, -1.26715749502182e-05, -9.004026651382446e-06, -5.336478352546692e-06, -1.6689300537109375e-06, 1.998618245124817e-06, 5.666166543960571e-06, 9.333714842796326e-06, 1.300126314163208e-05, 1.6668811440467834e-05, 2.033635973930359e-05, 2.4003908038139343e-05, 2.7671456336975098e-05, 3.133900463581085e-05, 3.5006552934646606e-05, 3.867410123348236e-05, 4.2341649532318115e-05, 4.600919783115387e-05, 4.9676746129989624e-05, 5.334429442882538e-05, 5.701184272766113e-05, 6.067939102649689e-05, 6.434693932533264e-05, 6.80144876241684e-05, 7.168203592300415e-05, 7.53495842218399e-05, 7.901713252067566e-05, 8.268468081951141e-05, 8.635222911834717e-05, 9.001977741718292e-05, 9.368732571601868e-05, 9.735487401485443e-05, 0.00010102242231369019, 0.00010468997061252594, 0.0001083575189113617, 0.00011202506721019745, 0.0001156926155090332]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 7.0, 12.0, 11.0, 6.0, 9.0, 18.0, 16.0, 26.0, 27.0, 89.0, 571.0, 63.0, 20.0, 17.0, 14.0, 15.0, 12.0, 3.0, 7.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4749507904052734e-05, -3.360491245985031e-05, -3.246031701564789e-05, -3.1315721571445465e-05, -3.0171126127243042e-05, -2.902653068304062e-05, -2.7881935238838196e-05, -2.6737339794635773e-05, -2.559274435043335e-05, -2.4448148906230927e-05, -2.3303553462028503e-05, -2.215895801782608e-05, -2.1014362573623657e-05, -1.9869767129421234e-05, -1.872517168521881e-05, -1.7580576241016388e-05, -1.6435980796813965e-05, -1.5291385352611542e-05, -1.4146789908409119e-05, -1.3002194464206696e-05, -1.1857599020004272e-05, -1.071300357580185e-05, -9.568408131599426e-06, -8.423812687397003e-06, -7.27921724319458e-06, -6.134621798992157e-06, -4.990026354789734e-06, -3.845430910587311e-06, -2.7008354663848877e-06, -1.5562400221824646e-06, -4.116445779800415e-07, 7.329508662223816e-07, 1.8775463104248047e-06, 3.0221417546272278e-06, 4.166737198829651e-06, 5.311332643032074e-06, 6.455928087234497e-06, 7.60052353143692e-06, 8.745118975639343e-06, 9.889714419841766e-06, 1.103430986404419e-05, 1.2178905308246613e-05, 1.3323500752449036e-05, 1.4468096196651459e-05, 1.5612691640853882e-05, 1.6757287085056305e-05, 1.7901882529258728e-05, 1.904647797346115e-05, 2.0191073417663574e-05, 2.1335668861865997e-05, 2.248026430606842e-05, 2.3624859750270844e-05, 2.4769455194473267e-05, 2.591405063867569e-05, 2.7058646082878113e-05, 2.8203241527080536e-05, 2.934783697128296e-05, 3.0492432415485382e-05, 3.1637027859687805e-05, 3.278162330389023e-05, 3.392621874809265e-05, 3.5070814192295074e-05, 3.62154096364975e-05, 3.736000508069992e-05, 3.8504600524902344e-05]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 10.0, 10.0, 12.0, 11.0, 12.0, 21.0, 24.0, 38.0, 48.0, 66.0, 87.0, 100.0, 103.0, 78.0, 67.0, 71.0, 49.0, 38.0, 47.0, 26.0, 10.0, 6.0, 11.0, 7.0, 6.0, 8.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0003639767237473279, -0.00035393895814195275, -0.00034390122164040804, -0.00033386345603503287, -0.0003238256904296577, -0.0003137879248242825, -0.00030375015921890736, -0.00029371242271736264, -0.00028367465711198747, -0.0002736368915066123, -0.0002635991550050676, -0.0002535613893996924, -0.00024352362379431725, -0.00023348585818894207, -0.00022344810713548213, -0.0002134103560820222, -0.00020337259047664702, -0.00019333482487127185, -0.0001832970738178119, -0.00017325932276435196, -0.0001632215571589768, -0.00015318379155360162, -0.00014314604050014168, -0.00013310828944668174, -0.00012307052384130657, -0.00011303276551188901, -0.00010299500718247145, -9.29572488530539e-05, -8.291949052363634e-05, -7.288173219421878e-05, -6.284397386480123e-05, -5.280621553538367e-05, -4.276842810213566e-05, -3.27306697727181e-05, -2.2692911443300545e-05, -1.2655153113882989e-05, -2.617394784465432e-06, 7.420363544952124e-06, 1.745812187436968e-05, 2.7495880203787237e-05, 3.7533638533204794e-05, 4.757139686262235e-05, 5.760915519203991e-05, 6.764691352145746e-05, 7.768467185087502e-05, 8.772243018029258e-05, 9.776018850971013e-05, 0.00010779794683912769, 0.00011783570516854525, 0.00012787347077392042, 0.00013791122182738036, 0.0001479489728808403, 0.00015798673848621547, 0.00016802450409159064, 0.00017806225514505059, 0.00018810000619851053, 0.0001981377718038857, 0.00020817553740926087, 0.0002182132884627208, 0.00022825103951618075, 0.00023828880512155592, 0.0002483265707269311, 0.0002583643072284758, 0.000268402072833851, 0.00027843983843922615]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 1.0, 9.0, 7.0, 5.0, 7.0, 14.0, 11.0, 17.0, 26.0, 18.0, 19.0, 26.0, 35.0, 29.0, 29.0, 41.0, 29.0, 32.0, 33.0, 52.0, 42.0, 45.0, 44.0, 31.0, 39.0, 38.0, 32.0, 32.0, 34.0, 27.0, 30.0, 24.0, 28.0, 22.0, 17.0, 16.0, 10.0, 8.0, 12.0, 4.0, 7.0, 6.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00021589358220808208, -0.00020922219846397638, -0.0002025508147198707, -0.000195879430975765, -0.00018920806178357452, -0.00018253667803946882, -0.00017586529429536313, -0.00016919391055125743, -0.00016252254135906696, -0.00015585115761496127, -0.00014917977387085557, -0.00014250839012674987, -0.0001358370209345594, -0.0001291656371904537, -0.000122494253446348, -0.00011582286970224231, -0.00010915148595813662, -0.00010248010221403092, -9.580872574588284e-05, -8.913734200177714e-05, -8.246596553362906e-05, -7.579458178952336e-05, -6.912319804541767e-05, -6.245181430131197e-05, -5.578043783316389e-05, -4.9109057727037e-05, -4.243767762091011e-05, -3.576629387680441e-05, -2.9094913770677522e-05, -2.2423533664550632e-05, -1.5752149920444936e-05, -9.080769814318046e-06, -2.4093897081911564e-06, 4.261991307430435e-06, 1.0933372323052026e-05, 1.760475424816832e-05, 2.427613435429521e-05, 3.09475144604221e-05, 3.7618898204527795e-05, 4.4290278310654685e-05, 5.0961658416781574e-05, 5.7633038522908464e-05, 6.430441862903535e-05, 7.097580237314105e-05, 7.764718611724675e-05, 8.431856258539483e-05, 9.098994632950053e-05, 9.766132279764861e-05, 0.0001043327065417543, 0.00011100409028586, 0.00011767546675400808, 0.00012434684322215617, 0.00013101822696626186, 0.00013768961071036756, 0.00014436099445447326, 0.00015103237819857895, 0.00015770376194268465, 0.00016437514568679035, 0.00017104652943089604, 0.00017771791317500174, 0.0001843892823671922, 0.0001910606661112979, 0.0001977320498554036, 0.0002044034335995093, 0.00021107480279169977]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 5.0, 8.0, 11.0, 14.0, 25.0, 35.0, 55.0, 51.0, 110.0, 133.0, 192.0, 299.0, 423.0, 571.0, 833.0, 1212.0, 1691.0, 2499.0, 3671.0, 5356.0, 8032.0, 12088.0, 18259.0, 28315.0, 44858.0, 73105.0, 125162.0, 230084.0, 534736.0, 1285427.0, 990603.0, 375935.0, 179828.0, 101126.0, 60526.0, 37651.0, 24136.0, 15232.0, 10165.0, 6777.0, 4659.0, 3089.0, 2232.0, 1510.0, 1070.0, 746.0, 551.0, 362.0, 259.0, 167.0, 119.0, 110.0, 61.0, 38.0, 26.0, 27.0, 15.0, 7.0, 1.0, 3.0], "bins": [-0.00024008750915527344, -0.00023298710584640503, -0.00022588670253753662, -0.0002187862992286682, -0.0002116858959197998, -0.0002045854926109314, -0.000197485089302063, -0.00019038468599319458, -0.00018328428268432617, -0.00017618387937545776, -0.00016908347606658936, -0.00016198307275772095, -0.00015488266944885254, -0.00014778226613998413, -0.00014068186283111572, -0.00013358145952224731, -0.0001264810562133789, -0.0001193806529045105, -0.00011228024959564209, -0.00010517984628677368, -9.807944297790527e-05, -9.097903966903687e-05, -8.387863636016846e-05, -7.677823305130005e-05, -6.967782974243164e-05, -6.257742643356323e-05, -5.5477023124694824e-05, -4.8376619815826416e-05, -4.127621650695801e-05, -3.41758131980896e-05, -2.707540988922119e-05, -1.9975006580352783e-05, -1.2874603271484375e-05, -5.774199962615967e-06, 1.3262033462524414e-06, 8.42660665512085e-06, 1.5527009963989258e-05, 2.2627413272857666e-05, 2.9727816581726074e-05, 3.682821989059448e-05, 4.392862319946289e-05, 5.10290265083313e-05, 5.812942981719971e-05, 6.522983312606812e-05, 7.233023643493652e-05, 7.943063974380493e-05, 8.653104305267334e-05, 9.363144636154175e-05, 0.00010073184967041016, 0.00010783225297927856, 0.00011493265628814697, 0.00012203305959701538, 0.0001291334629058838, 0.0001362338662147522, 0.0001433342695236206, 0.00015043467283248901, 0.00015753507614135742, 0.00016463547945022583, 0.00017173588275909424, 0.00017883628606796265, 0.00018593668937683105, 0.00019303709268569946, 0.00020013749599456787, 0.00020723789930343628, 0.0002143383026123047]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 4.0, 12.0, 9.0, 11.0, 15.0, 10.0, 17.0, 18.0, 18.0, 22.0, 28.0, 31.0, 14.0, 38.0, 30.0, 33.0, 37.0, 40.0, 47.0, 47.0, 30.0, 33.0, 39.0, 41.0, 29.0, 41.0, 32.0, 28.0, 27.0, 32.0, 22.0, 20.0, 27.0, 19.0, 15.0, 16.0, 8.0, 8.0, 8.0, 11.0, 7.0, 4.0, 3.0, 3.0, 1.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011134147644042969, -0.0001075640320777893, -0.00010378658771514893, -0.00010000914335250854, -9.623169898986816e-05, -9.245425462722778e-05, -8.86768102645874e-05, -8.489936590194702e-05, -8.112192153930664e-05, -7.734447717666626e-05, -7.356703281402588e-05, -6.97895884513855e-05, -6.601214408874512e-05, -6.223469972610474e-05, -5.8457255363464355e-05, -5.4679811000823975e-05, -5.0902366638183594e-05, -4.712492227554321e-05, -4.334747791290283e-05, -3.957003355026245e-05, -3.579258918762207e-05, -3.201514482498169e-05, -2.823770046234131e-05, -2.4460256099700928e-05, -2.0682811737060547e-05, -1.6905367374420166e-05, -1.3127923011779785e-05, -9.350478649139404e-06, -5.5730342864990234e-06, -1.7955899238586426e-06, 1.9818544387817383e-06, 5.759298801422119e-06, 9.5367431640625e-06, 1.3314187526702881e-05, 1.7091631889343262e-05, 2.0869076251983643e-05, 2.4646520614624023e-05, 2.8423964977264404e-05, 3.2201409339904785e-05, 3.5978853702545166e-05, 3.975629806518555e-05, 4.353374242782593e-05, 4.731118679046631e-05, 5.108863115310669e-05, 5.486607551574707e-05, 5.864351987838745e-05, 6.242096424102783e-05, 6.619840860366821e-05, 6.99758529663086e-05, 7.375329732894897e-05, 7.753074169158936e-05, 8.130818605422974e-05, 8.508563041687012e-05, 8.88630747795105e-05, 9.264051914215088e-05, 9.641796350479126e-05, 0.00010019540786743164, 0.00010397285223007202, 0.0001077502965927124, 0.00011152774095535278, 0.00011530518531799316, 0.00011908262968063354, 0.00012286007404327393, 0.0001266375184059143, 0.0001304149627685547]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 7.0, 10.0, 12.0, 15.0, 37.0, 60.0, 42.0, 86.0, 149.0, 188.0, 310.0, 486.0, 677.0, 1012.0, 1645.0, 2525.0, 3776.0, 6075.0, 9606.0, 15733.0, 25531.0, 42646.0, 71562.0, 127239.0, 237039.0, 502610.0, 1193080.0, 1026507.0, 434528.0, 212070.0, 112773.0, 65469.0, 38761.0, 22973.0, 14271.0, 9002.0, 5471.0, 3524.0, 2405.0, 1480.0, 943.0, 645.0, 413.0, 298.0, 194.0, 122.0, 86.0, 76.0, 40.0, 32.0, 12.0, 14.0, 6.0, 5.0, 6.0, 4.0, 2.0], "bins": [-0.0002256631851196289, -0.0002190079540014267, -0.0002123527228832245, -0.00020569749176502228, -0.00019904226064682007, -0.00019238702952861786, -0.00018573179841041565, -0.00017907656729221344, -0.00017242133617401123, -0.00016576610505580902, -0.0001591108739376068, -0.0001524556428194046, -0.0001458004117012024, -0.00013914518058300018, -0.00013248994946479797, -0.00012583471834659576, -0.00011917948722839355, -0.00011252425611019135, -0.00010586902499198914, -9.921379387378693e-05, -9.255856275558472e-05, -8.590333163738251e-05, -7.92481005191803e-05, -7.259286940097809e-05, -6.593763828277588e-05, -5.928240716457367e-05, -5.262717604637146e-05, -4.597194492816925e-05, -3.931671380996704e-05, -3.266148269176483e-05, -2.6006251573562622e-05, -1.9351020455360413e-05, -1.2695789337158203e-05, -6.040558218955994e-06, 6.146728992462158e-07, 7.269904017448425e-06, 1.3925135135650635e-05, 2.0580366253852844e-05, 2.7235597372055054e-05, 3.389082849025726e-05, 4.054605960845947e-05, 4.720129072666168e-05, 5.385652184486389e-05, 6.05117529630661e-05, 6.716698408126831e-05, 7.382221519947052e-05, 8.047744631767273e-05, 8.713267743587494e-05, 9.378790855407715e-05, 0.00010044313967227936, 0.00010709837079048157, 0.00011375360190868378, 0.00012040883302688599, 0.0001270640641450882, 0.0001337192952632904, 0.00014037452638149261, 0.00014702975749969482, 0.00015368498861789703, 0.00016034021973609924, 0.00016699545085430145, 0.00017365068197250366, 0.00018030591309070587, 0.00018696114420890808, 0.0001936163753271103, 0.0002002716064453125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 11.0, 14.0, 20.0, 20.0, 25.0, 33.0, 33.0, 66.0, 72.0, 79.0, 92.0, 100.0, 109.0, 138.0, 175.0, 203.0, 218.0, 225.0, 240.0, 252.0, 242.0, 248.0, 216.0, 205.0, 177.0, 135.0, 113.0, 96.0, 92.0, 79.0, 58.0, 52.0, 56.0, 45.0, 30.0, 26.0, 20.0, 11.0, 10.0, 6.0, 7.0, 3.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.216764450073242e-05, -6.006751209497452e-05, -5.7967379689216614e-05, -5.586724728345871e-05, -5.3767114877700806e-05, -5.16669824719429e-05, -4.9566850066185e-05, -4.7466717660427094e-05, -4.536658525466919e-05, -4.3266452848911285e-05, -4.116632044315338e-05, -3.906618803739548e-05, -3.696605563163757e-05, -3.486592322587967e-05, -3.2765790820121765e-05, -3.066565841436386e-05, -2.8565526008605957e-05, -2.6465393602848053e-05, -2.436526119709015e-05, -2.2265128791332245e-05, -2.016499638557434e-05, -1.8064863979816437e-05, -1.5964731574058533e-05, -1.3864599168300629e-05, -1.1764466762542725e-05, -9.66433435678482e-06, -7.5642019510269165e-06, -5.4640695452690125e-06, -3.3639371395111084e-06, -1.2638047337532043e-06, 8.363276720046997e-07, 2.9364600777626038e-06, 5.036592483520508e-06, 7.136724889278412e-06, 9.236857295036316e-06, 1.133698970079422e-05, 1.3437122106552124e-05, 1.5537254512310028e-05, 1.7637386918067932e-05, 1.9737519323825836e-05, 2.183765172958374e-05, 2.3937784135341644e-05, 2.603791654109955e-05, 2.8138048946857452e-05, 3.0238181352615356e-05, 3.233831375837326e-05, 3.4438446164131165e-05, 3.653857856988907e-05, 3.863871097564697e-05, 4.073884338140488e-05, 4.283897578716278e-05, 4.4939108192920685e-05, 4.703924059867859e-05, 4.913937300443649e-05, 5.12395054101944e-05, 5.33396378159523e-05, 5.5439770221710205e-05, 5.753990262746811e-05, 5.964003503322601e-05, 6.174016743898392e-05, 6.384029984474182e-05, 6.594043225049973e-05, 6.804056465625763e-05, 7.014069706201553e-05, 7.224082946777344e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 6.0, 5.0, 9.0, 5.0, 11.0, 12.0, 15.0, 24.0, 17.0, 33.0, 40.0, 43.0, 59.0, 62.0, 97.0, 92.0, 73.0, 66.0, 55.0, 55.0, 35.0, 33.0, 24.0, 27.0, 21.0, 9.0, 10.0, 15.0, 4.0, 6.0, 6.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.00020644454343710095, -0.00020093427156098187, -0.0001954239996848628, -0.00018991372780874372, -0.00018440347048453987, -0.0001788931986084208, -0.0001733829267323017, -0.00016787265485618263, -0.00016236238298006356, -0.00015685211110394448, -0.0001513418392278254, -0.00014583156735170633, -0.00014032129547558725, -0.0001348110381513834, -0.00012930076627526432, -0.00012379049439914525, -0.00011828022252302617, -0.00011276995064690709, -0.00010725967877078801, -0.00010174941417062655, -9.623914229450747e-05, -9.07288704183884e-05, -8.521860581822693e-05, -7.970833394210786e-05, -7.419806206598878e-05, -6.86877901898697e-05, -6.317751831375062e-05, -5.766725371358916e-05, -5.2156981837470084e-05, -4.664670996135101e-05, -4.113644172321074e-05, -3.562617348507047e-05, -3.011590160895139e-05, -2.4605631551821716e-05, -1.9095361494692042e-05, -1.3585091437562369e-05, -8.074821380432695e-06, -2.5645513233030215e-06, 2.945718733826652e-06, 8.455986971966922e-06, 1.3966258848086e-05, 1.9476528905215673e-05, 2.4986798962345347e-05, 3.049706901947502e-05, 3.6007339076604694e-05, 4.151761095272377e-05, 4.702787919086404e-05, 5.253814742900431e-05, 5.804841930512339e-05, 6.355869118124247e-05, 6.906896305736154e-05, 7.4579227657523e-05, 8.008949953364208e-05, 8.559977140976116e-05, 9.111003600992262e-05, 9.66203078860417e-05, 0.00010213057976216078, 0.00010764085163827986, 0.00011315112351439893, 0.0001186613881145604, 0.0001241716672666371, 0.00012968192459084094, 0.00013519219646696, 0.0001407024683430791, 0.00014621274021919817]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 3.0, 2.0, 1.0, 5.0, 13.0, 11.0, 15.0, 11.0, 27.0, 10.0, 21.0, 36.0, 21.0, 25.0, 25.0, 25.0, 43.0, 29.0, 42.0, 41.0, 36.0, 29.0, 32.0, 35.0, 37.0, 46.0, 37.0, 43.0, 39.0, 26.0, 23.0, 32.0, 22.0, 16.0, 26.0, 16.0, 13.0, 15.0, 11.0, 13.0, 11.0, 9.0, 9.0, 8.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00013573053001891822, -0.0001316455309279263, -0.00012756051728501916, -0.00012347551819402725, -0.00011939051910303533, -0.0001153055127360858, -0.00011122050636913627, -0.00010713550727814436, -0.00010305050091119483, -9.89654945442453e-05, -9.488049545325339e-05, -9.079548908630386e-05, -8.671048271935433e-05, -8.262548362836242e-05, -7.854047726141289e-05, -7.445547089446336e-05, -7.037047180347145e-05, -6.628546543652192e-05, -6.220046634553e-05, -5.8115459978580475e-05, -5.4030457249609753e-05, -4.994545452063903e-05, -4.5860448153689504e-05, -4.177544542471878e-05, -3.769044269574806e-05, -3.360543996677734e-05, -2.9520435418817215e-05, -2.543543087085709e-05, -2.135042814188637e-05, -1.7265425412915647e-05, -1.3180420864955522e-05, -9.095416316995397e-06, -5.010428139939904e-06, -9.254245014744811e-07, 3.159579136990942e-06, 7.244582775456365e-06, 1.1329586413921788e-05, 1.541458914289251e-05, 1.9499593690852635e-05, 2.358459823881276e-05, 2.766960096778348e-05, 3.17546036967542e-05, 3.5839606425724924e-05, 3.992461279267445e-05, 4.4009615521645173e-05, 4.8094618250615895e-05, 5.217962461756542e-05, 5.6264627346536145e-05, 6.0349630075506866e-05, 6.44346364424564e-05, 6.851963553344831e-05, 7.260464190039784e-05, 7.668964099138975e-05, 8.077464735833928e-05, 8.485965372528881e-05, 8.894465281628072e-05, 9.302965918323025e-05, 9.711466555017978e-05, 0.0001011996646411717, 0.00010528467100812122, 0.00010936967737507075, 0.00011345467646606266, 0.0001175396828330122, 0.00012162468919996172, 0.00012570968829095364]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 10.0, 11.0, 24.0, 26.0, 37.0, 63.0, 78.0, 109.0, 176.0, 232.0, 402.0, 507.0, 755.0, 1157.0, 1803.0, 2663.0, 4248.0, 6503.0, 10066.0, 16250.0, 25526.0, 41279.0, 66340.0, 106496.0, 168104.0, 199094.0, 147659.0, 93098.0, 58326.0, 35523.0, 21961.0, 14363.0, 9078.0, 5779.0, 3696.0, 2393.0, 1620.0, 1023.0, 688.0, 480.0, 254.0, 201.0, 151.0, 104.0, 70.0, 44.0, 30.0, 22.0, 15.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0], "bins": [-0.00021314620971679688, -0.00020675547420978546, -0.00020036473870277405, -0.00019397400319576263, -0.00018758326768875122, -0.0001811925321817398, -0.0001748017966747284, -0.00016841106116771698, -0.00016202032566070557, -0.00015562959015369415, -0.00014923885464668274, -0.00014284811913967133, -0.0001364573836326599, -0.0001300666481256485, -0.00012367591261863708, -0.00011728517711162567, -0.00011089444160461426, -0.00010450370609760284, -9.811297059059143e-05, -9.172223508358002e-05, -8.53314995765686e-05, -7.894076406955719e-05, -7.255002856254578e-05, -6.615929305553436e-05, -5.976855754852295e-05, -5.3377822041511536e-05, -4.698708653450012e-05, -4.059635102748871e-05, -3.4205615520477295e-05, -2.781488001346588e-05, -2.1424144506454468e-05, -1.5033408999443054e-05, -8.64267349243164e-06, -2.251937985420227e-06, 4.1387975215911865e-06, 1.05295330286026e-05, 1.6920268535614014e-05, 2.3311004042625427e-05, 2.970173954963684e-05, 3.6092475056648254e-05, 4.248321056365967e-05, 4.887394607067108e-05, 5.5264681577682495e-05, 6.165541708469391e-05, 6.804615259170532e-05, 7.443688809871674e-05, 8.082762360572815e-05, 8.721835911273956e-05, 9.360909461975098e-05, 9.999983012676239e-05, 0.0001063905656337738, 0.00011278130114078522, 0.00011917203664779663, 0.00012556277215480804, 0.00013195350766181946, 0.00013834424316883087, 0.00014473497867584229, 0.0001511257141828537, 0.0001575164496898651, 0.00016390718519687653, 0.00017029792070388794, 0.00017668865621089935, 0.00018307939171791077, 0.00018947012722492218, 0.0001958608627319336]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 5.0, 3.0, 5.0, 6.0, 11.0, 11.0, 20.0, 23.0, 20.0, 29.0, 21.0, 19.0, 27.0, 25.0, 37.0, 30.0, 28.0, 35.0, 30.0, 39.0, 37.0, 25.0, 29.0, 46.0, 46.0, 39.0, 43.0, 39.0, 38.0, 23.0, 24.0, 26.0, 26.0, 22.0, 22.0, 11.0, 13.0, 15.0, 6.0, 12.0, 13.0, 10.0, 1.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.00011938810348510742, -0.00011594314128160477, -0.00011249817907810211, -0.00010905321687459946, -0.0001056082546710968, -0.00010216329246759415, -9.871833026409149e-05, -9.527336806058884e-05, -9.182840585708618e-05, -8.838344365358353e-05, -8.493848145008087e-05, -8.149351924657822e-05, -7.804855704307556e-05, -7.46035948395729e-05, -7.115863263607025e-05, -6.77136704325676e-05, -6.426870822906494e-05, -6.0823746025562286e-05, -5.737878382205963e-05, -5.3933821618556976e-05, -5.048885941505432e-05, -4.7043897211551666e-05, -4.359893500804901e-05, -4.0153972804546356e-05, -3.67090106010437e-05, -3.3264048397541046e-05, -2.981908619403839e-05, -2.6374123990535736e-05, -2.292916178703308e-05, -1.9484199583530426e-05, -1.603923738002777e-05, -1.2594275176525116e-05, -9.149312973022461e-06, -5.704350769519806e-06, -2.259388566017151e-06, 1.1855736374855042e-06, 4.630535840988159e-06, 8.075498044490814e-06, 1.152046024799347e-05, 1.4965422451496124e-05, 1.841038465499878e-05, 2.1855346858501434e-05, 2.530030906200409e-05, 2.8745271265506744e-05, 3.21902334690094e-05, 3.5635195672512054e-05, 3.908015787601471e-05, 4.2525120079517365e-05, 4.597008228302002e-05, 4.9415044486522675e-05, 5.286000669002533e-05, 5.6304968893527985e-05, 5.974993109703064e-05, 6.31948933005333e-05, 6.663985550403595e-05, 7.00848177075386e-05, 7.352977991104126e-05, 7.697474211454391e-05, 8.041970431804657e-05, 8.386466652154922e-05, 8.730962872505188e-05, 9.075459092855453e-05, 9.419955313205719e-05, 9.764451533555984e-05, 0.0001010894775390625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 10.0, 7.0, 10.0, 26.0, 34.0, 56.0, 87.0, 146.0, 216.0, 323.0, 492.0, 845.0, 1381.0, 2404.0, 4314.0, 8626.0, 18867.0, 52660.0, 271766.0, 541612.0, 92389.0, 27401.0, 11524.0, 5808.0, 3082.0, 1779.0, 1005.0, 597.0, 378.0, 251.0, 160.0, 109.0, 61.0, 40.0, 17.0, 17.0, 8.0, 13.0, 10.0, 2.0, 9.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003447532653808594, -0.0003310739994049072, -0.0003173947334289551, -0.00030371546745300293, -0.0002900362014770508, -0.00027635693550109863, -0.0002626776695251465, -0.00024899840354919434, -0.0002353191375732422, -0.00022163987159729004, -0.0002079606056213379, -0.00019428133964538574, -0.0001806020736694336, -0.00016692280769348145, -0.0001532435417175293, -0.00013956427574157715, -0.000125885009765625, -0.00011220574378967285, -9.85264778137207e-05, -8.484721183776855e-05, -7.11679458618164e-05, -5.748867988586426e-05, -4.380941390991211e-05, -3.013014793395996e-05, -1.6450881958007812e-05, -2.771615982055664e-06, 1.0907649993896484e-05, 2.4586915969848633e-05, 3.826618194580078e-05, 5.194544792175293e-05, 6.562471389770508e-05, 7.930397987365723e-05, 9.298324584960938e-05, 0.00010666251182556152, 0.00012034177780151367, 0.00013402104377746582, 0.00014770030975341797, 0.00016137957572937012, 0.00017505884170532227, 0.00018873810768127441, 0.00020241737365722656, 0.0002160966396331787, 0.00022977590560913086, 0.000243455171585083, 0.00025713443756103516, 0.0002708137035369873, 0.00028449296951293945, 0.0002981722354888916, 0.00031185150146484375, 0.0003255307674407959, 0.00033921003341674805, 0.0003528892993927002, 0.00036656856536865234, 0.0003802478313446045, 0.00039392709732055664, 0.0004076063632965088, 0.00042128562927246094, 0.0004349648952484131, 0.00044864416122436523, 0.0004623234272003174, 0.00047600269317626953, 0.0004896819591522217, 0.0005033612251281738, 0.000517040491104126, 0.0005307197570800781]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 2.0, 4.0, 9.0, 6.0, 9.0, 10.0, 20.0, 11.0, 21.0, 24.0, 16.0, 24.0, 23.0, 29.0, 28.0, 30.0, 33.0, 41.0, 42.0, 48.0, 37.0, 41.0, 38.0, 52.0, 36.0, 45.0, 37.0, 23.0, 34.0, 25.0, 28.0, 22.0, 24.0, 27.0, 14.0, 14.0, 12.0, 16.0, 12.0, 5.0, 8.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.514787673950195e-05, -6.292946636676788e-05, -6.0711055994033813e-05, -5.8492645621299744e-05, -5.6274235248565674e-05, -5.4055824875831604e-05, -5.1837414503097534e-05, -4.9619004130363464e-05, -4.7400593757629395e-05, -4.5182183384895325e-05, -4.2963773012161255e-05, -4.0745362639427185e-05, -3.8526952266693115e-05, -3.6308541893959045e-05, -3.4090131521224976e-05, -3.1871721148490906e-05, -2.9653310775756836e-05, -2.7434900403022766e-05, -2.5216490030288696e-05, -2.2998079657554626e-05, -2.0779669284820557e-05, -1.8561258912086487e-05, -1.6342848539352417e-05, -1.4124438166618347e-05, -1.1906027793884277e-05, -9.687617421150208e-06, -7.469207048416138e-06, -5.250796675682068e-06, -3.032386302947998e-06, -8.139759302139282e-07, 1.4044344425201416e-06, 3.6228448152542114e-06, 5.841255187988281e-06, 8.059665560722351e-06, 1.0278075933456421e-05, 1.249648630619049e-05, 1.471489667892456e-05, 1.693330705165863e-05, 1.91517174243927e-05, 2.137012779712677e-05, 2.358853816986084e-05, 2.580694854259491e-05, 2.802535891532898e-05, 3.024376928806305e-05, 3.246217966079712e-05, 3.468059003353119e-05, 3.689900040626526e-05, 3.911741077899933e-05, 4.13358211517334e-05, 4.355423152446747e-05, 4.577264189720154e-05, 4.799105226993561e-05, 5.020946264266968e-05, 5.242787301540375e-05, 5.464628338813782e-05, 5.686469376087189e-05, 5.908310413360596e-05, 6.130151450634003e-05, 6.35199248790741e-05, 6.573833525180817e-05, 6.795674562454224e-05, 7.01751559972763e-05, 7.239356637001038e-05, 7.461197674274445e-05, 7.683038711547852e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 8.0, 5.0, 7.0, 22.0, 22.0, 34.0, 52.0, 77.0, 106.0, 175.0, 267.0, 412.0, 720.0, 1070.0, 2055.0, 3864.0, 8797.0, 26136.0, 154172.0, 744522.0, 74652.0, 17431.0, 6601.0, 3120.0, 1664.0, 937.0, 547.0, 369.0, 246.0, 144.0, 112.0, 66.0, 44.0, 33.0, 15.0, 12.0, 14.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.0001652240753173828, -0.00016079843044281006, -0.0001563727855682373, -0.00015194714069366455, -0.0001475214958190918, -0.00014309585094451904, -0.0001386702060699463, -0.00013424456119537354, -0.00012981891632080078, -0.00012539327144622803, -0.00012096762657165527, -0.00011654198169708252, -0.00011211633682250977, -0.00010769069194793701, -0.00010326504707336426, -9.88394021987915e-05, -9.441375732421875e-05, -8.9988112449646e-05, -8.556246757507324e-05, -8.113682270050049e-05, -7.671117782592773e-05, -7.228553295135498e-05, -6.785988807678223e-05, -6.343424320220947e-05, -5.900859832763672e-05, -5.4582953453063965e-05, -5.015730857849121e-05, -4.573166370391846e-05, -4.13060188293457e-05, -3.688037395477295e-05, -3.2454729080200195e-05, -2.802908420562744e-05, -2.3603439331054688e-05, -1.9177794456481934e-05, -1.475214958190918e-05, -1.0326504707336426e-05, -5.900859832763672e-06, -1.475214958190918e-06, 2.950429916381836e-06, 7.37607479095459e-06, 1.1801719665527344e-05, 1.6227364540100098e-05, 2.065300941467285e-05, 2.5078654289245605e-05, 2.950429916381836e-05, 3.392994403839111e-05, 3.835558891296387e-05, 4.278123378753662e-05, 4.7206878662109375e-05, 5.163252353668213e-05, 5.605816841125488e-05, 6.048381328582764e-05, 6.490945816040039e-05, 6.933510303497314e-05, 7.37607479095459e-05, 7.818639278411865e-05, 8.26120376586914e-05, 8.703768253326416e-05, 9.146332740783691e-05, 9.588897228240967e-05, 0.00010031461715698242, 0.00010474026203155518, 0.00010916590690612793, 0.00011359155178070068, 0.00011801719665527344]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 2.0, 2.0, 7.0, 5.0, 2.0, 10.0, 6.0, 11.0, 16.0, 13.0, 21.0, 16.0, 25.0, 39.0, 50.0, 57.0, 92.0, 98.0, 147.0, 95.0, 56.0, 31.0, 37.0, 36.0, 19.0, 17.0, 10.0, 11.0, 14.0, 9.0, 7.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.496906280517578e-06, -6.305985152721405e-06, -6.115064024925232e-06, -5.924142897129059e-06, -5.733221769332886e-06, -5.542300641536713e-06, -5.3513795137405396e-06, -5.1604583859443665e-06, -4.969537258148193e-06, -4.77861613035202e-06, -4.587695002555847e-06, -4.396773874759674e-06, -4.205852746963501e-06, -4.014931619167328e-06, -3.824010491371155e-06, -3.6330893635749817e-06, -3.4421682357788086e-06, -3.2512471079826355e-06, -3.0603259801864624e-06, -2.8694048523902893e-06, -2.678483724594116e-06, -2.487562596797943e-06, -2.29664146900177e-06, -2.105720341205597e-06, -1.914799213409424e-06, -1.7238780856132507e-06, -1.5329569578170776e-06, -1.3420358300209045e-06, -1.1511147022247314e-06, -9.601935744285583e-07, -7.692724466323853e-07, -5.783513188362122e-07, -3.8743019104003906e-07, -1.9650906324386597e-07, -5.587935447692871e-09, 1.8533319234848022e-07, 3.762543201446533e-07, 5.671754479408264e-07, 7.580965757369995e-07, 9.490177035331726e-07, 1.1399388313293457e-06, 1.3308599591255188e-06, 1.521781086921692e-06, 1.712702214717865e-06, 1.903623342514038e-06, 2.094544470310211e-06, 2.2854655981063843e-06, 2.4763867259025574e-06, 2.6673078536987305e-06, 2.8582289814949036e-06, 3.0491501092910767e-06, 3.2400712370872498e-06, 3.430992364883423e-06, 3.621913492679596e-06, 3.812834620475769e-06, 4.003755748271942e-06, 4.194676876068115e-06, 4.385598003864288e-06, 4.5765191316604614e-06, 4.7674402594566345e-06, 4.958361387252808e-06, 5.149282515048981e-06, 5.340203642845154e-06, 5.531124770641327e-06, 5.7220458984375e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 9.0, 8.0, 25.0, 27.0, 33.0, 45.0, 72.0, 98.0, 144.0, 157.0, 306.0, 390.0, 614.0, 820.0, 1193.0, 1924.0, 2672.0, 4293.0, 7299.0, 12138.0, 22276.0, 44072.0, 107047.0, 307508.0, 321510.0, 112182.0, 45593.0, 22982.0, 12422.0, 7576.0, 4403.0, 2860.0, 1831.0, 1164.0, 826.0, 630.0, 425.0, 278.0, 204.0, 133.0, 108.0, 74.0, 51.0, 40.0, 31.0, 19.0, 12.0, 5.0, 9.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.0650367736816406e-05, -3.938097506761551e-05, -3.811158239841461e-05, -3.6842189729213715e-05, -3.557279706001282e-05, -3.430340439081192e-05, -3.303401172161102e-05, -3.1764619052410126e-05, -3.049522638320923e-05, -2.922583371400833e-05, -2.7956441044807434e-05, -2.6687048375606537e-05, -2.541765570640564e-05, -2.4148263037204742e-05, -2.2878870368003845e-05, -2.1609477698802948e-05, -2.034008502960205e-05, -1.9070692360401154e-05, -1.7801299691200256e-05, -1.653190702199936e-05, -1.5262514352798462e-05, -1.3993121683597565e-05, -1.2723729014396667e-05, -1.145433634519577e-05, -1.0184943675994873e-05, -8.915551006793976e-06, -7.646158337593079e-06, -6.376765668392181e-06, -5.107372999191284e-06, -3.837980329990387e-06, -2.5685876607894897e-06, -1.2991949915885925e-06, -2.9802322387695312e-08, 1.239590346813202e-06, 2.508983016014099e-06, 3.7783756852149963e-06, 5.0477683544158936e-06, 6.317161023616791e-06, 7.586553692817688e-06, 8.855946362018585e-06, 1.0125339031219482e-05, 1.139473170042038e-05, 1.2664124369621277e-05, 1.3933517038822174e-05, 1.5202909708023071e-05, 1.647230237722397e-05, 1.7741695046424866e-05, 1.9011087715625763e-05, 2.028048038482666e-05, 2.1549873054027557e-05, 2.2819265723228455e-05, 2.4088658392429352e-05, 2.535805106163025e-05, 2.6627443730831146e-05, 2.7896836400032043e-05, 2.916622906923294e-05, 3.0435621738433838e-05, 3.1705014407634735e-05, 3.297440707683563e-05, 3.424379974603653e-05, 3.551319241523743e-05, 3.6782585084438324e-05, 3.805197775363922e-05, 3.932137042284012e-05, 4.0590763092041016e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 10.0, 6.0, 4.0, 6.0, 9.0, 2.0, 12.0, 11.0, 19.0, 28.0, 27.0, 35.0, 26.0, 48.0, 54.0, 49.0, 64.0, 54.0, 68.0, 69.0, 50.0, 62.0, 48.0, 43.0, 36.0, 22.0, 28.0, 20.0, 18.0, 8.0, 11.0, 12.0, 7.0, 5.0, 5.0, 4.0, 7.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0192394256591797e-05, -9.858980774879456e-06, -9.525567293167114e-06, -9.192153811454773e-06, -8.858740329742432e-06, -8.52532684803009e-06, -8.191913366317749e-06, -7.858499884605408e-06, -7.525086402893066e-06, -7.191672921180725e-06, -6.858259439468384e-06, -6.5248459577560425e-06, -6.191432476043701e-06, -5.85801899433136e-06, -5.5246055126190186e-06, -5.191192030906677e-06, -4.857778549194336e-06, -4.524365067481995e-06, -4.190951585769653e-06, -3.857538104057312e-06, -3.5241246223449707e-06, -3.1907111406326294e-06, -2.857297658920288e-06, -2.5238841772079468e-06, -2.1904706954956055e-06, -1.8570572137832642e-06, -1.5236437320709229e-06, -1.1902302503585815e-06, -8.568167686462402e-07, -5.234032869338989e-07, -1.8998980522155762e-07, 1.434236764907837e-07, 4.76837158203125e-07, 8.102506399154663e-07, 1.1436641216278076e-06, 1.477077603340149e-06, 1.8104910850524902e-06, 2.1439045667648315e-06, 2.477318048477173e-06, 2.810731530189514e-06, 3.1441450119018555e-06, 3.4775584936141968e-06, 3.810971975326538e-06, 4.144385457038879e-06, 4.477798938751221e-06, 4.811212420463562e-06, 5.144625902175903e-06, 5.478039383888245e-06, 5.811452865600586e-06, 6.144866347312927e-06, 6.4782798290252686e-06, 6.81169331073761e-06, 7.145106792449951e-06, 7.4785202741622925e-06, 7.811933755874634e-06, 8.145347237586975e-06, 8.478760719299316e-06, 8.812174201011658e-06, 9.145587682723999e-06, 9.47900116443634e-06, 9.812414646148682e-06, 1.0145828127861023e-05, 1.0479241609573364e-05, 1.0812655091285706e-05, 1.1146068572998047e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 7.0, 11.0, 6.0, 22.0, 29.0, 24.0, 44.0, 38.0, 59.0, 65.0, 110.0, 97.0, 85.0, 77.0, 55.0, 57.0, 46.0, 25.0, 24.0, 18.0, 20.0, 11.0, 7.0, 9.0, 9.0, 4.0, 4.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018325835117138922, -0.00017826180555857718, -0.00017326525994576514, -0.00016826872888486832, -0.00016327218327205628, -0.00015827563765924424, -0.00015327910659834743, -0.00014828256098553538, -0.00014328601537272334, -0.0001382894697599113, -0.00013329292414709926, -0.00012829639308620244, -0.0001232998474733904, -0.00011830330186057836, -0.00011330676352372393, -0.0001083102251868695, -0.00010331367957405746, -9.831713396124542e-05, -9.332059562439099e-05, -8.832405728753656e-05, -8.332751167472452e-05, -7.833096606191248e-05, -7.333442772505805e-05, -6.833788938820362e-05, -6.334134377539158e-05, -5.8344801800558344e-05, -5.334825982572511e-05, -4.835171785089187e-05, -4.335517587605864e-05, -3.83586339012254e-05, -3.336209192639217e-05, -2.8365549951558933e-05, -2.336899342481047e-05, -1.8372451449977234e-05, -1.3375909475143999e-05, -8.379367500310764e-06, -3.3828255254775286e-06, 1.6137164493557066e-06, 6.610258424188942e-06, 1.1606800399022177e-05, 1.6603342373855412e-05, 2.1599884348688647e-05, 2.6596426323521882e-05, 3.159296829835512e-05, 3.658951027318835e-05, 4.158605224802159e-05, 4.658259422285482e-05, 5.157913619768806e-05, 5.657567817252129e-05, 6.157222378533334e-05, 6.656876212218776e-05, 7.156530045904219e-05, 7.656184607185423e-05, 8.155839168466628e-05, 8.65549300215207e-05, 9.155146835837513e-05, 9.654801397118717e-05, 0.00010154455958399922, 0.00010654109792085364, 0.00011153763625770807, 0.00011653418187052011, 0.00012153072748333216, 0.0001265272730961442, 0.000131523804157041, 0.00013652034976985306]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 4.0, 11.0, 13.0, 18.0, 16.0, 26.0, 18.0, 28.0, 23.0, 24.0, 25.0, 24.0, 44.0, 35.0, 36.0, 45.0, 39.0, 26.0, 28.0, 39.0, 41.0, 45.0, 39.0, 47.0, 39.0, 28.0, 29.0, 22.0, 28.0, 24.0, 14.0, 16.0, 22.0, 12.0, 10.0, 12.0, 14.0, 11.0, 7.0, 4.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001153466000687331, -0.0001119141816161573, -0.0001084817704395391, -0.0001050493519869633, -0.0001016169335343875, -9.818452235776931e-05, -9.475210390519351e-05, -9.13196854526177e-05, -8.78872670000419e-05, -8.44548485474661e-05, -8.102243737084791e-05, -7.759001891827211e-05, -7.41576004656963e-05, -7.072518928907812e-05, -6.729277083650231e-05, -6.386035238392651e-05, -6.0427937569329515e-05, -5.699552275473252e-05, -5.3563104302156717e-05, -5.013068948755972e-05, -4.669827103498392e-05, -4.326585622038692e-05, -3.983343776781112e-05, -3.6401022953214124e-05, -3.296860813861713e-05, -2.953619150503073e-05, -2.610377487144433e-05, -2.2671360056847334e-05, -1.923894160427153e-05, -1.5806526789674535e-05, -1.2374110156088136e-05, -8.941693522501737e-06, -5.509275069925934e-06, -2.0768586637132103e-06, 1.3555577424995136e-06, 4.787973921338562e-06, 8.220390554924961e-06, 1.1652806279016659e-05, 1.5085222912603058e-05, 1.8517639546189457e-05, 2.1950056179775856e-05, 2.5382472813362256e-05, 2.8814889446948655e-05, 3.2247306080535054e-05, 3.567972089513205e-05, 3.9112135709729046e-05, 4.254455416230485e-05, 4.597697261488065e-05, 4.940938742947765e-05, 5.284180224407464e-05, 5.6274220696650445e-05, 5.970663551124744e-05, 6.313905032584444e-05, 6.657146877842024e-05, 7.000388723099604e-05, 7.343629840761423e-05, 7.686871686019003e-05, 8.030113531276584e-05, 8.373354648938403e-05, 8.716596494195983e-05, 9.059838339453563e-05, 9.403079457115382e-05, 9.746321302372962e-05, 0.00010089563147630543, 0.00010432804992888123]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 9.0, 8.0, 9.0, 21.0, 28.0, 42.0, 56.0, 93.0, 106.0, 174.0, 240.0, 336.0, 461.0, 670.0, 913.0, 1231.0, 1754.0, 2547.0, 3458.0, 4993.0, 7266.0, 10607.0, 15761.0, 23774.0, 36322.0, 57349.0, 92725.0, 154794.0, 206365.0, 159073.0, 95782.0, 58381.0, 37398.0, 23964.0, 16346.0, 10776.0, 7453.0, 5029.0, 3547.0, 2494.0, 1776.0, 1287.0, 936.0, 641.0, 434.0, 344.0, 261.0, 157.0, 113.0, 86.0, 57.0, 36.0, 27.0, 27.0, 7.0, 11.0, 5.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.00017762184143066406, -0.00017198733985424042, -0.00016635283827781677, -0.00016071833670139313, -0.00015508383512496948, -0.00014944933354854584, -0.0001438148319721222, -0.00013818033039569855, -0.0001325458288192749, -0.00012691132724285126, -0.00012127682566642761, -0.00011564232409000397, -0.00011000782251358032, -0.00010437332093715668, -9.873881936073303e-05, -9.310431778430939e-05, -8.746981620788574e-05, -8.18353146314621e-05, -7.620081305503845e-05, -7.056631147861481e-05, -6.493180990219116e-05, -5.929730832576752e-05, -5.366280674934387e-05, -4.802830517292023e-05, -4.239380359649658e-05, -3.675930202007294e-05, -3.112480044364929e-05, -2.5490298867225647e-05, -1.9855797290802002e-05, -1.4221295714378357e-05, -8.586794137954712e-06, -2.952292561531067e-06, 2.682209014892578e-06, 8.316710591316223e-06, 1.3951212167739868e-05, 1.9585713744163513e-05, 2.5220215320587158e-05, 3.08547168970108e-05, 3.648921847343445e-05, 4.212372004985809e-05, 4.775822162628174e-05, 5.339272320270538e-05, 5.902722477912903e-05, 6.466172635555267e-05, 7.029622793197632e-05, 7.593072950839996e-05, 8.156523108482361e-05, 8.719973266124725e-05, 9.28342342376709e-05, 9.846873581409454e-05, 0.00010410323739051819, 0.00010973773896694183, 0.00011537224054336548, 0.00012100674211978912, 0.00012664124369621277, 0.00013227574527263641, 0.00013791024684906006, 0.0001435447484254837, 0.00014917925000190735, 0.000154813751578331, 0.00016044825315475464, 0.00016608275473117828, 0.00017171725630760193, 0.00017735175788402557, 0.00018298625946044922]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 5.0, 10.0, 19.0, 28.0, 13.0, 21.0, 22.0, 32.0, 24.0, 30.0, 29.0, 28.0, 37.0, 37.0, 38.0, 43.0, 31.0, 40.0, 37.0, 36.0, 38.0, 38.0, 43.0, 28.0, 42.0, 29.0, 14.0, 23.0, 30.0, 22.0, 22.0, 11.0, 12.0, 11.0, 13.0, 11.0, 5.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 5.0], "bins": [-0.00010061264038085938, -9.786803275346756e-05, -9.512342512607574e-05, -9.237881749868393e-05, -8.963420987129211e-05, -8.68896022439003e-05, -8.414499461650848e-05, -8.140038698911667e-05, -7.865577936172485e-05, -7.591117173433304e-05, -7.316656410694122e-05, -7.042195647954941e-05, -6.767734885215759e-05, -6.493274122476578e-05, -6.218813359737396e-05, -5.944352596998215e-05, -5.669891834259033e-05, -5.395431071519852e-05, -5.12097030878067e-05, -4.8465095460414886e-05, -4.572048783302307e-05, -4.2975880205631256e-05, -4.023127257823944e-05, -3.7486664950847626e-05, -3.474205732345581e-05, -3.1997449696063995e-05, -2.925284206867218e-05, -2.6508234441280365e-05, -2.376362681388855e-05, -2.1019019186496735e-05, -1.827441155910492e-05, -1.5529803931713104e-05, -1.2785196304321289e-05, -1.0040588676929474e-05, -7.295981049537659e-06, -4.5513734221458435e-06, -1.8067657947540283e-06, 9.378418326377869e-07, 3.682449460029602e-06, 6.427057087421417e-06, 9.171664714813232e-06, 1.1916272342205048e-05, 1.4660879969596863e-05, 1.7405487596988678e-05, 2.0150095224380493e-05, 2.289470285177231e-05, 2.5639310479164124e-05, 2.838391810655594e-05, 3.1128525733947754e-05, 3.387313336133957e-05, 3.6617740988731384e-05, 3.93623486161232e-05, 4.2106956243515015e-05, 4.485156387090683e-05, 4.7596171498298645e-05, 5.034077912569046e-05, 5.3085386753082275e-05, 5.582999438047409e-05, 5.8574602007865906e-05, 6.131920963525772e-05, 6.406381726264954e-05, 6.680842489004135e-05, 6.955303251743317e-05, 7.229764014482498e-05, 7.50422477722168e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 1.0, 13.0, 10.0, 15.0, 31.0, 39.0, 69.0, 85.0, 137.0, 178.0, 267.0, 422.0, 616.0, 850.0, 1254.0, 2016.0, 3010.0, 4503.0, 7285.0, 11207.0, 17937.0, 28947.0, 48321.0, 80771.0, 141551.0, 226418.0, 194051.0, 110301.0, 64490.0, 38978.0, 23500.0, 14703.0, 9288.0, 5966.0, 3779.0, 2465.0, 1626.0, 1087.0, 777.0, 482.0, 367.0, 237.0, 149.0, 116.0, 83.0, 57.0, 34.0, 14.0, 19.0, 8.0, 10.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.00018525123596191406, -0.0001794230192899704, -0.00017359480261802673, -0.00016776658594608307, -0.0001619383692741394, -0.00015611015260219574, -0.00015028193593025208, -0.0001444537192583084, -0.00013862550258636475, -0.00013279728591442108, -0.00012696906924247742, -0.00012114085257053375, -0.00011531263589859009, -0.00010948441922664642, -0.00010365620255470276, -9.78279858827591e-05, -9.199976921081543e-05, -8.617155253887177e-05, -8.03433358669281e-05, -7.451511919498444e-05, -6.868690252304077e-05, -6.285868585109711e-05, -5.703046917915344e-05, -5.120225250720978e-05, -4.537403583526611e-05, -3.954581916332245e-05, -3.3717602491378784e-05, -2.788938581943512e-05, -2.2061169147491455e-05, -1.623295247554779e-05, -1.0404735803604126e-05, -4.5765191316604614e-06, 1.2516975402832031e-06, 7.079914212226868e-06, 1.2908130884170532e-05, 1.8736347556114197e-05, 2.456456422805786e-05, 3.0392780900001526e-05, 3.622099757194519e-05, 4.2049214243888855e-05, 4.787743091583252e-05, 5.3705647587776184e-05, 5.953386425971985e-05, 6.536208093166351e-05, 7.119029760360718e-05, 7.701851427555084e-05, 8.284673094749451e-05, 8.867494761943817e-05, 9.450316429138184e-05, 0.0001003313809633255, 0.00010615959763526917, 0.00011198781430721283, 0.0001178160309791565, 0.00012364424765110016, 0.00012947246432304382, 0.0001353006809949875, 0.00014112889766693115, 0.00014695711433887482, 0.00015278533101081848, 0.00015861354768276215, 0.0001644417643547058, 0.00017026998102664948, 0.00017609819769859314, 0.0001819264143705368, 0.00018775463104248047]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 5.0, 6.0, 8.0, 6.0, 10.0, 12.0, 15.0, 17.0, 18.0, 25.0, 17.0, 26.0, 19.0, 37.0, 34.0, 27.0, 36.0, 37.0, 32.0, 35.0, 43.0, 44.0, 52.0, 38.0, 49.0, 39.0, 35.0, 31.0, 26.0, 27.0, 22.0, 16.0, 29.0, 15.0, 9.0, 13.0, 14.0, 14.0, 3.0, 11.0, 11.0, 2.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-5.704164505004883e-05, -5.539972335100174e-05, -5.375780165195465e-05, -5.211587995290756e-05, -5.0473958253860474e-05, -4.8832036554813385e-05, -4.7190114855766296e-05, -4.554819315671921e-05, -4.390627145767212e-05, -4.226434975862503e-05, -4.062242805957794e-05, -3.898050636053085e-05, -3.7338584661483765e-05, -3.5696662962436676e-05, -3.405474126338959e-05, -3.24128195643425e-05, -3.077089786529541e-05, -2.912897616624832e-05, -2.7487054467201233e-05, -2.5845132768154144e-05, -2.4203211069107056e-05, -2.2561289370059967e-05, -2.091936767101288e-05, -1.927744597196579e-05, -1.76355242729187e-05, -1.5993602573871613e-05, -1.4351680874824524e-05, -1.2709759175777435e-05, -1.1067837476730347e-05, -9.425915777683258e-06, -7.78399407863617e-06, -6.142072379589081e-06, -4.500150680541992e-06, -2.8582289814949036e-06, -1.216307282447815e-06, 4.256144165992737e-07, 2.0675361156463623e-06, 3.709457814693451e-06, 5.3513795137405396e-06, 6.993301212787628e-06, 8.635222911834717e-06, 1.0277144610881805e-05, 1.1919066309928894e-05, 1.3560988008975983e-05, 1.5202909708023071e-05, 1.684483140707016e-05, 1.848675310611725e-05, 2.0128674805164337e-05, 2.1770596504211426e-05, 2.3412518203258514e-05, 2.5054439902305603e-05, 2.669636160135269e-05, 2.833828330039978e-05, 2.998020499944687e-05, 3.162212669849396e-05, 3.3264048397541046e-05, 3.4905970096588135e-05, 3.6547891795635223e-05, 3.818981349468231e-05, 3.98317351937294e-05, 4.147365689277649e-05, 4.311557859182358e-05, 4.4757500290870667e-05, 4.6399421989917755e-05, 4.8041343688964844e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 9.0, 7.0, 13.0, 22.0, 22.0, 22.0, 53.0, 56.0, 61.0, 101.0, 124.0, 161.0, 227.0, 322.0, 432.0, 623.0, 927.0, 1503.0, 2458.0, 4500.0, 11471.0, 70354.0, 919330.0, 20653.0, 6447.0, 3133.0, 1759.0, 1154.0, 707.0, 554.0, 364.0, 245.0, 181.0, 136.0, 102.0, 79.0, 58.0, 43.0, 29.0, 30.0, 24.0, 14.0, 9.0, 9.0, 13.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.412101745605469e-05, -5.2440911531448364e-05, -5.076080560684204e-05, -4.908069968223572e-05, -4.7400593757629395e-05, -4.572048783302307e-05, -4.404038190841675e-05, -4.2360275983810425e-05, -4.06801700592041e-05, -3.900006413459778e-05, -3.7319958209991455e-05, -3.563985228538513e-05, -3.395974636077881e-05, -3.2279640436172485e-05, -3.059953451156616e-05, -2.891942858695984e-05, -2.7239322662353516e-05, -2.5559216737747192e-05, -2.387911081314087e-05, -2.2199004888534546e-05, -2.0518898963928223e-05, -1.88387930393219e-05, -1.7158687114715576e-05, -1.5478581190109253e-05, -1.379847526550293e-05, -1.2118369340896606e-05, -1.0438263416290283e-05, -8.75815749168396e-06, -7.078051567077637e-06, -5.3979456424713135e-06, -3.7178397178649902e-06, -2.037733793258667e-06, -3.5762786865234375e-07, 1.3224780559539795e-06, 3.0025839805603027e-06, 4.682689905166626e-06, 6.362795829772949e-06, 8.042901754379272e-06, 9.723007678985596e-06, 1.1403113603591919e-05, 1.3083219528198242e-05, 1.4763325452804565e-05, 1.644343137741089e-05, 1.8123537302017212e-05, 1.9803643226623535e-05, 2.148374915122986e-05, 2.316385507583618e-05, 2.4843961000442505e-05, 2.6524066925048828e-05, 2.820417284965515e-05, 2.9884278774261475e-05, 3.15643846988678e-05, 3.324449062347412e-05, 3.4924596548080444e-05, 3.660470247268677e-05, 3.828480839729309e-05, 3.9964914321899414e-05, 4.164502024650574e-05, 4.332512617111206e-05, 4.5005232095718384e-05, 4.668533802032471e-05, 4.836544394493103e-05, 5.0045549869537354e-05, 5.172565579414368e-05, 5.340576171875e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 0.0, 34.0, 0.0, 0.0, 41.0, 0.0, 0.0, 79.0, 0.0, 0.0, 0.0, 178.0, 0.0, 0.0, 330.0, 0.0, 0.0, 166.0, 0.0, 0.0, 85.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 33.0, 0.0, 0.0, 15.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.370246410369873e-07, -6.183981895446777e-07, -5.997717380523682e-07, -5.811452865600586e-07, -5.62518835067749e-07, -5.438923835754395e-07, -5.252659320831299e-07, -5.066394805908203e-07, -4.880130290985107e-07, -4.6938657760620117e-07, -4.507601261138916e-07, -4.3213367462158203e-07, -4.1350722312927246e-07, -3.948807716369629e-07, -3.762543201446533e-07, -3.5762786865234375e-07, -3.390014171600342e-07, -3.203749656677246e-07, -3.0174851417541504e-07, -2.8312206268310547e-07, -2.644956111907959e-07, -2.4586915969848633e-07, -2.2724270820617676e-07, -2.086162567138672e-07, -1.8998980522155762e-07, -1.7136335372924805e-07, -1.5273690223693848e-07, -1.341104507446289e-07, -1.1548399925231934e-07, -9.685754776000977e-08, -7.82310962677002e-08, -5.960464477539063e-08, -4.0978193283081055e-08, -2.2351741790771484e-08, -3.725290298461914e-09, 1.4901161193847656e-08, 3.3527612686157227e-08, 5.21540641784668e-08, 7.078051567077637e-08, 8.940696716308594e-08, 1.0803341865539551e-07, 1.2665987014770508e-07, 1.4528632164001465e-07, 1.6391277313232422e-07, 1.825392246246338e-07, 2.0116567611694336e-07, 2.1979212760925293e-07, 2.384185791015625e-07, 2.5704503059387207e-07, 2.7567148208618164e-07, 2.942979335784912e-07, 3.129243850708008e-07, 3.3155083656311035e-07, 3.501772880554199e-07, 3.688037395477295e-07, 3.8743019104003906e-07, 4.0605664253234863e-07, 4.246830940246582e-07, 4.4330954551696777e-07, 4.6193599700927734e-07, 4.805624485015869e-07, 4.991888999938965e-07, 5.178153514862061e-07, 5.364418029785156e-07]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 7.0, 5.0, 13.0, 19.0, 16.0, 18.0, 28.0, 40.0, 73.0, 80.0, 87.0, 132.0, 230.0, 282.0, 392.0, 548.0, 827.0, 1171.0, 1740.0, 2388.0, 3520.0, 6334.0, 26153.0, 958920.0, 27348.0, 6408.0, 3693.0, 2427.0, 1661.0, 1176.0, 791.0, 582.0, 392.0, 290.0, 212.0, 156.0, 115.0, 74.0, 55.0, 40.0, 32.0, 27.0, 20.0, 10.0, 4.0, 6.0, 3.0, 7.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.071826934814453e-05, -8.774455636739731e-05, -8.477084338665009e-05, -8.179713040590286e-05, -7.882341742515564e-05, -7.584970444440842e-05, -7.28759914636612e-05, -6.990227848291397e-05, -6.692856550216675e-05, -6.395485252141953e-05, -6.09811395406723e-05, -5.800742655992508e-05, -5.5033713579177856e-05, -5.2060000598430634e-05, -4.908628761768341e-05, -4.611257463693619e-05, -4.3138861656188965e-05, -4.016514867544174e-05, -3.719143569469452e-05, -3.4217722713947296e-05, -3.124400973320007e-05, -2.827029675245285e-05, -2.5296583771705627e-05, -2.2322870790958405e-05, -1.934915781021118e-05, -1.637544482946396e-05, -1.3401731848716736e-05, -1.0428018867969513e-05, -7.45430588722229e-06, -4.480592906475067e-06, -1.5068799257278442e-06, 1.4668330550193787e-06, 4.4405460357666016e-06, 7.4142590165138245e-06, 1.0387971997261047e-05, 1.336168497800827e-05, 1.6335397958755493e-05, 1.9309110939502716e-05, 2.228282392024994e-05, 2.5256536900997162e-05, 2.8230249881744385e-05, 3.120396286249161e-05, 3.417767584323883e-05, 3.7151388823986053e-05, 4.0125101804733276e-05, 4.30988147854805e-05, 4.607252776622772e-05, 4.9046240746974945e-05, 5.201995372772217e-05, 5.499366670846939e-05, 5.7967379689216614e-05, 6.094109266996384e-05, 6.391480565071106e-05, 6.688851863145828e-05, 6.98622316122055e-05, 7.283594459295273e-05, 7.580965757369995e-05, 7.878337055444717e-05, 8.17570835351944e-05, 8.473079651594162e-05, 8.770450949668884e-05, 9.067822247743607e-05, 9.365193545818329e-05, 9.662564843893051e-05, 9.959936141967773e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 12.0, 23.0, 63.0, 777.0, 55.0, 20.0, 15.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.045797348022461e-05, -2.960115671157837e-05, -2.874433994293213e-05, -2.788752317428589e-05, -2.703070640563965e-05, -2.6173889636993408e-05, -2.5317072868347168e-05, -2.4460256099700928e-05, -2.3603439331054688e-05, -2.2746622562408447e-05, -2.1889805793762207e-05, -2.1032989025115967e-05, -2.0176172256469727e-05, -1.9319355487823486e-05, -1.8462538719177246e-05, -1.7605721950531006e-05, -1.6748905181884766e-05, -1.5892088413238525e-05, -1.5035271644592285e-05, -1.4178454875946045e-05, -1.3321638107299805e-05, -1.2464821338653564e-05, -1.1608004570007324e-05, -1.0751187801361084e-05, -9.894371032714844e-06, -9.037554264068604e-06, -8.180737495422363e-06, -7.323920726776123e-06, -6.467103958129883e-06, -5.610287189483643e-06, -4.753470420837402e-06, -3.896653652191162e-06, -3.039836883544922e-06, -2.1830201148986816e-06, -1.3262033462524414e-06, -4.6938657760620117e-07, 3.8743019104003906e-07, 1.2442469596862793e-06, 2.1010637283325195e-06, 2.9578804969787598e-06, 3.814697265625e-06, 4.67151403427124e-06, 5.5283308029174805e-06, 6.385147571563721e-06, 7.241964340209961e-06, 8.098781108856201e-06, 8.955597877502441e-06, 9.812414646148682e-06, 1.0669231414794922e-05, 1.1526048183441162e-05, 1.2382864952087402e-05, 1.3239681720733643e-05, 1.4096498489379883e-05, 1.4953315258026123e-05, 1.5810132026672363e-05, 1.6666948795318604e-05, 1.7523765563964844e-05, 1.8380582332611084e-05, 1.9237399101257324e-05, 2.0094215869903564e-05, 2.0951032638549805e-05, 2.1807849407196045e-05, 2.2664666175842285e-05, 2.3521482944488525e-05, 2.4378299713134766e-05]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 5.0, 6.0, 7.0, 12.0, 13.0, 20.0, 20.0, 22.0, 30.0, 34.0, 48.0, 55.0, 78.0, 80.0, 80.0, 79.0, 66.0, 45.0, 44.0, 37.0, 33.0, 34.0, 19.0, 16.0, 21.0, 15.0, 8.0, 6.0, 6.0, 7.0, 4.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012496898125391454, -0.0001214294316014275, -0.00011788987467298284, -0.00011435031774453819, -0.00011081076809205115, -0.00010727121843956411, -0.00010373166151111946, -0.0001001921045826748, -9.665255493018776e-05, -9.311300527770072e-05, -8.957344834925607e-05, -8.603389142081141e-05, -8.249434176832438e-05, -7.895479211583734e-05, -7.541523518739268e-05, -7.187567825894803e-05, -6.833612860646099e-05, -6.479657895397395e-05, -6.12570220255293e-05, -5.771746873506345e-05, -5.41779154445976e-05, -5.0638362154131755e-05, -4.709880886366591e-05, -4.355925557320006e-05, -4.0019702282734215e-05, -3.648014899226837e-05, -3.294059570180252e-05, -2.9401042411336675e-05, -2.586148912087083e-05, -2.2321935830404982e-05, -1.8782382539939135e-05, -1.5242829249473289e-05, -1.1703268683049828e-05, -8.163715392583981e-06, -4.6241621021181345e-06, -1.0846088116522878e-06, 2.454944478813559e-06, 5.9944977692794055e-06, 9.534051059745252e-06, 1.3073604350211099e-05, 1.6613157640676945e-05, 2.0152710931142792e-05, 2.369226422160864e-05, 2.7231817512074485e-05, 3.077137080254033e-05, 3.431092409300618e-05, 3.7850477383472025e-05, 4.139003067393787e-05, 4.492958396440372e-05, 4.8469137254869565e-05, 5.200869054533541e-05, 5.554824383580126e-05, 5.9087797126267105e-05, 6.262735405471176e-05, 6.61669037071988e-05, 6.970645335968584e-05, 7.324601028813049e-05, 7.678556721657515e-05, 8.032511686906219e-05, 8.386466652154922e-05, 8.740422344999388e-05, 9.094378037843853e-05, 9.448333003092557e-05, 9.802287968341261e-05, 0.00010156243661185727]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 8.0, 10.0, 14.0, 13.0, 12.0, 14.0, 17.0, 28.0, 21.0, 27.0, 33.0, 32.0, 31.0, 43.0, 39.0, 31.0, 32.0, 34.0, 37.0, 41.0, 45.0, 49.0, 46.0, 40.0, 42.0, 29.0, 35.0, 27.0, 22.0, 26.0, 11.0, 10.0, 17.0, 15.0, 14.0, 14.0, 4.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.777162631507963e-05, -9.47269654716365e-05, -9.168231190415099e-05, -8.863765106070787e-05, -8.559299021726474e-05, -8.254832937382162e-05, -7.95036758063361e-05, -7.645901496289298e-05, -7.341435411944985e-05, -7.036969327600673e-05, -6.732503970852122e-05, -6.428037886507809e-05, -6.123571802163497e-05, -5.819106081617065e-05, -5.514640361070633e-05, -5.2101742767263204e-05, -4.905708919977769e-05, -4.6012431994313374e-05, -4.296777115087025e-05, -3.992311394540593e-05, -3.6878453101962805e-05, -3.3833795896498486e-05, -3.078913869103417e-05, -2.7744479666580446e-05, -2.4699820642126724e-05, -2.1655161617673002e-05, -1.861050259321928e-05, -1.5565845387754962e-05, -1.252118636330124e-05, -9.476527338847518e-06, -6.4318701333831996e-06, -3.3872111089294776e-06, -3.425593604333699e-07, 2.702099209273001e-06, 5.746757778979372e-06, 8.791415893938392e-06, 1.1836074918392114e-05, 1.4880733942845836e-05, 1.7925391148310155e-05, 2.0970050172763877e-05, 2.40147091972176e-05, 2.705936822167132e-05, 3.0104027246125042e-05, 3.314868445158936e-05, 3.619334165705368e-05, 3.9238002500496805e-05, 4.228265970596112e-05, 4.532731691142544e-05, 4.837197775486857e-05, 5.1416634960332885e-05, 5.446129580377601e-05, 5.750595300924033e-05, 6.0550613852683455e-05, 6.359527469612658e-05, 6.663992826361209e-05, 6.968458910705522e-05, 7.272924995049834e-05, 7.577391079394147e-05, 7.881856436142698e-05, 8.18632252048701e-05, 8.490788604831323e-05, 8.795254689175636e-05, 9.099720045924187e-05, 9.404186130268499e-05, 9.70865148701705e-05]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 2.0, 6.0, 8.0, 22.0, 31.0, 46.0, 51.0, 101.0, 113.0, 185.0, 292.0, 527.0, 779.0, 1200.0, 2011.0, 3146.0, 5257.0, 8683.0, 14960.0, 25937.0, 47633.0, 93130.0, 201264.0, 562645.0, 1765120.0, 932110.0, 277785.0, 119536.0, 59012.0, 30790.0, 17244.0, 9708.0, 5663.0, 3407.0, 2153.0, 1295.0, 815.0, 504.0, 362.0, 215.0, 168.0, 107.0, 68.0, 56.0, 28.0, 28.0, 22.0, 17.0, 14.0, 7.0, 9.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.00012069940567016602, -0.0001161741092801094, -0.0001116488128900528, -0.00010712351649999619, -0.00010259822010993958, -9.807292371988297e-05, -9.354762732982635e-05, -8.902233093976974e-05, -8.449703454971313e-05, -7.997173815965652e-05, -7.544644176959991e-05, -7.09211453795433e-05, -6.63958489894867e-05, -6.187055259943008e-05, -5.7345256209373474e-05, -5.2819959819316864e-05, -4.8294663429260254e-05, -4.3769367039203644e-05, -3.9244070649147034e-05, -3.4718774259090424e-05, -3.0193477869033813e-05, -2.5668181478977203e-05, -2.1142885088920593e-05, -1.6617588698863983e-05, -1.2092292308807373e-05, -7.566995918750763e-06, -3.041699528694153e-06, 1.4835968613624573e-06, 6.008893251419067e-06, 1.0534189641475677e-05, 1.5059486031532288e-05, 1.9584782421588898e-05, 2.4110078811645508e-05, 2.8635375201702118e-05, 3.316067159175873e-05, 3.768596798181534e-05, 4.221126437187195e-05, 4.673656076192856e-05, 5.126185715198517e-05, 5.578715354204178e-05, 6.031244993209839e-05, 6.4837746322155e-05, 6.936304271221161e-05, 7.388833910226822e-05, 7.841363549232483e-05, 8.293893188238144e-05, 8.746422827243805e-05, 9.198952466249466e-05, 9.651482105255127e-05, 0.00010104011744260788, 0.00010556541383266449, 0.0001100907102227211, 0.00011461600661277771, 0.00011914130300283432, 0.00012366659939289093, 0.00012819189578294754, 0.00013271719217300415, 0.00013724248856306076, 0.00014176778495311737, 0.00014629308134317398, 0.0001508183777332306, 0.0001553436741232872, 0.0001598689705133438, 0.00016439426690340042, 0.00016891956329345703]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 5.0, 8.0, 8.0, 18.0, 8.0, 16.0, 10.0, 16.0, 30.0, 26.0, 25.0, 33.0, 37.0, 37.0, 45.0, 31.0, 45.0, 31.0, 35.0, 46.0, 52.0, 44.0, 38.0, 35.0, 46.0, 35.0, 42.0, 27.0, 31.0, 24.0, 17.0, 12.0, 21.0, 12.0, 11.0, 11.0, 6.0, 8.0, 9.0, 4.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.079673767089844e-05, -5.8867037296295166e-05, -5.6937336921691895e-05, -5.500763654708862e-05, -5.307793617248535e-05, -5.114823579788208e-05, -4.921853542327881e-05, -4.728883504867554e-05, -4.5359134674072266e-05, -4.3429434299468994e-05, -4.149973392486572e-05, -3.957003355026245e-05, -3.764033317565918e-05, -3.571063280105591e-05, -3.378093242645264e-05, -3.1851232051849365e-05, -2.9921531677246094e-05, -2.7991831302642822e-05, -2.606213092803955e-05, -2.413243055343628e-05, -2.2202730178833008e-05, -2.0273029804229736e-05, -1.8343329429626465e-05, -1.6413629055023193e-05, -1.4483928680419922e-05, -1.255422830581665e-05, -1.0624527931213379e-05, -8.694827556610107e-06, -6.765127182006836e-06, -4.8354268074035645e-06, -2.905726432800293e-06, -9.760260581970215e-07, 9.5367431640625e-07, 2.8833746910095215e-06, 4.813075065612793e-06, 6.7427754402160645e-06, 8.672475814819336e-06, 1.0602176189422607e-05, 1.2531876564025879e-05, 1.446157693862915e-05, 1.6391277313232422e-05, 1.8320977687835693e-05, 2.0250678062438965e-05, 2.2180378437042236e-05, 2.4110078811645508e-05, 2.603977918624878e-05, 2.796947956085205e-05, 2.9899179935455322e-05, 3.1828880310058594e-05, 3.3758580684661865e-05, 3.568828105926514e-05, 3.761798143386841e-05, 3.954768180847168e-05, 4.147738218307495e-05, 4.340708255767822e-05, 4.5336782932281494e-05, 4.7266483306884766e-05, 4.919618368148804e-05, 5.112588405609131e-05, 5.305558443069458e-05, 5.498528480529785e-05, 5.691498517990112e-05, 5.8844685554504395e-05, 6.0774385929107666e-05, 6.270408630371094e-05]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 12.0, 14.0, 26.0, 36.0, 39.0, 64.0, 92.0, 125.0, 211.0, 308.0, 432.0, 671.0, 941.0, 1561.0, 2246.0, 3301.0, 5314.0, 7887.0, 12489.0, 20105.0, 31472.0, 52158.0, 88877.0, 153873.0, 294876.0, 613988.0, 1289866.0, 807840.0, 353883.0, 187660.0, 104594.0, 59739.0, 36593.0, 22256.0, 14305.0, 9108.0, 5772.0, 3845.0, 2594.0, 1682.0, 1136.0, 758.0, 490.0, 333.0, 226.0, 160.0, 124.0, 74.0, 48.0, 25.0, 19.0, 16.0, 7.0, 8.0, 6.0, 3.0, 0.0, 4.0], "bins": [-9.655952453613281e-05, -9.360164403915405e-05, -9.064376354217529e-05, -8.768588304519653e-05, -8.472800254821777e-05, -8.177012205123901e-05, -7.881224155426025e-05, -7.58543610572815e-05, -7.289648056030273e-05, -6.993860006332397e-05, -6.698071956634521e-05, -6.402283906936646e-05, -6.10649585723877e-05, -5.8107078075408936e-05, -5.5149197578430176e-05, -5.2191317081451416e-05, -4.9233436584472656e-05, -4.6275556087493896e-05, -4.331767559051514e-05, -4.035979509353638e-05, -3.740191459655762e-05, -3.444403409957886e-05, -3.14861536026001e-05, -2.8528273105621338e-05, -2.5570392608642578e-05, -2.261251211166382e-05, -1.965463161468506e-05, -1.66967511177063e-05, -1.3738870620727539e-05, -1.078099012374878e-05, -7.82310962677002e-06, -4.86522912979126e-06, -1.9073486328125e-06, 1.0505318641662598e-06, 4.0084123611450195e-06, 6.966292858123779e-06, 9.924173355102539e-06, 1.2882053852081299e-05, 1.583993434906006e-05, 1.879781484603882e-05, 2.1755695343017578e-05, 2.4713575839996338e-05, 2.7671456336975098e-05, 3.062933683395386e-05, 3.358721733093262e-05, 3.654509782791138e-05, 3.950297832489014e-05, 4.2460858821868896e-05, 4.5418739318847656e-05, 4.8376619815826416e-05, 5.1334500312805176e-05, 5.4292380809783936e-05, 5.7250261306762695e-05, 6.0208141803741455e-05, 6.316602230072021e-05, 6.612390279769897e-05, 6.908178329467773e-05, 7.20396637916565e-05, 7.499754428863525e-05, 7.795542478561401e-05, 8.091330528259277e-05, 8.387118577957153e-05, 8.682906627655029e-05, 8.978694677352905e-05, 9.274482727050781e-05]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 6.0, 7.0, 7.0, 11.0, 14.0, 17.0, 17.0, 19.0, 20.0, 34.0, 36.0, 60.0, 50.0, 71.0, 64.0, 87.0, 104.0, 135.0, 179.0, 177.0, 203.0, 227.0, 250.0, 274.0, 218.0, 242.0, 206.0, 194.0, 168.0, 146.0, 146.0, 108.0, 79.0, 73.0, 77.0, 58.0, 54.0, 32.0, 45.0, 36.0, 23.0, 22.0, 13.0, 8.0, 10.0, 11.0, 6.0, 8.0, 8.0, 3.0, 1.0, 4.0, 2.0, 3.0], "bins": [-3.1113624572753906e-05, -3.019627183675766e-05, -2.9278919100761414e-05, -2.8361566364765167e-05, -2.744421362876892e-05, -2.6526860892772675e-05, -2.5609508156776428e-05, -2.4692155420780182e-05, -2.3774802684783936e-05, -2.285744994878769e-05, -2.1940097212791443e-05, -2.1022744476795197e-05, -2.010539174079895e-05, -1.9188039004802704e-05, -1.8270686268806458e-05, -1.735333353281021e-05, -1.6435980796813965e-05, -1.551862806081772e-05, -1.4601275324821472e-05, -1.3683922588825226e-05, -1.276656985282898e-05, -1.1849217116832733e-05, -1.0931864380836487e-05, -1.001451164484024e-05, -9.097158908843994e-06, -8.179806172847748e-06, -7.2624534368515015e-06, -6.345100700855255e-06, -5.427747964859009e-06, -4.5103952288627625e-06, -3.593042492866516e-06, -2.6756897568702698e-06, -1.7583370208740234e-06, -8.409842848777771e-07, 7.636845111846924e-08, 9.937211871147156e-07, 1.911073923110962e-06, 2.8284266591072083e-06, 3.7457793951034546e-06, 4.663132131099701e-06, 5.580484867095947e-06, 6.497837603092194e-06, 7.41519033908844e-06, 8.332543075084686e-06, 9.249895811080933e-06, 1.0167248547077179e-05, 1.1084601283073425e-05, 1.2001954019069672e-05, 1.2919306755065918e-05, 1.3836659491062164e-05, 1.475401222705841e-05, 1.5671364963054657e-05, 1.6588717699050903e-05, 1.750607043504715e-05, 1.8423423171043396e-05, 1.9340775907039642e-05, 2.025812864303589e-05, 2.1175481379032135e-05, 2.209283411502838e-05, 2.3010186851024628e-05, 2.3927539587020874e-05, 2.484489232301712e-05, 2.5762245059013367e-05, 2.6679597795009613e-05, 2.759695053100586e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 1.0, 5.0, 6.0, 6.0, 16.0, 14.0, 24.0, 19.0, 37.0, 36.0, 45.0, 61.0, 75.0, 84.0, 111.0, 91.0, 81.0, 66.0, 48.0, 26.0, 32.0, 21.0, 25.0, 16.0, 15.0, 8.0, 8.0, 4.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00011047763109672815, -0.00010744790779426694, -0.00010441818449180573, -0.00010138846118934453, -9.835873788688332e-05, -9.532901458442211e-05, -9.22992912819609e-05, -8.92695679794997e-05, -8.623984467703849e-05, -8.321012137457728e-05, -8.018039807211608e-05, -7.715067476965487e-05, -7.412095146719366e-05, -7.109122816473246e-05, -6.806150486227125e-05, -6.503178155981004e-05, -6.200205098139122e-05, -5.8972327678930014e-05, -5.594260437646881e-05, -5.29128810740076e-05, -4.9883157771546394e-05, -4.685343446908519e-05, -4.382370752864517e-05, -4.0793984226183966e-05, -3.776426092372276e-05, -3.473453762126155e-05, -3.1704814318800345e-05, -2.8675089197349735e-05, -2.5645365894888528e-05, -2.261564259242732e-05, -1.958591747097671e-05, -1.6556194168515503e-05, -1.3526463590096682e-05, -1.0496740287635475e-05, -7.467016075679567e-06, -4.437291863723658e-06, -1.4075685612624511e-06, 1.6221547411987558e-06, 4.651879862649366e-06, 7.681603165110573e-06, 1.071132646757178e-05, 1.3741049770032987e-05, 1.6770773072494194e-05, 1.9800498193944804e-05, 2.283022149640601e-05, 2.5859944798867218e-05, 2.888966992031783e-05, 3.1919393222779036e-05, 3.494911652524024e-05, 3.797883982770145e-05, 4.1008563130162656e-05, 4.403828643262386e-05, 4.706800973508507e-05, 5.009773303754628e-05, 5.312745997798629e-05, 5.61571832804475e-05, 5.9186906582908705e-05, 6.221663352334872e-05, 6.524635682580993e-05, 6.827608012827113e-05, 7.130580343073234e-05, 7.433552673319355e-05, 7.736525003565475e-05, 8.039497333811596e-05, 8.342469664057717e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 6.0, 10.0, 11.0, 15.0, 20.0, 20.0, 22.0, 21.0, 28.0, 43.0, 21.0, 38.0, 44.0, 34.0, 35.0, 29.0, 50.0, 50.0, 48.0, 40.0, 36.0, 41.0, 35.0, 36.0, 29.0, 24.0, 30.0, 25.0, 13.0, 22.0, 14.0, 18.0, 6.0, 15.0, 15.0, 6.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.92493049427867e-05, -6.719132943544537e-05, -6.513334665214643e-05, -6.30753711448051e-05, -6.1017388361506164e-05, -5.895941285416484e-05, -5.6901433708844706e-05, -5.4843454563524574e-05, -5.278547541820444e-05, -5.072749627288431e-05, -4.866951712756418e-05, -4.6611537982244045e-05, -4.455356247490272e-05, -4.249557969160378e-05, -4.0437604184262455e-05, -3.837962503894232e-05, -3.632164589362219e-05, -3.426366674830206e-05, -3.2205687602981925e-05, -3.0147710276651196e-05, -2.8089731131331064e-05, -2.603175198601093e-05, -2.3973774659680203e-05, -2.191579551436007e-05, -1.9857816369039938e-05, -1.7799837223719805e-05, -1.5741858078399673e-05, -1.3683880752068944e-05, -1.1625901606748812e-05, -9.56792246142868e-06, -7.509944225603249e-06, -5.451965989777818e-06, -3.3939795685000718e-06, -1.3360008779272903e-06, 7.219778126454912e-07, 2.7799565032182727e-06, 4.837935193791054e-06, 6.8959143391111866e-06, 8.953892574936617e-06, 1.1011870810762048e-05, 1.306984995608218e-05, 1.5127829101402313e-05, 1.7185808246722445e-05, 1.9243785573053174e-05, 2.1301764718373306e-05, 2.335974386369344e-05, 2.5417721190024167e-05, 2.74757003353443e-05, 2.9533679480664432e-05, 3.1591658625984564e-05, 3.36496377713047e-05, 3.570761691662483e-05, 3.776559606194496e-05, 3.982357156928629e-05, 4.188155071460642e-05, 4.393952985992655e-05, 4.5997509005246684e-05, 4.8055488150566816e-05, 5.011346729588695e-05, 5.217144644120708e-05, 5.4229421948548406e-05, 5.6287404731847346e-05, 5.834538023918867e-05, 6.0403359384508803e-05, 6.246133852982894e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 12.0, 7.0, 10.0, 22.0, 18.0, 38.0, 49.0, 67.0, 100.0, 150.0, 196.0, 288.0, 384.0, 663.0, 1028.0, 1466.0, 2282.0, 3462.0, 5240.0, 8235.0, 12836.0, 20758.0, 33668.0, 54085.0, 88517.0, 147074.0, 208749.0, 175194.0, 108210.0, 66443.0, 40435.0, 25015.0, 15311.0, 9984.0, 6478.0, 4082.0, 2626.0, 1783.0, 1178.0, 762.0, 515.0, 359.0, 220.0, 164.0, 124.0, 87.0, 56.0, 44.0, 28.0, 21.0, 11.0, 9.0, 5.0, 9.0, 2.0, 0.0, 2.0], "bins": [-0.00010395050048828125, -0.00010086596012115479, -9.778141975402832e-05, -9.469687938690186e-05, -9.161233901977539e-05, -8.852779865264893e-05, -8.544325828552246e-05, -8.2358717918396e-05, -7.927417755126953e-05, -7.618963718414307e-05, -7.31050968170166e-05, -7.002055644989014e-05, -6.693601608276367e-05, -6.385147571563721e-05, -6.076693534851074e-05, -5.768239498138428e-05, -5.459785461425781e-05, -5.151331424713135e-05, -4.842877388000488e-05, -4.534423351287842e-05, -4.225969314575195e-05, -3.917515277862549e-05, -3.6090612411499023e-05, -3.300607204437256e-05, -2.9921531677246094e-05, -2.683699131011963e-05, -2.3752450942993164e-05, -2.06679105758667e-05, -1.7583370208740234e-05, -1.449882984161377e-05, -1.1414289474487305e-05, -8.32974910736084e-06, -5.245208740234375e-06, -2.16066837310791e-06, 9.238719940185547e-07, 4.0084123611450195e-06, 7.092952728271484e-06, 1.017749309539795e-05, 1.3262033462524414e-05, 1.634657382965088e-05, 1.9431114196777344e-05, 2.251565456390381e-05, 2.5600194931030273e-05, 2.8684735298156738e-05, 3.17692756652832e-05, 3.485381603240967e-05, 3.793835639953613e-05, 4.10228967666626e-05, 4.410743713378906e-05, 4.719197750091553e-05, 5.027651786804199e-05, 5.336105823516846e-05, 5.644559860229492e-05, 5.953013896942139e-05, 6.261467933654785e-05, 6.569921970367432e-05, 6.878376007080078e-05, 7.186830043792725e-05, 7.495284080505371e-05, 7.803738117218018e-05, 8.112192153930664e-05, 8.42064619064331e-05, 8.729100227355957e-05, 9.037554264068604e-05, 9.34600830078125e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 9.0, 14.0, 11.0, 11.0, 16.0, 15.0, 26.0, 18.0, 20.0, 15.0, 25.0, 35.0, 29.0, 26.0, 30.0, 41.0, 40.0, 34.0, 36.0, 39.0, 35.0, 33.0, 37.0, 56.0, 22.0, 28.0, 41.0, 21.0, 19.0, 23.0, 27.0, 15.0, 24.0, 17.0, 12.0, 9.0, 12.0, 10.0, 12.0, 9.0, 5.0, 7.0, 1.0, 3.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.364418029785156e-05, -5.2036717534065247e-05, -5.042925477027893e-05, -4.8821792006492615e-05, -4.72143292427063e-05, -4.560686647891998e-05, -4.399940371513367e-05, -4.239194095134735e-05, -4.0784478187561035e-05, -3.917701542377472e-05, -3.75695526599884e-05, -3.596208989620209e-05, -3.435462713241577e-05, -3.2747164368629456e-05, -3.113970160484314e-05, -2.9532238841056824e-05, -2.7924776077270508e-05, -2.6317313313484192e-05, -2.4709850549697876e-05, -2.310238778591156e-05, -2.1494925022125244e-05, -1.9887462258338928e-05, -1.8279999494552612e-05, -1.6672536730766296e-05, -1.506507396697998e-05, -1.3457611203193665e-05, -1.1850148439407349e-05, -1.0242685675621033e-05, -8.635222911834717e-06, -7.027760148048401e-06, -5.420297384262085e-06, -3.812834620475769e-06, -2.205371856689453e-06, -5.979090929031372e-07, 1.0095536708831787e-06, 2.6170164346694946e-06, 4.2244791984558105e-06, 5.8319419622421265e-06, 7.439404726028442e-06, 9.046867489814758e-06, 1.0654330253601074e-05, 1.226179301738739e-05, 1.3869255781173706e-05, 1.5476718544960022e-05, 1.7084181308746338e-05, 1.8691644072532654e-05, 2.029910683631897e-05, 2.1906569600105286e-05, 2.35140323638916e-05, 2.5121495127677917e-05, 2.6728957891464233e-05, 2.833642065525055e-05, 2.9943883419036865e-05, 3.155134618282318e-05, 3.31588089466095e-05, 3.476627171039581e-05, 3.637373447418213e-05, 3.7981197237968445e-05, 3.958866000175476e-05, 4.119612276554108e-05, 4.280358552932739e-05, 4.441104829311371e-05, 4.6018511056900024e-05, 4.762597382068634e-05, 4.9233436584472656e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 7.0, 3.0, 13.0, 11.0, 13.0, 32.0, 30.0, 51.0, 84.0, 155.0, 253.0, 391.0, 624.0, 1070.0, 1986.0, 3498.0, 6685.0, 13549.0, 33817.0, 133602.0, 638637.0, 148077.0, 35970.0, 14525.0, 6936.0, 3652.0, 1981.0, 1149.0, 710.0, 382.0, 237.0, 162.0, 84.0, 54.0, 38.0, 27.0, 22.0, 13.0, 10.0, 9.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019228458404541016, -0.00018577277660369873, -0.0001792609691619873, -0.00017274916172027588, -0.00016623735427856445, -0.00015972554683685303, -0.0001532137393951416, -0.00014670193195343018, -0.00014019012451171875, -0.00013367831707000732, -0.0001271665096282959, -0.00012065470218658447, -0.00011414289474487305, -0.00010763108730316162, -0.0001011192798614502, -9.460747241973877e-05, -8.809566497802734e-05, -8.158385753631592e-05, -7.507205009460449e-05, -6.856024265289307e-05, -6.204843521118164e-05, -5.5536627769470215e-05, -4.902482032775879e-05, -4.251301288604736e-05, -3.600120544433594e-05, -2.9489398002624512e-05, -2.2977590560913086e-05, -1.646578311920166e-05, -9.953975677490234e-06, -3.4421682357788086e-06, 3.069639205932617e-06, 9.581446647644043e-06, 1.609325408935547e-05, 2.2605061531066895e-05, 2.911686897277832e-05, 3.5628676414489746e-05, 4.214048385620117e-05, 4.86522912979126e-05, 5.5164098739624023e-05, 6.167590618133545e-05, 6.818771362304688e-05, 7.46995210647583e-05, 8.121132850646973e-05, 8.772313594818115e-05, 9.423494338989258e-05, 0.000100746750831604, 0.00010725855827331543, 0.00011377036571502686, 0.00012028217315673828, 0.0001267939805984497, 0.00013330578804016113, 0.00013981759548187256, 0.00014632940292358398, 0.0001528412103652954, 0.00015935301780700684, 0.00016586482524871826, 0.0001723766326904297, 0.0001788884401321411, 0.00018540024757385254, 0.00019191205501556396, 0.0001984238624572754, 0.00020493566989898682, 0.00021144747734069824, 0.00021795928478240967, 0.0002244710922241211]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 4.0, 10.0, 8.0, 11.0, 13.0, 13.0, 18.0, 22.0, 23.0, 19.0, 25.0, 40.0, 37.0, 41.0, 36.0, 35.0, 45.0, 40.0, 41.0, 59.0, 43.0, 46.0, 40.0, 32.0, 33.0, 41.0, 32.0, 24.0, 27.0, 18.0, 29.0, 11.0, 14.0, 18.0, 7.0, 8.0, 7.0, 3.0, 6.0, 7.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.987550735473633e-05, -3.8702040910720825e-05, -3.752857446670532e-05, -3.635510802268982e-05, -3.5181641578674316e-05, -3.4008175134658813e-05, -3.283470869064331e-05, -3.166124224662781e-05, -3.0487775802612305e-05, -2.9314309358596802e-05, -2.81408429145813e-05, -2.6967376470565796e-05, -2.5793910026550293e-05, -2.462044358253479e-05, -2.3446977138519287e-05, -2.2273510694503784e-05, -2.110004425048828e-05, -1.992657780647278e-05, -1.8753111362457275e-05, -1.7579644918441772e-05, -1.640617847442627e-05, -1.5232712030410767e-05, -1.4059245586395264e-05, -1.288577914237976e-05, -1.1712312698364258e-05, -1.0538846254348755e-05, -9.365379810333252e-06, -8.191913366317749e-06, -7.018446922302246e-06, -5.844980478286743e-06, -4.67151403427124e-06, -3.4980475902557373e-06, -2.3245811462402344e-06, -1.1511147022247314e-06, 2.2351741790771484e-08, 1.1958181858062744e-06, 2.3692846298217773e-06, 3.5427510738372803e-06, 4.716217517852783e-06, 5.889683961868286e-06, 7.063150405883789e-06, 8.236616849899292e-06, 9.410083293914795e-06, 1.0583549737930298e-05, 1.17570161819458e-05, 1.2930482625961304e-05, 1.4103949069976807e-05, 1.527741551399231e-05, 1.6450881958007812e-05, 1.7624348402023315e-05, 1.879781484603882e-05, 1.997128129005432e-05, 2.1144747734069824e-05, 2.2318214178085327e-05, 2.349168062210083e-05, 2.4665147066116333e-05, 2.5838613510131836e-05, 2.701207995414734e-05, 2.8185546398162842e-05, 2.9359012842178345e-05, 3.053247928619385e-05, 3.170594573020935e-05, 3.2879412174224854e-05, 3.4052878618240356e-05, 3.522634506225586e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 4.0, 15.0, 21.0, 37.0, 51.0, 88.0, 121.0, 173.0, 271.0, 402.0, 599.0, 933.0, 1455.0, 2407.0, 4175.0, 7947.0, 17517.0, 48107.0, 244390.0, 594602.0, 77553.0, 24245.0, 10505.0, 5142.0, 2873.0, 1749.0, 1043.0, 715.0, 474.0, 298.0, 216.0, 139.0, 77.0, 53.0, 53.0, 21.0, 19.0, 22.0, 14.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8100948333740234e-05, -4.660617560148239e-05, -4.511140286922455e-05, -4.3616630136966705e-05, -4.212185740470886e-05, -4.062708467245102e-05, -3.9132311940193176e-05, -3.763753920793533e-05, -3.614276647567749e-05, -3.464799374341965e-05, -3.3153221011161804e-05, -3.165844827890396e-05, -3.0163675546646118e-05, -2.8668902814388275e-05, -2.7174130082130432e-05, -2.567935734987259e-05, -2.4184584617614746e-05, -2.2689811885356903e-05, -2.119503915309906e-05, -1.9700266420841217e-05, -1.8205493688583374e-05, -1.671072095632553e-05, -1.5215948224067688e-05, -1.3721175491809845e-05, -1.2226402759552002e-05, -1.0731630027294159e-05, -9.236857295036316e-06, -7.742084562778473e-06, -6.24731183052063e-06, -4.752539098262787e-06, -3.257766366004944e-06, -1.7629936337471008e-06, -2.682209014892578e-07, 1.2265518307685852e-06, 2.7213245630264282e-06, 4.216097295284271e-06, 5.710870027542114e-06, 7.205642759799957e-06, 8.7004154920578e-06, 1.0195188224315643e-05, 1.1689960956573486e-05, 1.318473368883133e-05, 1.4679506421089172e-05, 1.6174279153347015e-05, 1.766905188560486e-05, 1.91638246178627e-05, 2.0658597350120544e-05, 2.2153370082378387e-05, 2.364814281463623e-05, 2.5142915546894073e-05, 2.6637688279151917e-05, 2.813246101140976e-05, 2.9627233743667603e-05, 3.1122006475925446e-05, 3.261677920818329e-05, 3.411155194044113e-05, 3.5606324672698975e-05, 3.710109740495682e-05, 3.859587013721466e-05, 4.0090642869472504e-05, 4.158541560173035e-05, 4.308018833398819e-05, 4.457496106624603e-05, 4.6069733798503876e-05, 4.756450653076172e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 15.0, 8.0, 12.0, 8.0, 10.0, 18.0, 12.0, 25.0, 19.0, 23.0, 94.0, 50.0, 57.0, 60.0, 141.0, 89.0, 58.0, 46.0, 25.0, 48.0, 26.0, 14.0, 17.0, 30.0, 15.0, 9.0, 7.0, 10.0, 11.0, 5.0, 4.0, 0.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6226043701171875e-06, -2.54996120929718e-06, -2.477318048477173e-06, -2.4046748876571655e-06, -2.332031726837158e-06, -2.259388566017151e-06, -2.1867454051971436e-06, -2.1141022443771362e-06, -2.041459083557129e-06, -1.9688159227371216e-06, -1.8961727619171143e-06, -1.823529601097107e-06, -1.7508864402770996e-06, -1.6782432794570923e-06, -1.605600118637085e-06, -1.5329569578170776e-06, -1.4603137969970703e-06, -1.387670636177063e-06, -1.3150274753570557e-06, -1.2423843145370483e-06, -1.169741153717041e-06, -1.0970979928970337e-06, -1.0244548320770264e-06, -9.51811671257019e-07, -8.791685104370117e-07, -8.065253496170044e-07, -7.338821887969971e-07, -6.612390279769897e-07, -5.885958671569824e-07, -5.159527063369751e-07, -4.4330954551696777e-07, -3.7066638469696045e-07, -2.980232238769531e-07, -2.253800630569458e-07, -1.5273690223693848e-07, -8.009374141693115e-08, -7.450580596923828e-09, 6.51925802230835e-08, 1.3783574104309082e-07, 2.1047890186309814e-07, 2.8312206268310547e-07, 3.557652235031128e-07, 4.284083843231201e-07, 5.010515451431274e-07, 5.736947059631348e-07, 6.463378667831421e-07, 7.189810276031494e-07, 7.916241884231567e-07, 8.642673492431641e-07, 9.369105100631714e-07, 1.0095536708831787e-06, 1.082196831703186e-06, 1.1548399925231934e-06, 1.2274831533432007e-06, 1.300126314163208e-06, 1.3727694749832153e-06, 1.4454126358032227e-06, 1.51805579662323e-06, 1.5906989574432373e-06, 1.6633421182632446e-06, 1.735985279083252e-06, 1.8086284399032593e-06, 1.8812716007232666e-06, 1.953914761543274e-06, 2.0265579223632812e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 7.0, 10.0, 20.0, 18.0, 26.0, 42.0, 49.0, 69.0, 121.0, 164.0, 270.0, 443.0, 767.0, 1328.0, 2468.0, 4667.0, 10858.0, 27850.0, 86573.0, 412678.0, 364394.0, 86615.0, 27684.0, 10988.0, 4864.0, 2368.0, 1205.0, 729.0, 459.0, 288.0, 184.0, 110.0, 70.0, 54.0, 34.0, 22.0, 20.0, 11.0, 8.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2067298889160156e-05, -3.1123869121074677e-05, -3.0180439352989197e-05, -2.9237009584903717e-05, -2.8293579816818237e-05, -2.7350150048732758e-05, -2.6406720280647278e-05, -2.5463290512561798e-05, -2.451986074447632e-05, -2.357643097639084e-05, -2.263300120830536e-05, -2.168957144021988e-05, -2.07461416721344e-05, -1.980271190404892e-05, -1.885928213596344e-05, -1.791585236787796e-05, -1.697242259979248e-05, -1.6028992831707e-05, -1.5085563063621521e-05, -1.4142133295536041e-05, -1.3198703527450562e-05, -1.2255273759365082e-05, -1.1311843991279602e-05, -1.0368414223194122e-05, -9.424984455108643e-06, -8.481554687023163e-06, -7.538124918937683e-06, -6.594695150852203e-06, -5.651265382766724e-06, -4.707835614681244e-06, -3.764405846595764e-06, -2.8209760785102844e-06, -1.8775463104248047e-06, -9.34116542339325e-07, 9.313225746154785e-09, 9.527429938316345e-07, 1.8961727619171143e-06, 2.839602530002594e-06, 3.7830322980880737e-06, 4.7264620661735535e-06, 5.669891834259033e-06, 6.613321602344513e-06, 7.556751370429993e-06, 8.500181138515472e-06, 9.443610906600952e-06, 1.0387040674686432e-05, 1.1330470442771912e-05, 1.2273900210857391e-05, 1.3217329978942871e-05, 1.416075974702835e-05, 1.510418951511383e-05, 1.604761928319931e-05, 1.699104905128479e-05, 1.793447881937027e-05, 1.887790858745575e-05, 1.982133835554123e-05, 2.076476812362671e-05, 2.170819789171219e-05, 2.265162765979767e-05, 2.3595057427883148e-05, 2.4538487195968628e-05, 2.5481916964054108e-05, 2.6425346732139587e-05, 2.7368776500225067e-05, 2.8312206268310547e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 4.0, 7.0, 4.0, 8.0, 8.0, 13.0, 7.0, 12.0, 29.0, 31.0, 47.0, 42.0, 56.0, 63.0, 69.0, 77.0, 65.0, 71.0, 73.0, 56.0, 59.0, 49.0, 22.0, 33.0, 21.0, 21.0, 12.0, 10.0, 8.0, 3.0, 2.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.470348358154297e-06, -4.295259714126587e-06, -4.120171070098877e-06, -3.945082426071167e-06, -3.769993782043457e-06, -3.594905138015747e-06, -3.419816493988037e-06, -3.244727849960327e-06, -3.069639205932617e-06, -2.8945505619049072e-06, -2.7194619178771973e-06, -2.5443732738494873e-06, -2.3692846298217773e-06, -2.1941959857940674e-06, -2.0191073417663574e-06, -1.8440186977386475e-06, -1.6689300537109375e-06, -1.4938414096832275e-06, -1.3187527656555176e-06, -1.1436641216278076e-06, -9.685754776000977e-07, -7.934868335723877e-07, -6.183981895446777e-07, -4.4330954551696777e-07, -2.682209014892578e-07, -9.313225746154785e-08, 8.195638656616211e-08, 2.5704503059387207e-07, 4.3213367462158203e-07, 6.07222318649292e-07, 7.82310962677002e-07, 9.57399606704712e-07, 1.1324882507324219e-06, 1.3075768947601318e-06, 1.4826655387878418e-06, 1.6577541828155518e-06, 1.8328428268432617e-06, 2.0079314708709717e-06, 2.1830201148986816e-06, 2.3581087589263916e-06, 2.5331974029541016e-06, 2.7082860469818115e-06, 2.8833746910095215e-06, 3.0584633350372314e-06, 3.2335519790649414e-06, 3.4086406230926514e-06, 3.5837292671203613e-06, 3.7588179111480713e-06, 3.933906555175781e-06, 4.108995199203491e-06, 4.284083843231201e-06, 4.459172487258911e-06, 4.634261131286621e-06, 4.809349775314331e-06, 4.984438419342041e-06, 5.159527063369751e-06, 5.334615707397461e-06, 5.509704351425171e-06, 5.684792995452881e-06, 5.859881639480591e-06, 6.034970283508301e-06, 6.210058927536011e-06, 6.385147571563721e-06, 6.560236215591431e-06, 6.735324859619141e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 4.0, 8.0, 10.0, 25.0, 17.0, 15.0, 28.0, 29.0, 49.0, 55.0, 74.0, 92.0, 105.0, 84.0, 89.0, 53.0, 47.0, 42.0, 32.0, 28.0, 25.0, 11.0, 10.0, 18.0, 7.0, 6.0, 9.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-9.297375800088048e-05, -9.051169763552025e-05, -8.80496299942024e-05, -8.558756962884218e-05, -8.312550198752433e-05, -8.06634416221641e-05, -7.820138125680387e-05, -7.573931361548603e-05, -7.32772532501258e-05, -7.081519288476557e-05, -6.835312524344772e-05, -6.589106487808749e-05, -6.342900451272726e-05, -6.0966936871409416e-05, -5.8504876506049186e-05, -5.604281250271015e-05, -5.358074849937111e-05, -5.1118684496032074e-05, -4.865662049269304e-05, -4.6194560127332807e-05, -4.373249612399377e-05, -4.127043212065473e-05, -3.88083717552945e-05, -3.6346307751955464e-05, -3.388424374861643e-05, -3.142217974527739e-05, -2.8960117560927756e-05, -2.6498055376578122e-05, -2.4035991373239085e-05, -2.1573927369900048e-05, -1.9111865185550414e-05, -1.664980300120078e-05, -1.4187738997861743e-05, -1.1725675904017407e-05, -9.263612810173072e-06, -6.801549716328736e-06, -4.339486622484401e-06, -1.8774235286400653e-06, 5.846395652042702e-07, 3.046701749553904e-06, 5.508765752892941e-06, 7.970828846737277e-06, 1.0432891940581612e-05, 1.2894955034425948e-05, 1.5357018128270283e-05, 1.781908213160932e-05, 2.0281144315958954e-05, 2.2743206500308588e-05, 2.5205270503647625e-05, 2.7667334506986663e-05, 3.0129396691336296e-05, 3.259145887568593e-05, 3.505352287902497e-05, 3.7515586882364005e-05, 3.9977647247724235e-05, 4.243971125106327e-05, 4.490177525440231e-05, 4.736383925774135e-05, 4.9825903261080384e-05, 5.2287963626440614e-05, 5.475002762977965e-05, 5.721209163311869e-05, 5.967415199847892e-05, 6.213621236383915e-05, 6.4598280005157e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 0.0, 5.0, 9.0, 6.0, 5.0, 9.0, 12.0, 16.0, 14.0, 14.0, 20.0, 27.0, 17.0, 32.0, 32.0, 33.0, 31.0, 50.0, 29.0, 35.0, 39.0, 41.0, 58.0, 44.0, 33.0, 46.0, 36.0, 38.0, 30.0, 31.0, 28.0, 27.0, 21.0, 13.0, 23.0, 19.0, 16.0, 9.0, 12.0, 11.0, 8.0, 5.0, 9.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-5.965093441773206e-05, -5.791201692773029e-05, -5.6173099437728524e-05, -5.4434181947726756e-05, -5.269526081974618e-05, -5.0956343329744413e-05, -4.9217425839742646e-05, -4.747850834974088e-05, -4.573959085973911e-05, -4.400067336973734e-05, -4.2261755879735574e-05, -4.0522834751755e-05, -3.878391726175323e-05, -3.7044999771751463e-05, -3.5306082281749696e-05, -3.356716479174793e-05, -3.182824730174616e-05, -3.0089329811744392e-05, -2.835041050275322e-05, -2.6611493012751453e-05, -2.4872575522749685e-05, -2.3133656213758513e-05, -2.1394738723756745e-05, -1.9655821233754978e-05, -1.7916900105774403e-05, -1.6177982615772635e-05, -1.4439064216276165e-05, -1.2700145816779695e-05, -1.0961228326777928e-05, -9.222309927281458e-06, -7.483391527784988e-06, -5.74447403778322e-06, -4.0055565477814525e-06, -2.2666386030323338e-06, -5.277204309095396e-07, 1.2111977412132546e-06, 2.9501156859623734e-06, 4.689033630711492e-06, 6.427952030207962e-06, 8.16686952020973e-06, 9.9057879197062e-06, 1.1644706319202669e-05, 1.3383623809204437e-05, 1.5122542208700906e-05, 1.6861460608197376e-05, 1.8600378098199144e-05, 2.0339295588200912e-05, 2.207821307820268e-05, 2.381713238719385e-05, 2.555604987719562e-05, 2.729496918618679e-05, 2.903388667618856e-05, 3.0772804166190326e-05, 3.2511721656192094e-05, 3.425063914619386e-05, 3.598955663619563e-05, 3.7728477764176205e-05, 3.946739525417797e-05, 4.120631274417974e-05, 4.2945233872160316e-05, 4.468415136216208e-05, 4.642306885216385e-05, 4.816198634216562e-05, 4.990090383216739e-05, 5.1639821322169155e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 3.0, 9.0, 5.0, 14.0, 12.0, 21.0, 36.0, 54.0, 78.0, 127.0, 187.0, 274.0, 426.0, 722.0, 1115.0, 1792.0, 3041.0, 4988.0, 8322.0, 14610.0, 24507.0, 45748.0, 87927.0, 181081.0, 277023.0, 191041.0, 93442.0, 48833.0, 25953.0, 15047.0, 8711.0, 5179.0, 3110.0, 1914.0, 1169.0, 733.0, 433.0, 315.0, 176.0, 117.0, 85.0, 46.0, 43.0, 28.0, 20.0, 14.0, 13.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001099705696105957, -0.00010648369789123535, -0.000102996826171875, -9.950995445251465e-05, -9.60230827331543e-05, -9.253621101379395e-05, -8.90493392944336e-05, -8.556246757507324e-05, -8.207559585571289e-05, -7.858872413635254e-05, -7.510185241699219e-05, -7.161498069763184e-05, -6.812810897827148e-05, -6.464123725891113e-05, -6.115436553955078e-05, -5.766749382019043e-05, -5.418062210083008e-05, -5.0693750381469727e-05, -4.7206878662109375e-05, -4.3720006942749023e-05, -4.023313522338867e-05, -3.674626350402832e-05, -3.325939178466797e-05, -2.9772520065307617e-05, -2.6285648345947266e-05, -2.2798776626586914e-05, -1.9311904907226562e-05, -1.582503318786621e-05, -1.233816146850586e-05, -8.851289749145508e-06, -5.364418029785156e-06, -1.8775463104248047e-06, 1.6093254089355469e-06, 5.0961971282958984e-06, 8.58306884765625e-06, 1.2069940567016602e-05, 1.5556812286376953e-05, 1.9043684005737305e-05, 2.2530555725097656e-05, 2.6017427444458008e-05, 2.950429916381836e-05, 3.299117088317871e-05, 3.647804260253906e-05, 3.9964914321899414e-05, 4.3451786041259766e-05, 4.693865776062012e-05, 5.042552947998047e-05, 5.391240119934082e-05, 5.739927291870117e-05, 6.0886144638061523e-05, 6.437301635742188e-05, 6.785988807678223e-05, 7.134675979614258e-05, 7.483363151550293e-05, 7.832050323486328e-05, 8.180737495422363e-05, 8.529424667358398e-05, 8.878111839294434e-05, 9.226799011230469e-05, 9.575486183166504e-05, 9.924173355102539e-05, 0.00010272860527038574, 0.0001062154769897461, 0.00010970234870910645, 0.0001131892204284668]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 10.0, 3.0, 7.0, 8.0, 12.0, 14.0, 17.0, 15.0, 21.0, 22.0, 36.0, 34.0, 34.0, 45.0, 32.0, 33.0, 46.0, 44.0, 41.0, 51.0, 47.0, 37.0, 45.0, 35.0, 45.0, 39.0, 33.0, 31.0, 16.0, 20.0, 18.0, 25.0, 16.0, 14.0, 10.0, 8.0, 12.0, 9.0, 2.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.46574592590332e-05, -5.302019417285919e-05, -5.138292908668518e-05, -4.974566400051117e-05, -4.810839891433716e-05, -4.647113382816315e-05, -4.4833868741989136e-05, -4.3196603655815125e-05, -4.155933856964111e-05, -3.99220734834671e-05, -3.828480839729309e-05, -3.664754331111908e-05, -3.501027822494507e-05, -3.337301313877106e-05, -3.1735748052597046e-05, -3.0098482966423035e-05, -2.8461217880249023e-05, -2.6823952794075012e-05, -2.5186687707901e-05, -2.354942262172699e-05, -2.191215753555298e-05, -2.0274892449378967e-05, -1.8637627363204956e-05, -1.7000362277030945e-05, -1.5363097190856934e-05, -1.3725832104682922e-05, -1.2088567018508911e-05, -1.04513019323349e-05, -8.814036846160889e-06, -7.1767717599868774e-06, -5.539506673812866e-06, -3.902241587638855e-06, -2.2649765014648438e-06, -6.277114152908325e-07, 1.0095536708831787e-06, 2.64681875705719e-06, 4.284083843231201e-06, 5.921348929405212e-06, 7.558614015579224e-06, 9.195879101753235e-06, 1.0833144187927246e-05, 1.2470409274101257e-05, 1.4107674360275269e-05, 1.574493944644928e-05, 1.738220453262329e-05, 1.9019469618797302e-05, 2.0656734704971313e-05, 2.2293999791145325e-05, 2.3931264877319336e-05, 2.5568529963493347e-05, 2.720579504966736e-05, 2.884306013584137e-05, 3.048032522201538e-05, 3.211759030818939e-05, 3.37548553943634e-05, 3.5392120480537415e-05, 3.7029385566711426e-05, 3.866665065288544e-05, 4.030391573905945e-05, 4.194118082523346e-05, 4.357844591140747e-05, 4.521571099758148e-05, 4.685297608375549e-05, 4.8490241169929504e-05, 5.0127506256103516e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 4.0, 10.0, 9.0, 10.0, 15.0, 30.0, 43.0, 72.0, 102.0, 140.0, 237.0, 310.0, 541.0, 765.0, 1091.0, 1704.0, 2643.0, 3897.0, 6134.0, 9281.0, 14347.0, 22249.0, 37046.0, 59850.0, 106360.0, 182853.0, 235029.0, 149170.0, 82442.0, 49410.0, 29272.0, 18682.0, 11984.0, 7793.0, 5071.0, 3326.0, 2164.0, 1509.0, 1008.0, 700.0, 422.0, 271.0, 195.0, 142.0, 68.0, 59.0, 39.0, 20.0, 15.0, 15.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.863210678100586e-05, -8.579995483160019e-05, -8.296780288219452e-05, -8.013565093278885e-05, -7.730349898338318e-05, -7.447134703397751e-05, -7.163919508457184e-05, -6.880704313516617e-05, -6.59748911857605e-05, -6.314273923635483e-05, -6.031058728694916e-05, -5.747843533754349e-05, -5.464628338813782e-05, -5.181413143873215e-05, -4.898197948932648e-05, -4.614982753992081e-05, -4.331767559051514e-05, -4.0485523641109467e-05, -3.7653371691703796e-05, -3.4821219742298126e-05, -3.1989067792892456e-05, -2.9156915843486786e-05, -2.6324763894081116e-05, -2.3492611944675446e-05, -2.0660459995269775e-05, -1.7828308045864105e-05, -1.4996156096458435e-05, -1.2164004147052765e-05, -9.331852197647095e-06, -6.4997002482414246e-06, -3.6675482988357544e-06, -8.353963494300842e-07, 1.996755599975586e-06, 4.828907549381256e-06, 7.661059498786926e-06, 1.0493211448192596e-05, 1.3325363397598267e-05, 1.6157515347003937e-05, 1.8989667296409607e-05, 2.1821819245815277e-05, 2.4653971195220947e-05, 2.7486123144626617e-05, 3.0318275094032288e-05, 3.315042704343796e-05, 3.598257899284363e-05, 3.88147309422493e-05, 4.164688289165497e-05, 4.447903484106064e-05, 4.731118679046631e-05, 5.014333873987198e-05, 5.297549068927765e-05, 5.580764263868332e-05, 5.863979458808899e-05, 6.147194653749466e-05, 6.430409848690033e-05, 6.7136250436306e-05, 6.996840238571167e-05, 7.280055433511734e-05, 7.563270628452301e-05, 7.846485823392868e-05, 8.129701018333435e-05, 8.412916213274002e-05, 8.696131408214569e-05, 8.979346603155136e-05, 9.262561798095703e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 7.0, 3.0, 2.0, 6.0, 7.0, 4.0, 5.0, 12.0, 12.0, 12.0, 13.0, 18.0, 27.0, 32.0, 20.0, 19.0, 32.0, 43.0, 43.0, 30.0, 35.0, 39.0, 52.0, 40.0, 37.0, 32.0, 44.0, 40.0, 43.0, 33.0, 30.0, 33.0, 35.0, 25.0, 26.0, 11.0, 22.0, 22.0, 13.0, 16.0, 7.0, 5.0, 5.0, 6.0, 7.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.2842159271240234e-05, -3.184843808412552e-05, -3.08547168970108e-05, -2.9860995709896088e-05, -2.8867274522781372e-05, -2.7873553335666656e-05, -2.687983214855194e-05, -2.5886110961437225e-05, -2.489238977432251e-05, -2.3898668587207794e-05, -2.290494740009308e-05, -2.1911226212978363e-05, -2.0917505025863647e-05, -1.9923783838748932e-05, -1.8930062651634216e-05, -1.79363414645195e-05, -1.6942620277404785e-05, -1.594889909029007e-05, -1.4955177903175354e-05, -1.3961456716060638e-05, -1.2967735528945923e-05, -1.1974014341831207e-05, -1.0980293154716492e-05, -9.986571967601776e-06, -8.99285078048706e-06, -7.999129593372345e-06, -7.005408406257629e-06, -6.011687219142914e-06, -5.017966032028198e-06, -4.024244844913483e-06, -3.030523657798767e-06, -2.0368024706840515e-06, -1.043081283569336e-06, -4.936009645462036e-08, 9.443610906600952e-07, 1.938082277774811e-06, 2.9318034648895264e-06, 3.925524652004242e-06, 4.9192458391189575e-06, 5.912967026233673e-06, 6.906688213348389e-06, 7.900409400463104e-06, 8.89413058757782e-06, 9.887851774692535e-06, 1.0881572961807251e-05, 1.1875294148921967e-05, 1.2869015336036682e-05, 1.3862736523151398e-05, 1.4856457710266113e-05, 1.585017889738083e-05, 1.6843900084495544e-05, 1.783762127161026e-05, 1.8831342458724976e-05, 1.982506364583969e-05, 2.0818784832954407e-05, 2.1812506020069122e-05, 2.2806227207183838e-05, 2.3799948394298553e-05, 2.479366958141327e-05, 2.5787390768527985e-05, 2.67811119556427e-05, 2.7774833142757416e-05, 2.876855432987213e-05, 2.9762275516986847e-05, 3.075599670410156e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 13.0, 6.0, 32.0, 23.0, 38.0, 46.0, 70.0, 115.0, 156.0, 225.0, 354.0, 506.0, 852.0, 1288.0, 2085.0, 3055.0, 4721.0, 8105.0, 13746.0, 24863.0, 48599.0, 711188.0, 134144.0, 42081.0, 21303.0, 11486.0, 7130.0, 4346.0, 2857.0, 1774.0, 1117.0, 774.0, 472.0, 318.0, 192.0, 141.0, 99.0, 73.0, 49.0, 23.0, 31.0, 16.0, 15.0, 5.0, 10.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.464387893676758e-05, -4.328601062297821e-05, -4.192814230918884e-05, -4.0570273995399475e-05, -3.921240568161011e-05, -3.785453736782074e-05, -3.649666905403137e-05, -3.5138800740242004e-05, -3.378093242645264e-05, -3.242306411266327e-05, -3.10651957988739e-05, -2.9707327485084534e-05, -2.8349459171295166e-05, -2.69915908575058e-05, -2.563372254371643e-05, -2.4275854229927063e-05, -2.2917985916137695e-05, -2.1560117602348328e-05, -2.020224928855896e-05, -1.8844380974769592e-05, -1.7486512660980225e-05, -1.6128644347190857e-05, -1.477077603340149e-05, -1.3412907719612122e-05, -1.2055039405822754e-05, -1.0697171092033386e-05, -9.339302778244019e-06, -7.981434464454651e-06, -6.623566150665283e-06, -5.2656978368759155e-06, -3.907829523086548e-06, -2.54996120929718e-06, -1.1920928955078125e-06, 1.6577541828155518e-07, 1.5236437320709229e-06, 2.8815120458602905e-06, 4.239380359649658e-06, 5.597248673439026e-06, 6.9551169872283936e-06, 8.312985301017761e-06, 9.670853614807129e-06, 1.1028721928596497e-05, 1.2386590242385864e-05, 1.3744458556175232e-05, 1.51023268699646e-05, 1.6460195183753967e-05, 1.7818063497543335e-05, 1.9175931811332703e-05, 2.053380012512207e-05, 2.1891668438911438e-05, 2.3249536752700806e-05, 2.4607405066490173e-05, 2.596527338027954e-05, 2.732314169406891e-05, 2.8681010007858276e-05, 3.0038878321647644e-05, 3.139674663543701e-05, 3.275461494922638e-05, 3.411248326301575e-05, 3.5470351576805115e-05, 3.682821989059448e-05, 3.818608820438385e-05, 3.954395651817322e-05, 4.0901824831962585e-05, 4.225969314575195e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 0.0, 0.0, 9.0, 0.0, 7.0, 0.0, 0.0, 22.0, 0.0, 0.0, 25.0, 0.0, 23.0, 0.0, 0.0, 73.0, 0.0, 92.0, 0.0, 0.0, 485.0, 0.0, 101.0, 0.0, 0.0, 69.0, 0.0, 43.0, 0.0, 0.0, 31.0, 0.0, 0.0, 14.0, 0.0, 7.0, 0.0, 0.0, 6.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.515773177146912e-07, -7.282942533493042e-07, -7.050111889839172e-07, -6.817281246185303e-07, -6.584450602531433e-07, -6.351619958877563e-07, -6.118789315223694e-07, -5.885958671569824e-07, -5.653128027915955e-07, -5.420297384262085e-07, -5.187466740608215e-07, -4.954636096954346e-07, -4.721805453300476e-07, -4.4889748096466064e-07, -4.256144165992737e-07, -4.023313522338867e-07, -3.7904828786849976e-07, -3.557652235031128e-07, -3.3248215913772583e-07, -3.0919909477233887e-07, -2.859160304069519e-07, -2.6263296604156494e-07, -2.39349901676178e-07, -2.1606683731079102e-07, -1.9278377294540405e-07, -1.695007085800171e-07, -1.4621764421463013e-07, -1.2293457984924316e-07, -9.96515154838562e-08, -7.636845111846924e-08, -5.3085386753082275e-08, -2.9802322387695312e-08, -6.51925802230835e-09, 1.6763806343078613e-08, 4.0046870708465576e-08, 6.332993507385254e-08, 8.66129994392395e-08, 1.0989606380462646e-07, 1.3317912817001343e-07, 1.564621925354004e-07, 1.7974525690078735e-07, 2.0302832126617432e-07, 2.2631138563156128e-07, 2.4959444999694824e-07, 2.728775143623352e-07, 2.9616057872772217e-07, 3.1944364309310913e-07, 3.427267074584961e-07, 3.6600977182388306e-07, 3.8929283618927e-07, 4.12575900554657e-07, 4.3585896492004395e-07, 4.591420292854309e-07, 4.824250936508179e-07, 5.057081580162048e-07, 5.289912223815918e-07, 5.522742867469788e-07, 5.755573511123657e-07, 5.988404154777527e-07, 6.221234798431396e-07, 6.454065442085266e-07, 6.686896085739136e-07, 6.919726729393005e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 10.0, 8.0, 10.0, 18.0, 27.0, 42.0, 51.0, 63.0, 98.0, 135.0, 180.0, 320.0, 440.0, 650.0, 1000.0, 1440.0, 2268.0, 3511.0, 5626.0, 9367.0, 14119.0, 25005.0, 40645.0, 102077.0, 717289.0, 49802.0, 28595.0, 17105.0, 10552.0, 6228.0, 4089.0, 2712.0, 1698.0, 1083.0, 676.0, 507.0, 348.0, 223.0, 163.0, 109.0, 79.0, 45.0, 46.0, 33.0, 16.0, 15.0, 10.0, 8.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.060434341430664e-05, -4.903040826320648e-05, -4.745647311210632e-05, -4.5882537961006165e-05, -4.4308602809906006e-05, -4.273466765880585e-05, -4.116073250770569e-05, -3.958679735660553e-05, -3.801286220550537e-05, -3.643892705440521e-05, -3.4864991903305054e-05, -3.3291056752204895e-05, -3.1717121601104736e-05, -3.0143186450004578e-05, -2.856925129890442e-05, -2.699531614780426e-05, -2.54213809967041e-05, -2.3847445845603943e-05, -2.2273510694503784e-05, -2.0699575543403625e-05, -1.9125640392303467e-05, -1.7551705241203308e-05, -1.597777009010315e-05, -1.440383493900299e-05, -1.2829899787902832e-05, -1.1255964636802673e-05, -9.682029485702515e-06, -8.108094334602356e-06, -6.534159183502197e-06, -4.9602240324020386e-06, -3.38628888130188e-06, -1.8123537302017212e-06, -2.384185791015625e-07, 1.3355165719985962e-06, 2.909451723098755e-06, 4.4833868741989136e-06, 6.057322025299072e-06, 7.631257176399231e-06, 9.20519232749939e-06, 1.0779127478599548e-05, 1.2353062629699707e-05, 1.3926997780799866e-05, 1.5500932931900024e-05, 1.7074868083000183e-05, 1.8648803234100342e-05, 2.02227383852005e-05, 2.179667353630066e-05, 2.3370608687400818e-05, 2.4944543838500977e-05, 2.6518478989601135e-05, 2.8092414140701294e-05, 2.9666349291801453e-05, 3.124028444290161e-05, 3.281421959400177e-05, 3.438815474510193e-05, 3.596208989620209e-05, 3.7536025047302246e-05, 3.9109960198402405e-05, 4.0683895349502563e-05, 4.225783050060272e-05, 4.383176565170288e-05, 4.540570080280304e-05, 4.69796359539032e-05, 4.855357110500336e-05, 5.0127506256103516e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 5.0, 5.0, 7.0, 13.0, 12.0, 21.0, 14.0, 11.0, 11.0, 21.0, 17.0, 29.0, 501.0, 119.0, 20.0, 25.0, 15.0, 22.0, 20.0, 15.0, 11.0, 13.0, 13.0, 11.0, 7.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5914440155029297e-05, -1.54152512550354e-05, -1.4916062355041504e-05, -1.4416873455047607e-05, -1.3917684555053711e-05, -1.3418495655059814e-05, -1.2919306755065918e-05, -1.2420117855072021e-05, -1.1920928955078125e-05, -1.1421740055084229e-05, -1.0922551155090332e-05, -1.0423362255096436e-05, -9.924173355102539e-06, -9.424984455108643e-06, -8.925795555114746e-06, -8.42660665512085e-06, -7.927417755126953e-06, -7.428228855133057e-06, -6.92903995513916e-06, -6.429851055145264e-06, -5.930662155151367e-06, -5.431473255157471e-06, -4.932284355163574e-06, -4.433095455169678e-06, -3.933906555175781e-06, -3.4347176551818848e-06, -2.9355287551879883e-06, -2.436339855194092e-06, -1.9371509552001953e-06, -1.4379620552062988e-06, -9.387731552124023e-07, -4.3958425521850586e-07, 5.960464477539063e-08, 5.587935447692871e-07, 1.0579824447631836e-06, 1.55717134475708e-06, 2.0563602447509766e-06, 2.555549144744873e-06, 3.0547380447387695e-06, 3.553926944732666e-06, 4.0531158447265625e-06, 4.552304744720459e-06, 5.0514936447143555e-06, 5.550682544708252e-06, 6.0498714447021484e-06, 6.549060344696045e-06, 7.048249244689941e-06, 7.547438144683838e-06, 8.046627044677734e-06, 8.545815944671631e-06, 9.045004844665527e-06, 9.544193744659424e-06, 1.004338264465332e-05, 1.0542571544647217e-05, 1.1041760444641113e-05, 1.154094934463501e-05, 1.2040138244628906e-05, 1.2539327144622803e-05, 1.30385160446167e-05, 1.3537704944610596e-05, 1.4036893844604492e-05, 1.4536082744598389e-05, 1.5035271644592285e-05, 1.553446054458618e-05, 1.6033649444580078e-05]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 3.0, 8.0, 7.0, 9.0, 15.0, 10.0, 12.0, 34.0, 19.0, 45.0, 39.0, 51.0, 70.0, 93.0, 96.0, 103.0, 81.0, 62.0, 49.0, 34.0, 28.0, 24.0, 24.0, 11.0, 17.0, 8.0, 8.0, 3.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.371454557869583e-05, -7.13950939825736e-05, -6.907564238645136e-05, -6.675619079032913e-05, -6.44367391942069e-05, -6.211728032212704e-05, -5.979782872600481e-05, -5.7478377129882574e-05, -5.515892553376034e-05, -5.2839473937638104e-05, -5.052002234151587e-05, -4.820056710741483e-05, -4.588111551129259e-05, -4.356166391517036e-05, -4.1242208681069314e-05, -3.892275708494708e-05, -3.6603305488824844e-05, -3.428385389270261e-05, -3.1964402296580374e-05, -2.9644947062479332e-05, -2.7325495466357097e-05, -2.5006043870234862e-05, -2.2686590455123223e-05, -2.0367137040011585e-05, -1.804768544388935e-05, -1.5728233847767115e-05, -1.3408780432655476e-05, -1.108932792703854e-05, -8.769875421421602e-06, -6.4504229158046655e-06, -4.130970410187729e-06, -1.81151699507609e-06, 5.079418770037591e-07, 2.827394382620696e-06, 5.146846888237633e-06, 7.46629939385457e-06, 9.785751899471506e-06, 1.2105204405088443e-05, 1.442465691070538e-05, 1.674411032581702e-05, 1.9063561921939254e-05, 2.138301351806149e-05, 2.3702466933173127e-05, 2.6021920348284766e-05, 2.8341371944407e-05, 3.0660823540529236e-05, 3.298027877463028e-05, 3.5299730370752513e-05, 3.761918196687475e-05, 3.9938633562996984e-05, 4.225808515911922e-05, 4.457754039322026e-05, 4.6896991989342496e-05, 4.921644358546473e-05, 5.153589881956577e-05, 5.385535041568801e-05, 5.617480201181024e-05, 5.849425360793248e-05, 6.081370520405471e-05, 6.313315680017695e-05, 6.545260839629918e-05, 6.777206726837903e-05, 7.009151886450127e-05, 7.24109704606235e-05, 7.473042205674574e-05]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 6.0, 2.0, 7.0, 6.0, 11.0, 13.0, 23.0, 21.0, 19.0, 33.0, 35.0, 30.0, 36.0, 23.0, 38.0, 42.0, 50.0, 37.0, 43.0, 42.0, 39.0, 38.0, 36.0, 38.0, 43.0, 34.0, 42.0, 39.0, 29.0, 22.0, 18.0, 22.0, 14.0, 13.0, 12.0, 9.0, 6.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.786535646417178e-05, -4.6159148041624576e-05, -4.445293961907737e-05, -4.274673119653016e-05, -4.104052277398296e-05, -3.933431435143575e-05, -3.762810956686735e-05, -3.592189750634134e-05, -3.421569272177294e-05, -3.250948429922573e-05, -3.0803275876678526e-05, -2.909706745413132e-05, -2.7390859031584114e-05, -2.5684650609036908e-05, -2.3978444005479105e-05, -2.22722355829319e-05, -2.056602534139529e-05, -1.8859816918848082e-05, -1.7153608496300876e-05, -1.544740007375367e-05, -1.3741192560701165e-05, -1.2034984138153959e-05, -1.0328776625101455e-05, -8.622568202554248e-06, -6.916359780007042e-06, -5.210151357459836e-06, -3.5039433896599803e-06, -1.797735421860125e-06, -9.152699931291863e-08, 1.6146814232342876e-06, 3.320888936286792e-06, 5.0270973588339984e-06, 6.733302143402398e-06, 8.439510565949604e-06, 1.014571898849681e-05, 1.1851926501549315e-05, 1.3558134924096521e-05, 1.526434425613843e-05, 1.6970550859696232e-05, 1.8676759282243438e-05, 2.0382967704790644e-05, 2.208917612733785e-05, 2.3795384549885057e-05, 2.550159115344286e-05, 2.7207799575990066e-05, 2.8914007998537272e-05, 3.062021642108448e-05, 3.2326424843631685e-05, 3.403263326617889e-05, 3.57388416887261e-05, 3.7445050111273304e-05, 3.915125853382051e-05, 4.0857466956367716e-05, 4.256367537891492e-05, 4.426988016348332e-05, 4.5976092224009335e-05, 4.7682297008577734e-05, 4.938850543112494e-05, 5.109471385367215e-05, 5.280092227621935e-05, 5.450713069876656e-05, 5.6213339121313766e-05, 5.791954754386097e-05, 5.962575232842937e-05, 6.133196438895538e-05]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 9.0, 24.0, 18.0, 41.0, 51.0, 68.0, 81.0, 97.0, 158.0, 204.0, 261.0, 362.0, 529.0, 716.0, 922.0, 1235.0, 1695.0, 2557.0, 3385.0, 4839.0, 7377.0, 10520.0, 15529.0, 24669.0, 37985.0, 61462.0, 105845.0, 207905.0, 467538.0, 1224320.0, 1150603.0, 415739.0, 188022.0, 99411.0, 58874.0, 34422.0, 21937.0, 14667.0, 9325.0, 6327.0, 4373.0, 2979.0, 1992.0, 1501.0, 1051.0, 720.0, 580.0, 412.0, 250.0, 219.0, 165.0, 90.0, 82.0, 50.0, 42.0, 20.0, 14.0, 15.0, 3.0, 5.0, 2.0], "bins": [-5.751848220825195e-05, -5.577225238084793e-05, -5.402602255344391e-05, -5.2279792726039886e-05, -5.0533562898635864e-05, -4.878733307123184e-05, -4.704110324382782e-05, -4.52948734164238e-05, -4.3548643589019775e-05, -4.180241376161575e-05, -4.005618393421173e-05, -3.830995410680771e-05, -3.6563724279403687e-05, -3.4817494451999664e-05, -3.307126462459564e-05, -3.132503479719162e-05, -2.9578804969787598e-05, -2.7832575142383575e-05, -2.6086345314979553e-05, -2.434011548757553e-05, -2.259388566017151e-05, -2.0847655832767487e-05, -1.9101426005363464e-05, -1.7355196177959442e-05, -1.560896635055542e-05, -1.3862736523151398e-05, -1.2116506695747375e-05, -1.0370276868343353e-05, -8.624047040939331e-06, -6.877817213535309e-06, -5.131587386131287e-06, -3.3853575587272644e-06, -1.6391277313232422e-06, 1.0710209608078003e-07, 1.8533319234848022e-06, 3.5995617508888245e-06, 5.345791578292847e-06, 7.092021405696869e-06, 8.838251233100891e-06, 1.0584481060504913e-05, 1.2330710887908936e-05, 1.4076940715312958e-05, 1.582317054271698e-05, 1.7569400370121002e-05, 1.9315630197525024e-05, 2.1061860024929047e-05, 2.280808985233307e-05, 2.455431967973709e-05, 2.6300549507141113e-05, 2.8046779334545135e-05, 2.9793009161949158e-05, 3.153923898935318e-05, 3.32854688167572e-05, 3.5031698644161224e-05, 3.6777928471565247e-05, 3.852415829896927e-05, 4.027038812637329e-05, 4.201661795377731e-05, 4.3762847781181335e-05, 4.550907760858536e-05, 4.725530743598938e-05, 4.90015372633934e-05, 5.0747767090797424e-05, 5.2493996918201447e-05, 5.424022674560547e-05]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 8.0, 4.0, 3.0, 9.0, 7.0, 7.0, 13.0, 16.0, 14.0, 24.0, 28.0, 28.0, 26.0, 29.0, 29.0, 26.0, 38.0, 31.0, 45.0, 45.0, 22.0, 36.0, 38.0, 34.0, 41.0, 29.0, 35.0, 44.0, 30.0, 29.0, 30.0, 29.0, 21.0, 23.0, 20.0, 18.0, 9.0, 16.0, 12.0, 3.0, 10.0, 9.0, 9.0, 5.0, 0.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.8073787689208984e-05, -2.7192756533622742e-05, -2.63117253780365e-05, -2.5430694222450256e-05, -2.4549663066864014e-05, -2.366863191127777e-05, -2.278760075569153e-05, -2.1906569600105286e-05, -2.1025538444519043e-05, -2.01445072889328e-05, -1.9263476133346558e-05, -1.8382444977760315e-05, -1.7501413822174072e-05, -1.662038266658783e-05, -1.5739351511001587e-05, -1.4858320355415344e-05, -1.3977289199829102e-05, -1.3096258044242859e-05, -1.2215226888656616e-05, -1.1334195733070374e-05, -1.0453164577484131e-05, -9.572133421897888e-06, -8.691102266311646e-06, -7.810071110725403e-06, -6.92903995513916e-06, -6.0480087995529175e-06, -5.166977643966675e-06, -4.285946488380432e-06, -3.4049153327941895e-06, -2.5238841772079468e-06, -1.642853021621704e-06, -7.618218660354614e-07, 1.1920928955078125e-07, 1.000240445137024e-06, 1.8812716007232666e-06, 2.7623027563095093e-06, 3.643333911895752e-06, 4.524365067481995e-06, 5.405396223068237e-06, 6.28642737865448e-06, 7.167458534240723e-06, 8.048489689826965e-06, 8.929520845413208e-06, 9.81055200099945e-06, 1.0691583156585693e-05, 1.1572614312171936e-05, 1.2453645467758179e-05, 1.3334676623344421e-05, 1.4215707778930664e-05, 1.5096738934516907e-05, 1.597777009010315e-05, 1.6858801245689392e-05, 1.7739832401275635e-05, 1.8620863556861877e-05, 1.950189471244812e-05, 2.0382925868034363e-05, 2.1263957023620605e-05, 2.2144988179206848e-05, 2.302601933479309e-05, 2.3907050490379333e-05, 2.4788081645965576e-05, 2.566911280155182e-05, 2.655014395713806e-05, 2.7431175112724304e-05, 2.8312206268310547e-05]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 3.0, 11.0, 17.0, 21.0, 36.0, 50.0, 68.0, 108.0, 189.0, 275.0, 421.0, 730.0, 1099.0, 1604.0, 2620.0, 4056.0, 6557.0, 10616.0, 17910.0, 29770.0, 48684.0, 89235.0, 164465.0, 334428.0, 800351.0, 1402656.0, 657052.0, 279523.0, 147266.0, 80268.0, 45636.0, 26638.0, 15846.0, 9657.0, 5971.0, 3821.0, 2405.0, 1498.0, 958.0, 621.0, 394.0, 261.0, 178.0, 104.0, 66.0, 61.0, 31.0, 18.0, 11.0, 12.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.745887756347656e-05, -5.5738724768161774e-05, -5.4018571972846985e-05, -5.2298419177532196e-05, -5.057826638221741e-05, -4.885811358690262e-05, -4.713796079158783e-05, -4.541780799627304e-05, -4.369765520095825e-05, -4.197750240564346e-05, -4.0257349610328674e-05, -3.8537196815013885e-05, -3.68170440196991e-05, -3.509689122438431e-05, -3.337673842906952e-05, -3.165658563375473e-05, -2.993643283843994e-05, -2.8216280043125153e-05, -2.6496127247810364e-05, -2.4775974452495575e-05, -2.3055821657180786e-05, -2.1335668861865997e-05, -1.961551606655121e-05, -1.789536327123642e-05, -1.617521047592163e-05, -1.4455057680606842e-05, -1.2734904885292053e-05, -1.1014752089977264e-05, -9.294599294662476e-06, -7.574446499347687e-06, -5.854293704032898e-06, -4.134140908718109e-06, -2.4139881134033203e-06, -6.938353180885315e-07, 1.0263174772262573e-06, 2.746470272541046e-06, 4.466623067855835e-06, 6.186775863170624e-06, 7.906928658485413e-06, 9.627081453800201e-06, 1.134723424911499e-05, 1.3067387044429779e-05, 1.4787539839744568e-05, 1.6507692635059357e-05, 1.8227845430374146e-05, 1.9947998225688934e-05, 2.1668151021003723e-05, 2.3388303816318512e-05, 2.51084566116333e-05, 2.682860940694809e-05, 2.854876220226288e-05, 3.0268914997577667e-05, 3.1989067792892456e-05, 3.3709220588207245e-05, 3.5429373383522034e-05, 3.714952617883682e-05, 3.886967897415161e-05, 4.05898317694664e-05, 4.230998456478119e-05, 4.403013736009598e-05, 4.5750290155410767e-05, 4.7470442950725555e-05, 4.9190595746040344e-05, 5.091074854135513e-05, 5.263090133666992e-05]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 10.0, 2.0, 17.0, 8.0, 7.0, 27.0, 30.0, 26.0, 39.0, 47.0, 55.0, 75.0, 115.0, 115.0, 128.0, 137.0, 201.0, 206.0, 235.0, 276.0, 268.0, 283.0, 238.0, 224.0, 213.0, 207.0, 157.0, 131.0, 112.0, 86.0, 69.0, 70.0, 47.0, 26.0, 43.0, 32.0, 23.0, 18.0, 17.0, 17.0, 10.0, 6.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.537799835205078e-05, -1.484900712966919e-05, -1.4320015907287598e-05, -1.3791024684906006e-05, -1.3262033462524414e-05, -1.2733042240142822e-05, -1.220405101776123e-05, -1.1675059795379639e-05, -1.1146068572998047e-05, -1.0617077350616455e-05, -1.0088086128234863e-05, -9.559094905853271e-06, -9.03010368347168e-06, -8.501112461090088e-06, -7.972121238708496e-06, -7.443130016326904e-06, -6.9141387939453125e-06, -6.385147571563721e-06, -5.856156349182129e-06, -5.327165126800537e-06, -4.798173904418945e-06, -4.2691826820373535e-06, -3.7401914596557617e-06, -3.21120023727417e-06, -2.682209014892578e-06, -2.1532177925109863e-06, -1.6242265701293945e-06, -1.0952353477478027e-06, -5.662441253662109e-07, -3.725290298461914e-08, 4.917383193969727e-07, 1.0207295417785645e-06, 1.5497207641601562e-06, 2.078711986541748e-06, 2.60770320892334e-06, 3.1366944313049316e-06, 3.6656856536865234e-06, 4.194676876068115e-06, 4.723668098449707e-06, 5.252659320831299e-06, 5.781650543212891e-06, 6.310641765594482e-06, 6.839632987976074e-06, 7.368624210357666e-06, 7.897615432739258e-06, 8.42660665512085e-06, 8.955597877502441e-06, 9.484589099884033e-06, 1.0013580322265625e-05, 1.0542571544647217e-05, 1.1071562767028809e-05, 1.16005539894104e-05, 1.2129545211791992e-05, 1.2658536434173584e-05, 1.3187527656555176e-05, 1.3716518878936768e-05, 1.424551010131836e-05, 1.4774501323699951e-05, 1.5303492546081543e-05, 1.5832483768463135e-05, 1.6361474990844727e-05, 1.689046621322632e-05, 1.741945743560791e-05, 1.7948448657989502e-05, 1.8477439880371094e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 7.0, 10.0, 9.0, 9.0, 21.0, 28.0, 24.0, 31.0, 38.0, 63.0, 73.0, 82.0, 115.0, 84.0, 83.0, 66.0, 55.0, 36.0, 36.0, 32.0, 16.0, 6.0, 10.0, 11.0, 6.0, 15.0, 7.0, 2.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.281666381051764e-05, -5.1207873184466735e-05, -4.959908619639464e-05, -4.799029557034373e-05, -4.638150494429283e-05, -4.4772714318241924e-05, -4.316392733016983e-05, -4.155513670411892e-05, -3.994634607806802e-05, -3.8337555452017114e-05, -3.6728768463945016e-05, -3.511997783789411e-05, -3.351118721184321e-05, -3.19023965857923e-05, -3.0293609597720206e-05, -2.86848189716693e-05, -2.70760301646078e-05, -2.54672413575463e-05, -2.3858450731495395e-05, -2.2249661924433894e-05, -2.064087129838299e-05, -1.903208249132149e-05, -1.7423291865270585e-05, -1.5814503058209084e-05, -1.4205713341652881e-05, -1.2596923625096679e-05, -1.0988133908540476e-05, -9.379344191984273e-06, -7.770555384922773e-06, -6.16176566836657e-06, -4.552975951810367e-06, -2.9441862352541648e-06, -1.3353965186979622e-06, 2.7339308417140273e-07, 1.8821826870407676e-06, 3.490972176223295e-06, 5.0997618927794974e-06, 6.708551154588349e-06, 8.317340871144552e-06, 9.926130587700754e-06, 1.1534920304256957e-05, 1.314371002081316e-05, 1.4752499737369362e-05, 1.6361289453925565e-05, 1.7970078260987066e-05, 1.9578867068048567e-05, 2.118765769409947e-05, 2.2796448320150375e-05, 2.4405237127211876e-05, 2.6014025934273377e-05, 2.762281656032428e-05, 2.9231605367385782e-05, 3.084039417444728e-05, 3.244918480049819e-05, 3.405797542654909e-05, 3.5666766052599996e-05, 3.7275553040672094e-05, 3.8884343666723e-05, 4.0493130654795095e-05, 4.2101921280846e-05, 4.3710711906896904e-05, 4.531950253294781e-05, 4.6928289521019906e-05, 4.853708014707081e-05, 5.0145870773121715e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 12.0, 11.0, 20.0, 14.0, 16.0, 22.0, 22.0, 31.0, 38.0, 30.0, 34.0, 39.0, 36.0, 44.0, 44.0, 54.0, 40.0, 41.0, 45.0, 46.0, 37.0, 41.0, 30.0, 34.0, 40.0, 32.0, 28.0, 18.0, 23.0, 15.0, 13.0, 11.0, 5.0, 8.0, 3.0, 9.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7627090932801366e-05, -3.642652518465184e-05, -3.52259557985235e-05, -3.402539005037397e-05, -3.2824820664245635e-05, -3.1624254916096106e-05, -3.0423689167946577e-05, -2.9223121600807644e-05, -2.8022554033668712e-05, -2.682198646652978e-05, -2.5621418899390846e-05, -2.4420853151241317e-05, -2.3220285584102385e-05, -2.2019718016963452e-05, -2.0819152268813923e-05, -1.961858470167499e-05, -1.8418017134536058e-05, -1.7217449567397125e-05, -1.6016882000258192e-05, -1.4816316252108663e-05, -1.361574868496973e-05, -1.2415181117830798e-05, -1.1214614460186567e-05, -1.0014047802542336e-05, -8.813480235403404e-06, -7.612913123011822e-06, -6.41234601062024e-06, -5.211778898228658e-06, -4.011211785837077e-06, -2.810644673445495e-06, -1.610077561053913e-06, -4.095109034096822e-07, 7.910603017080575e-07, 1.9916274140996393e-06, 3.192194526491221e-06, 4.392761638882803e-06, 5.5933287512743846e-06, 6.793895863665966e-06, 7.994462976057548e-06, 9.195029633701779e-06, 1.0395597200840712e-05, 1.1596164767979644e-05, 1.2796731425623875e-05, 1.3997298083268106e-05, 1.5197865650407039e-05, 1.639843321754597e-05, 1.75989989656955e-05, 1.8799566532834433e-05, 2.0000134099973366e-05, 2.12007016671123e-05, 2.240126923425123e-05, 2.360183498240076e-05, 2.4802402549539693e-05, 2.6002970116678625e-05, 2.7203535864828154e-05, 2.8404103431967087e-05, 2.960467099910602e-05, 3.080523674725555e-05, 3.2005806133383885e-05, 3.3206371881533414e-05, 3.440694126766175e-05, 3.560750701581128e-05, 3.680807276396081e-05, 3.8008642150089145e-05, 3.9209207898238674e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 12.0, 16.0, 20.0, 27.0, 43.0, 73.0, 121.0, 182.0, 270.0, 428.0, 590.0, 1006.0, 1523.0, 2489.0, 3773.0, 5954.0, 9899.0, 15412.0, 24616.0, 42086.0, 65961.0, 108068.0, 168712.0, 209830.0, 147233.0, 91476.0, 57446.0, 34031.0, 21123.0, 13127.0, 8579.0, 5238.0, 3263.0, 2133.0, 1360.0, 866.0, 589.0, 314.0, 239.0, 135.0, 83.0, 71.0, 38.0, 37.0, 13.0, 16.0, 10.0, 9.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.392862319946289e-05, -4.248041659593582e-05, -4.103220999240875e-05, -3.958400338888168e-05, -3.8135796785354614e-05, -3.6687590181827545e-05, -3.5239383578300476e-05, -3.379117697477341e-05, -3.234297037124634e-05, -3.089476376771927e-05, -2.94465571641922e-05, -2.799835056066513e-05, -2.655014395713806e-05, -2.5101937353610992e-05, -2.3653730750083923e-05, -2.2205524146556854e-05, -2.0757317543029785e-05, -1.9309110939502716e-05, -1.7860904335975647e-05, -1.6412697732448578e-05, -1.4964491128921509e-05, -1.351628452539444e-05, -1.206807792186737e-05, -1.0619871318340302e-05, -9.171664714813232e-06, -7.723458111286163e-06, -6.275251507759094e-06, -4.827044904232025e-06, -3.378838300704956e-06, -1.930631697177887e-06, -4.824250936508179e-07, 9.657815098762512e-07, 2.4139881134033203e-06, 3.862194716930389e-06, 5.3104013204574585e-06, 6.758607923984528e-06, 8.206814527511597e-06, 9.655021131038666e-06, 1.1103227734565735e-05, 1.2551434338092804e-05, 1.3999640941619873e-05, 1.5447847545146942e-05, 1.689605414867401e-05, 1.834426075220108e-05, 1.979246735572815e-05, 2.124067395925522e-05, 2.2688880562782288e-05, 2.4137087166309357e-05, 2.5585293769836426e-05, 2.7033500373363495e-05, 2.8481706976890564e-05, 2.9929913580417633e-05, 3.13781201839447e-05, 3.282632678747177e-05, 3.427453339099884e-05, 3.572273999452591e-05, 3.717094659805298e-05, 3.861915320158005e-05, 4.006735980510712e-05, 4.1515566408634186e-05, 4.2963773012161255e-05, 4.4411979615688324e-05, 4.586018621921539e-05, 4.730839282274246e-05, 4.875659942626953e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 12.0, 9.0, 18.0, 22.0, 7.0, 28.0, 31.0, 39.0, 33.0, 39.0, 35.0, 33.0, 45.0, 53.0, 46.0, 46.0, 41.0, 37.0, 49.0, 34.0, 45.0, 36.0, 34.0, 43.0, 31.0, 30.0, 20.0, 16.0, 15.0, 11.0, 16.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.272294998168945e-05, -3.168173134326935e-05, -3.064051270484924e-05, -2.9599294066429138e-05, -2.8558075428009033e-05, -2.7516856789588928e-05, -2.6475638151168823e-05, -2.5434419512748718e-05, -2.4393200874328613e-05, -2.3351982235908508e-05, -2.2310763597488403e-05, -2.12695449590683e-05, -2.0228326320648193e-05, -1.918710768222809e-05, -1.8145889043807983e-05, -1.710467040538788e-05, -1.6063451766967773e-05, -1.5022233128547668e-05, -1.3981014490127563e-05, -1.2939795851707458e-05, -1.1898577213287354e-05, -1.0857358574867249e-05, -9.816139936447144e-06, -8.774921298027039e-06, -7.733702659606934e-06, -6.692484021186829e-06, -5.651265382766724e-06, -4.610046744346619e-06, -3.5688281059265137e-06, -2.5276094675064087e-06, -1.4863908290863037e-06, -4.4517219066619873e-07, 5.960464477539062e-07, 1.6372650861740112e-06, 2.678483724594116e-06, 3.719702363014221e-06, 4.760921001434326e-06, 5.802139639854431e-06, 6.843358278274536e-06, 7.884576916694641e-06, 8.925795555114746e-06, 9.967014193534851e-06, 1.1008232831954956e-05, 1.2049451470375061e-05, 1.3090670108795166e-05, 1.4131888747215271e-05, 1.5173107385635376e-05, 1.621432602405548e-05, 1.7255544662475586e-05, 1.829676330089569e-05, 1.9337981939315796e-05, 2.03792005777359e-05, 2.1420419216156006e-05, 2.246163785457611e-05, 2.3502856492996216e-05, 2.454407513141632e-05, 2.5585293769836426e-05, 2.662651240825653e-05, 2.7667731046676636e-05, 2.870894968509674e-05, 2.9750168323516846e-05, 3.079138696193695e-05, 3.1832605600357056e-05, 3.287382423877716e-05, 3.3915042877197266e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 2.0, 7.0, 9.0, 8.0, 14.0, 29.0, 44.0, 62.0, 81.0, 147.0, 263.0, 397.0, 647.0, 946.0, 1464.0, 2497.0, 4007.0, 6966.0, 12780.0, 28314.0, 92998.0, 506871.0, 287918.0, 56366.0, 20995.0, 10301.0, 5530.0, 3342.0, 2023.0, 1292.0, 832.0, 514.0, 302.0, 210.0, 147.0, 89.0, 48.0, 35.0, 25.0, 7.0, 9.0, 6.0, 2.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.456541061401367e-05, -7.197819650173187e-05, -6.939098238945007e-05, -6.680376827716827e-05, -6.421655416488647e-05, -6.162934005260468e-05, -5.9042125940322876e-05, -5.645491182804108e-05, -5.386769771575928e-05, -5.128048360347748e-05, -4.869326949119568e-05, -4.610605537891388e-05, -4.351884126663208e-05, -4.093162715435028e-05, -3.834441304206848e-05, -3.575719892978668e-05, -3.316998481750488e-05, -3.0582770705223083e-05, -2.7995556592941284e-05, -2.5408342480659485e-05, -2.2821128368377686e-05, -2.0233914256095886e-05, -1.7646700143814087e-05, -1.5059486031532288e-05, -1.2472271919250488e-05, -9.885057806968689e-06, -7.29784369468689e-06, -4.71062958240509e-06, -2.123415470123291e-06, 4.637986421585083e-07, 3.0510127544403076e-06, 5.638226866722107e-06, 8.225440979003906e-06, 1.0812655091285706e-05, 1.3399869203567505e-05, 1.5987083315849304e-05, 1.8574297428131104e-05, 2.1161511540412903e-05, 2.3748725652694702e-05, 2.63359397649765e-05, 2.89231538772583e-05, 3.15103679895401e-05, 3.40975821018219e-05, 3.66847962141037e-05, 3.92720103263855e-05, 4.18592244386673e-05, 4.44464385509491e-05, 4.7033652663230896e-05, 4.9620866775512695e-05, 5.2208080887794495e-05, 5.4795295000076294e-05, 5.738250911235809e-05, 5.996972322463989e-05, 6.255693733692169e-05, 6.514415144920349e-05, 6.773136556148529e-05, 7.031857967376709e-05, 7.290579378604889e-05, 7.549300789833069e-05, 7.808022201061249e-05, 8.066743612289429e-05, 8.325465023517609e-05, 8.584186434745789e-05, 8.842907845973969e-05, 9.101629257202148e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 9.0, 4.0, 7.0, 7.0, 10.0, 6.0, 7.0, 7.0, 15.0, 18.0, 20.0, 19.0, 26.0, 29.0, 39.0, 50.0, 32.0, 40.0, 36.0, 45.0, 37.0, 48.0, 34.0, 54.0, 37.0, 32.0, 34.0, 37.0, 31.0, 26.0, 31.0, 17.0, 23.0, 20.0, 19.0, 17.0, 11.0, 6.0, 11.0, 6.0, 12.0, 6.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-1.6868114471435547e-05, -1.6351230442523956e-05, -1.5834346413612366e-05, -1.5317462384700775e-05, -1.4800578355789185e-05, -1.4283694326877594e-05, -1.3766810297966003e-05, -1.3249926269054413e-05, -1.2733042240142822e-05, -1.2216158211231232e-05, -1.1699274182319641e-05, -1.118239015340805e-05, -1.066550612449646e-05, -1.014862209558487e-05, -9.631738066673279e-06, -9.114854037761688e-06, -8.597970008850098e-06, -8.081085979938507e-06, -7.5642019510269165e-06, -7.047317922115326e-06, -6.530433893203735e-06, -6.013549864292145e-06, -5.496665835380554e-06, -4.979781806468964e-06, -4.462897777557373e-06, -3.9460137486457825e-06, -3.429129719734192e-06, -2.9122456908226013e-06, -2.3953616619110107e-06, -1.8784776329994202e-06, -1.3615936040878296e-06, -8.44709575176239e-07, -3.2782554626464844e-07, 1.8905848264694214e-07, 7.059425115585327e-07, 1.2228265404701233e-06, 1.7397105693817139e-06, 2.2565945982933044e-06, 2.773478627204895e-06, 3.2903626561164856e-06, 3.807246685028076e-06, 4.324130713939667e-06, 4.841014742851257e-06, 5.357898771762848e-06, 5.8747828006744385e-06, 6.391666829586029e-06, 6.90855085849762e-06, 7.42543488740921e-06, 7.9423189163208e-06, 8.459202945232391e-06, 8.976086974143982e-06, 9.492971003055573e-06, 1.0009855031967163e-05, 1.0526739060878754e-05, 1.1043623089790344e-05, 1.1560507118701935e-05, 1.2077391147613525e-05, 1.2594275176525116e-05, 1.3111159205436707e-05, 1.3628043234348297e-05, 1.4144927263259888e-05, 1.4661811292171478e-05, 1.5178695321083069e-05, 1.569557934999466e-05, 1.621246337890625e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 4.0, 3.0, 9.0, 14.0, 13.0, 31.0, 37.0, 52.0, 78.0, 82.0, 154.0, 200.0, 308.0, 536.0, 866.0, 1361.0, 2396.0, 4256.0, 10062.0, 26558.0, 148652.0, 728765.0, 85305.0, 21789.0, 7699.0, 3875.0, 2068.0, 1251.0, 733.0, 474.0, 282.0, 206.0, 121.0, 91.0, 70.0, 53.0, 48.0, 17.0, 8.0, 13.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.8967857360839844e-05, -2.8044916689395905e-05, -2.7121976017951965e-05, -2.6199035346508026e-05, -2.5276094675064087e-05, -2.4353154003620148e-05, -2.343021333217621e-05, -2.250727266073227e-05, -2.158433198928833e-05, -2.066139131784439e-05, -1.973845064640045e-05, -1.8815509974956512e-05, -1.7892569303512573e-05, -1.6969628632068634e-05, -1.6046687960624695e-05, -1.5123747289180756e-05, -1.4200806617736816e-05, -1.3277865946292877e-05, -1.2354925274848938e-05, -1.1431984603404999e-05, -1.050904393196106e-05, -9.58610326051712e-06, -8.663162589073181e-06, -7.740221917629242e-06, -6.817281246185303e-06, -5.8943405747413635e-06, -4.971399903297424e-06, -4.048459231853485e-06, -3.125518560409546e-06, -2.2025778889656067e-06, -1.2796372175216675e-06, -3.5669654607772827e-07, 5.662441253662109e-07, 1.4891847968101501e-06, 2.4121254682540894e-06, 3.3350661396980286e-06, 4.258006811141968e-06, 5.180947482585907e-06, 6.103888154029846e-06, 7.026828825473785e-06, 7.949769496917725e-06, 8.872710168361664e-06, 9.795650839805603e-06, 1.0718591511249542e-05, 1.1641532182693481e-05, 1.256447285413742e-05, 1.348741352558136e-05, 1.4410354197025299e-05, 1.5333294868469238e-05, 1.6256235539913177e-05, 1.7179176211357117e-05, 1.8102116882801056e-05, 1.9025057554244995e-05, 1.9947998225688934e-05, 2.0870938897132874e-05, 2.1793879568576813e-05, 2.2716820240020752e-05, 2.363976091146469e-05, 2.456270158290863e-05, 2.548564225435257e-05, 2.640858292579651e-05, 2.7331523597240448e-05, 2.8254464268684387e-05, 2.9177404940128326e-05, 3.0100345611572266e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 3.0, 2.0, 10.0, 3.0, 10.0, 10.0, 29.0, 17.0, 33.0, 19.0, 67.0, 29.0, 74.0, 72.0, 155.0, 73.0, 116.0, 38.0, 68.0, 30.0, 62.0, 17.0, 21.0, 21.0, 5.0, 7.0, 5.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.9206275939941406e-06, -2.8312206268310547e-06, -2.7418136596679688e-06, -2.652406692504883e-06, -2.562999725341797e-06, -2.473592758178711e-06, -2.384185791015625e-06, -2.294778823852539e-06, -2.205371856689453e-06, -2.115964889526367e-06, -2.0265579223632812e-06, -1.9371509552001953e-06, -1.8477439880371094e-06, -1.7583370208740234e-06, -1.6689300537109375e-06, -1.5795230865478516e-06, -1.4901161193847656e-06, -1.4007091522216797e-06, -1.3113021850585938e-06, -1.2218952178955078e-06, -1.1324882507324219e-06, -1.043081283569336e-06, -9.5367431640625e-07, -8.642673492431641e-07, -7.748603820800781e-07, -6.854534149169922e-07, -5.960464477539062e-07, -5.066394805908203e-07, -4.172325134277344e-07, -3.2782554626464844e-07, -2.384185791015625e-07, -1.4901161193847656e-07, -5.960464477539063e-08, 2.9802322387695312e-08, 1.1920928955078125e-07, 2.086162567138672e-07, 2.980232238769531e-07, 3.8743019104003906e-07, 4.76837158203125e-07, 5.662441253662109e-07, 6.556510925292969e-07, 7.450580596923828e-07, 8.344650268554688e-07, 9.238719940185547e-07, 1.0132789611816406e-06, 1.1026859283447266e-06, 1.1920928955078125e-06, 1.2814998626708984e-06, 1.3709068298339844e-06, 1.4603137969970703e-06, 1.5497207641601562e-06, 1.6391277313232422e-06, 1.7285346984863281e-06, 1.817941665649414e-06, 1.9073486328125e-06, 1.996755599975586e-06, 2.086162567138672e-06, 2.175569534301758e-06, 2.2649765014648438e-06, 2.3543834686279297e-06, 2.4437904357910156e-06, 2.5331974029541016e-06, 2.6226043701171875e-06, 2.7120113372802734e-06, 2.8014183044433594e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 4.0, 7.0, 9.0, 10.0, 15.0, 22.0, 24.0, 39.0, 62.0, 87.0, 132.0, 247.0, 352.0, 605.0, 1076.0, 2051.0, 4169.0, 9269.0, 18968.0, 59388.0, 235265.0, 516556.0, 134443.0, 36034.0, 16070.0, 6664.0, 3072.0, 1574.0, 905.0, 474.0, 333.0, 227.0, 122.0, 92.0, 49.0, 22.0, 27.0, 24.0, 7.0, 9.0, 8.0, 2.0, 2.0, 6.0, 5.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.5079975128173828e-05, -1.4613382518291473e-05, -1.4146789908409119e-05, -1.3680197298526764e-05, -1.321360468864441e-05, -1.2747012078762054e-05, -1.22804194688797e-05, -1.1813826858997345e-05, -1.134723424911499e-05, -1.0880641639232635e-05, -1.041404902935028e-05, -9.947456419467926e-06, -9.480863809585571e-06, -9.014271199703217e-06, -8.547678589820862e-06, -8.081085979938507e-06, -7.614493370056152e-06, -7.147900760173798e-06, -6.681308150291443e-06, -6.214715540409088e-06, -5.748122930526733e-06, -5.281530320644379e-06, -4.814937710762024e-06, -4.348345100879669e-06, -3.8817524909973145e-06, -3.4151598811149597e-06, -2.948567271232605e-06, -2.4819746613502502e-06, -2.0153820514678955e-06, -1.5487894415855408e-06, -1.082196831703186e-06, -6.156042218208313e-07, -1.4901161193847656e-07, 3.175809979438782e-07, 7.841736078262329e-07, 1.2507662177085876e-06, 1.7173588275909424e-06, 2.183951437473297e-06, 2.650544047355652e-06, 3.1171366572380066e-06, 3.5837292671203613e-06, 4.050321877002716e-06, 4.516914486885071e-06, 4.9835070967674255e-06, 5.45009970664978e-06, 5.916692316532135e-06, 6.38328492641449e-06, 6.8498775362968445e-06, 7.316470146179199e-06, 7.783062756061554e-06, 8.249655365943909e-06, 8.716247975826263e-06, 9.182840585708618e-06, 9.649433195590973e-06, 1.0116025805473328e-05, 1.0582618415355682e-05, 1.1049211025238037e-05, 1.1515803635120392e-05, 1.1982396245002747e-05, 1.2448988854885101e-05, 1.2915581464767456e-05, 1.338217407464981e-05, 1.3848766684532166e-05, 1.431535929441452e-05, 1.4781951904296875e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 3.0, 6.0, 13.0, 8.0, 9.0, 18.0, 40.0, 53.0, 47.0, 72.0, 80.0, 94.0, 87.0, 130.0, 84.0, 71.0, 58.0, 32.0, 20.0, 20.0, 21.0, 6.0, 8.0, 5.0, 4.0, 7.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4570693969726562e-06, -3.3294782042503357e-06, -3.201887011528015e-06, -3.0742958188056946e-06, -2.946704626083374e-06, -2.8191134333610535e-06, -2.691522240638733e-06, -2.5639310479164124e-06, -2.436339855194092e-06, -2.3087486624717712e-06, -2.1811574697494507e-06, -2.05356627702713e-06, -1.9259750843048096e-06, -1.798383891582489e-06, -1.6707926988601685e-06, -1.543201506137848e-06, -1.4156103134155273e-06, -1.2880191206932068e-06, -1.1604279279708862e-06, -1.0328367352485657e-06, -9.052455425262451e-07, -7.776543498039246e-07, -6.50063157081604e-07, -5.224719643592834e-07, -3.948807716369629e-07, -2.6728957891464233e-07, -1.3969838619232178e-07, -1.210719347000122e-08, 1.1548399925231934e-07, 2.430751919746399e-07, 3.7066638469696045e-07, 4.98257577419281e-07, 6.258487701416016e-07, 7.534399628639221e-07, 8.810311555862427e-07, 1.0086223483085632e-06, 1.1362135410308838e-06, 1.2638047337532043e-06, 1.391395926475525e-06, 1.5189871191978455e-06, 1.646578311920166e-06, 1.7741695046424866e-06, 1.9017606973648071e-06, 2.0293518900871277e-06, 2.1569430828094482e-06, 2.284534275531769e-06, 2.4121254682540894e-06, 2.53971666097641e-06, 2.6673078536987305e-06, 2.794899046421051e-06, 2.9224902391433716e-06, 3.050081431865692e-06, 3.1776726245880127e-06, 3.3052638173103333e-06, 3.432855010032654e-06, 3.5604462027549744e-06, 3.688037395477295e-06, 3.8156285881996155e-06, 3.943219780921936e-06, 4.070810973644257e-06, 4.198402166366577e-06, 4.325993359088898e-06, 4.453584551811218e-06, 4.581175744533539e-06, 4.708766937255859e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 15.0, 6.0, 9.0, 17.0, 21.0, 17.0, 38.0, 54.0, 55.0, 76.0, 106.0, 121.0, 110.0, 85.0, 58.0, 52.0, 28.0, 29.0, 31.0, 14.0, 6.0, 11.0, 5.0, 10.0, 6.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.824843199457973e-05, -4.671978240367025e-05, -4.519113281276077e-05, -4.366248322185129e-05, -4.213383363094181e-05, -4.060518404003233e-05, -3.9076534449122846e-05, -3.7547884858213365e-05, -3.6019235267303884e-05, -3.44905856763944e-05, -3.296193608548492e-05, -3.143328649457544e-05, -2.990463690366596e-05, -2.837598731275648e-05, -2.6847335902857594e-05, -2.5318686311948113e-05, -2.379003490204923e-05, -2.2261385311139748e-05, -2.0732735720230266e-05, -1.9204086129320785e-05, -1.7675436538411304e-05, -1.6146786947501823e-05, -1.4618135537602939e-05, -1.3089485946693458e-05, -1.1560836355783977e-05, -1.0032186764874496e-05, -8.503537173965015e-06, -6.974886673560832e-06, -5.446237082651351e-06, -3.91758749174187e-06, -2.3889369913376868e-06, -8.602874004282057e-07, 6.683621904812753e-07, 2.197012008764432e-06, 3.7256618270475883e-06, 5.25431187270442e-06, 6.782961463613901e-06, 8.311611054523382e-06, 9.840261554927565e-06, 1.1368911145837046e-05, 1.2897560736746527e-05, 1.4426210327656008e-05, 1.595485991856549e-05, 1.7483511328464374e-05, 1.9012160919373855e-05, 2.0540810510283336e-05, 2.2069460101192817e-05, 2.3598109692102298e-05, 2.512675928301178e-05, 2.665540887392126e-05, 2.818405846483074e-05, 2.9712708055740222e-05, 3.12413576466497e-05, 3.2770007237559184e-05, 3.429866046644747e-05, 3.5827310057356954e-05, 3.7355959648266435e-05, 3.8884609239175916e-05, 4.04132588300854e-05, 4.194190842099488e-05, 4.347055801190436e-05, 4.499920760281384e-05, 4.652785719372332e-05, 4.80565067846328e-05, 4.958515637554228e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 0.0, 5.0, 7.0, 6.0, 11.0, 15.0, 18.0, 17.0, 21.0, 19.0, 23.0, 32.0, 37.0, 37.0, 31.0, 36.0, 48.0, 37.0, 49.0, 50.0, 45.0, 43.0, 46.0, 35.0, 39.0, 34.0, 48.0, 30.0, 36.0, 30.0, 26.0, 19.0, 14.0, 16.0, 8.0, 10.0, 6.0, 9.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.128805474261753e-05, -3.0275081371655688e-05, -2.9262109819683246e-05, -2.82491364487214e-05, -2.723616489674896e-05, -2.6223191525787115e-05, -2.521021815482527e-05, -2.419724660285283e-05, -2.3184275050880387e-05, -2.2171301679918543e-05, -2.11583301279461e-05, -2.0145356756984256e-05, -1.9132385205011815e-05, -1.811941183404997e-05, -1.7106438463088125e-05, -1.6093466911115684e-05, -1.5080493540153839e-05, -1.4067521078686696e-05, -1.3054548617219552e-05, -1.2041575246257707e-05, -1.1028603694285266e-05, -1.0015630323323421e-05, -9.002657861856278e-06, -7.989685400389135e-06, -6.976712938921992e-06, -5.963740477454849e-06, -4.9507680159877054e-06, -3.937795099773211e-06, -2.9248226383060683e-06, -1.911850176838925e-06, -8.988772606244311e-07, 1.1409520084271207e-07, 1.1270676623098552e-06, 2.1400401237769984e-06, 3.153012812617817e-06, 4.1659855014586356e-06, 5.178957962925779e-06, 6.191930424392922e-06, 7.204903340607416e-06, 8.217875802074559e-06, 9.230848263541702e-06, 1.0243820725008845e-05, 1.1256793186475988e-05, 1.2269765647943132e-05, 1.3282739018904977e-05, 1.4295710570877418e-05, 1.5308683941839263e-05, 1.6321657312801108e-05, 1.733462886477355e-05, 1.8347602235735394e-05, 1.9360573787707835e-05, 2.037354715866968e-05, 2.1386518710642122e-05, 2.2399492081603967e-05, 2.3412463633576408e-05, 2.4425437004538253e-05, 2.5438410375500098e-05, 2.6451383746461943e-05, 2.7464355298434384e-05, 2.847732866939623e-05, 2.949030022136867e-05, 3.0503273592330515e-05, 3.151624696329236e-05, 3.2529220334254205e-05, 3.354219006723724e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 3.0, 9.0, 4.0, 6.0, 7.0, 21.0, 23.0, 36.0, 79.0, 106.0, 142.0, 239.0, 324.0, 499.0, 772.0, 1155.0, 1590.0, 2363.0, 3610.0, 5724.0, 8588.0, 14238.0, 23511.0, 38211.0, 69388.0, 124405.0, 234629.0, 223908.0, 127781.0, 67965.0, 37351.0, 23263.0, 13361.0, 8697.0, 5618.0, 3545.0, 2470.0, 1565.0, 1095.0, 723.0, 495.0, 342.0, 236.0, 153.0, 116.0, 70.0, 46.0, 30.0, 21.0, 13.0, 8.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9114227294921875e-05, -4.752911627292633e-05, -4.5944005250930786e-05, -4.435889422893524e-05, -4.27737832069397e-05, -4.118867218494415e-05, -3.960356116294861e-05, -3.8018450140953064e-05, -3.643333911895752e-05, -3.4848228096961975e-05, -3.326311707496643e-05, -3.1678006052970886e-05, -3.0092895030975342e-05, -2.8507784008979797e-05, -2.6922672986984253e-05, -2.533756196498871e-05, -2.3752450942993164e-05, -2.216733992099762e-05, -2.0582228899002075e-05, -1.899711787700653e-05, -1.7412006855010986e-05, -1.5826895833015442e-05, -1.4241784811019897e-05, -1.2656673789024353e-05, -1.1071562767028809e-05, -9.486451745033264e-06, -7.90134072303772e-06, -6.316229701042175e-06, -4.731118679046631e-06, -3.1460076570510864e-06, -1.560896635055542e-06, 2.421438694000244e-08, 1.6093254089355469e-06, 3.1944364309310913e-06, 4.779547452926636e-06, 6.36465847492218e-06, 7.949769496917725e-06, 9.534880518913269e-06, 1.1119991540908813e-05, 1.2705102562904358e-05, 1.4290213584899902e-05, 1.5875324606895447e-05, 1.746043562889099e-05, 1.9045546650886536e-05, 2.063065767288208e-05, 2.2215768694877625e-05, 2.380087971687317e-05, 2.5385990738868713e-05, 2.6971101760864258e-05, 2.8556212782859802e-05, 3.0141323804855347e-05, 3.172643482685089e-05, 3.3311545848846436e-05, 3.489665687084198e-05, 3.6481767892837524e-05, 3.806687891483307e-05, 3.965198993682861e-05, 4.123710095882416e-05, 4.28222119808197e-05, 4.4407323002815247e-05, 4.599243402481079e-05, 4.7577545046806335e-05, 4.916265606880188e-05, 5.0747767090797424e-05, 5.233287811279297e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 6.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 8.0, 9.0, 9.0, 10.0, 19.0, 14.0, 12.0, 27.0, 20.0, 30.0, 25.0, 31.0, 42.0, 42.0, 30.0, 33.0, 43.0, 43.0, 53.0, 40.0, 40.0, 46.0, 26.0, 50.0, 30.0, 30.0, 38.0, 25.0, 33.0, 25.0, 22.0, 15.0, 17.0, 8.0, 9.0, 10.0, 8.0, 6.0, 1.0, 8.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.187490463256836e-05, -2.105720341205597e-05, -2.023950219154358e-05, -1.942180097103119e-05, -1.86040997505188e-05, -1.778639853000641e-05, -1.696869730949402e-05, -1.615099608898163e-05, -1.5333294868469238e-05, -1.4515593647956848e-05, -1.3697892427444458e-05, -1.2880191206932068e-05, -1.2062489986419678e-05, -1.1244788765907288e-05, -1.0427087545394897e-05, -9.609386324882507e-06, -8.791685104370117e-06, -7.973983883857727e-06, -7.156282663345337e-06, -6.338581442832947e-06, -5.520880222320557e-06, -4.7031790018081665e-06, -3.885477781295776e-06, -3.0677765607833862e-06, -2.250075340270996e-06, -1.432374119758606e-06, -6.146728992462158e-07, 2.0302832126617432e-07, 1.0207295417785645e-06, 1.8384307622909546e-06, 2.6561319828033447e-06, 3.473833203315735e-06, 4.291534423828125e-06, 5.109235644340515e-06, 5.926936864852905e-06, 6.744638085365295e-06, 7.5623393058776855e-06, 8.380040526390076e-06, 9.197741746902466e-06, 1.0015442967414856e-05, 1.0833144187927246e-05, 1.1650845408439636e-05, 1.2468546628952026e-05, 1.3286247849464417e-05, 1.4103949069976807e-05, 1.4921650290489197e-05, 1.5739351511001587e-05, 1.6557052731513977e-05, 1.7374753952026367e-05, 1.8192455172538757e-05, 1.9010156393051147e-05, 1.9827857613563538e-05, 2.0645558834075928e-05, 2.1463260054588318e-05, 2.2280961275100708e-05, 2.3098662495613098e-05, 2.3916363716125488e-05, 2.473406493663788e-05, 2.555176615715027e-05, 2.636946737766266e-05, 2.718716859817505e-05, 2.800486981868744e-05, 2.882257103919983e-05, 2.964027225971222e-05, 3.045797348022461e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 9.0, 15.0, 21.0, 22.0, 42.0, 55.0, 88.0, 97.0, 122.0, 210.0, 320.0, 439.0, 630.0, 943.0, 1267.0, 1813.0, 2661.0, 3934.0, 5955.0, 8855.0, 13833.0, 21776.0, 35961.0, 60551.0, 105699.0, 184174.0, 214663.0, 154649.0, 90221.0, 52445.0, 31033.0, 19047.0, 12083.0, 7858.0, 5354.0, 3569.0, 2397.0, 1732.0, 1177.0, 870.0, 566.0, 440.0, 289.0, 195.0, 158.0, 91.0, 67.0, 45.0, 36.0, 23.0, 21.0, 10.0, 6.0, 5.0, 6.0, 7.0, 3.0], "bins": [-4.38690185546875e-05, -4.2553991079330444e-05, -4.123896360397339e-05, -3.992393612861633e-05, -3.860890865325928e-05, -3.729388117790222e-05, -3.5978853702545166e-05, -3.466382622718811e-05, -3.3348798751831055e-05, -3.2033771276474e-05, -3.071874380111694e-05, -2.9403716325759888e-05, -2.8088688850402832e-05, -2.6773661375045776e-05, -2.545863389968872e-05, -2.4143606424331665e-05, -2.282857894897461e-05, -2.1513551473617554e-05, -2.0198523998260498e-05, -1.8883496522903442e-05, -1.7568469047546387e-05, -1.625344157218933e-05, -1.4938414096832275e-05, -1.362338662147522e-05, -1.2308359146118164e-05, -1.0993331670761108e-05, -9.678304195404053e-06, -8.363276720046997e-06, -7.048249244689941e-06, -5.733221769332886e-06, -4.41819429397583e-06, -3.1031668186187744e-06, -1.7881393432617188e-06, -4.731118679046631e-07, 8.419156074523926e-07, 2.1569430828094482e-06, 3.471970558166504e-06, 4.7869980335235596e-06, 6.102025508880615e-06, 7.417052984237671e-06, 8.732080459594727e-06, 1.0047107934951782e-05, 1.1362135410308838e-05, 1.2677162885665894e-05, 1.399219036102295e-05, 1.5307217836380005e-05, 1.662224531173706e-05, 1.7937272787094116e-05, 1.9252300262451172e-05, 2.0567327737808228e-05, 2.1882355213165283e-05, 2.319738268852234e-05, 2.4512410163879395e-05, 2.582743763923645e-05, 2.7142465114593506e-05, 2.845749258995056e-05, 2.9772520065307617e-05, 3.108754754066467e-05, 3.240257501602173e-05, 3.3717602491378784e-05, 3.503262996673584e-05, 3.6347657442092896e-05, 3.766268491744995e-05, 3.897771239280701e-05, 4.029273986816406e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 7.0, 12.0, 9.0, 10.0, 9.0, 18.0, 14.0, 21.0, 32.0, 26.0, 40.0, 29.0, 45.0, 50.0, 42.0, 39.0, 38.0, 43.0, 51.0, 46.0, 43.0, 37.0, 33.0, 39.0, 35.0, 36.0, 26.0, 29.0, 23.0, 15.0, 15.0, 18.0, 11.0, 20.0, 10.0, 9.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8537044525146484e-05, -1.7977319657802582e-05, -1.741759479045868e-05, -1.6857869923114777e-05, -1.6298145055770874e-05, -1.573842018842697e-05, -1.5178695321083069e-05, -1.4618970453739166e-05, -1.4059245586395264e-05, -1.3499520719051361e-05, -1.2939795851707458e-05, -1.2380070984363556e-05, -1.1820346117019653e-05, -1.126062124967575e-05, -1.0700896382331848e-05, -1.0141171514987946e-05, -9.581446647644043e-06, -9.02172178030014e-06, -8.461996912956238e-06, -7.902272045612335e-06, -7.342547178268433e-06, -6.78282231092453e-06, -6.2230974435806274e-06, -5.663372576236725e-06, -5.103647708892822e-06, -4.54392284154892e-06, -3.984197974205017e-06, -3.4244731068611145e-06, -2.864748239517212e-06, -2.3050233721733093e-06, -1.7452985048294067e-06, -1.1855736374855042e-06, -6.258487701416016e-07, -6.612390279769897e-08, 4.936009645462036e-07, 1.0533258318901062e-06, 1.6130506992340088e-06, 2.1727755665779114e-06, 2.732500433921814e-06, 3.2922253012657166e-06, 3.851950168609619e-06, 4.411675035953522e-06, 4.971399903297424e-06, 5.531124770641327e-06, 6.0908496379852295e-06, 6.650574505329132e-06, 7.210299372673035e-06, 7.770024240016937e-06, 8.32974910736084e-06, 8.889473974704742e-06, 9.449198842048645e-06, 1.0008923709392548e-05, 1.056864857673645e-05, 1.1128373444080353e-05, 1.1688098311424255e-05, 1.2247823178768158e-05, 1.280754804611206e-05, 1.3367272913455963e-05, 1.3926997780799866e-05, 1.4486722648143768e-05, 1.5046447515487671e-05, 1.5606172382831573e-05, 1.6165897250175476e-05, 1.672562211751938e-05, 1.728534698486328e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 13.0, 16.0, 25.0, 32.0, 52.0, 72.0, 80.0, 101.0, 115.0, 212.0, 274.0, 362.0, 538.0, 641.0, 914.0, 1216.0, 1669.0, 2295.0, 3594.0, 4890.0, 7220.0, 11399.0, 21261.0, 38268.0, 92675.0, 658884.0, 101729.0, 42761.0, 20046.0, 11962.0, 7578.0, 5306.0, 3431.0, 2451.0, 1631.0, 1326.0, 944.0, 692.0, 477.0, 374.0, 256.0, 203.0, 152.0, 119.0, 94.0, 56.0, 38.0, 39.0, 22.0, 16.0, 12.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0], "bins": [-2.372264862060547e-05, -2.299342304468155e-05, -2.226419746875763e-05, -2.153497189283371e-05, -2.080574631690979e-05, -2.007652074098587e-05, -1.934729516506195e-05, -1.861806958913803e-05, -1.788884401321411e-05, -1.715961843729019e-05, -1.6430392861366272e-05, -1.5701167285442352e-05, -1.4971941709518433e-05, -1.4242716133594513e-05, -1.3513490557670593e-05, -1.2784264981746674e-05, -1.2055039405822754e-05, -1.1325813829898834e-05, -1.0596588253974915e-05, -9.867362678050995e-06, -9.138137102127075e-06, -8.408911526203156e-06, -7.679685950279236e-06, -6.950460374355316e-06, -6.2212347984313965e-06, -5.492009222507477e-06, -4.762783646583557e-06, -4.0335580706596375e-06, -3.3043324947357178e-06, -2.575106918811798e-06, -1.8458813428878784e-06, -1.1166557669639587e-06, -3.8743019104003906e-07, 3.417953848838806e-07, 1.0710209608078003e-06, 1.80024653673172e-06, 2.5294721126556396e-06, 3.2586976885795593e-06, 3.987923264503479e-06, 4.717148840427399e-06, 5.446374416351318e-06, 6.175599992275238e-06, 6.904825568199158e-06, 7.634051144123077e-06, 8.363276720046997e-06, 9.092502295970917e-06, 9.821727871894836e-06, 1.0550953447818756e-05, 1.1280179023742676e-05, 1.2009404599666595e-05, 1.2738630175590515e-05, 1.3467855751514435e-05, 1.4197081327438354e-05, 1.4926306903362274e-05, 1.5655532479286194e-05, 1.6384758055210114e-05, 1.7113983631134033e-05, 1.7843209207057953e-05, 1.8572434782981873e-05, 1.9301660358905792e-05, 2.0030885934829712e-05, 2.076011151075363e-05, 2.148933708667755e-05, 2.221856266260147e-05, 2.294778823852539e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 153.0, 0.0, 0.0, 0.0, 0.0, 587.0, 0.0, 0.0, 0.0, 133.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 11.0, 8.0, 12.0, 19.0, 27.0, 43.0, 70.0, 73.0, 120.0, 195.0, 234.0, 375.0, 512.0, 852.0, 1187.0, 1710.0, 2654.0, 3837.0, 6119.0, 9748.0, 16397.0, 34439.0, 86535.0, 710536.0, 91765.0, 34554.0, 18125.0, 9774.0, 6419.0, 3938.0, 2795.0, 1749.0, 1152.0, 795.0, 557.0, 407.0, 240.0, 161.0, 144.0, 83.0, 45.0, 47.0, 34.0, 20.0, 9.0, 10.0, 11.0, 2.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7670135498046875e-05, -3.639422357082367e-05, -3.5118311643600464e-05, -3.384239971637726e-05, -3.256648778915405e-05, -3.129057586193085e-05, -3.001466393470764e-05, -2.8738752007484436e-05, -2.746284008026123e-05, -2.6186928153038025e-05, -2.491101622581482e-05, -2.3635104298591614e-05, -2.2359192371368408e-05, -2.1083280444145203e-05, -1.9807368516921997e-05, -1.853145658969879e-05, -1.7255544662475586e-05, -1.597963273525238e-05, -1.4703720808029175e-05, -1.342780888080597e-05, -1.2151896953582764e-05, -1.0875985026359558e-05, -9.600073099136353e-06, -8.324161171913147e-06, -7.048249244689941e-06, -5.772337317466736e-06, -4.49642539024353e-06, -3.2205134630203247e-06, -1.944601535797119e-06, -6.686896085739136e-07, 6.07222318649292e-07, 1.8831342458724976e-06, 3.159046173095703e-06, 4.434958100318909e-06, 5.710870027542114e-06, 6.98678195476532e-06, 8.262693881988525e-06, 9.538605809211731e-06, 1.0814517736434937e-05, 1.2090429663658142e-05, 1.3366341590881348e-05, 1.4642253518104553e-05, 1.591816544532776e-05, 1.7194077372550964e-05, 1.846998929977417e-05, 1.9745901226997375e-05, 2.102181315422058e-05, 2.2297725081443787e-05, 2.3573637008666992e-05, 2.4849548935890198e-05, 2.6125460863113403e-05, 2.740137279033661e-05, 2.8677284717559814e-05, 2.995319664478302e-05, 3.1229108572006226e-05, 3.250502049922943e-05, 3.378093242645264e-05, 3.505684435367584e-05, 3.633275628089905e-05, 3.7608668208122253e-05, 3.888458013534546e-05, 4.0160492062568665e-05, 4.143640398979187e-05, 4.2712315917015076e-05, 4.398822784423828e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 3.0, 9.0, 8.0, 22.0, 9.0, 22.0, 34.0, 38.0, 54.0, 119.0, 388.0, 60.0, 45.0, 39.0, 23.0, 16.0, 16.0, 13.0, 9.0, 7.0, 6.0, 7.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3828277587890625e-05, -1.3423152267932892e-05, -1.3018026947975159e-05, -1.2612901628017426e-05, -1.2207776308059692e-05, -1.180265098810196e-05, -1.1397525668144226e-05, -1.0992400348186493e-05, -1.058727502822876e-05, -1.0182149708271027e-05, -9.777024388313293e-06, -9.37189906835556e-06, -8.966773748397827e-06, -8.561648428440094e-06, -8.15652310848236e-06, -7.751397788524628e-06, -7.3462724685668945e-06, -6.941147148609161e-06, -6.536021828651428e-06, -6.130896508693695e-06, -5.725771188735962e-06, -5.320645868778229e-06, -4.915520548820496e-06, -4.5103952288627625e-06, -4.105269908905029e-06, -3.700144588947296e-06, -3.295019268989563e-06, -2.88989394903183e-06, -2.4847686290740967e-06, -2.0796433091163635e-06, -1.6745179891586304e-06, -1.2693926692008972e-06, -8.642673492431641e-07, -4.591420292854309e-07, -5.4016709327697754e-08, 3.511086106300354e-07, 7.562339305877686e-07, 1.1613592505455017e-06, 1.5664845705032349e-06, 1.971609890460968e-06, 2.376735210418701e-06, 2.7818605303764343e-06, 3.1869858503341675e-06, 3.5921111702919006e-06, 3.997236490249634e-06, 4.402361810207367e-06, 4.8074871301651e-06, 5.212612450122833e-06, 5.617737770080566e-06, 6.0228630900382996e-06, 6.427988409996033e-06, 6.833113729953766e-06, 7.238239049911499e-06, 7.643364369869232e-06, 8.048489689826965e-06, 8.453615009784698e-06, 8.858740329742432e-06, 9.263865649700165e-06, 9.668990969657898e-06, 1.0074116289615631e-05, 1.0479241609573364e-05, 1.0884366929531097e-05, 1.128949224948883e-05, 1.1694617569446564e-05, 1.2099742889404297e-05]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 7.0, 4.0, 9.0, 8.0, 15.0, 22.0, 17.0, 22.0, 31.0, 46.0, 62.0, 80.0, 109.0, 104.0, 98.0, 85.0, 67.0, 41.0, 26.0, 27.0, 15.0, 26.0, 17.0, 12.0, 11.0, 8.0, 6.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.858188938465901e-05, -3.728336378117092e-05, -3.598483817768283e-05, -3.4686312574194744e-05, -3.3387786970706657e-05, -3.208926136721857e-05, -3.0790732125751674e-05, -2.949220834125299e-05, -2.8193682737764902e-05, -2.6895157134276815e-05, -2.5596631530788727e-05, -2.4298104108311236e-05, -2.2999578504823148e-05, -2.170105290133506e-05, -2.0402527297846973e-05, -1.9104001694358885e-05, -1.7805476090870798e-05, -1.650695048738271e-05, -1.5208424883894622e-05, -1.3909898370911833e-05, -1.2611372767423745e-05, -1.1312847163935658e-05, -1.0014320650952868e-05, -8.71579504746478e-06, -7.417269443976693e-06, -6.118743840488605e-06, -4.820217782253167e-06, -3.521691724017728e-06, -2.2231661205296405e-06, -9.246405170415528e-07, 3.738859959412366e-07, 1.6724115994293243e-06, 2.970940840896219e-06, 4.269466444384307e-06, 5.567992502619745e-06, 6.866518560855184e-06, 8.165044164343271e-06, 9.463569767831359e-06, 1.0762096280814148e-05, 1.2060621884302236e-05, 1.3359147487790324e-05, 1.4657673091278411e-05, 1.59561986947665e-05, 1.725472611724399e-05, 1.8553251720732078e-05, 1.9851777324220166e-05, 2.1150302927708253e-05, 2.244882853119634e-05, 2.374735413468443e-05, 2.5045879738172516e-05, 2.6344405341660604e-05, 2.764293094514869e-05, 2.894145654863678e-05, 3.0239982152124867e-05, 3.153851139359176e-05, 3.283703699707985e-05, 3.413556260056794e-05, 3.5434088204056025e-05, 3.673261380754411e-05, 3.80311394110322e-05, 3.932966501452029e-05, 4.0628190618008375e-05, 4.192671622149646e-05, 4.322524182498455e-05, 4.452376742847264e-05]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 14.0, 18.0, 16.0, 15.0, 11.0, 16.0, 18.0, 29.0, 27.0, 31.0, 38.0, 41.0, 38.0, 37.0, 37.0, 49.0, 36.0, 45.0, 54.0, 41.0, 38.0, 41.0, 43.0, 38.0, 31.0, 32.0, 34.0, 28.0, 21.0, 19.0, 8.0, 21.0, 4.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.628840047691483e-05, -2.534960185585078e-05, -2.4410803234786727e-05, -2.347200279473327e-05, -2.253320417366922e-05, -2.1594405552605167e-05, -2.0655606931541115e-05, -1.9716808310477063e-05, -1.877800968941301e-05, -1.783921106834896e-05, -1.6900412447284907e-05, -1.5961613826220855e-05, -1.50228133861674e-05, -1.4084014765103348e-05, -1.3145216144039296e-05, -1.2206417522975244e-05, -1.1267617082921788e-05, -1.0328818461857736e-05, -9.390018931298982e-06, -8.45122031023493e-06, -7.5124212344235275e-06, -6.573622158612125e-06, -5.634823537548073e-06, -4.69602446173667e-06, -3.757225385925267e-06, -2.818426310113864e-06, -1.8796274616761366e-06, -9.408286132384092e-07, -2.0295374270062894e-09, 9.367695383843966e-07, 1.8755681594484486e-06, 2.8143672352598514e-06, 3.7531644920818508e-06, 4.691963567893254e-06, 5.6307626437046565e-06, 6.5695612647687085e-06, 7.508360340580111e-06, 8.447159416391514e-06, 9.385958037455566e-06, 1.0324756658519618e-05, 1.1263556189078372e-05, 1.2202354810142424e-05, 1.3141154340701178e-05, 1.407995296176523e-05, 1.5018751582829282e-05, 1.5957550203893334e-05, 1.6896348824957386e-05, 1.783514926501084e-05, 1.8773947886074893e-05, 1.9712746507138945e-05, 2.0651545128202997e-05, 2.1590345568256453e-05, 2.2529144189320505e-05, 2.3467942810384557e-05, 2.440674143144861e-05, 2.534554005251266e-05, 2.6284338673576713e-05, 2.7223137294640765e-05, 2.8161935915704817e-05, 2.910073453676887e-05, 3.0039534976822324e-05, 3.097833541687578e-05, 3.1917130399961025e-05, 3.2855932659003884e-05, 3.3794731280067936e-05]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 14.0, 25.0, 31.0, 65.0, 121.0, 182.0, 232.0, 425.0, 629.0, 883.0, 1377.0, 2153.0, 3554.0, 5777.0, 9184.0, 15144.0, 26534.0, 44451.0, 88216.0, 191944.0, 535385.0, 1719538.0, 988165.0, 288242.0, 124036.0, 62714.0, 34412.0, 19101.0, 11844.0, 7478.0, 4439.0, 2913.0, 1855.0, 1045.0, 690.0, 453.0, 309.0, 223.0, 138.0, 104.0, 68.0, 46.0, 27.0, 23.0, 19.0, 20.0, 11.0, 15.0, 16.0, 7.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.0517578125e-05, -2.933107316493988e-05, -2.814456820487976e-05, -2.695806324481964e-05, -2.577155828475952e-05, -2.4585053324699402e-05, -2.3398548364639282e-05, -2.2212043404579163e-05, -2.1025538444519043e-05, -1.9839033484458923e-05, -1.8652528524398804e-05, -1.7466023564338684e-05, -1.6279518604278564e-05, -1.5093013644218445e-05, -1.3906508684158325e-05, -1.2720003724098206e-05, -1.1533498764038086e-05, -1.0346993803977966e-05, -9.160488843917847e-06, -7.973983883857727e-06, -6.787478923797607e-06, -5.600973963737488e-06, -4.414469003677368e-06, -3.2279640436172485e-06, -2.041459083557129e-06, -8.549541234970093e-07, 3.3155083656311035e-07, 1.51805579662323e-06, 2.7045607566833496e-06, 3.891065716743469e-06, 5.077570676803589e-06, 6.2640756368637085e-06, 7.450580596923828e-06, 8.637085556983948e-06, 9.823590517044067e-06, 1.1010095477104187e-05, 1.2196600437164307e-05, 1.3383105397224426e-05, 1.4569610357284546e-05, 1.5756115317344666e-05, 1.6942620277404785e-05, 1.8129125237464905e-05, 1.9315630197525024e-05, 2.0502135157585144e-05, 2.1688640117645264e-05, 2.2875145077705383e-05, 2.4061650037765503e-05, 2.5248154997825623e-05, 2.6434659957885742e-05, 2.7621164917945862e-05, 2.880766987800598e-05, 2.99941748380661e-05, 3.118067979812622e-05, 3.236718475818634e-05, 3.355368971824646e-05, 3.474019467830658e-05, 3.59266996383667e-05, 3.711320459842682e-05, 3.829970955848694e-05, 3.948621451854706e-05, 4.067271947860718e-05, 4.18592244386673e-05, 4.304572939872742e-05, 4.423223435878754e-05, 4.5418739318847656e-05]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 13.0, 16.0, 12.0, 14.0, 14.0, 18.0, 23.0, 21.0, 37.0, 41.0, 33.0, 52.0, 51.0, 49.0, 44.0, 44.0, 38.0, 53.0, 46.0, 39.0, 39.0, 51.0, 38.0, 38.0, 43.0, 23.0, 30.0, 21.0, 12.0, 14.0, 11.0, 7.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5854835510253906e-05, -1.5251338481903076e-05, -1.4647841453552246e-05, -1.4044344425201416e-05, -1.3440847396850586e-05, -1.2837350368499756e-05, -1.2233853340148926e-05, -1.1630356311798096e-05, -1.1026859283447266e-05, -1.0423362255096436e-05, -9.819865226745605e-06, -9.216368198394775e-06, -8.612871170043945e-06, -8.009374141693115e-06, -7.405877113342285e-06, -6.802380084991455e-06, -6.198883056640625e-06, -5.595386028289795e-06, -4.991888999938965e-06, -4.388391971588135e-06, -3.7848949432373047e-06, -3.1813979148864746e-06, -2.5779008865356445e-06, -1.9744038581848145e-06, -1.3709068298339844e-06, -7.674098014831543e-07, -1.6391277313232422e-07, 4.3958425521850586e-07, 1.043081283569336e-06, 1.646578311920166e-06, 2.250075340270996e-06, 2.853572368621826e-06, 3.4570693969726562e-06, 4.060566425323486e-06, 4.664063453674316e-06, 5.2675604820251465e-06, 5.8710575103759766e-06, 6.474554538726807e-06, 7.078051567077637e-06, 7.681548595428467e-06, 8.285045623779297e-06, 8.888542652130127e-06, 9.492039680480957e-06, 1.0095536708831787e-05, 1.0699033737182617e-05, 1.1302530765533447e-05, 1.1906027793884277e-05, 1.2509524822235107e-05, 1.3113021850585938e-05, 1.3716518878936768e-05, 1.4320015907287598e-05, 1.4923512935638428e-05, 1.5527009963989258e-05, 1.6130506992340088e-05, 1.6734004020690918e-05, 1.7337501049041748e-05, 1.7940998077392578e-05, 1.8544495105743408e-05, 1.9147992134094238e-05, 1.975148916244507e-05, 2.03549861907959e-05, 2.095848321914673e-05, 2.156198024749756e-05, 2.216547727584839e-05, 2.276897430419922e-05]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 1.0, 0.0, 4.0, 5.0, 6.0, 18.0, 23.0, 35.0, 52.0, 71.0, 113.0, 188.0, 251.0, 353.0, 492.0, 733.0, 1033.0, 1804.0, 2688.0, 4237.0, 7439.0, 11706.0, 19524.0, 35878.0, 61995.0, 117496.0, 247413.0, 683074.0, 1573772.0, 806578.0, 317840.0, 135674.0, 69329.0, 37657.0, 22581.0, 12629.0, 7637.0, 5002.0, 2988.0, 2068.0, 1403.0, 851.0, 545.0, 367.0, 247.0, 163.0, 96.0, 55.0, 54.0, 37.0, 24.0, 30.0, 18.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.069639205932617e-05, -2.9725022614002228e-05, -2.8753653168678284e-05, -2.778228372335434e-05, -2.6810914278030396e-05, -2.583954483270645e-05, -2.4868175387382507e-05, -2.3896805942058563e-05, -2.292543649673462e-05, -2.1954067051410675e-05, -2.098269760608673e-05, -2.0011328160762787e-05, -1.9039958715438843e-05, -1.80685892701149e-05, -1.7097219824790955e-05, -1.612585037946701e-05, -1.5154480934143066e-05, -1.4183111488819122e-05, -1.3211742043495178e-05, -1.2240372598171234e-05, -1.126900315284729e-05, -1.0297633707523346e-05, -9.326264262199402e-06, -8.354894816875458e-06, -7.383525371551514e-06, -6.41215592622757e-06, -5.4407864809036255e-06, -4.469417035579681e-06, -3.4980475902557373e-06, -2.5266781449317932e-06, -1.5553086996078491e-06, -5.83939254283905e-07, 3.8743019104003906e-07, 1.3587996363639832e-06, 2.3301690816879272e-06, 3.3015385270118713e-06, 4.2729079723358154e-06, 5.2442774176597595e-06, 6.215646862983704e-06, 7.187016308307648e-06, 8.158385753631592e-06, 9.129755198955536e-06, 1.010112464427948e-05, 1.1072494089603424e-05, 1.2043863534927368e-05, 1.3015232980251312e-05, 1.3986602425575256e-05, 1.49579718708992e-05, 1.5929341316223145e-05, 1.690071076154709e-05, 1.7872080206871033e-05, 1.8843449652194977e-05, 1.981481909751892e-05, 2.0786188542842865e-05, 2.175755798816681e-05, 2.2728927433490753e-05, 2.3700296878814697e-05, 2.467166632413864e-05, 2.5643035769462585e-05, 2.661440521478653e-05, 2.7585774660110474e-05, 2.8557144105434418e-05, 2.9528513550758362e-05, 3.0499882996082306e-05, 3.147125244140625e-05]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 12.0, 6.0, 13.0, 19.0, 18.0, 16.0, 44.0, 35.0, 35.0, 65.0, 67.0, 81.0, 117.0, 125.0, 156.0, 196.0, 211.0, 218.0, 319.0, 295.0, 263.0, 276.0, 285.0, 181.0, 209.0, 157.0, 120.0, 118.0, 96.0, 48.0, 58.0, 37.0, 18.0, 34.0, 29.0, 10.0, 13.0, 14.0, 8.0, 5.0, 12.0, 4.0, 8.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-9.179115295410156e-06, -8.900649845600128e-06, -8.6221843957901e-06, -8.343718945980072e-06, -8.065253496170044e-06, -7.786788046360016e-06, -7.508322596549988e-06, -7.22985714673996e-06, -6.951391696929932e-06, -6.6729262471199036e-06, -6.3944607973098755e-06, -6.115995347499847e-06, -5.837529897689819e-06, -5.559064447879791e-06, -5.280598998069763e-06, -5.002133548259735e-06, -4.723668098449707e-06, -4.445202648639679e-06, -4.166737198829651e-06, -3.888271749019623e-06, -3.6098062992095947e-06, -3.3313408493995667e-06, -3.0528753995895386e-06, -2.7744099497795105e-06, -2.4959444999694824e-06, -2.2174790501594543e-06, -1.9390136003494263e-06, -1.6605481505393982e-06, -1.3820827007293701e-06, -1.103617250919342e-06, -8.25151801109314e-07, -5.466863512992859e-07, -2.682209014892578e-07, 1.0244548320770264e-08, 2.8870999813079834e-07, 5.671754479408264e-07, 8.456408977508545e-07, 1.1241063475608826e-06, 1.4025717973709106e-06, 1.6810372471809387e-06, 1.959502696990967e-06, 2.237968146800995e-06, 2.516433596611023e-06, 2.794899046421051e-06, 3.073364496231079e-06, 3.351829946041107e-06, 3.6302953958511353e-06, 3.908760845661163e-06, 4.187226295471191e-06, 4.4656917452812195e-06, 4.7441571950912476e-06, 5.022622644901276e-06, 5.301088094711304e-06, 5.579553544521332e-06, 5.85801899433136e-06, 6.136484444141388e-06, 6.414949893951416e-06, 6.693415343761444e-06, 6.971880793571472e-06, 7.2503462433815e-06, 7.528811693191528e-06, 7.807277143001556e-06, 8.085742592811584e-06, 8.364208042621613e-06, 8.64267349243164e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 5.0, 10.0, 7.0, 13.0, 15.0, 16.0, 28.0, 27.0, 41.0, 61.0, 85.0, 78.0, 119.0, 93.0, 93.0, 64.0, 48.0, 43.0, 22.0, 32.0, 22.0, 19.0, 16.0, 13.0, 9.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4628623577882536e-05, -2.3752902052365243e-05, -2.2877178707858548e-05, -2.2001457182341255e-05, -2.1125735656823963e-05, -2.0250012312317267e-05, -1.9374290786799975e-05, -1.8498569261282682e-05, -1.7622845916775987e-05, -1.6747124391258694e-05, -1.5871401046752e-05, -1.4995679521234706e-05, -1.4119957995717414e-05, -1.324423556070542e-05, -1.2368513125693426e-05, -1.1492791600176133e-05, -1.0617070074658841e-05, -9.741347639646847e-06, -8.865626114129554e-06, -7.98990367911756e-06, -7.114181698852917e-06, -6.238459718588274e-06, -5.36273728357628e-06, -4.487015303311637e-06, -3.6112933230469935e-06, -2.7355713427823503e-06, -1.8598491351440316e-06, -9.84126927505713e-07, -1.0840494724106975e-07, 7.673170330235735e-07, 1.6430394680355676e-06, 2.5187614483002108e-06, 3.3944852475542575e-06, 4.270207227818901e-06, 5.145929208083544e-06, 6.021651643095538e-06, 6.897373623360181e-06, 7.773095603624824e-06, 8.648818038636819e-06, 9.524539564154111e-06, 1.0400261999166105e-05, 1.1275984434178099e-05, 1.2151705959695391e-05, 1.3027428394707385e-05, 1.390315082971938e-05, 1.4778872355236672e-05, 1.5654593880753964e-05, 1.653031722526066e-05, 1.7406038750777952e-05, 1.8281760276295245e-05, 1.915748362080194e-05, 2.0033205146319233e-05, 2.0908926671836525e-05, 2.178465001634322e-05, 2.2660371541860513e-05, 2.3536093067377806e-05, 2.44118164118845e-05, 2.5287537937401794e-05, 2.616326128190849e-05, 2.7038982807425782e-05, 2.7914704332943074e-05, 2.8790425858460367e-05, 2.9666149202967063e-05, 3.054187254747376e-05, 3.141759225400165e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 9.0, 4.0, 7.0, 4.0, 12.0, 16.0, 12.0, 15.0, 28.0, 11.0, 26.0, 21.0, 26.0, 34.0, 33.0, 34.0, 45.0, 27.0, 39.0, 40.0, 33.0, 43.0, 47.0, 36.0, 37.0, 35.0, 31.0, 34.0, 43.0, 32.0, 28.0, 27.0, 26.0, 21.0, 18.0, 17.0, 8.0, 8.0, 10.0, 6.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6537234841962345e-05, -1.5993147826520726e-05, -1.544906263006851e-05, -1.4904975614626892e-05, -1.4360889508679975e-05, -1.3816803402733058e-05, -1.3272716387291439e-05, -1.2728630281344522e-05, -1.2184544175397605e-05, -1.1640458069450688e-05, -1.109637196350377e-05, -1.0552284948062152e-05, -1.0008198842115235e-05, -9.464112736168317e-06, -8.920025720726699e-06, -8.375939614779782e-06, -7.831853508832864e-06, -7.287767402885947e-06, -6.743680842191679e-06, -6.1995942814974114e-06, -5.655508175550494e-06, -5.111422069603577e-06, -4.567335508909309e-06, -4.023248948215041e-06, -3.4791628422681242e-06, -2.9350765089475317e-06, -2.390990175626939e-06, -1.8469038423063466e-06, -1.302817508985754e-06, -7.587311756651616e-07, -2.1464484234456904e-07, 3.294414909760235e-07, 8.735296432860196e-07, 1.417615976606612e-06, 1.9617023099272046e-06, 2.505788643247797e-06, 3.0498749765683897e-06, 3.5939613098889822e-06, 4.138047643209575e-06, 4.682134203903843e-06, 5.22622030985076e-06, 5.770306415797677e-06, 6.314392976491945e-06, 6.858479537186213e-06, 7.40256564313313e-06, 7.946651749080047e-06, 8.490738764521666e-06, 9.034824870468583e-06, 9.5789109764155e-06, 1.0122997082362417e-05, 1.0667083188309334e-05, 1.1211170203750953e-05, 1.175525630969787e-05, 1.2299342415644787e-05, 1.2843429431086406e-05, 1.3387515537033323e-05, 1.393160164298024e-05, 1.4475687748927157e-05, 1.5019773854874074e-05, 1.5563860870315693e-05, 1.6107947885757312e-05, 1.6652033082209527e-05, 1.7196120097651146e-05, 1.774020529410336e-05, 1.828429230954498e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 19.0, 13.0, 38.0, 54.0, 86.0, 111.0, 180.0, 252.0, 428.0, 659.0, 875.0, 1649.0, 2378.0, 4022.0, 5888.0, 10667.0, 16235.0, 29081.0, 46631.0, 86411.0, 136760.0, 208006.0, 205043.0, 116602.0, 74123.0, 39673.0, 25075.0, 13906.0, 9138.0, 5211.0, 3456.0, 2007.0, 1362.0, 944.0, 507.0, 411.0, 234.0, 154.0, 93.0, 50.0, 42.0, 24.0, 16.0, 15.0, 9.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.6345252990722656e-05, -2.554338425397873e-05, -2.4741515517234802e-05, -2.3939646780490875e-05, -2.3137778043746948e-05, -2.233590930700302e-05, -2.1534040570259094e-05, -2.0732171833515167e-05, -1.993030309677124e-05, -1.9128434360027313e-05, -1.8326565623283386e-05, -1.752469688653946e-05, -1.6722828149795532e-05, -1.5920959413051605e-05, -1.5119090676307678e-05, -1.4317221939563751e-05, -1.3515353202819824e-05, -1.2713484466075897e-05, -1.191161572933197e-05, -1.1109746992588043e-05, -1.0307878255844116e-05, -9.50600951910019e-06, -8.704140782356262e-06, -7.902272045612335e-06, -7.100403308868408e-06, -6.298534572124481e-06, -5.496665835380554e-06, -4.694797098636627e-06, -3.8929283618927e-06, -3.091059625148773e-06, -2.289190888404846e-06, -1.4873221516609192e-06, -6.854534149169922e-07, 1.1641532182693481e-07, 9.182840585708618e-07, 1.7201527953147888e-06, 2.522021532058716e-06, 3.323890268802643e-06, 4.12575900554657e-06, 4.927627742290497e-06, 5.729496479034424e-06, 6.531365215778351e-06, 7.333233952522278e-06, 8.135102689266205e-06, 8.936971426010132e-06, 9.738840162754059e-06, 1.0540708899497986e-05, 1.1342577636241913e-05, 1.214444637298584e-05, 1.2946315109729767e-05, 1.3748183846473694e-05, 1.4550052583217621e-05, 1.5351921319961548e-05, 1.6153790056705475e-05, 1.6955658793449402e-05, 1.775752753019333e-05, 1.8559396266937256e-05, 1.9361265003681183e-05, 2.016313374042511e-05, 2.0965002477169037e-05, 2.1766871213912964e-05, 2.256873995065689e-05, 2.3370608687400818e-05, 2.4172477424144745e-05, 2.4974346160888672e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 8.0, 4.0, 4.0, 2.0, 5.0, 8.0, 9.0, 12.0, 19.0, 13.0, 18.0, 18.0, 22.0, 28.0, 32.0, 20.0, 29.0, 25.0, 35.0, 23.0, 40.0, 54.0, 42.0, 42.0, 45.0, 41.0, 31.0, 34.0, 40.0, 36.0, 24.0, 30.0, 25.0, 25.0, 28.0, 28.0, 24.0, 13.0, 7.0, 11.0, 8.0, 14.0, 8.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-1.5079975128173828e-05, -1.4619901776313782e-05, -1.4159828424453735e-05, -1.3699755072593689e-05, -1.3239681720733643e-05, -1.2779608368873596e-05, -1.231953501701355e-05, -1.1859461665153503e-05, -1.1399388313293457e-05, -1.093931496143341e-05, -1.0479241609573364e-05, -1.0019168257713318e-05, -9.559094905853271e-06, -9.099021553993225e-06, -8.638948202133179e-06, -8.178874850273132e-06, -7.718801498413086e-06, -7.2587281465530396e-06, -6.798654794692993e-06, -6.338581442832947e-06, -5.8785080909729e-06, -5.418434739112854e-06, -4.958361387252808e-06, -4.498288035392761e-06, -4.038214683532715e-06, -3.5781413316726685e-06, -3.118067979812622e-06, -2.6579946279525757e-06, -2.1979212760925293e-06, -1.737847924232483e-06, -1.2777745723724365e-06, -8.177012205123901e-07, -3.5762786865234375e-07, 1.0244548320770264e-07, 5.62518835067749e-07, 1.0225921869277954e-06, 1.4826655387878418e-06, 1.942738890647888e-06, 2.4028122425079346e-06, 2.862885594367981e-06, 3.3229589462280273e-06, 3.7830322980880737e-06, 4.24310564994812e-06, 4.7031790018081665e-06, 5.163252353668213e-06, 5.623325705528259e-06, 6.083399057388306e-06, 6.543472409248352e-06, 7.0035457611083984e-06, 7.463619112968445e-06, 7.923692464828491e-06, 8.383765816688538e-06, 8.843839168548584e-06, 9.30391252040863e-06, 9.763985872268677e-06, 1.0224059224128723e-05, 1.068413257598877e-05, 1.1144205927848816e-05, 1.1604279279708862e-05, 1.2064352631568909e-05, 1.2524425983428955e-05, 1.2984499335289001e-05, 1.3444572687149048e-05, 1.3904646039009094e-05, 1.436471939086914e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 7.0, 4.0, 7.0, 10.0, 15.0, 26.0, 34.0, 45.0, 69.0, 121.0, 144.0, 211.0, 390.0, 546.0, 876.0, 1385.0, 2306.0, 3601.0, 6266.0, 11513.0, 23713.0, 61198.0, 249049.0, 509453.0, 106345.0, 35271.0, 15658.0, 7814.0, 4710.0, 2874.0, 1744.0, 1117.0, 721.0, 449.0, 279.0, 175.0, 134.0, 94.0, 56.0, 39.0, 28.0, 22.0, 15.0, 5.0, 8.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.236532211303711e-05, -3.117695450782776e-05, -2.9988586902618408e-05, -2.8800219297409058e-05, -2.7611851692199707e-05, -2.6423484086990356e-05, -2.5235116481781006e-05, -2.4046748876571655e-05, -2.2858381271362305e-05, -2.1670013666152954e-05, -2.0481646060943604e-05, -1.9293278455734253e-05, -1.8104910850524902e-05, -1.6916543245315552e-05, -1.57281756401062e-05, -1.453980803489685e-05, -1.33514404296875e-05, -1.216307282447815e-05, -1.0974705219268799e-05, -9.786337614059448e-06, -8.597970008850098e-06, -7.409602403640747e-06, -6.2212347984313965e-06, -5.032867193222046e-06, -3.844499588012695e-06, -2.6561319828033447e-06, -1.4677643775939941e-06, -2.7939677238464355e-07, 9.08970832824707e-07, 2.0973384380340576e-06, 3.285706043243408e-06, 4.474073648452759e-06, 5.662441253662109e-06, 6.85080885887146e-06, 8.03917646408081e-06, 9.227544069290161e-06, 1.0415911674499512e-05, 1.1604279279708862e-05, 1.2792646884918213e-05, 1.3981014490127563e-05, 1.5169382095336914e-05, 1.6357749700546265e-05, 1.7546117305755615e-05, 1.8734484910964966e-05, 1.9922852516174316e-05, 2.1111220121383667e-05, 2.2299587726593018e-05, 2.3487955331802368e-05, 2.467632293701172e-05, 2.586469054222107e-05, 2.705305814743042e-05, 2.824142575263977e-05, 2.942979335784912e-05, 3.061816096305847e-05, 3.180652856826782e-05, 3.299489617347717e-05, 3.4183263778686523e-05, 3.5371631383895874e-05, 3.6559998989105225e-05, 3.7748366594314575e-05, 3.8936734199523926e-05, 4.0125101804733276e-05, 4.131346940994263e-05, 4.250183701515198e-05, 4.369020462036133e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 2.0, 8.0, 4.0, 2.0, 12.0, 9.0, 10.0, 11.0, 11.0, 26.0, 17.0, 20.0, 22.0, 25.0, 26.0, 47.0, 36.0, 42.0, 43.0, 69.0, 53.0, 79.0, 41.0, 47.0, 34.0, 36.0, 36.0, 30.0, 27.0, 19.0, 19.0, 16.0, 20.0, 10.0, 23.0, 10.0, 14.0, 4.0, 10.0, 6.0, 2.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.046627044677734e-06, -7.776543498039246e-06, -7.506459951400757e-06, -7.236376404762268e-06, -6.966292858123779e-06, -6.6962093114852905e-06, -6.426125764846802e-06, -6.156042218208313e-06, -5.885958671569824e-06, -5.6158751249313354e-06, -5.345791578292847e-06, -5.075708031654358e-06, -4.805624485015869e-06, -4.53554093837738e-06, -4.265457391738892e-06, -3.995373845100403e-06, -3.725290298461914e-06, -3.4552067518234253e-06, -3.1851232051849365e-06, -2.9150396585464478e-06, -2.644956111907959e-06, -2.3748725652694702e-06, -2.1047890186309814e-06, -1.8347054719924927e-06, -1.564621925354004e-06, -1.2945383787155151e-06, -1.0244548320770264e-06, -7.543712854385376e-07, -4.842877388000488e-07, -2.1420419216156006e-07, 5.587935447692871e-08, 3.259629011154175e-07, 5.960464477539062e-07, 8.66129994392395e-07, 1.1362135410308838e-06, 1.4062970876693726e-06, 1.6763806343078613e-06, 1.94646418094635e-06, 2.216547727584839e-06, 2.4866312742233276e-06, 2.7567148208618164e-06, 3.026798367500305e-06, 3.296881914138794e-06, 3.5669654607772827e-06, 3.8370490074157715e-06, 4.10713255405426e-06, 4.377216100692749e-06, 4.647299647331238e-06, 4.9173831939697266e-06, 5.187466740608215e-06, 5.457550287246704e-06, 5.727633833885193e-06, 5.997717380523682e-06, 6.26780092716217e-06, 6.537884473800659e-06, 6.807968020439148e-06, 7.078051567077637e-06, 7.3481351137161255e-06, 7.618218660354614e-06, 7.888302206993103e-06, 8.158385753631592e-06, 8.42846930027008e-06, 8.69855284690857e-06, 8.968636393547058e-06, 9.238719940185547e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 6.0, 6.0, 7.0, 8.0, 9.0, 15.0, 20.0, 36.0, 38.0, 68.0, 56.0, 119.0, 139.0, 159.0, 290.0, 301.0, 480.0, 514.0, 989.0, 1202.0, 2366.0, 3141.0, 7388.0, 13032.0, 44013.0, 143998.0, 672857.0, 106734.0, 24437.0, 12489.0, 4639.0, 3196.0, 1586.0, 1323.0, 792.0, 580.0, 335.0, 353.0, 208.0, 187.0, 128.0, 99.0, 57.0, 43.0, 35.0, 23.0, 21.0, 17.0, 10.0, 6.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.344650268554688e-06, -8.07829201221466e-06, -7.811933755874634e-06, -7.545575499534607e-06, -7.27921724319458e-06, -7.012858986854553e-06, -6.746500730514526e-06, -6.4801424741744995e-06, -6.213784217834473e-06, -5.947425961494446e-06, -5.681067705154419e-06, -5.414709448814392e-06, -5.148351192474365e-06, -4.881992936134338e-06, -4.6156346797943115e-06, -4.349276423454285e-06, -4.082918167114258e-06, -3.816559910774231e-06, -3.550201654434204e-06, -3.2838433980941772e-06, -3.0174851417541504e-06, -2.7511268854141235e-06, -2.4847686290740967e-06, -2.21841037273407e-06, -1.952052116394043e-06, -1.6856938600540161e-06, -1.4193356037139893e-06, -1.1529773473739624e-06, -8.866190910339355e-07, -6.202608346939087e-07, -3.5390257835388184e-07, -8.754432201385498e-08, 1.7881393432617188e-07, 4.4517219066619873e-07, 7.115304470062256e-07, 9.778887033462524e-07, 1.2442469596862793e-06, 1.5106052160263062e-06, 1.776963472366333e-06, 2.04332172870636e-06, 2.3096799850463867e-06, 2.5760382413864136e-06, 2.8423964977264404e-06, 3.1087547540664673e-06, 3.375113010406494e-06, 3.641471266746521e-06, 3.907829523086548e-06, 4.174187779426575e-06, 4.4405460357666016e-06, 4.706904292106628e-06, 4.973262548446655e-06, 5.239620804786682e-06, 5.505979061126709e-06, 5.772337317466736e-06, 6.038695573806763e-06, 6.3050538301467896e-06, 6.571412086486816e-06, 6.837770342826843e-06, 7.10412859916687e-06, 7.370486855506897e-06, 7.636845111846924e-06, 7.90320336818695e-06, 8.169561624526978e-06, 8.435919880867004e-06, 8.702278137207031e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 4.0, 6.0, 0.0, 7.0, 0.0, 10.0, 0.0, 11.0, 0.0, 19.0, 0.0, 40.0, 58.0, 0.0, 92.0, 0.0, 109.0, 0.0, 264.0, 0.0, 128.0, 0.0, 96.0, 70.0, 0.0, 32.0, 0.0, 20.0, 0.0, 12.0, 0.0, 10.0, 0.0, 8.0, 8.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2191012501716614e-06, -1.1865049600601196e-06, -1.1539086699485779e-06, -1.1213123798370361e-06, -1.0887160897254944e-06, -1.0561197996139526e-06, -1.0235235095024109e-06, -9.909272193908691e-07, -9.583309292793274e-07, -9.257346391677856e-07, -8.931383490562439e-07, -8.605420589447021e-07, -8.279457688331604e-07, -7.953494787216187e-07, -7.627531886100769e-07, -7.301568984985352e-07, -6.975606083869934e-07, -6.649643182754517e-07, -6.323680281639099e-07, -5.997717380523682e-07, -5.671754479408264e-07, -5.345791578292847e-07, -5.019828677177429e-07, -4.6938657760620117e-07, -4.367902874946594e-07, -4.041939973831177e-07, -3.7159770727157593e-07, -3.390014171600342e-07, -3.0640512704849243e-07, -2.738088369369507e-07, -2.4121254682540894e-07, -2.086162567138672e-07, -1.7601996660232544e-07, -1.434236764907837e-07, -1.1082738637924194e-07, -7.82310962677002e-08, -4.563480615615845e-08, -1.30385160446167e-08, 1.955777406692505e-08, 5.21540641784668e-08, 8.475035429000854e-08, 1.1734664440155029e-07, 1.4994293451309204e-07, 1.825392246246338e-07, 2.1513551473617554e-07, 2.477318048477173e-07, 2.8032809495925903e-07, 3.129243850708008e-07, 3.4552067518234253e-07, 3.781169652938843e-07, 4.10713255405426e-07, 4.4330954551696777e-07, 4.759058356285095e-07, 5.085021257400513e-07, 5.41098415851593e-07, 5.736947059631348e-07, 6.062909960746765e-07, 6.388872861862183e-07, 6.7148357629776e-07, 7.040798664093018e-07, 7.366761565208435e-07, 7.692724466323853e-07, 8.01868736743927e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 9.0, 13.0, 23.0, 23.0, 37.0, 52.0, 63.0, 83.0, 117.0, 165.0, 204.0, 350.0, 536.0, 1365.0, 2131.0, 4000.0, 8129.0, 17927.0, 45624.0, 159385.0, 567741.0, 180381.0, 32851.0, 13616.0, 6306.0, 3191.0, 1650.0, 911.0, 543.0, 428.0, 181.0, 151.0, 90.0, 70.0, 50.0, 40.0, 34.0, 37.0, 14.0, 10.0, 12.0, 3.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.841255187988281e-06, -5.6549906730651855e-06, -5.46872615814209e-06, -5.282461643218994e-06, -5.0961971282958984e-06, -4.909932613372803e-06, -4.723668098449707e-06, -4.537403583526611e-06, -4.351139068603516e-06, -4.16487455368042e-06, -3.978610038757324e-06, -3.7923455238342285e-06, -3.606081008911133e-06, -3.419816493988037e-06, -3.2335519790649414e-06, -3.0472874641418457e-06, -2.86102294921875e-06, -2.6747584342956543e-06, -2.4884939193725586e-06, -2.302229404449463e-06, -2.115964889526367e-06, -1.9297003746032715e-06, -1.7434358596801758e-06, -1.55717134475708e-06, -1.3709068298339844e-06, -1.1846423149108887e-06, -9.98377799987793e-07, -8.121132850646973e-07, -6.258487701416016e-07, -4.3958425521850586e-07, -2.5331974029541016e-07, -6.705522537231445e-08, 1.1920928955078125e-07, 3.0547380447387695e-07, 4.917383193969727e-07, 6.780028343200684e-07, 8.642673492431641e-07, 1.0505318641662598e-06, 1.2367963790893555e-06, 1.4230608940124512e-06, 1.6093254089355469e-06, 1.7955899238586426e-06, 1.9818544387817383e-06, 2.168118953704834e-06, 2.3543834686279297e-06, 2.5406479835510254e-06, 2.726912498474121e-06, 2.913177013397217e-06, 3.0994415283203125e-06, 3.285706043243408e-06, 3.471970558166504e-06, 3.6582350730895996e-06, 3.844499588012695e-06, 4.030764102935791e-06, 4.217028617858887e-06, 4.403293132781982e-06, 4.589557647705078e-06, 4.775822162628174e-06, 4.9620866775512695e-06, 5.148351192474365e-06, 5.334615707397461e-06, 5.520880222320557e-06, 5.707144737243652e-06, 5.893409252166748e-06, 6.079673767089844e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 4.0, 16.0, 0.0, 20.0, 29.0, 51.0, 0.0, 62.0, 90.0, 138.0, 0.0, 163.0, 129.0, 0.0, 99.0, 69.0, 50.0, 0.0, 25.0, 26.0, 15.0, 0.0, 5.0, 3.0, 2.0, 0.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3271346688270569e-06, -1.2833625078201294e-06, -1.239590346813202e-06, -1.1958181858062744e-06, -1.152046024799347e-06, -1.1082738637924194e-06, -1.064501702785492e-06, -1.0207295417785645e-06, -9.76957380771637e-07, -9.331852197647095e-07, -8.89413058757782e-07, -8.456408977508545e-07, -8.01868736743927e-07, -7.580965757369995e-07, -7.14324414730072e-07, -6.705522537231445e-07, -6.26780092716217e-07, -5.830079317092896e-07, -5.392357707023621e-07, -4.954636096954346e-07, -4.516914486885071e-07, -4.079192876815796e-07, -3.641471266746521e-07, -3.203749656677246e-07, -2.766028046607971e-07, -2.3283064365386963e-07, -1.8905848264694214e-07, -1.4528632164001465e-07, -1.0151416063308716e-07, -5.774199962615967e-08, -1.3969838619232178e-08, 2.9802322387695312e-08, 7.35744833946228e-08, 1.1734664440155029e-07, 1.6111880540847778e-07, 2.0489096641540527e-07, 2.4866312742233276e-07, 2.9243528842926025e-07, 3.3620744943618774e-07, 3.7997961044311523e-07, 4.237517714500427e-07, 4.675239324569702e-07, 5.112960934638977e-07, 5.550682544708252e-07, 5.988404154777527e-07, 6.426125764846802e-07, 6.863847374916077e-07, 7.301568984985352e-07, 7.739290595054626e-07, 8.177012205123901e-07, 8.614733815193176e-07, 9.052455425262451e-07, 9.490177035331726e-07, 9.927898645401e-07, 1.0365620255470276e-06, 1.080334186553955e-06, 1.1241063475608826e-06, 1.16787850856781e-06, 1.2116506695747375e-06, 1.255422830581665e-06, 1.2991949915885925e-06, 1.34296715259552e-06, 1.3867393136024475e-06, 1.430511474609375e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 6.0, 5.0, 6.0, 8.0, 6.0, 17.0, 15.0, 19.0, 27.0, 31.0, 49.0, 59.0, 98.0, 117.0, 119.0, 103.0, 68.0, 57.0, 43.0, 40.0, 19.0, 21.0, 16.0, 13.0, 14.0, 12.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.040502477029804e-05, -1.960353802132886e-05, -1.8802051272359677e-05, -1.8000564523390494e-05, -1.7199079593410715e-05, -1.6397592844441533e-05, -1.559610609547235e-05, -1.4794619346503168e-05, -1.3993132597533986e-05, -1.3191645848564804e-05, -1.2390159099595621e-05, -1.158867326012114e-05, -1.0787186511151958e-05, -9.985699762182776e-06, -9.184213922708295e-06, -8.382727173739113e-06, -7.5812404247699305e-06, -6.779753675800748e-06, -5.978267381578917e-06, -5.176781087357085e-06, -4.375294338387903e-06, -3.5738075894187205e-06, -2.772321295196889e-06, -1.9708350009750575e-06, -1.1693482520058751e-06, -3.678617304103682e-07, 4.3362479118513875e-07, 1.2351113127806457e-06, 2.0365978343761526e-06, 2.838084583345335e-06, 3.6395708775671665e-06, 4.441057171788998e-06, 5.242542101768777e-06, 6.044028850737959e-06, 6.845515144959791e-06, 7.647001439181622e-06, 8.448488188150804e-06, 9.249974937119987e-06, 1.0051460776594467e-05, 1.085294752556365e-05, 1.1654434274532832e-05, 1.2455921023502015e-05, 1.3257407772471197e-05, 1.4058893611945678e-05, 1.486038036091486e-05, 1.566186620038934e-05, 1.6463352949358523e-05, 1.7264839698327705e-05, 1.8066326447296888e-05, 1.886781319626607e-05, 1.9669299945235252e-05, 2.0470786694204435e-05, 2.1272273443173617e-05, 2.20737601921428e-05, 2.287524512212258e-05, 2.367673187109176e-05, 2.4478218620060943e-05, 2.5279705369030125e-05, 2.6081192117999308e-05, 2.688267886696849e-05, 2.768416379694827e-05, 2.848565054591745e-05, 2.9287137294886634e-05, 3.0088624043855816e-05, 3.0890110792825e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 8.0, 4.0, 6.0, 8.0, 4.0, 9.0, 16.0, 10.0, 18.0, 17.0, 23.0, 19.0, 19.0, 25.0, 39.0, 31.0, 29.0, 38.0, 37.0, 29.0, 45.0, 41.0, 36.0, 42.0, 43.0, 36.0, 33.0, 29.0, 43.0, 27.0, 32.0, 31.0, 31.0, 22.0, 32.0, 14.0, 21.0, 12.0, 7.0, 7.0, 8.0, 10.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3696160749532282e-05, -1.3234711332188454e-05, -1.2773261914844625e-05, -1.2311812497500796e-05, -1.1850363080156967e-05, -1.1388913662813138e-05, -1.092746424546931e-05, -1.0466013918630779e-05, -1.0004565410781652e-05, -9.543115993437823e-06, -9.081666576093994e-06, -8.620217158750165e-06, -8.158767741406336e-06, -7.697318324062508e-06, -7.235868451971328e-06, -6.774419034627499e-06, -6.312969162536319e-06, -5.8515197451924905e-06, -5.390070327848662e-06, -4.928620910504833e-06, -4.467171493161004e-06, -4.005722075817175e-06, -3.5442722037259955e-06, -3.0828227863821667e-06, -2.621373369038338e-06, -2.159923951694509e-06, -1.6984744206638425e-06, -1.237024889633176e-06, -7.755754722893471e-07, -3.1412605494551826e-07, 1.47323589771986e-07, 6.087730071158148e-07, 1.0702224244596437e-06, 1.5316718418034725e-06, 1.9931212591473013e-06, 2.4545709038648056e-06, 2.9160203212086344e-06, 3.3774697385524632e-06, 3.8389193832699675e-06, 4.300368800613796e-06, 4.761818217957625e-06, 5.223267635301454e-06, 5.684717052645283e-06, 6.1461669247364625e-06, 6.607616342080291e-06, 7.06906575942412e-06, 7.530515176767949e-06, 7.991964594111778e-06, 8.453414011455607e-06, 8.914863428799435e-06, 9.376312846143264e-06, 9.837762263487093e-06, 1.0299211680830922e-05, 1.076066109817475e-05, 1.1222111425013281e-05, 1.1683559932862408e-05, 1.2145010259700939e-05, 1.2606459677044768e-05, 1.3067909094388597e-05, 1.3529358511732426e-05, 1.3990807929076254e-05, 1.4452257346420083e-05, 1.4913706763763912e-05, 1.5375157090602443e-05, 1.583660559845157e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 1.0, 6.0, 7.0, 10.0, 14.0, 16.0, 32.0, 45.0, 55.0, 88.0, 117.0, 157.0, 252.0, 373.0, 507.0, 784.0, 1073.0, 1700.0, 2671.0, 3771.0, 6207.0, 9388.0, 16496.0, 27792.0, 45380.0, 87877.0, 154773.0, 265550.0, 184334.0, 103954.0, 55780.0, 29562.0, 18770.0, 10635.0, 7261.0, 4507.0, 2726.0, 1977.0, 1187.0, 866.0, 595.0, 396.0, 275.0, 177.0, 149.0, 79.0, 63.0, 42.0, 25.0, 24.0, 10.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.664327621459961e-05, -2.5773420929908752e-05, -2.4903565645217896e-05, -2.403371036052704e-05, -2.316385507583618e-05, -2.2293999791145325e-05, -2.1424144506454468e-05, -2.055428922176361e-05, -1.9684433937072754e-05, -1.8814578652381897e-05, -1.794472336769104e-05, -1.7074868083000183e-05, -1.6205012798309326e-05, -1.533515751361847e-05, -1.4465302228927612e-05, -1.3595446944236755e-05, -1.2725591659545898e-05, -1.1855736374855042e-05, -1.0985881090164185e-05, -1.0116025805473328e-05, -9.24617052078247e-06, -8.376315236091614e-06, -7.506459951400757e-06, -6.6366046667099e-06, -5.766749382019043e-06, -4.896894097328186e-06, -4.027038812637329e-06, -3.157183527946472e-06, -2.2873282432556152e-06, -1.4174729585647583e-06, -5.476176738739014e-07, 3.2223761081695557e-07, 1.1920928955078125e-06, 2.0619481801986694e-06, 2.9318034648895264e-06, 3.8016587495803833e-06, 4.67151403427124e-06, 5.541369318962097e-06, 6.411224603652954e-06, 7.281079888343811e-06, 8.150935173034668e-06, 9.020790457725525e-06, 9.890645742416382e-06, 1.0760501027107239e-05, 1.1630356311798096e-05, 1.2500211596488953e-05, 1.337006688117981e-05, 1.4239922165870667e-05, 1.5109777450561523e-05, 1.597963273525238e-05, 1.6849488019943237e-05, 1.7719343304634094e-05, 1.858919858932495e-05, 1.9459053874015808e-05, 2.0328909158706665e-05, 2.1198764443397522e-05, 2.206861972808838e-05, 2.2938475012779236e-05, 2.3808330297470093e-05, 2.467818558216095e-05, 2.5548040866851807e-05, 2.6417896151542664e-05, 2.728775143623352e-05, 2.8157606720924377e-05, 2.9027462005615234e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 8.0, 5.0, 4.0, 7.0, 7.0, 8.0, 17.0, 21.0, 16.0, 19.0, 19.0, 19.0, 33.0, 32.0, 24.0, 39.0, 37.0, 37.0, 43.0, 36.0, 40.0, 45.0, 37.0, 33.0, 40.0, 43.0, 43.0, 28.0, 40.0, 29.0, 25.0, 24.0, 32.0, 17.0, 14.0, 16.0, 13.0, 9.0, 10.0, 10.0, 3.0, 7.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.233816146850586e-05, -1.192186027765274e-05, -1.1505559086799622e-05, -1.1089257895946503e-05, -1.0672956705093384e-05, -1.0256655514240265e-05, -9.840354323387146e-06, -9.424053132534027e-06, -9.007751941680908e-06, -8.59145075082779e-06, -8.17514955997467e-06, -7.758848369121552e-06, -7.342547178268433e-06, -6.926245987415314e-06, -6.509944796562195e-06, -6.093643605709076e-06, -5.677342414855957e-06, -5.261041224002838e-06, -4.844740033149719e-06, -4.4284388422966e-06, -4.0121376514434814e-06, -3.5958364605903625e-06, -3.1795352697372437e-06, -2.7632340788841248e-06, -2.346932888031006e-06, -1.930631697177887e-06, -1.514330506324768e-06, -1.0980293154716492e-06, -6.817281246185303e-07, -2.654269337654114e-07, 1.5087425708770752e-07, 5.671754479408264e-07, 9.834766387939453e-07, 1.3997778296470642e-06, 1.816079020500183e-06, 2.232380211353302e-06, 2.648681402206421e-06, 3.06498259305954e-06, 3.4812837839126587e-06, 3.897584974765778e-06, 4.3138861656188965e-06, 4.730187356472015e-06, 5.146488547325134e-06, 5.562789738178253e-06, 5.979090929031372e-06, 6.395392119884491e-06, 6.81169331073761e-06, 7.227994501590729e-06, 7.644295692443848e-06, 8.060596883296967e-06, 8.476898074150085e-06, 8.893199265003204e-06, 9.309500455856323e-06, 9.725801646709442e-06, 1.0142102837562561e-05, 1.055840402841568e-05, 1.0974705219268799e-05, 1.1391006410121918e-05, 1.1807307600975037e-05, 1.2223608791828156e-05, 1.2639909982681274e-05, 1.3056211173534393e-05, 1.3472512364387512e-05, 1.3888813555240631e-05, 1.430511474609375e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 4.0, 14.0, 28.0, 20.0, 29.0, 40.0, 85.0, 106.0, 163.0, 204.0, 298.0, 423.0, 675.0, 917.0, 1350.0, 2019.0, 2933.0, 4324.0, 6503.0, 10134.0, 15747.0, 24171.0, 38709.0, 64225.0, 97657.0, 183123.0, 230525.0, 144317.0, 83158.0, 49524.0, 30379.0, 19247.0, 12281.0, 8245.0, 5409.0, 3730.0, 2481.0, 1663.0, 1134.0, 817.0, 526.0, 391.0, 258.0, 195.0, 119.0, 82.0, 58.0, 43.0, 27.0, 16.0, 9.0, 2.0, 8.0, 6.0, 8.0, 2.0, 1.0], "bins": [-2.372264862060547e-05, -2.3009255528450012e-05, -2.2295862436294556e-05, -2.15824693441391e-05, -2.0869076251983643e-05, -2.0155683159828186e-05, -1.944229006767273e-05, -1.8728896975517273e-05, -1.8015503883361816e-05, -1.730211079120636e-05, -1.6588717699050903e-05, -1.5875324606895447e-05, -1.516193151473999e-05, -1.4448538422584534e-05, -1.3735145330429077e-05, -1.302175223827362e-05, -1.2308359146118164e-05, -1.1594966053962708e-05, -1.0881572961807251e-05, -1.0168179869651794e-05, -9.454786777496338e-06, -8.741393685340881e-06, -8.028000593185425e-06, -7.314607501029968e-06, -6.601214408874512e-06, -5.887821316719055e-06, -5.174428224563599e-06, -4.461035132408142e-06, -3.7476420402526855e-06, -3.034248948097229e-06, -2.3208558559417725e-06, -1.607462763786316e-06, -8.940696716308594e-07, -1.8067657947540283e-07, 5.327165126800537e-07, 1.2461096048355103e-06, 1.959502696990967e-06, 2.6728957891464233e-06, 3.38628888130188e-06, 4.0996819734573364e-06, 4.813075065612793e-06, 5.5264681577682495e-06, 6.239861249923706e-06, 6.953254342079163e-06, 7.666647434234619e-06, 8.380040526390076e-06, 9.093433618545532e-06, 9.806826710700989e-06, 1.0520219802856445e-05, 1.1233612895011902e-05, 1.1947005987167358e-05, 1.2660399079322815e-05, 1.3373792171478271e-05, 1.4087185263633728e-05, 1.4800578355789185e-05, 1.551397144794464e-05, 1.6227364540100098e-05, 1.6940757632255554e-05, 1.765415072441101e-05, 1.8367543816566467e-05, 1.9080936908721924e-05, 1.979433000087738e-05, 2.0507723093032837e-05, 2.1221116185188293e-05, 2.193450927734375e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 3.0, 3.0, 7.0, 5.0, 12.0, 19.0, 15.0, 23.0, 23.0, 19.0, 19.0, 35.0, 33.0, 33.0, 26.0, 32.0, 32.0, 33.0, 35.0, 55.0, 31.0, 35.0, 36.0, 58.0, 32.0, 38.0, 38.0, 46.0, 30.0, 26.0, 21.0, 22.0, 22.0, 16.0, 13.0, 19.0, 8.0, 11.0, 8.0, 9.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.179115295410156e-06, -8.910894393920898e-06, -8.64267349243164e-06, -8.374452590942383e-06, -8.106231689453125e-06, -7.838010787963867e-06, -7.569789886474609e-06, -7.3015689849853516e-06, -7.033348083496094e-06, -6.765127182006836e-06, -6.496906280517578e-06, -6.22868537902832e-06, -5.9604644775390625e-06, -5.692243576049805e-06, -5.424022674560547e-06, -5.155801773071289e-06, -4.887580871582031e-06, -4.6193599700927734e-06, -4.351139068603516e-06, -4.082918167114258e-06, -3.814697265625e-06, -3.546476364135742e-06, -3.2782554626464844e-06, -3.0100345611572266e-06, -2.7418136596679688e-06, -2.473592758178711e-06, -2.205371856689453e-06, -1.9371509552001953e-06, -1.6689300537109375e-06, -1.4007091522216797e-06, -1.1324882507324219e-06, -8.642673492431641e-07, -5.960464477539062e-07, -3.2782554626464844e-07, -5.960464477539063e-08, 2.086162567138672e-07, 4.76837158203125e-07, 7.450580596923828e-07, 1.0132789611816406e-06, 1.2814998626708984e-06, 1.5497207641601562e-06, 1.817941665649414e-06, 2.086162567138672e-06, 2.3543834686279297e-06, 2.6226043701171875e-06, 2.8908252716064453e-06, 3.159046173095703e-06, 3.427267074584961e-06, 3.6954879760742188e-06, 3.9637088775634766e-06, 4.231929779052734e-06, 4.500150680541992e-06, 4.76837158203125e-06, 5.036592483520508e-06, 5.304813385009766e-06, 5.5730342864990234e-06, 5.841255187988281e-06, 6.109476089477539e-06, 6.377696990966797e-06, 6.645917892456055e-06, 6.9141387939453125e-06, 7.18235969543457e-06, 7.450580596923828e-06, 7.718801498413086e-06, 7.987022399902344e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 2.0, 11.0, 6.0, 8.0, 10.0, 25.0, 18.0, 43.0, 49.0, 77.0, 93.0, 124.0, 231.0, 254.0, 410.0, 582.0, 953.0, 1359.0, 2492.0, 3719.0, 6046.0, 13092.0, 23439.0, 66083.0, 653638.0, 182930.0, 45350.0, 20563.0, 11833.0, 5497.0, 3835.0, 1899.0, 1418.0, 734.0, 570.0, 304.0, 225.0, 175.0, 137.0, 79.0, 56.0, 61.0, 27.0, 29.0, 30.0, 17.0, 10.0, 3.0, 6.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1086463928222656e-05, -1.0702759027481079e-05, -1.0319054126739502e-05, -9.935349225997925e-06, -9.551644325256348e-06, -9.16793942451477e-06, -8.784234523773193e-06, -8.400529623031616e-06, -8.016824722290039e-06, -7.633119821548462e-06, -7.249414920806885e-06, -6.865710020065308e-06, -6.4820051193237305e-06, -6.098300218582153e-06, -5.714595317840576e-06, -5.330890417098999e-06, -4.947185516357422e-06, -4.563480615615845e-06, -4.179775714874268e-06, -3.7960708141326904e-06, -3.4123659133911133e-06, -3.028661012649536e-06, -2.644956111907959e-06, -2.261251211166382e-06, -1.8775463104248047e-06, -1.4938414096832275e-06, -1.1101365089416504e-06, -7.264316082000732e-07, -3.427267074584961e-07, 4.0978193283081055e-08, 4.246830940246582e-07, 8.083879947662354e-07, 1.1920928955078125e-06, 1.5757977962493896e-06, 1.959502696990967e-06, 2.343207597732544e-06, 2.726912498474121e-06, 3.1106173992156982e-06, 3.4943222999572754e-06, 3.8780272006988525e-06, 4.26173210144043e-06, 4.645437002182007e-06, 5.029141902923584e-06, 5.412846803665161e-06, 5.796551704406738e-06, 6.1802566051483154e-06, 6.563961505889893e-06, 6.94766640663147e-06, 7.331371307373047e-06, 7.715076208114624e-06, 8.098781108856201e-06, 8.482486009597778e-06, 8.866190910339355e-06, 9.249895811080933e-06, 9.63360071182251e-06, 1.0017305612564087e-05, 1.0401010513305664e-05, 1.0784715414047241e-05, 1.1168420314788818e-05, 1.1552125215530396e-05, 1.1935830116271973e-05, 1.231953501701355e-05, 1.2703239917755127e-05, 1.3086944818496704e-05, 1.3470649719238281e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 0.0, 796.0, 0.0, 0.0, 0.0, 0.0, 73.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.172325134277344e-07, -4.0512531995773315e-07, -3.9301812648773193e-07, -3.809109330177307e-07, -3.688037395477295e-07, -3.5669654607772827e-07, -3.4458935260772705e-07, -3.3248215913772583e-07, -3.203749656677246e-07, -3.082677721977234e-07, -2.9616057872772217e-07, -2.8405338525772095e-07, -2.7194619178771973e-07, -2.598389983177185e-07, -2.477318048477173e-07, -2.3562461137771606e-07, -2.2351741790771484e-07, -2.1141022443771362e-07, -1.993030309677124e-07, -1.8719583749771118e-07, -1.7508864402770996e-07, -1.6298145055770874e-07, -1.5087425708770752e-07, -1.387670636177063e-07, -1.2665987014770508e-07, -1.1455267667770386e-07, -1.0244548320770264e-07, -9.033828973770142e-08, -7.82310962677002e-08, -6.612390279769897e-08, -5.4016709327697754e-08, -4.190951585769653e-08, -2.9802322387695312e-08, -1.7695128917694092e-08, -5.587935447692871e-09, 6.51925802230835e-09, 1.862645149230957e-08, 3.073364496231079e-08, 4.284083843231201e-08, 5.494803190231323e-08, 6.705522537231445e-08, 7.916241884231567e-08, 9.12696123123169e-08, 1.0337680578231812e-07, 1.1548399925231934e-07, 1.2759119272232056e-07, 1.3969838619232178e-07, 1.51805579662323e-07, 1.6391277313232422e-07, 1.7601996660232544e-07, 1.8812716007232666e-07, 2.0023435354232788e-07, 2.123415470123291e-07, 2.2444874048233032e-07, 2.3655593395233154e-07, 2.4866312742233276e-07, 2.60770320892334e-07, 2.728775143623352e-07, 2.849847078323364e-07, 2.9709190130233765e-07, 3.0919909477233887e-07, 3.213062882423401e-07, 3.334134817123413e-07, 3.4552067518234253e-07, 3.5762786865234375e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 5.0, 15.0, 7.0, 12.0, 36.0, 24.0, 35.0, 60.0, 91.0, 121.0, 214.0, 260.0, 365.0, 599.0, 765.0, 1088.0, 1855.0, 2463.0, 4290.0, 5936.0, 9882.0, 19907.0, 38841.0, 121056.0, 720820.0, 58409.0, 24899.0, 14330.0, 7476.0, 5248.0, 2863.0, 2033.0, 1479.0, 943.0, 658.0, 468.0, 300.0, 209.0, 134.0, 102.0, 82.0, 59.0, 32.0, 44.0, 19.0, 6.0, 4.0, 4.0, 5.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.8537044525146484e-05, -1.7979182302951813e-05, -1.742132008075714e-05, -1.686345785856247e-05, -1.6305595636367798e-05, -1.5747733414173126e-05, -1.5189871191978455e-05, -1.4632008969783783e-05, -1.4074146747589111e-05, -1.351628452539444e-05, -1.2958422303199768e-05, -1.2400560081005096e-05, -1.1842697858810425e-05, -1.1284835636615753e-05, -1.0726973414421082e-05, -1.016911119222641e-05, -9.611248970031738e-06, -9.053386747837067e-06, -8.495524525642395e-06, -7.937662303447723e-06, -7.379800081253052e-06, -6.82193785905838e-06, -6.2640756368637085e-06, -5.706213414669037e-06, -5.148351192474365e-06, -4.590488970279694e-06, -4.032626748085022e-06, -3.4747645258903503e-06, -2.9169023036956787e-06, -2.359040081501007e-06, -1.8011778593063354e-06, -1.2433156371116638e-06, -6.854534149169922e-07, -1.2759119272232056e-07, 4.302710294723511e-07, 9.881332516670227e-07, 1.5459954738616943e-06, 2.103857696056366e-06, 2.6617199182510376e-06, 3.2195821404457092e-06, 3.777444362640381e-06, 4.3353065848350525e-06, 4.893168807029724e-06, 5.451031029224396e-06, 6.008893251419067e-06, 6.566755473613739e-06, 7.124617695808411e-06, 7.682479918003082e-06, 8.240342140197754e-06, 8.798204362392426e-06, 9.356066584587097e-06, 9.913928806781769e-06, 1.047179102897644e-05, 1.1029653251171112e-05, 1.1587515473365784e-05, 1.2145377695560455e-05, 1.2703239917755127e-05, 1.3261102139949799e-05, 1.381896436214447e-05, 1.4376826584339142e-05, 1.4934688806533813e-05, 1.5492551028728485e-05, 1.6050413250923157e-05, 1.660827547311783e-05, 1.71661376953125e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 2.0, 4.0, 9.0, 5.0, 6.0, 6.0, 13.0, 8.0, 22.0, 37.0, 39.0, 56.0, 57.0, 444.0, 88.0, 40.0, 28.0, 18.0, 16.0, 20.0, 19.0, 11.0, 5.0, 5.0, 3.0, 3.0, 6.0, 8.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.9604644775390625e-06, -5.791895091533661e-06, -5.623325705528259e-06, -5.454756319522858e-06, -5.286186933517456e-06, -5.1176175475120544e-06, -4.949048161506653e-06, -4.780478775501251e-06, -4.61190938949585e-06, -4.443340003490448e-06, -4.274770617485046e-06, -4.106201231479645e-06, -3.937631845474243e-06, -3.7690624594688416e-06, -3.60049307346344e-06, -3.4319236874580383e-06, -3.2633543014526367e-06, -3.094784915447235e-06, -2.9262155294418335e-06, -2.757646143436432e-06, -2.5890767574310303e-06, -2.4205073714256287e-06, -2.251937985420227e-06, -2.0833685994148254e-06, -1.914799213409424e-06, -1.7462298274040222e-06, -1.5776604413986206e-06, -1.409091055393219e-06, -1.2405216693878174e-06, -1.0719522833824158e-06, -9.033828973770142e-07, -7.348135113716125e-07, -5.662441253662109e-07, -3.976747393608093e-07, -2.2910535335540771e-07, -6.05359673500061e-08, 1.0803341865539551e-07, 2.766028046607971e-07, 4.4517219066619873e-07, 6.137415766716003e-07, 7.82310962677002e-07, 9.508803486824036e-07, 1.1194497346878052e-06, 1.2880191206932068e-06, 1.4565885066986084e-06, 1.62515789270401e-06, 1.7937272787094116e-06, 1.9622966647148132e-06, 2.130866050720215e-06, 2.2994354367256165e-06, 2.468004822731018e-06, 2.6365742087364197e-06, 2.8051435947418213e-06, 2.973712980747223e-06, 3.1422823667526245e-06, 3.310851752758026e-06, 3.4794211387634277e-06, 3.6479905247688293e-06, 3.816559910774231e-06, 3.9851292967796326e-06, 4.153698682785034e-06, 4.322268068790436e-06, 4.490837454795837e-06, 4.659406840801239e-06, 4.827976226806641e-06]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 14.0, 14.0, 7.0, 18.0, 26.0, 37.0, 45.0, 60.0, 78.0, 132.0, 128.0, 107.0, 78.0, 50.0, 46.0, 32.0, 25.0, 22.0, 13.0, 12.0, 15.0, 5.0, 6.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1122672478668392e-05, -2.0349685655673966e-05, -1.957669883267954e-05, -1.8803712009685114e-05, -1.8030725186690688e-05, -1.7257738363696262e-05, -1.6484751540701836e-05, -1.571176471770741e-05, -1.4938776985218283e-05, -1.4165790162223857e-05, -1.3392803339229431e-05, -1.2619815606740303e-05, -1.1846828783745877e-05, -1.1073841960751452e-05, -1.0300855137757026e-05, -9.5278683147626e-06, -8.754881491768174e-06, -7.981894668773748e-06, -7.208907845779322e-06, -6.435920568037545e-06, -5.662933745043119e-06, -4.8899469220486935e-06, -4.116959644306917e-06, -3.343972821312491e-06, -2.570985998318065e-06, -1.7979990616368013e-06, -1.0250121249555377e-06, -2.520250745874364e-07, 5.209617484069895e-07, 1.2939485714014154e-06, 2.066935849143192e-06, 2.839922672137618e-06, 3.612909495132044e-06, 4.38589631812647e-06, 5.158883141120896e-06, 5.9318704188626725e-06, 6.704857241857098e-06, 7.477844064851524e-06, 8.250831342593301e-06, 9.023818165587727e-06, 9.796804988582153e-06, 1.0569791811576579e-05, 1.1342778634571005e-05, 1.2115766367060132e-05, 1.2888753190054558e-05, 1.3661740013048984e-05, 1.443472683604341e-05, 1.5207713659037836e-05, 1.5980700482032262e-05, 1.6753687305026688e-05, 1.7526674128021114e-05, 1.829966095101554e-05, 1.9072647774009965e-05, 1.984563459700439e-05, 2.061862323898822e-05, 2.1391610061982647e-05, 2.2164596884977072e-05, 2.29375837079715e-05, 2.3710570530965924e-05, 2.448355735396035e-05, 2.5256544176954776e-05, 2.6029530999949202e-05, 2.6802517822943628e-05, 2.7575504645938054e-05, 2.834849146893248e-05]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 3.0, 10.0, 7.0, 8.0, 9.0, 12.0, 12.0, 17.0, 16.0, 21.0, 26.0, 30.0, 28.0, 29.0, 39.0, 28.0, 25.0, 35.0, 38.0, 36.0, 33.0, 37.0, 37.0, 40.0, 45.0, 44.0, 35.0, 36.0, 29.0, 27.0, 20.0, 34.0, 18.0, 23.0, 22.0, 16.0, 17.0, 11.0, 8.0, 11.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1791449651354924e-05, -1.1374974747013766e-05, -1.0958499842672609e-05, -1.0542024938331451e-05, -1.0125550033990294e-05, -9.709076039143838e-06, -9.29260113480268e-06, -8.876126230461523e-06, -8.459651326120365e-06, -8.043176421779208e-06, -7.62670151743805e-06, -7.210227067844244e-06, -6.793752163503086e-06, -6.377277259161929e-06, -5.960802809568122e-06, -5.5443279052269645e-06, -5.127853000885807e-06, -4.7113780965446495e-06, -4.294903192203492e-06, -3.878428742609685e-06, -3.4619538382685278e-06, -3.0454789339273702e-06, -2.629004256959888e-06, -2.212529579992406e-06, -1.7960546756512485e-06, -1.3795798849969287e-06, -9.63105094342609e-07, -5.466303036882891e-07, -1.3015551303396933e-07, 2.863193913071882e-07, 7.027940682746703e-07, 1.1192687452421524e-06, 1.5357445590780117e-06, 1.952219463419169e-06, 2.3686941403866513e-06, 2.7851688173541334e-06, 3.201643721695291e-06, 3.6181186260364484e-06, 4.034593075630255e-06, 4.4510679799714126e-06, 4.86754288431257e-06, 5.284017788653728e-06, 5.700492692994885e-06, 6.116967142588692e-06, 6.533442046929849e-06, 6.949916951271007e-06, 7.3663914008648135e-06, 7.782866305205971e-06, 8.199341209547129e-06, 8.615816113888286e-06, 9.032291018229444e-06, 9.448765922570601e-06, 9.865239917417057e-06, 1.0281715731252916e-05, 1.0698189726099372e-05, 1.111466463044053e-05, 1.1531139534781687e-05, 1.1947614439122844e-05, 1.2364089343464002e-05, 1.278056424780516e-05, 1.3197039152146317e-05, 1.3613513146992773e-05, 1.402998805133393e-05, 1.4446462955675088e-05, 1.4862937860016245e-05]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 10.0, 11.0, 19.0, 32.0, 43.0, 85.0, 126.0, 222.0, 321.0, 418.0, 726.0, 1006.0, 1569.0, 2541.0, 3727.0, 6007.0, 9453.0, 15772.0, 26008.0, 45119.0, 93337.0, 175944.0, 453918.0, 1562150.0, 1147052.0, 334804.0, 143343.0, 72033.0, 38946.0, 22619.0, 13589.0, 8151.0, 5346.0, 3636.0, 2107.0, 1347.0, 878.0, 621.0, 382.0, 279.0, 188.0, 116.0, 91.0, 65.0, 33.0, 27.0, 25.0, 11.0, 9.0, 10.0, 6.0, 3.0, 8.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7344951629638672e-05, -1.6744248569011688e-05, -1.6143545508384705e-05, -1.554284244775772e-05, -1.4942139387130737e-05, -1.4341436326503754e-05, -1.374073326587677e-05, -1.3140030205249786e-05, -1.2539327144622803e-05, -1.1938624083995819e-05, -1.1337921023368835e-05, -1.0737217962741852e-05, -1.0136514902114868e-05, -9.535811841487885e-06, -8.935108780860901e-06, -8.334405720233917e-06, -7.733702659606934e-06, -7.13299959897995e-06, -6.532296538352966e-06, -5.931593477725983e-06, -5.330890417098999e-06, -4.730187356472015e-06, -4.129484295845032e-06, -3.528781235218048e-06, -2.9280781745910645e-06, -2.327375113964081e-06, -1.7266720533370972e-06, -1.1259689927101135e-06, -5.252659320831299e-07, 7.543712854385376e-08, 6.761401891708374e-07, 1.276843249797821e-06, 1.8775463104248047e-06, 2.4782493710517883e-06, 3.078952431678772e-06, 3.6796554923057556e-06, 4.280358552932739e-06, 4.881061613559723e-06, 5.4817646741867065e-06, 6.08246773481369e-06, 6.683170795440674e-06, 7.2838738560676575e-06, 7.884576916694641e-06, 8.485279977321625e-06, 9.085983037948608e-06, 9.686686098575592e-06, 1.0287389159202576e-05, 1.088809221982956e-05, 1.1488795280456543e-05, 1.2089498341083527e-05, 1.269020140171051e-05, 1.3290904462337494e-05, 1.3891607522964478e-05, 1.4492310583591461e-05, 1.5093013644218445e-05, 1.569371670484543e-05, 1.6294419765472412e-05, 1.6895122826099396e-05, 1.749582588672638e-05, 1.8096528947353363e-05, 1.8697232007980347e-05, 1.929793506860733e-05, 1.9898638129234314e-05, 2.0499341189861298e-05, 2.110004425048828e-05]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 6.0, 0.0, 6.0, 8.0, 15.0, 8.0, 20.0, 20.0, 25.0, 23.0, 21.0, 34.0, 30.0, 37.0, 14.0, 40.0, 45.0, 32.0, 38.0, 35.0, 43.0, 40.0, 48.0, 43.0, 37.0, 26.0, 27.0, 38.0, 38.0, 30.0, 28.0, 22.0, 25.0, 16.0, 16.0, 10.0, 9.0, 5.0, 14.0, 4.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.62939453125e-06, -7.379800081253052e-06, -7.1302056312561035e-06, -6.880611181259155e-06, -6.631016731262207e-06, -6.381422281265259e-06, -6.1318278312683105e-06, -5.882233381271362e-06, -5.632638931274414e-06, -5.383044481277466e-06, -5.133450031280518e-06, -4.883855581283569e-06, -4.634261131286621e-06, -4.384666681289673e-06, -4.135072231292725e-06, -3.885477781295776e-06, -3.635883331298828e-06, -3.38628888130188e-06, -3.1366944313049316e-06, -2.8870999813079834e-06, -2.637505531311035e-06, -2.387911081314087e-06, -2.1383166313171387e-06, -1.8887221813201904e-06, -1.6391277313232422e-06, -1.389533281326294e-06, -1.1399388313293457e-06, -8.903443813323975e-07, -6.407499313354492e-07, -3.91155481338501e-07, -1.4156103134155273e-07, 1.0803341865539551e-07, 3.5762786865234375e-07, 6.07222318649292e-07, 8.568167686462402e-07, 1.1064112186431885e-06, 1.3560056686401367e-06, 1.605600118637085e-06, 1.8551945686340332e-06, 2.1047890186309814e-06, 2.3543834686279297e-06, 2.603977918624878e-06, 2.853572368621826e-06, 3.1031668186187744e-06, 3.3527612686157227e-06, 3.602355718612671e-06, 3.851950168609619e-06, 4.101544618606567e-06, 4.351139068603516e-06, 4.600733518600464e-06, 4.850327968597412e-06, 5.09992241859436e-06, 5.349516868591309e-06, 5.599111318588257e-06, 5.848705768585205e-06, 6.098300218582153e-06, 6.3478946685791016e-06, 6.59748911857605e-06, 6.847083568572998e-06, 7.096678018569946e-06, 7.3462724685668945e-06, 7.595866918563843e-06, 7.845461368560791e-06, 8.09505581855774e-06, 8.344650268554688e-06]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 7.0, 12.0, 25.0, 26.0, 48.0, 73.0, 87.0, 151.0, 192.0, 254.0, 379.0, 634.0, 823.0, 1453.0, 1769.0, 3106.0, 4049.0, 7216.0, 9866.0, 17918.0, 25940.0, 49405.0, 75747.0, 161020.0, 283354.0, 629105.0, 1504193.0, 713200.0, 343076.0, 146892.0, 90347.0, 45061.0, 30699.0, 16317.0, 11582.0, 6486.0, 4829.0, 2728.0, 2031.0, 1232.0, 996.0, 577.0, 431.0, 310.0, 203.0, 156.0, 82.0, 74.0, 50.0, 20.0, 25.0, 15.0, 7.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.4483928680419922e-05, -1.4038756489753723e-05, -1.3593584299087524e-05, -1.3148412108421326e-05, -1.2703239917755127e-05, -1.2258067727088928e-05, -1.181289553642273e-05, -1.136772334575653e-05, -1.0922551155090332e-05, -1.0477378964424133e-05, -1.0032206773757935e-05, -9.587034583091736e-06, -9.141862392425537e-06, -8.696690201759338e-06, -8.25151801109314e-06, -7.806345820426941e-06, -7.361173629760742e-06, -6.9160014390945435e-06, -6.470829248428345e-06, -6.025657057762146e-06, -5.580484867095947e-06, -5.1353126764297485e-06, -4.69014048576355e-06, -4.244968295097351e-06, -3.7997961044311523e-06, -3.3546239137649536e-06, -2.909451723098755e-06, -2.464279532432556e-06, -2.0191073417663574e-06, -1.5739351511001587e-06, -1.12876296043396e-06, -6.835907697677612e-07, -2.384185791015625e-07, 2.0675361156463623e-07, 6.51925802230835e-07, 1.0970979928970337e-06, 1.5422701835632324e-06, 1.987442374229431e-06, 2.43261456489563e-06, 2.8777867555618286e-06, 3.3229589462280273e-06, 3.768131136894226e-06, 4.213303327560425e-06, 4.6584755182266235e-06, 5.103647708892822e-06, 5.548819899559021e-06, 5.99399209022522e-06, 6.4391642808914185e-06, 6.884336471557617e-06, 7.329508662223816e-06, 7.774680852890015e-06, 8.219853043556213e-06, 8.665025234222412e-06, 9.11019742488861e-06, 9.55536961555481e-06, 1.0000541806221008e-05, 1.0445713996887207e-05, 1.0890886187553406e-05, 1.1336058378219604e-05, 1.1781230568885803e-05, 1.2226402759552002e-05, 1.26715749502182e-05, 1.31167471408844e-05, 1.3561919331550598e-05, 1.4007091522216797e-05]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 6.0, 3.0, 2.0, 10.0, 8.0, 10.0, 8.0, 17.0, 27.0, 23.0, 44.0, 68.0, 49.0, 75.0, 71.0, 132.0, 167.0, 139.0, 207.0, 165.0, 323.0, 233.0, 396.0, 339.0, 197.0, 259.0, 171.0, 220.0, 164.0, 92.0, 119.0, 55.0, 66.0, 46.0, 36.0, 32.0, 14.0, 24.0, 14.0, 7.0, 12.0, 8.0, 9.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.0067901611328125e-06, -4.852190613746643e-06, -4.697591066360474e-06, -4.542991518974304e-06, -4.388391971588135e-06, -4.233792424201965e-06, -4.079192876815796e-06, -3.9245933294296265e-06, -3.769993782043457e-06, -3.6153942346572876e-06, -3.460794687271118e-06, -3.3061951398849487e-06, -3.1515955924987793e-06, -2.99699604511261e-06, -2.8423964977264404e-06, -2.687796950340271e-06, -2.5331974029541016e-06, -2.378597855567932e-06, -2.2239983081817627e-06, -2.0693987607955933e-06, -1.914799213409424e-06, -1.7601996660232544e-06, -1.605600118637085e-06, -1.4510005712509155e-06, -1.296401023864746e-06, -1.1418014764785767e-06, -9.872019290924072e-07, -8.326023817062378e-07, -6.780028343200684e-07, -5.234032869338989e-07, -3.688037395477295e-07, -2.1420419216156006e-07, -5.960464477539063e-08, 9.499490261077881e-08, 2.4959444999694824e-07, 4.041939973831177e-07, 5.587935447692871e-07, 7.133930921554565e-07, 8.67992639541626e-07, 1.0225921869277954e-06, 1.1771917343139648e-06, 1.3317912817001343e-06, 1.4863908290863037e-06, 1.6409903764724731e-06, 1.7955899238586426e-06, 1.950189471244812e-06, 2.1047890186309814e-06, 2.259388566017151e-06, 2.4139881134033203e-06, 2.5685876607894897e-06, 2.723187208175659e-06, 2.8777867555618286e-06, 3.032386302947998e-06, 3.1869858503341675e-06, 3.341585397720337e-06, 3.4961849451065063e-06, 3.6507844924926758e-06, 3.8053840398788452e-06, 3.959983587265015e-06, 4.114583134651184e-06, 4.2691826820373535e-06, 4.423782229423523e-06, 4.578381776809692e-06, 4.732981324195862e-06, 4.887580871582031e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 4.0, 9.0, 17.0, 15.0, 22.0, 26.0, 31.0, 54.0, 64.0, 74.0, 87.0, 122.0, 103.0, 93.0, 73.0, 43.0, 34.0, 27.0, 29.0, 16.0, 8.0, 10.0, 8.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3004626453039236e-05, -1.2517227332864422e-05, -1.2029828212689608e-05, -1.1542430002009496e-05, -1.1055030881834682e-05, -1.0567631761659868e-05, -1.0080233550979756e-05, -9.592834430804942e-06, -9.105435310630128e-06, -8.618036190455314e-06, -8.1306370702805e-06, -7.643238859600388e-06, -7.1558397394255735e-06, -6.6684406192507595e-06, -6.181041953823296e-06, -5.693643288395833e-06, -5.206244168221019e-06, -4.718845048046205e-06, -4.231446382618742e-06, -3.7440474898176035e-06, -3.256648597016465e-06, -2.7692497042153263e-06, -2.2818508114141878e-06, -1.7944519186130492e-06, -1.3070530258119106e-06, -8.196541330107721e-07, -3.322552402096335e-07, 1.551436525915051e-07, 6.425425453926437e-07, 1.1299414381937822e-06, 1.6173403309949208e-06, 2.1047392237960594e-06, 2.5921362976077944e-06, 3.079535190408933e-06, 3.5669340832100715e-06, 4.054332748637535e-06, 4.541731868812349e-06, 5.029130988987163e-06, 5.516529654414626e-06, 6.003928319842089e-06, 6.491327440016903e-06, 6.978726560191717e-06, 7.46612522561918e-06, 7.953523891046643e-06, 8.440923011221457e-06, 8.928322131396271e-06, 9.415720342076384e-06, 9.903119462251198e-06, 1.0390518582426012e-05, 1.0877917702600826e-05, 1.136531682277564e-05, 1.1852715033455752e-05, 1.2340114153630566e-05, 1.282751327380538e-05, 1.3314911484485492e-05, 1.3802310604660306e-05, 1.428970972483512e-05, 1.4777108845009934e-05, 1.5264507965184748e-05, 1.575190617586486e-05, 1.6239304386544973e-05, 1.672670441621449e-05, 1.72141026268946e-05, 1.7701502656564116e-05, 1.818890086724423e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 7.0, 4.0, 3.0, 3.0, 6.0, 6.0, 3.0, 11.0, 8.0, 10.0, 15.0, 13.0, 12.0, 28.0, 24.0, 24.0, 27.0, 21.0, 26.0, 32.0, 36.0, 24.0, 35.0, 25.0, 28.0, 35.0, 40.0, 40.0, 36.0, 40.0, 40.0, 33.0, 26.0, 21.0, 30.0, 31.0, 20.0, 19.0, 25.0, 21.0, 19.0, 15.0, 14.0, 10.0, 13.0, 10.0, 8.0, 8.0, 9.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-7.083381660777377e-06, -6.84416545482236e-06, -6.604949248867342e-06, -6.365733042912325e-06, -6.1265168369573075e-06, -5.88730063100229e-06, -5.648083970299922e-06, -5.4088677643449046e-06, -5.169651558389887e-06, -4.93043535243487e-06, -4.6912191464798525e-06, -4.452002940524835e-06, -4.212786734569818e-06, -3.9735705286148e-06, -3.7343540952861076e-06, -3.4951378893310903e-06, -3.2559219107497483e-06, -3.016705704794731e-06, -2.7774894988397136e-06, -2.5382732928846963e-06, -2.299057086929679e-06, -2.0598408809746616e-06, -1.8206244476459688e-06, -1.5814082416909514e-06, -1.342192035735934e-06, -1.1029758297809167e-06, -8.637595669824805e-07, -6.245433041840442e-07, -3.853270982290269e-07, -1.4611089227400953e-07, 9.310542736784555e-08, 3.323216333228629e-07, 5.715382940252312e-07, 8.107544999802485e-07, 1.0499707059352659e-06, 1.289187025577121e-06, 1.5284032315321383e-06, 1.7676194374871557e-06, 2.0068357571290107e-06, 2.246051963084028e-06, 2.4852681690390455e-06, 2.724484374994063e-06, 2.96370058094908e-06, 3.202917014277773e-06, 3.4421332202327903e-06, 3.6813494261878077e-06, 3.920565632142825e-06, 4.159781838097842e-06, 4.39899804405286e-06, 4.638214250007877e-06, 4.8774304559628945e-06, 5.116646661917912e-06, 5.355862867872929e-06, 5.5950790738279466e-06, 5.834295734530315e-06, 6.073511940485332e-06, 6.3127281464403495e-06, 6.551944352395367e-06, 6.791160558350384e-06, 7.030376764305402e-06, 7.269592970260419e-06, 7.508809176215436e-06, 7.748025382170454e-06, 7.987241588125471e-06, 8.226457794080488e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 9.0, 14.0, 25.0, 41.0, 51.0, 89.0, 139.0, 142.0, 286.0, 434.0, 604.0, 1108.0, 1811.0, 2397.0, 4491.0, 7385.0, 10229.0, 19616.0, 27305.0, 54789.0, 98647.0, 145079.0, 235461.0, 188798.0, 96398.0, 64608.0, 36438.0, 18582.0, 13343.0, 6796.0, 5238.0, 3114.0, 1727.0, 1283.0, 757.0, 442.0, 307.0, 198.0, 106.0, 87.0, 56.0, 43.0, 23.0, 11.0, 16.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2516975402832031e-05, -1.2121163308620453e-05, -1.1725351214408875e-05, -1.1329539120197296e-05, -1.0933727025985718e-05, -1.053791493177414e-05, -1.0142102837562561e-05, -9.746290743350983e-06, -9.350478649139404e-06, -8.954666554927826e-06, -8.558854460716248e-06, -8.16304236650467e-06, -7.76723027229309e-06, -7.3714181780815125e-06, -6.975606083869934e-06, -6.579793989658356e-06, -6.183981895446777e-06, -5.788169801235199e-06, -5.392357707023621e-06, -4.996545612812042e-06, -4.600733518600464e-06, -4.2049214243888855e-06, -3.809109330177307e-06, -3.4132972359657288e-06, -3.0174851417541504e-06, -2.621673047542572e-06, -2.2258609533309937e-06, -1.8300488591194153e-06, -1.434236764907837e-06, -1.0384246706962585e-06, -6.426125764846802e-07, -2.468004822731018e-07, 1.4901161193847656e-07, 5.448237061500549e-07, 9.406358003616333e-07, 1.3364478945732117e-06, 1.73225998878479e-06, 2.1280720829963684e-06, 2.5238841772079468e-06, 2.919696271419525e-06, 3.3155083656311035e-06, 3.711320459842682e-06, 4.10713255405426e-06, 4.502944648265839e-06, 4.898756742477417e-06, 5.294568836688995e-06, 5.690380930900574e-06, 6.086193025112152e-06, 6.4820051193237305e-06, 6.877817213535309e-06, 7.273629307746887e-06, 7.669441401958466e-06, 8.065253496170044e-06, 8.461065590381622e-06, 8.8568776845932e-06, 9.252689778804779e-06, 9.648501873016357e-06, 1.0044313967227936e-05, 1.0440126061439514e-05, 1.0835938155651093e-05, 1.1231750249862671e-05, 1.162756234407425e-05, 1.2023374438285828e-05, 1.2419186532497406e-05, 1.2814998626708984e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 6.0, 7.0, 5.0, 8.0, 7.0, 9.0, 10.0, 9.0, 14.0, 23.0, 20.0, 36.0, 23.0, 17.0, 26.0, 27.0, 29.0, 22.0, 26.0, 43.0, 44.0, 31.0, 36.0, 33.0, 47.0, 47.0, 46.0, 31.0, 26.0, 35.0, 19.0, 33.0, 21.0, 24.0, 14.0, 19.0, 12.0, 16.0, 21.0, 5.0, 11.0, 9.0, 15.0, 9.0, 5.0, 7.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-7.331371307373047e-06, -7.095746695995331e-06, -6.860122084617615e-06, -6.624497473239899e-06, -6.388872861862183e-06, -6.1532482504844666e-06, -5.9176236391067505e-06, -5.6819990277290344e-06, -5.446374416351318e-06, -5.210749804973602e-06, -4.975125193595886e-06, -4.73950058221817e-06, -4.503875970840454e-06, -4.268251359462738e-06, -4.032626748085022e-06, -3.797002136707306e-06, -3.56137752532959e-06, -3.3257529139518738e-06, -3.0901283025741577e-06, -2.8545036911964417e-06, -2.6188790798187256e-06, -2.3832544684410095e-06, -2.1476298570632935e-06, -1.9120052456855774e-06, -1.6763806343078613e-06, -1.4407560229301453e-06, -1.2051314115524292e-06, -9.695068001747131e-07, -7.338821887969971e-07, -4.98257577419281e-07, -2.6263296604156494e-07, -2.7008354663848877e-08, 2.086162567138672e-07, 4.4424086809158325e-07, 6.798654794692993e-07, 9.154900908470154e-07, 1.1511147022247314e-06, 1.3867393136024475e-06, 1.6223639249801636e-06, 1.8579885363578796e-06, 2.0936131477355957e-06, 2.3292377591133118e-06, 2.564862370491028e-06, 2.800486981868744e-06, 3.03611159324646e-06, 3.271736204624176e-06, 3.507360816001892e-06, 3.742985427379608e-06, 3.978610038757324e-06, 4.21423465013504e-06, 4.449859261512756e-06, 4.685483872890472e-06, 4.9211084842681885e-06, 5.1567330956459045e-06, 5.392357707023621e-06, 5.627982318401337e-06, 5.863606929779053e-06, 6.099231541156769e-06, 6.334856152534485e-06, 6.570480763912201e-06, 6.806105375289917e-06, 7.041729986667633e-06, 7.277354598045349e-06, 7.512979209423065e-06, 7.748603820800781e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 12.0, 16.0, 6.0, 21.0, 27.0, 40.0, 66.0, 98.0, 165.0, 240.0, 425.0, 632.0, 1118.0, 1708.0, 3545.0, 7321.0, 17710.0, 51995.0, 206307.0, 627110.0, 84056.0, 25506.0, 9585.0, 4916.0, 2467.0, 1369.0, 763.0, 475.0, 294.0, 183.0, 113.0, 87.0, 55.0, 45.0, 22.0, 17.0, 9.0, 8.0, 6.0, 2.0, 6.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2590160369873047e-05, -2.1948479115962982e-05, -2.1306797862052917e-05, -2.0665116608142853e-05, -2.0023435354232788e-05, -1.9381754100322723e-05, -1.874007284641266e-05, -1.8098391592502594e-05, -1.745671033859253e-05, -1.6815029084682465e-05, -1.61733478307724e-05, -1.5531666576862335e-05, -1.488998532295227e-05, -1.4248304069042206e-05, -1.3606622815132141e-05, -1.2964941561222076e-05, -1.2323260307312012e-05, -1.1681579053401947e-05, -1.1039897799491882e-05, -1.0398216545581818e-05, -9.756535291671753e-06, -9.114854037761688e-06, -8.473172783851624e-06, -7.831491529941559e-06, -7.189810276031494e-06, -6.5481290221214294e-06, -5.906447768211365e-06, -5.2647665143013e-06, -4.623085260391235e-06, -3.981404006481171e-06, -3.339722752571106e-06, -2.6980414986610413e-06, -2.0563602447509766e-06, -1.4146789908409119e-06, -7.729977369308472e-07, -1.3131648302078247e-07, 5.103647708892822e-07, 1.152046024799347e-06, 1.7937272787094116e-06, 2.4354085326194763e-06, 3.077089786529541e-06, 3.7187710404396057e-06, 4.36045229434967e-06, 5.002133548259735e-06, 5.6438148021698e-06, 6.2854960560798645e-06, 6.927177309989929e-06, 7.568858563899994e-06, 8.210539817810059e-06, 8.852221071720123e-06, 9.493902325630188e-06, 1.0135583579540253e-05, 1.0777264833450317e-05, 1.1418946087360382e-05, 1.2060627341270447e-05, 1.2702308595180511e-05, 1.3343989849090576e-05, 1.3985671103000641e-05, 1.4627352356910706e-05, 1.526903361082077e-05, 1.5910714864730835e-05, 1.65523961186409e-05, 1.7194077372550964e-05, 1.783575862646103e-05, 1.8477439880371094e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 13.0, 11.0, 12.0, 16.0, 17.0, 20.0, 28.0, 28.0, 28.0, 54.0, 56.0, 46.0, 87.0, 132.0, 105.0, 52.0, 65.0, 42.0, 37.0, 33.0, 17.0, 28.0, 7.0, 13.0, 12.0, 2.0, 6.0, 2.0, 6.0, 7.0, 0.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.410743713378906e-06, -4.257075488567352e-06, -4.103407263755798e-06, -3.949739038944244e-06, -3.7960708141326904e-06, -3.6424025893211365e-06, -3.4887343645095825e-06, -3.3350661396980286e-06, -3.1813979148864746e-06, -3.0277296900749207e-06, -2.8740614652633667e-06, -2.7203932404518127e-06, -2.566725015640259e-06, -2.413056790828705e-06, -2.259388566017151e-06, -2.105720341205597e-06, -1.952052116394043e-06, -1.798383891582489e-06, -1.644715666770935e-06, -1.491047441959381e-06, -1.3373792171478271e-06, -1.1837109923362732e-06, -1.0300427675247192e-06, -8.763745427131653e-07, -7.227063179016113e-07, -5.690380930900574e-07, -4.153698682785034e-07, -2.6170164346694946e-07, -1.0803341865539551e-07, 4.563480615615845e-08, 1.993030309677124e-07, 3.5297125577926636e-07, 5.066394805908203e-07, 6.603077054023743e-07, 8.139759302139282e-07, 9.676441550254822e-07, 1.1213123798370361e-06, 1.27498060464859e-06, 1.428648829460144e-06, 1.582317054271698e-06, 1.735985279083252e-06, 1.889653503894806e-06, 2.04332172870636e-06, 2.196989953517914e-06, 2.3506581783294678e-06, 2.5043264031410217e-06, 2.6579946279525757e-06, 2.8116628527641296e-06, 2.9653310775756836e-06, 3.1189993023872375e-06, 3.2726675271987915e-06, 3.4263357520103455e-06, 3.5800039768218994e-06, 3.7336722016334534e-06, 3.887340426445007e-06, 4.041008651256561e-06, 4.194676876068115e-06, 4.348345100879669e-06, 4.502013325691223e-06, 4.655681550502777e-06, 4.809349775314331e-06, 4.963018000125885e-06, 5.116686224937439e-06, 5.270354449748993e-06, 5.424022674560547e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 12.0, 14.0, 20.0, 43.0, 36.0, 52.0, 84.0, 158.0, 185.0, 417.0, 814.0, 1668.0, 2781.0, 6509.0, 17051.0, 62251.0, 863782.0, 62807.0, 17087.0, 6345.0, 2917.0, 1722.0, 574.0, 513.0, 256.0, 162.0, 84.0, 73.0, 36.0, 43.0, 24.0, 6.0, 8.0, 9.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-06, -4.353001713752747e-06, -4.176050424575806e-06, -3.999099135398865e-06, -3.822147846221924e-06, -3.645196557044983e-06, -3.468245267868042e-06, -3.291293978691101e-06, -3.11434268951416e-06, -2.9373914003372192e-06, -2.7604401111602783e-06, -2.5834888219833374e-06, -2.4065375328063965e-06, -2.2295862436294556e-06, -2.0526349544525146e-06, -1.8756836652755737e-06, -1.6987323760986328e-06, -1.521781086921692e-06, -1.344829797744751e-06, -1.16787850856781e-06, -9.909272193908691e-07, -8.139759302139282e-07, -6.370246410369873e-07, -4.600733518600464e-07, -2.8312206268310547e-07, -1.0617077350616455e-07, 7.078051567077637e-08, 2.477318048477173e-07, 4.246830940246582e-07, 6.016343832015991e-07, 7.7858567237854e-07, 9.55536961555481e-07, 1.1324882507324219e-06, 1.3094395399093628e-06, 1.4863908290863037e-06, 1.6633421182632446e-06, 1.8402934074401855e-06, 2.0172446966171265e-06, 2.1941959857940674e-06, 2.3711472749710083e-06, 2.5480985641479492e-06, 2.72504985332489e-06, 2.902001142501831e-06, 3.078952431678772e-06, 3.255903720855713e-06, 3.432855010032654e-06, 3.6098062992095947e-06, 3.7867575883865356e-06, 3.9637088775634766e-06, 4.1406601667404175e-06, 4.317611455917358e-06, 4.494562745094299e-06, 4.67151403427124e-06, 4.848465323448181e-06, 5.025416612625122e-06, 5.202367901802063e-06, 5.379319190979004e-06, 5.556270480155945e-06, 5.733221769332886e-06, 5.910173058509827e-06, 6.087124347686768e-06, 6.2640756368637085e-06, 6.441026926040649e-06, 6.61797821521759e-06, 6.794929504394531e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 10.0, 0.0, 0.0, 10.0, 0.0, 0.0, 17.0, 0.0, 0.0, 24.0, 0.0, 0.0, 84.0, 0.0, 0.0, 116.0, 0.0, 506.0, 0.0, 0.0, 106.0, 0.0, 0.0, 76.0, 0.0, 0.0, 33.0, 0.0, 0.0, 13.0, 0.0, 0.0, 9.0, 0.0, 0.0, 10.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.94766640663147e-07, -6.742775440216064e-07, -6.537884473800659e-07, -6.332993507385254e-07, -6.128102540969849e-07, -5.923211574554443e-07, -5.718320608139038e-07, -5.513429641723633e-07, -5.308538675308228e-07, -5.103647708892822e-07, -4.898756742477417e-07, -4.6938657760620117e-07, -4.4889748096466064e-07, -4.284083843231201e-07, -4.079192876815796e-07, -3.8743019104003906e-07, -3.6694109439849854e-07, -3.46451997756958e-07, -3.259629011154175e-07, -3.0547380447387695e-07, -2.849847078323364e-07, -2.644956111907959e-07, -2.4400651454925537e-07, -2.2351741790771484e-07, -2.0302832126617432e-07, -1.825392246246338e-07, -1.6205012798309326e-07, -1.4156103134155273e-07, -1.210719347000122e-07, -1.0058283805847168e-07, -8.009374141693115e-08, -5.960464477539063e-08, -3.91155481338501e-08, -1.862645149230957e-08, 1.862645149230957e-09, 2.2351741790771484e-08, 4.284083843231201e-08, 6.332993507385254e-08, 8.381903171539307e-08, 1.043081283569336e-07, 1.2479722499847412e-07, 1.4528632164001465e-07, 1.6577541828155518e-07, 1.862645149230957e-07, 2.0675361156463623e-07, 2.2724270820617676e-07, 2.477318048477173e-07, 2.682209014892578e-07, 2.8870999813079834e-07, 3.0919909477233887e-07, 3.296881914138794e-07, 3.501772880554199e-07, 3.7066638469696045e-07, 3.91155481338501e-07, 4.116445779800415e-07, 4.3213367462158203e-07, 4.5262277126312256e-07, 4.731118679046631e-07, 4.936009645462036e-07, 5.140900611877441e-07, 5.345791578292847e-07, 5.550682544708252e-07, 5.755573511123657e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 14.0, 17.0, 40.0, 26.0, 25.0, 62.0, 72.0, 78.0, 122.0, 353.0, 225.0, 360.0, 466.0, 627.0, 891.0, 3475.0, 3261.0, 5299.0, 8518.0, 14734.0, 25110.0, 51492.0, 710481.0, 107666.0, 51461.0, 25342.0, 14400.0, 8449.0, 8525.0, 1971.0, 1466.0, 957.0, 650.0, 492.0, 611.0, 198.0, 146.0, 113.0, 90.0, 59.0, 48.0, 57.0, 31.0, 18.0, 12.0, 8.0, 9.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-2.2649765014648438e-06, -2.1960586309432983e-06, -2.127140760421753e-06, -2.0582228899002075e-06, -1.989305019378662e-06, -1.9203871488571167e-06, -1.8514692783355713e-06, -1.7825514078140259e-06, -1.7136335372924805e-06, -1.644715666770935e-06, -1.5757977962493896e-06, -1.5068799257278442e-06, -1.4379620552062988e-06, -1.3690441846847534e-06, -1.300126314163208e-06, -1.2312084436416626e-06, -1.1622905731201172e-06, -1.0933727025985718e-06, -1.0244548320770264e-06, -9.55536961555481e-07, -8.866190910339355e-07, -8.177012205123901e-07, -7.487833499908447e-07, -6.798654794692993e-07, -6.109476089477539e-07, -5.420297384262085e-07, -4.731118679046631e-07, -4.041939973831177e-07, -3.3527612686157227e-07, -2.6635825634002686e-07, -1.9744038581848145e-07, -1.2852251529693604e-07, -5.960464477539063e-08, 9.313225746154785e-09, 7.82310962677002e-08, 1.471489667892456e-07, 2.1606683731079102e-07, 2.849847078323364e-07, 3.5390257835388184e-07, 4.2282044887542725e-07, 4.917383193969727e-07, 5.606561899185181e-07, 6.295740604400635e-07, 6.984919309616089e-07, 7.674098014831543e-07, 8.363276720046997e-07, 9.052455425262451e-07, 9.741634130477905e-07, 1.043081283569336e-06, 1.1119991540908813e-06, 1.1809170246124268e-06, 1.2498348951339722e-06, 1.3187527656555176e-06, 1.387670636177063e-06, 1.4565885066986084e-06, 1.5255063772201538e-06, 1.5944242477416992e-06, 1.6633421182632446e-06, 1.73225998878479e-06, 1.8011778593063354e-06, 1.8700957298278809e-06, 1.9390136003494263e-06, 2.0079314708709717e-06, 2.076849341392517e-06, 2.1457672119140625e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 11.0, 0.0, 0.0, 10.0, 0.0, 0.0, 18.0, 0.0, 0.0, 34.0, 0.0, 0.0, 77.0, 0.0, 118.0, 0.0, 0.0, 477.0, 0.0, 0.0, 118.0, 0.0, 0.0, 65.0, 0.0, 27.0, 0.0, 0.0, 24.0, 0.0, 0.0, 18.0, 0.0, 0.0, 8.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.342306733131409e-07, -6.128102540969849e-07, -5.913898348808289e-07, -5.699694156646729e-07, -5.485489964485168e-07, -5.271285772323608e-07, -5.057081580162048e-07, -4.842877388000488e-07, -4.628673195838928e-07, -4.414469003677368e-07, -4.200264811515808e-07, -3.986060619354248e-07, -3.771856427192688e-07, -3.557652235031128e-07, -3.343448042869568e-07, -3.129243850708008e-07, -2.915039658546448e-07, -2.7008354663848877e-07, -2.4866312742233276e-07, -2.2724270820617676e-07, -2.0582228899002075e-07, -1.8440186977386475e-07, -1.6298145055770874e-07, -1.4156103134155273e-07, -1.2014061212539673e-07, -9.872019290924072e-08, -7.729977369308472e-08, -5.587935447692871e-08, -3.4458935260772705e-08, -1.30385160446167e-08, 8.381903171539307e-09, 2.9802322387695312e-08, 5.122274160385132e-08, 7.264316082000732e-08, 9.406358003616333e-08, 1.1548399925231934e-07, 1.3690441846847534e-07, 1.5832483768463135e-07, 1.7974525690078735e-07, 2.0116567611694336e-07, 2.2258609533309937e-07, 2.4400651454925537e-07, 2.654269337654114e-07, 2.868473529815674e-07, 3.082677721977234e-07, 3.296881914138794e-07, 3.511086106300354e-07, 3.725290298461914e-07, 3.939494490623474e-07, 4.153698682785034e-07, 4.367902874946594e-07, 4.5821070671081543e-07, 4.796311259269714e-07, 5.010515451431274e-07, 5.224719643592834e-07, 5.438923835754395e-07, 5.653128027915955e-07, 5.867332220077515e-07, 6.081536412239075e-07, 6.295740604400635e-07, 6.509944796562195e-07, 6.724148988723755e-07, 6.938353180885315e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 3.0, 8.0, 3.0, 9.0, 13.0, 15.0, 22.0, 31.0, 44.0, 40.0, 74.0, 96.0, 124.0, 128.0, 97.0, 77.0, 49.0, 45.0, 31.0, 20.0, 18.0, 8.0, 8.0, 11.0, 10.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2005237294943072e-05, -1.1527798051247373e-05, -1.1050358807551675e-05, -1.0572919563855976e-05, -1.0095480320160277e-05, -9.618041076464579e-06, -9.140602742263582e-06, -8.663163498567883e-06, -8.185724254872184e-06, -7.708285011176486e-06, -7.230845767480787e-06, -6.753406978532439e-06, -6.27596773483674e-06, -5.798528491141042e-06, -5.321089702192694e-06, -4.843650458496995e-06, -4.366211214801297e-06, -3.888771971105598e-06, -3.4113329547835747e-06, -2.9338939384615514e-06, -2.4564546947658528e-06, -1.979015451070154e-06, -1.5015764347481309e-06, -1.0241374184261076e-06, -5.466981747304089e-07, -6.925904472154798e-08, 4.08180085287313e-07, 8.856192152961739e-07, 1.3630583453050349e-06, 1.8404975890007336e-06, 2.317936605322757e-06, 2.79537562164478e-06, 3.2728166843298823e-06, 3.750255928025581e-06, 4.22769517172128e-06, 4.705133960669627e-06, 5.182573204365326e-06, 5.660012448061025e-06, 6.1374512370093726e-06, 6.614890480705071e-06, 7.09232972440077e-06, 7.569768968096469e-06, 8.047208211792167e-06, 8.524647455487866e-06, 9.002085789688863e-06, 9.479525033384562e-06, 9.95696427708026e-06, 1.0434403520775959e-05, 1.0911842764471658e-05, 1.1389282008167356e-05, 1.1866721251863055e-05, 1.2344160495558754e-05, 1.2821599739254452e-05, 1.3299038982950151e-05, 1.3776477317151148e-05, 1.4253916560846847e-05, 1.4731355804542545e-05, 1.5208795048238244e-05, 1.568623338243924e-05, 1.616367262613494e-05, 1.6641111869830638e-05, 1.7118551113526337e-05, 1.7595990357222036e-05, 1.8073429600917734e-05, 1.8550868844613433e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 4.0, 8.0, 6.0, 3.0, 5.0, 2.0, 4.0, 6.0, 5.0, 13.0, 8.0, 14.0, 11.0, 13.0, 14.0, 24.0, 26.0, 30.0, 19.0, 24.0, 26.0, 38.0, 25.0, 37.0, 29.0, 24.0, 27.0, 46.0, 30.0, 37.0, 48.0, 39.0, 33.0, 31.0, 28.0, 20.0, 32.0, 25.0, 28.0, 16.0, 22.0, 18.0, 20.0, 19.0, 7.0, 14.0, 12.0, 7.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-6.648672297160374e-06, -6.422322258003987e-06, -6.195972218847601e-06, -5.969622179691214e-06, -5.7432721405348275e-06, -5.516922101378441e-06, -5.290572062222054e-06, -5.064222023065668e-06, -4.837871983909281e-06, -4.611521944752894e-06, -4.385171905596508e-06, -4.158821866440121e-06, -3.9324718272837345e-06, -3.706121788127348e-06, -3.479771748970961e-06, -3.2534217098145746e-06, -3.027071670658188e-06, -2.8007216315018013e-06, -2.5743715923454147e-06, -2.348021553189028e-06, -2.1216715140326414e-06, -1.8953214748762548e-06, -1.6689714357198682e-06, -1.4426213965634815e-06, -1.216271357407095e-06, -9.899213182507083e-07, -7.635712790943217e-07, -5.37221239937935e-07, -3.108712007815484e-07, -8.452116162516177e-08, 1.4182887753122486e-07, 3.681789166876115e-07, 5.945285010966472e-07, 8.208785402530339e-07, 1.0472285794094205e-06, 1.2735786185658071e-06, 1.4999286577221937e-06, 1.7262786968785804e-06, 1.952628736034967e-06, 2.1789787751913536e-06, 2.4053288143477403e-06, 2.631678853504127e-06, 2.8580288926605135e-06, 3.0843789318169e-06, 3.3107289709732868e-06, 3.5370790101296734e-06, 3.76342904928606e-06, 3.989779088442447e-06, 4.216129127598833e-06, 4.44247916675522e-06, 4.6688292059116066e-06, 4.895179245067993e-06, 5.12152928422438e-06, 5.3478793233807664e-06, 5.574229362537153e-06, 5.80057940169354e-06, 6.026929440849926e-06, 6.253279480006313e-06, 6.4796295191627e-06, 6.705979558319086e-06, 6.932329597475473e-06, 7.1586796366318595e-06, 7.385029675788246e-06, 7.611379714944633e-06, 7.83772975410102e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 6.0, 4.0, 5.0, 7.0, 9.0, 12.0, 17.0, 23.0, 37.0, 59.0, 77.0, 115.0, 182.0, 222.0, 335.0, 362.0, 657.0, 745.0, 1284.0, 1813.0, 2259.0, 3799.0, 4707.0, 8047.0, 12480.0, 17087.0, 31894.0, 47359.0, 100602.0, 169043.0, 272479.0, 170874.0, 76940.0, 48606.0, 25040.0, 17871.0, 10981.0, 6589.0, 4938.0, 3090.0, 2358.0, 1743.0, 1031.0, 841.0, 523.0, 418.0, 292.0, 191.0, 153.0, 88.0, 81.0, 52.0, 40.0, 33.0, 21.0, 20.0, 11.0, 6.0, 5.0, 4.0, 1.0, 1.0], "bins": [-1.4662742614746094e-05, -1.4210119843482971e-05, -1.3757497072219849e-05, -1.3304874300956726e-05, -1.2852251529693604e-05, -1.2399628758430481e-05, -1.1947005987167358e-05, -1.1494383215904236e-05, -1.1041760444641113e-05, -1.058913767337799e-05, -1.0136514902114868e-05, -9.683892130851746e-06, -9.231269359588623e-06, -8.7786465883255e-06, -8.326023817062378e-06, -7.873401045799255e-06, -7.420778274536133e-06, -6.96815550327301e-06, -6.515532732009888e-06, -6.062909960746765e-06, -5.610287189483643e-06, -5.15766441822052e-06, -4.7050416469573975e-06, -4.252418875694275e-06, -3.7997961044311523e-06, -3.3471733331680298e-06, -2.8945505619049072e-06, -2.4419277906417847e-06, -1.989305019378662e-06, -1.5366822481155396e-06, -1.084059476852417e-06, -6.314367055892944e-07, -1.7881393432617188e-07, 2.738088369369507e-07, 7.264316082000732e-07, 1.1790543794631958e-06, 1.6316771507263184e-06, 2.084299921989441e-06, 2.5369226932525635e-06, 2.989545464515686e-06, 3.4421682357788086e-06, 3.894791007041931e-06, 4.347413778305054e-06, 4.800036549568176e-06, 5.252659320831299e-06, 5.705282092094421e-06, 6.157904863357544e-06, 6.6105276346206665e-06, 7.063150405883789e-06, 7.515773177146912e-06, 7.968395948410034e-06, 8.421018719673157e-06, 8.87364149093628e-06, 9.326264262199402e-06, 9.778887033462524e-06, 1.0231509804725647e-05, 1.068413257598877e-05, 1.1136755347251892e-05, 1.1589378118515015e-05, 1.2042000889778137e-05, 1.249462366104126e-05, 1.2947246432304382e-05, 1.3399869203567505e-05, 1.3852491974830627e-05, 1.430511474609375e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 7.0, 9.0, 3.0, 5.0, 12.0, 14.0, 13.0, 19.0, 29.0, 18.0, 36.0, 28.0, 34.0, 25.0, 32.0, 35.0, 38.0, 47.0, 39.0, 50.0, 43.0, 25.0, 49.0, 46.0, 37.0, 44.0, 34.0, 22.0, 26.0, 20.0, 24.0, 21.0, 19.0, 17.0, 11.0, 15.0, 14.0, 9.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.973743438720703e-06, -6.7427754402160645e-06, -6.511807441711426e-06, -6.280839443206787e-06, -6.0498714447021484e-06, -5.81890344619751e-06, -5.587935447692871e-06, -5.356967449188232e-06, -5.125999450683594e-06, -4.895031452178955e-06, -4.664063453674316e-06, -4.433095455169678e-06, -4.202127456665039e-06, -3.9711594581604e-06, -3.7401914596557617e-06, -3.509223461151123e-06, -3.2782554626464844e-06, -3.0472874641418457e-06, -2.816319465637207e-06, -2.5853514671325684e-06, -2.3543834686279297e-06, -2.123415470123291e-06, -1.8924474716186523e-06, -1.6614794731140137e-06, -1.430511474609375e-06, -1.1995434761047363e-06, -9.685754776000977e-07, -7.37607479095459e-07, -5.066394805908203e-07, -2.7567148208618164e-07, -4.470348358154297e-08, 1.862645149230957e-07, 4.172325134277344e-07, 6.48200511932373e-07, 8.791685104370117e-07, 1.1101365089416504e-06, 1.341104507446289e-06, 1.5720725059509277e-06, 1.8030405044555664e-06, 2.034008502960205e-06, 2.2649765014648438e-06, 2.4959444999694824e-06, 2.726912498474121e-06, 2.9578804969787598e-06, 3.1888484954833984e-06, 3.419816493988037e-06, 3.6507844924926758e-06, 3.8817524909973145e-06, 4.112720489501953e-06, 4.343688488006592e-06, 4.5746564865112305e-06, 4.805624485015869e-06, 5.036592483520508e-06, 5.2675604820251465e-06, 5.498528480529785e-06, 5.729496479034424e-06, 5.9604644775390625e-06, 6.191432476043701e-06, 6.42240047454834e-06, 6.6533684730529785e-06, 6.884336471557617e-06, 7.115304470062256e-06, 7.3462724685668945e-06, 7.577240467071533e-06, 7.808208465576172e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 10.0, 19.0, 23.0, 36.0, 46.0, 72.0, 136.0, 183.0, 272.0, 407.0, 572.0, 881.0, 1496.0, 1891.0, 3191.0, 5232.0, 6800.0, 12726.0, 21308.0, 31627.0, 65459.0, 131836.0, 221101.0, 259014.0, 132033.0, 59054.0, 37822.0, 21181.0, 11374.0, 8311.0, 5182.0, 2961.0, 2296.0, 1371.0, 784.0, 636.0, 403.0, 235.0, 194.0, 154.0, 77.0, 65.0, 33.0, 20.0, 14.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4185905456542969e-05, -1.3728626072406769e-05, -1.3271346688270569e-05, -1.2814067304134369e-05, -1.2356787919998169e-05, -1.1899508535861969e-05, -1.1442229151725769e-05, -1.0984949767589569e-05, -1.0527670383453369e-05, -1.007039099931717e-05, -9.61311161518097e-06, -9.15583223104477e-06, -8.69855284690857e-06, -8.24127346277237e-06, -7.78399407863617e-06, -7.3267146944999695e-06, -6.8694353103637695e-06, -6.41215592622757e-06, -5.95487654209137e-06, -5.49759715795517e-06, -5.04031777381897e-06, -4.58303838968277e-06, -4.12575900554657e-06, -3.66847962141037e-06, -3.21120023727417e-06, -2.75392085313797e-06, -2.29664146900177e-06, -1.83936208486557e-06, -1.3820827007293701e-06, -9.248033165931702e-07, -4.675239324569702e-07, -1.0244548320770264e-08, 4.470348358154297e-07, 9.043142199516296e-07, 1.3615936040878296e-06, 1.8188729882240295e-06, 2.2761523723602295e-06, 2.7334317564964294e-06, 3.1907111406326294e-06, 3.6479905247688293e-06, 4.105269908905029e-06, 4.562549293041229e-06, 5.019828677177429e-06, 5.477108061313629e-06, 5.934387445449829e-06, 6.391666829586029e-06, 6.848946213722229e-06, 7.306225597858429e-06, 7.763504981994629e-06, 8.220784366130829e-06, 8.678063750267029e-06, 9.135343134403229e-06, 9.592622518539429e-06, 1.0049901902675629e-05, 1.0507181286811829e-05, 1.0964460670948029e-05, 1.1421740055084229e-05, 1.1879019439220428e-05, 1.2336298823356628e-05, 1.2793578207492828e-05, 1.3250857591629028e-05, 1.3708136975765228e-05, 1.4165416359901428e-05, 1.4622695744037628e-05, 1.5079975128173828e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 3.0, 2.0, 4.0, 5.0, 13.0, 15.0, 3.0, 17.0, 20.0, 21.0, 16.0, 32.0, 28.0, 39.0, 30.0, 50.0, 29.0, 45.0, 41.0, 42.0, 30.0, 34.0, 50.0, 28.0, 51.0, 30.0, 47.0, 22.0, 41.0, 22.0, 21.0, 28.0, 30.0, 13.0, 20.0, 10.0, 20.0, 13.0, 3.0, 8.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.5299530029296875e-06, -4.382804036140442e-06, -4.235655069351196e-06, -4.088506102561951e-06, -3.941357135772705e-06, -3.7942081689834595e-06, -3.647059202194214e-06, -3.4999102354049683e-06, -3.3527612686157227e-06, -3.205612301826477e-06, -3.0584633350372314e-06, -2.911314368247986e-06, -2.7641654014587402e-06, -2.6170164346694946e-06, -2.469867467880249e-06, -2.3227185010910034e-06, -2.175569534301758e-06, -2.028420567512512e-06, -1.8812716007232666e-06, -1.734122633934021e-06, -1.5869736671447754e-06, -1.4398247003555298e-06, -1.2926757335662842e-06, -1.1455267667770386e-06, -9.98377799987793e-07, -8.512288331985474e-07, -7.040798664093018e-07, -5.569308996200562e-07, -4.0978193283081055e-07, -2.6263296604156494e-07, -1.1548399925231934e-07, 3.166496753692627e-08, 1.7881393432617188e-07, 3.259629011154175e-07, 4.731118679046631e-07, 6.202608346939087e-07, 7.674098014831543e-07, 9.145587682723999e-07, 1.0617077350616455e-06, 1.2088567018508911e-06, 1.3560056686401367e-06, 1.5031546354293823e-06, 1.650303602218628e-06, 1.7974525690078735e-06, 1.944601535797119e-06, 2.0917505025863647e-06, 2.2388994693756104e-06, 2.386048436164856e-06, 2.5331974029541016e-06, 2.680346369743347e-06, 2.8274953365325928e-06, 2.9746443033218384e-06, 3.121793270111084e-06, 3.2689422369003296e-06, 3.416091203689575e-06, 3.563240170478821e-06, 3.7103891372680664e-06, 3.857538104057312e-06, 4.004687070846558e-06, 4.151836037635803e-06, 4.298985004425049e-06, 4.4461339712142944e-06, 4.59328293800354e-06, 4.740431904792786e-06, 4.887580871582031e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 10.0, 21.0, 33.0, 22.0, 41.0, 74.0, 89.0, 141.0, 187.0, 275.0, 412.0, 583.0, 846.0, 1242.0, 1699.0, 3446.0, 4039.0, 5995.0, 9383.0, 16970.0, 38302.0, 134167.0, 720431.0, 55934.0, 21151.0, 11324.0, 6944.0, 4380.0, 4069.0, 1923.0, 1333.0, 935.0, 686.0, 434.0, 336.0, 211.0, 144.0, 105.0, 78.0, 58.0, 26.0, 38.0, 21.0, 11.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-5.900859832763672e-06, -5.717389285564423e-06, -5.533918738365173e-06, -5.350448191165924e-06, -5.166977643966675e-06, -4.9835070967674255e-06, -4.800036549568176e-06, -4.616566002368927e-06, -4.433095455169678e-06, -4.2496249079704285e-06, -4.066154360771179e-06, -3.88268381357193e-06, -3.6992132663726807e-06, -3.5157427191734314e-06, -3.332272171974182e-06, -3.148801624774933e-06, -2.9653310775756836e-06, -2.7818605303764343e-06, -2.598389983177185e-06, -2.414919435977936e-06, -2.2314488887786865e-06, -2.0479783415794373e-06, -1.864507794380188e-06, -1.6810372471809387e-06, -1.4975666999816895e-06, -1.3140961527824402e-06, -1.130625605583191e-06, -9.471550583839417e-07, -7.636845111846924e-07, -5.802139639854431e-07, -3.9674341678619385e-07, -2.1327286958694458e-07, -2.9802322387695312e-08, 1.5366822481155396e-07, 3.371387720108032e-07, 5.206093192100525e-07, 7.040798664093018e-07, 8.87550413608551e-07, 1.0710209608078003e-06, 1.2544915080070496e-06, 1.4379620552062988e-06, 1.621432602405548e-06, 1.8049031496047974e-06, 1.9883736968040466e-06, 2.171844244003296e-06, 2.355314791202545e-06, 2.5387853384017944e-06, 2.7222558856010437e-06, 2.905726432800293e-06, 3.0891969799995422e-06, 3.2726675271987915e-06, 3.4561380743980408e-06, 3.63960862159729e-06, 3.823079168796539e-06, 4.0065497159957886e-06, 4.190020263195038e-06, 4.373490810394287e-06, 4.556961357593536e-06, 4.740431904792786e-06, 4.923902451992035e-06, 5.107372999191284e-06, 5.2908435463905334e-06, 5.474314093589783e-06, 5.657784640789032e-06, 5.841255187988281e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 845.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 12.0, 7.0, 15.0, 14.0, 29.0, 39.0, 35.0, 64.0, 66.0, 131.0, 141.0, 199.0, 276.0, 455.0, 529.0, 694.0, 1051.0, 1975.0, 2281.0, 3227.0, 4689.0, 9530.0, 13046.0, 23829.0, 60461.0, 764878.0, 98552.0, 23746.0, 13070.0, 8232.0, 6154.0, 3208.0, 2224.0, 1525.0, 1350.0, 770.0, 538.0, 412.0, 335.0, 185.0, 146.0, 97.0, 82.0, 77.0, 41.0, 43.0, 28.0, 14.0, 18.0, 11.0, 10.0, 6.0, 4.0, 2.0, 1.0, 5.0], "bins": [-8.463859558105469e-06, -8.211471140384674e-06, -7.95908272266388e-06, -7.706694304943085e-06, -7.45430588722229e-06, -7.201917469501495e-06, -6.949529051780701e-06, -6.697140634059906e-06, -6.444752216339111e-06, -6.192363798618317e-06, -5.939975380897522e-06, -5.687586963176727e-06, -5.435198545455933e-06, -5.182810127735138e-06, -4.930421710014343e-06, -4.678033292293549e-06, -4.425644874572754e-06, -4.173256456851959e-06, -3.9208680391311646e-06, -3.66847962141037e-06, -3.416091203689575e-06, -3.1637027859687805e-06, -2.911314368247986e-06, -2.658925950527191e-06, -2.4065375328063965e-06, -2.154149115085602e-06, -1.9017606973648071e-06, -1.6493722796440125e-06, -1.3969838619232178e-06, -1.144595444202423e-06, -8.922070264816284e-07, -6.398186087608337e-07, -3.8743019104003906e-07, -1.3504177331924438e-07, 1.1734664440155029e-07, 3.6973506212234497e-07, 6.221234798431396e-07, 8.745118975639343e-07, 1.126900315284729e-06, 1.3792887330055237e-06, 1.6316771507263184e-06, 1.884065568447113e-06, 2.1364539861679077e-06, 2.3888424038887024e-06, 2.641230821609497e-06, 2.8936192393302917e-06, 3.1460076570510864e-06, 3.398396074771881e-06, 3.6507844924926758e-06, 3.9031729102134705e-06, 4.155561327934265e-06, 4.40794974565506e-06, 4.6603381633758545e-06, 4.912726581096649e-06, 5.165114998817444e-06, 5.4175034165382385e-06, 5.669891834259033e-06, 5.922280251979828e-06, 6.1746686697006226e-06, 6.427057087421417e-06, 6.679445505142212e-06, 6.931833922863007e-06, 7.184222340583801e-06, 7.436610758304596e-06, 7.68899917602539e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 7.0, 4.0, 4.0, 8.0, 7.0, 7.0, 16.0, 5.0, 11.0, 29.0, 19.0, 37.0, 574.0, 70.0, 43.0, 26.0, 32.0, 13.0, 7.0, 19.0, 7.0, 12.0, 7.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2649765014648438e-06, -2.1867454051971436e-06, -2.1085143089294434e-06, -2.030283212661743e-06, -1.952052116394043e-06, -1.8738210201263428e-06, -1.7955899238586426e-06, -1.7173588275909424e-06, -1.6391277313232422e-06, -1.560896635055542e-06, -1.4826655387878418e-06, -1.4044344425201416e-06, -1.3262033462524414e-06, -1.2479722499847412e-06, -1.169741153717041e-06, -1.0915100574493408e-06, -1.0132789611816406e-06, -9.350478649139404e-07, -8.568167686462402e-07, -7.7858567237854e-07, -7.003545761108398e-07, -6.221234798431396e-07, -5.438923835754395e-07, -4.6566128730773926e-07, -3.8743019104003906e-07, -3.0919909477233887e-07, -2.3096799850463867e-07, -1.5273690223693848e-07, -7.450580596923828e-08, 3.725290298461914e-09, 8.195638656616211e-08, 1.601874828338623e-07, 2.384185791015625e-07, 3.166496753692627e-07, 3.948807716369629e-07, 4.731118679046631e-07, 5.513429641723633e-07, 6.295740604400635e-07, 7.078051567077637e-07, 7.860362529754639e-07, 8.642673492431641e-07, 9.424984455108643e-07, 1.0207295417785645e-06, 1.0989606380462646e-06, 1.1771917343139648e-06, 1.255422830581665e-06, 1.3336539268493652e-06, 1.4118850231170654e-06, 1.4901161193847656e-06, 1.5683472156524658e-06, 1.646578311920166e-06, 1.7248094081878662e-06, 1.8030405044555664e-06, 1.8812716007232666e-06, 1.959502696990967e-06, 2.037733793258667e-06, 2.115964889526367e-06, 2.1941959857940674e-06, 2.2724270820617676e-06, 2.3506581783294678e-06, 2.428889274597168e-06, 2.507120370864868e-06, 2.5853514671325684e-06, 2.6635825634002686e-06, 2.7418136596679688e-06]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 7.0, 9.0, 14.0, 13.0, 26.0, 30.0, 40.0, 66.0, 79.0, 104.0, 124.0, 122.0, 91.0, 73.0, 47.0, 45.0, 28.0, 21.0, 12.0, 9.0, 5.0, 10.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.109410459321225e-05, -1.0663046850822866e-05, -1.0231989108433481e-05, -9.800931366044097e-06, -9.369873623654712e-06, -8.938815881265327e-06, -8.507758138875943e-06, -8.076700396486558e-06, -7.645642654097173e-06, -7.214584911707789e-06, -6.783527169318404e-06, -6.352469426929019e-06, -5.921411684539635e-06, -5.49035394215025e-06, -5.059296199760865e-06, -4.628238457371481e-06, -4.197180714982096e-06, -3.7661229725927114e-06, -3.335065230203327e-06, -2.904007487813942e-06, -2.4729497454245575e-06, -2.041892003035173e-06, -1.6108342606457882e-06, -1.1797765182564035e-06, -7.487187758670188e-07, -3.176610334776342e-07, 1.1339670891175047e-07, 5.444544513011351e-07, 9.755121936905198e-07, 1.4065699360799044e-06, 1.837627678469289e-06, 2.2686854208586738e-06, 2.69974407274276e-06, 3.130801815132145e-06, 3.5618595575215295e-06, 3.992917299910914e-06, 4.423975042300299e-06, 4.8550327846896835e-06, 5.286090527079068e-06, 5.717148269468453e-06, 6.1482060118578374e-06, 6.579263754247222e-06, 7.010321496636607e-06, 7.441379239025991e-06, 7.872436981415376e-06, 8.30349472380476e-06, 8.734552466194145e-06, 9.16561020858353e-06, 9.596667950972915e-06, 1.00277256933623e-05, 1.0458783435751684e-05, 1.0889841178141069e-05, 1.1320898920530453e-05, 1.1751956662919838e-05, 1.2183014405309223e-05, 1.2614072147698607e-05, 1.3045129890087992e-05, 1.3476187632477377e-05, 1.3907245374866761e-05, 1.4338303117256146e-05, 1.476936085964553e-05, 1.5200418602034915e-05, 1.56314763444243e-05, 1.6062534996308386e-05, 1.649359182920307e-05]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 3.0, 7.0, 14.0, 6.0, 7.0, 11.0, 9.0, 16.0, 24.0, 26.0, 26.0, 37.0, 28.0, 26.0, 28.0, 43.0, 36.0, 35.0, 37.0, 35.0, 49.0, 38.0, 37.0, 34.0, 40.0, 45.0, 29.0, 29.0, 35.0, 23.0, 32.0, 25.0, 18.0, 21.0, 14.0, 11.0, 14.0, 14.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.045482107059797e-06, -6.80291623211815e-06, -6.560350357176503e-06, -6.317784936982207e-06, -6.07521906204056e-06, -5.832653187098913e-06, -5.590087312157266e-06, -5.347521437215619e-06, -5.104955562273972e-06, -4.862389687332325e-06, -4.619823812390678e-06, -4.377257937449031e-06, -4.134692517254734e-06, -3.892126642313087e-06, -3.6495607673714403e-06, -3.4069948924297933e-06, -3.164429472235497e-06, -2.92186359729385e-06, -2.6792979497258784e-06, -2.4367320747842314e-06, -2.1941664272162598e-06, -1.9516005522746127e-06, -1.7090346773329657e-06, -1.4664689160781563e-06, -1.223903154823347e-06, -9.813373935685377e-07, -7.387715754703095e-07, -4.962057573720813e-07, -2.5363999611727195e-07, -1.1074234862462617e-08, 2.3149164007918444e-07, 4.7405740133399377e-07, 7.166227078414522e-07, 9.591884690962615e-07, 1.2017542303510709e-06, 1.444320105292718e-06, 1.6868858665475273e-06, 1.9294516278023366e-06, 2.1720175027439836e-06, 2.4145833776856307e-06, 2.6571490252536023e-06, 2.8997149001952494e-06, 3.142280547763221e-06, 3.384846422704868e-06, 3.627412297646515e-06, 3.869978172588162e-06, 4.112544047529809e-06, 4.355109467724105e-06, 4.597675342665752e-06, 4.8402412176073994e-06, 5.0828070925490465e-06, 5.325372512743343e-06, 5.56793838768499e-06, 5.810504262626637e-06, 6.053070137568284e-06, 6.295636012509931e-06, 6.538201887451578e-06, 6.780767762393225e-06, 7.023333637334872e-06, 7.265899512276519e-06, 7.508464932470815e-06, 7.751030352665111e-06, 7.993596227606758e-06, 8.236162102548406e-06, 8.478727977490053e-06]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 6.0, 7.0, 9.0, 18.0, 28.0, 36.0, 67.0, 106.0, 136.0, 217.0, 315.0, 310.0, 556.0, 770.0, 1196.0, 1715.0, 2445.0, 3761.0, 5513.0, 8698.0, 13780.0, 22187.0, 37357.0, 66031.0, 124445.0, 261807.0, 721993.0, 1352812.0, 936899.0, 309103.0, 140609.0, 74275.0, 41325.0, 24167.0, 14940.0, 9126.0, 5912.0, 3884.0, 2522.0, 1647.0, 1157.0, 722.0, 548.0, 282.0, 277.0, 181.0, 132.0, 87.0, 66.0, 43.0, 21.0, 20.0, 20.0, 4.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0], "bins": [-9.298324584960938e-06, -9.004026651382446e-06, -8.709728717803955e-06, -8.415430784225464e-06, -8.121132850646973e-06, -7.826834917068481e-06, -7.53253698348999e-06, -7.238239049911499e-06, -6.943941116333008e-06, -6.649643182754517e-06, -6.355345249176025e-06, -6.061047315597534e-06, -5.766749382019043e-06, -5.472451448440552e-06, -5.1781535148620605e-06, -4.883855581283569e-06, -4.589557647705078e-06, -4.295259714126587e-06, -4.000961780548096e-06, -3.7066638469696045e-06, -3.4123659133911133e-06, -3.118067979812622e-06, -2.823770046234131e-06, -2.5294721126556396e-06, -2.2351741790771484e-06, -1.9408762454986572e-06, -1.646578311920166e-06, -1.3522803783416748e-06, -1.0579824447631836e-06, -7.636845111846924e-07, -4.6938657760620117e-07, -1.7508864402770996e-07, 1.1920928955078125e-07, 4.1350722312927246e-07, 7.078051567077637e-07, 1.0021030902862549e-06, 1.296401023864746e-06, 1.5906989574432373e-06, 1.8849968910217285e-06, 2.1792948246002197e-06, 2.473592758178711e-06, 2.767890691757202e-06, 3.0621886253356934e-06, 3.3564865589141846e-06, 3.6507844924926758e-06, 3.945082426071167e-06, 4.239380359649658e-06, 4.533678293228149e-06, 4.827976226806641e-06, 5.122274160385132e-06, 5.416572093963623e-06, 5.710870027542114e-06, 6.0051679611206055e-06, 6.299465894699097e-06, 6.593763828277588e-06, 6.888061761856079e-06, 7.18235969543457e-06, 7.4766576290130615e-06, 7.770955562591553e-06, 8.065253496170044e-06, 8.359551429748535e-06, 8.653849363327026e-06, 8.948147296905518e-06, 9.242445230484009e-06, 9.5367431640625e-06]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 3.0, 6.0, 10.0, 8.0, 6.0, 19.0, 15.0, 22.0, 26.0, 19.0, 22.0, 44.0, 25.0, 29.0, 38.0, 30.0, 37.0, 48.0, 31.0, 43.0, 58.0, 34.0, 38.0, 47.0, 22.0, 48.0, 25.0, 24.0, 49.0, 19.0, 23.0, 31.0, 10.0, 12.0, 12.0, 8.0, 7.0, 10.0, 9.0, 9.0, 10.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.0531158447265625e-06, -3.913417458534241e-06, -3.773719072341919e-06, -3.634020686149597e-06, -3.4943222999572754e-06, -3.3546239137649536e-06, -3.214925527572632e-06, -3.07522714138031e-06, -2.9355287551879883e-06, -2.7958303689956665e-06, -2.6561319828033447e-06, -2.516433596611023e-06, -2.376735210418701e-06, -2.2370368242263794e-06, -2.0973384380340576e-06, -1.957640051841736e-06, -1.817941665649414e-06, -1.6782432794570923e-06, -1.5385448932647705e-06, -1.3988465070724487e-06, -1.259148120880127e-06, -1.1194497346878052e-06, -9.797513484954834e-07, -8.400529623031616e-07, -7.003545761108398e-07, -5.606561899185181e-07, -4.209578037261963e-07, -2.812594175338745e-07, -1.4156103134155273e-07, -1.862645149230957e-09, 1.3783574104309082e-07, 2.775341272354126e-07, 4.172325134277344e-07, 5.569308996200562e-07, 6.966292858123779e-07, 8.363276720046997e-07, 9.760260581970215e-07, 1.1157244443893433e-06, 1.255422830581665e-06, 1.3951212167739868e-06, 1.5348196029663086e-06, 1.6745179891586304e-06, 1.8142163753509521e-06, 1.953914761543274e-06, 2.0936131477355957e-06, 2.2333115339279175e-06, 2.3730099201202393e-06, 2.512708306312561e-06, 2.652406692504883e-06, 2.7921050786972046e-06, 2.9318034648895264e-06, 3.071501851081848e-06, 3.21120023727417e-06, 3.3508986234664917e-06, 3.4905970096588135e-06, 3.6302953958511353e-06, 3.769993782043457e-06, 3.909692168235779e-06, 4.049390554428101e-06, 4.189088940620422e-06, 4.328787326812744e-06, 4.468485713005066e-06, 4.608184099197388e-06, 4.7478824853897095e-06, 4.887580871582031e-06]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 10.0, 12.0, 22.0, 34.0, 39.0, 67.0, 85.0, 120.0, 175.0, 267.0, 404.0, 584.0, 1142.0, 1448.0, 2096.0, 3203.0, 4943.0, 7716.0, 12055.0, 19257.0, 31278.0, 71029.0, 106472.0, 201963.0, 427783.0, 1016186.0, 1217737.0, 525674.0, 241479.0, 123750.0, 81002.0, 35723.0, 22126.0, 13878.0, 8524.0, 5422.0, 3520.0, 2345.0, 1538.0, 1173.0, 632.0, 414.0, 292.0, 214.0, 159.0, 92.0, 54.0, 52.0, 42.0, 14.0, 21.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-7.867813110351562e-06, -7.622875273227692e-06, -7.377937436103821e-06, -7.13299959897995e-06, -6.888061761856079e-06, -6.643123924732208e-06, -6.398186087608337e-06, -6.1532482504844666e-06, -5.908310413360596e-06, -5.663372576236725e-06, -5.418434739112854e-06, -5.173496901988983e-06, -4.928559064865112e-06, -4.6836212277412415e-06, -4.438683390617371e-06, -4.1937455534935e-06, -3.948807716369629e-06, -3.703869879245758e-06, -3.458932042121887e-06, -3.2139942049980164e-06, -2.9690563678741455e-06, -2.7241185307502747e-06, -2.479180693626404e-06, -2.234242856502533e-06, -1.989305019378662e-06, -1.7443671822547913e-06, -1.4994293451309204e-06, -1.2544915080070496e-06, -1.0095536708831787e-06, -7.646158337593079e-07, -5.19677996635437e-07, -2.7474015951156616e-07, -2.9802322387695312e-08, 2.1513551473617554e-07, 4.600733518600464e-07, 7.050111889839172e-07, 9.499490261077881e-07, 1.194886863231659e-06, 1.4398247003555298e-06, 1.6847625374794006e-06, 1.9297003746032715e-06, 2.1746382117271423e-06, 2.419576048851013e-06, 2.664513885974884e-06, 2.909451723098755e-06, 3.1543895602226257e-06, 3.3993273973464966e-06, 3.6442652344703674e-06, 3.889203071594238e-06, 4.134140908718109e-06, 4.37907874584198e-06, 4.624016582965851e-06, 4.868954420089722e-06, 5.1138922572135925e-06, 5.358830094337463e-06, 5.603767931461334e-06, 5.848705768585205e-06, 6.093643605709076e-06, 6.338581442832947e-06, 6.583519279956818e-06, 6.8284571170806885e-06, 7.073394954204559e-06, 7.31833279132843e-06, 7.563270628452301e-06, 7.808208465576172e-06]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 9.0, 4.0, 8.0, 17.0, 12.0, 8.0, 16.0, 38.0, 28.0, 26.0, 64.0, 39.0, 40.0, 49.0, 125.0, 81.0, 93.0, 116.0, 274.0, 155.0, 171.0, 178.0, 435.0, 211.0, 200.0, 360.0, 193.0, 138.0, 128.0, 231.0, 77.0, 73.0, 56.0, 122.0, 58.0, 50.0, 29.0, 64.0, 16.0, 16.0, 22.0, 9.0, 5.0, 5.0, 10.0, 6.0, 3.0, 2.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.384185791015625e-06, -2.3087486624717712e-06, -2.2333115339279175e-06, -2.1578744053840637e-06, -2.08243727684021e-06, -2.007000148296356e-06, -1.9315630197525024e-06, -1.8561258912086487e-06, -1.780688762664795e-06, -1.7052516341209412e-06, -1.6298145055770874e-06, -1.5543773770332336e-06, -1.4789402484893799e-06, -1.4035031199455261e-06, -1.3280659914016724e-06, -1.2526288628578186e-06, -1.1771917343139648e-06, -1.101754605770111e-06, -1.0263174772262573e-06, -9.508803486824036e-07, -8.754432201385498e-07, -8.00006091594696e-07, -7.245689630508423e-07, -6.491318345069885e-07, -5.736947059631348e-07, -4.98257577419281e-07, -4.2282044887542725e-07, -3.473833203315735e-07, -2.7194619178771973e-07, -1.9650906324386597e-07, -1.210719347000122e-07, -4.563480615615845e-08, 2.9802322387695312e-08, 1.0523945093154907e-07, 1.8067657947540283e-07, 2.561137080192566e-07, 3.3155083656311035e-07, 4.069879651069641e-07, 4.824250936508179e-07, 5.578622221946716e-07, 6.332993507385254e-07, 7.087364792823792e-07, 7.841736078262329e-07, 8.596107363700867e-07, 9.350478649139404e-07, 1.0104849934577942e-06, 1.085922122001648e-06, 1.1613592505455017e-06, 1.2367963790893555e-06, 1.3122335076332092e-06, 1.387670636177063e-06, 1.4631077647209167e-06, 1.5385448932647705e-06, 1.6139820218086243e-06, 1.689419150352478e-06, 1.7648562788963318e-06, 1.8402934074401855e-06, 1.9157305359840393e-06, 1.991167664527893e-06, 2.066604793071747e-06, 2.1420419216156006e-06, 2.2174790501594543e-06, 2.292916178703308e-06, 2.368353307247162e-06, 2.4437904357910156e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 8.0, 6.0, 4.0, 17.0, 14.0, 21.0, 28.0, 35.0, 55.0, 59.0, 78.0, 107.0, 120.0, 109.0, 68.0, 58.0, 43.0, 38.0, 21.0, 17.0, 13.0, 18.0, 14.0, 10.0, 8.0, 4.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.703766757709673e-06, -6.4593550632707775e-06, -6.214943368831882e-06, -5.970531674392987e-06, -5.726119525206741e-06, -5.481707830767846e-06, -5.2372961363289505e-06, -4.992884441890055e-06, -4.74847274745116e-06, -4.504061053012265e-06, -4.25964935857337e-06, -4.015237209387124e-06, -3.7708255149482284e-06, -3.526413820509333e-06, -3.282002126070438e-06, -3.0375904316315427e-06, -2.7931782824452966e-06, -2.5487665880064014e-06, -2.3043546661938308e-06, -2.0599429717549356e-06, -1.8155311636292026e-06, -1.5711193555034697e-06, -1.3267076610645745e-06, -1.0822958529388416e-06, -8.378840448131086e-07, -5.934722366873757e-07, -3.4906048540506163e-07, -1.0464873412274756e-07, 1.3976307400298538e-07, 3.841748821287183e-07, 6.285865765676135e-07, 8.729983846933465e-07, 1.1174097380717285e-06, 1.3618215461974614e-06, 1.6062333543231944e-06, 1.8506450487620896e-06, 2.0950569705746602e-06, 2.3394686650135554e-06, 2.5838803594524506e-06, 2.828292053891346e-06, 3.0727039757039165e-06, 3.3171156701428117e-06, 3.5615275919553824e-06, 3.8059392863942776e-06, 4.050350980833173e-06, 4.294763130019419e-06, 4.539174369710963e-06, 4.783586518897209e-06, 5.0279982133361045e-06, 5.272409907775e-06, 5.516821602213895e-06, 5.76123329665279e-06, 6.005645445839036e-06, 6.2500571402779315e-06, 6.494468834716827e-06, 6.738880529155722e-06, 6.983292223594617e-06, 7.227703918033512e-06, 7.4721156124724075e-06, 7.716527761658654e-06, 7.960939001350198e-06, 8.205351150536444e-06, 8.449762390227988e-06, 8.694174539414234e-06, 8.93858668860048e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 5.0, 9.0, 9.0, 15.0, 17.0, 18.0, 20.0, 21.0, 24.0, 33.0, 37.0, 36.0, 35.0, 35.0, 33.0, 43.0, 35.0, 43.0, 57.0, 48.0, 50.0, 40.0, 33.0, 29.0, 26.0, 31.0, 38.0, 30.0, 30.0, 17.0, 20.0, 11.0, 12.0, 12.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.673425337387016e-06, -4.511319275479764e-06, -4.3492132135725114e-06, -4.187107151665259e-06, -4.025001089758007e-06, -3.8628950278507546e-06, -3.7007889659435023e-06, -3.53868290403625e-06, -3.3765768421289977e-06, -3.2144707802217454e-06, -3.052364718314493e-06, -2.8902586564072408e-06, -2.7281525944999885e-06, -2.566046532592736e-06, -2.403940470685484e-06, -2.2418344087782316e-06, -2.0797283468709793e-06, -1.917622284963727e-06, -1.7555162230564747e-06, -1.5934101611492224e-06, -1.4313040992419701e-06, -1.2691980373347178e-06, -1.1070919754274655e-06, -9.449859135202132e-07, -7.828798516129609e-07, -6.207737897057086e-07, -4.586677277984563e-07, -2.9656166589120403e-07, -1.3445560398395173e-07, 2.7650457923300564e-08, 1.8975651983055286e-07, 3.5186258173780516e-07, 5.139686436450575e-07, 6.760747055523098e-07, 8.38180767459562e-07, 1.0002868293668143e-06, 1.1623928912740666e-06, 1.324498953181319e-06, 1.4866050150885712e-06, 1.6487110769958235e-06, 1.8108171389030758e-06, 1.972923200810328e-06, 2.1350292627175804e-06, 2.2971353246248327e-06, 2.459241386532085e-06, 2.6213474484393373e-06, 2.7834535103465896e-06, 2.945559572253842e-06, 3.107665634161094e-06, 3.2697716960683465e-06, 3.431877757975599e-06, 3.593983819882851e-06, 3.7560898817901034e-06, 3.918195943697356e-06, 4.080302005604608e-06, 4.24240806751186e-06, 4.404514129419113e-06, 4.566620191326365e-06, 4.728726253233617e-06, 4.8908323151408695e-06, 5.052938377048122e-06, 5.215044438955374e-06, 5.377150500862626e-06, 5.539256562769879e-06, 5.701362624677131e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 8.0, 7.0, 10.0, 30.0, 41.0, 59.0, 86.0, 109.0, 167.0, 239.0, 322.0, 467.0, 551.0, 1013.0, 1599.0, 2549.0, 4093.0, 6812.0, 11040.0, 18711.0, 22443.0, 49633.0, 89031.0, 161962.0, 250324.0, 187067.0, 103151.0, 56663.0, 25828.0, 21284.0, 12601.0, 7457.0, 4704.0, 2965.0, 1887.0, 1217.0, 626.0, 622.0, 376.0, 249.0, 178.0, 117.0, 88.0, 41.0, 33.0, 25.0, 17.0, 16.0, 14.0, 6.0, 7.0, 2.0, 2.0], "bins": [-8.225440979003906e-06, -7.994472980499268e-06, -7.763504981994629e-06, -7.53253698348999e-06, -7.3015689849853516e-06, -7.070600986480713e-06, -6.839632987976074e-06, -6.6086649894714355e-06, -6.377696990966797e-06, -6.146728992462158e-06, -5.9157609939575195e-06, -5.684792995452881e-06, -5.453824996948242e-06, -5.2228569984436035e-06, -4.991888999938965e-06, -4.760921001434326e-06, -4.5299530029296875e-06, -4.298985004425049e-06, -4.06801700592041e-06, -3.8370490074157715e-06, -3.606081008911133e-06, -3.375113010406494e-06, -3.1441450119018555e-06, -2.913177013397217e-06, -2.682209014892578e-06, -2.4512410163879395e-06, -2.2202730178833008e-06, -1.989305019378662e-06, -1.7583370208740234e-06, -1.5273690223693848e-06, -1.296401023864746e-06, -1.0654330253601074e-06, -8.344650268554688e-07, -6.034970283508301e-07, -3.725290298461914e-07, -1.4156103134155273e-07, 8.940696716308594e-08, 3.203749656677246e-07, 5.513429641723633e-07, 7.82310962677002e-07, 1.0132789611816406e-06, 1.2442469596862793e-06, 1.475214958190918e-06, 1.7061829566955566e-06, 1.9371509552001953e-06, 2.168118953704834e-06, 2.3990869522094727e-06, 2.6300549507141113e-06, 2.86102294921875e-06, 3.0919909477233887e-06, 3.3229589462280273e-06, 3.553926944732666e-06, 3.7848949432373047e-06, 4.015862941741943e-06, 4.246830940246582e-06, 4.477798938751221e-06, 4.708766937255859e-06, 4.939734935760498e-06, 5.170702934265137e-06, 5.401670932769775e-06, 5.632638931274414e-06, 5.863606929779053e-06, 6.094574928283691e-06, 6.32554292678833e-06, 6.556510925292969e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 6.0, 11.0, 5.0, 8.0, 11.0, 13.0, 19.0, 12.0, 24.0, 12.0, 27.0, 25.0, 42.0, 26.0, 28.0, 46.0, 27.0, 38.0, 42.0, 44.0, 46.0, 33.0, 48.0, 48.0, 58.0, 42.0, 20.0, 35.0, 32.0, 26.0, 15.0, 22.0, 26.0, 14.0, 16.0, 7.0, 14.0, 8.0, 5.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-4.231929779052734e-06, -4.07826155424118e-06, -3.9245933294296265e-06, -3.7709251046180725e-06, -3.6172568798065186e-06, -3.4635886549949646e-06, -3.3099204301834106e-06, -3.1562522053718567e-06, -3.0025839805603027e-06, -2.8489157557487488e-06, -2.695247530937195e-06, -2.541579306125641e-06, -2.387911081314087e-06, -2.234242856502533e-06, -2.080574631690979e-06, -1.926906406879425e-06, -1.773238182067871e-06, -1.6195699572563171e-06, -1.4659017324447632e-06, -1.3122335076332092e-06, -1.1585652828216553e-06, -1.0048970580101013e-06, -8.512288331985474e-07, -6.975606083869934e-07, -5.438923835754395e-07, -3.902241587638855e-07, -2.3655593395233154e-07, -8.288770914077759e-08, 7.078051567077637e-08, 2.2444874048233032e-07, 3.781169652938843e-07, 5.317851901054382e-07, 6.854534149169922e-07, 8.391216397285461e-07, 9.927898645401e-07, 1.146458089351654e-06, 1.300126314163208e-06, 1.453794538974762e-06, 1.607462763786316e-06, 1.7611309885978699e-06, 1.914799213409424e-06, 2.0684674382209778e-06, 2.2221356630325317e-06, 2.3758038878440857e-06, 2.5294721126556396e-06, 2.6831403374671936e-06, 2.8368085622787476e-06, 2.9904767870903015e-06, 3.1441450119018555e-06, 3.2978132367134094e-06, 3.4514814615249634e-06, 3.6051496863365173e-06, 3.7588179111480713e-06, 3.912486135959625e-06, 4.066154360771179e-06, 4.219822585582733e-06, 4.373490810394287e-06, 4.527159035205841e-06, 4.680827260017395e-06, 4.834495484828949e-06, 4.988163709640503e-06, 5.141831934452057e-06, 5.295500159263611e-06, 5.449168384075165e-06, 5.602836608886719e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 16.0, 25.0, 40.0, 43.0, 71.0, 106.0, 148.0, 259.0, 417.0, 751.0, 1213.0, 2696.0, 6386.0, 16099.0, 134737.0, 835608.0, 33557.0, 8373.0, 3922.0, 1811.0, 854.0, 557.0, 268.0, 196.0, 139.0, 69.0, 60.0, 33.0, 24.0, 17.0, 14.0, 10.0, 8.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.800060272216797e-05, -1.748930662870407e-05, -1.6978010535240173e-05, -1.6466714441776276e-05, -1.5955418348312378e-05, -1.544412225484848e-05, -1.4932826161384583e-05, -1.4421530067920685e-05, -1.3910233974456787e-05, -1.339893788099289e-05, -1.2887641787528992e-05, -1.2376345694065094e-05, -1.1865049600601196e-05, -1.1353753507137299e-05, -1.0842457413673401e-05, -1.0331161320209503e-05, -9.819865226745605e-06, -9.308569133281708e-06, -8.79727303981781e-06, -8.285976946353912e-06, -7.774680852890015e-06, -7.263384759426117e-06, -6.752088665962219e-06, -6.2407925724983215e-06, -5.729496479034424e-06, -5.218200385570526e-06, -4.706904292106628e-06, -4.195608198642731e-06, -3.684312105178833e-06, -3.1730160117149353e-06, -2.6617199182510376e-06, -2.15042382478714e-06, -1.6391277313232422e-06, -1.1278316378593445e-06, -6.165355443954468e-07, -1.0523945093154907e-07, 4.0605664253234863e-07, 9.173527359962463e-07, 1.428648829460144e-06, 1.9399449229240417e-06, 2.4512410163879395e-06, 2.962537109851837e-06, 3.473833203315735e-06, 3.9851292967796326e-06, 4.49642539024353e-06, 5.007721483707428e-06, 5.519017577171326e-06, 6.030313670635223e-06, 6.541609764099121e-06, 7.052905857563019e-06, 7.5642019510269165e-06, 8.075498044490814e-06, 8.586794137954712e-06, 9.09809023141861e-06, 9.609386324882507e-06, 1.0120682418346405e-05, 1.0631978511810303e-05, 1.11432746052742e-05, 1.1654570698738098e-05, 1.2165866792201996e-05, 1.2677162885665894e-05, 1.3188458979129791e-05, 1.3699755072593689e-05, 1.4211051166057587e-05, 1.4722347259521484e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 6.0, 4.0, 0.0, 7.0, 11.0, 18.0, 15.0, 18.0, 16.0, 24.0, 31.0, 56.0, 77.0, 370.0, 66.0, 55.0, 51.0, 38.0, 24.0, 21.0, 14.0, 18.0, 12.0, 0.0, 8.0, 5.0, 9.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-06, -1.7909333109855652e-06, -1.734122633934021e-06, -1.6773119568824768e-06, -1.6205012798309326e-06, -1.5636906027793884e-06, -1.5068799257278442e-06, -1.4500692486763e-06, -1.3932585716247559e-06, -1.3364478945732117e-06, -1.2796372175216675e-06, -1.2228265404701233e-06, -1.166015863418579e-06, -1.109205186367035e-06, -1.0523945093154907e-06, -9.955838322639465e-07, -9.387731552124023e-07, -8.819624781608582e-07, -8.25151801109314e-07, -7.683411240577698e-07, -7.115304470062256e-07, -6.547197699546814e-07, -5.979090929031372e-07, -5.41098415851593e-07, -4.842877388000488e-07, -4.2747706174850464e-07, -3.7066638469696045e-07, -3.1385570764541626e-07, -2.5704503059387207e-07, -2.0023435354232788e-07, -1.434236764907837e-07, -8.66129994392395e-08, -2.9802322387695312e-08, 2.7008354663848877e-08, 8.381903171539307e-08, 1.4062970876693726e-07, 1.9744038581848145e-07, 2.5425106287002563e-07, 3.110617399215698e-07, 3.67872416973114e-07, 4.246830940246582e-07, 4.814937710762024e-07, 5.383044481277466e-07, 5.951151251792908e-07, 6.51925802230835e-07, 7.087364792823792e-07, 7.655471563339233e-07, 8.223578333854675e-07, 8.791685104370117e-07, 9.359791874885559e-07, 9.927898645401e-07, 1.0496005415916443e-06, 1.1064112186431885e-06, 1.1632218956947327e-06, 1.2200325727462769e-06, 1.276843249797821e-06, 1.3336539268493652e-06, 1.3904646039009094e-06, 1.4472752809524536e-06, 1.5040859580039978e-06, 1.560896635055542e-06, 1.6177073121070862e-06, 1.6745179891586304e-06, 1.7313286662101746e-06, 1.7881393432617188e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 2.0, 6.0, 5.0, 10.0, 13.0, 20.0, 16.0, 35.0, 57.0, 102.0, 88.0, 225.0, 295.0, 733.0, 721.0, 1817.0, 4585.0, 13609.0, 72576.0, 902274.0, 35388.0, 9342.0, 3231.0, 1043.0, 1047.0, 526.0, 267.0, 148.0, 137.0, 80.0, 72.0, 15.0, 23.0, 18.0, 12.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.662441253662109e-06, -5.49759715795517e-06, -5.33275306224823e-06, -5.16790896654129e-06, -5.003064870834351e-06, -4.838220775127411e-06, -4.673376679420471e-06, -4.5085325837135315e-06, -4.343688488006592e-06, -4.178844392299652e-06, -4.014000296592712e-06, -3.849156200885773e-06, -3.684312105178833e-06, -3.5194680094718933e-06, -3.3546239137649536e-06, -3.189779818058014e-06, -3.0249357223510742e-06, -2.8600916266441345e-06, -2.695247530937195e-06, -2.530403435230255e-06, -2.3655593395233154e-06, -2.2007152438163757e-06, -2.035871148109436e-06, -1.8710270524024963e-06, -1.7061829566955566e-06, -1.541338860988617e-06, -1.3764947652816772e-06, -1.2116506695747375e-06, -1.0468065738677979e-06, -8.819624781608582e-07, -7.171183824539185e-07, -5.522742867469788e-07, -3.8743019104003906e-07, -2.2258609533309937e-07, -5.774199962615967e-08, 1.0710209608078003e-07, 2.7194619178771973e-07, 4.367902874946594e-07, 6.016343832015991e-07, 7.664784789085388e-07, 9.313225746154785e-07, 1.0961666703224182e-06, 1.261010766029358e-06, 1.4258548617362976e-06, 1.5906989574432373e-06, 1.755543053150177e-06, 1.9203871488571167e-06, 2.0852312445640564e-06, 2.250075340270996e-06, 2.414919435977936e-06, 2.5797635316848755e-06, 2.744607627391815e-06, 2.909451723098755e-06, 3.0742958188056946e-06, 3.2391399145126343e-06, 3.403984010219574e-06, 3.5688281059265137e-06, 3.7336722016334534e-06, 3.898516297340393e-06, 4.063360393047333e-06, 4.2282044887542725e-06, 4.393048584461212e-06, 4.557892680168152e-06, 4.7227367758750916e-06, 4.887580871582031e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 112.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 683.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 117.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 8.0, 13.0, 23.0, 26.0, 44.0, 49.0, 88.0, 147.0, 176.0, 266.0, 416.0, 646.0, 0.0, 969.0, 1516.0, 2491.0, 4019.0, 7710.0, 13505.0, 30953.0, 79026.0, 764324.0, 78851.0, 31269.0, 13346.0, 0.0, 7794.0, 4058.0, 2463.0, 1492.0, 962.0, 629.0, 428.0, 278.0, 170.0, 136.0, 91.0, 57.0, 0.0, 44.0, 27.0, 20.0, 9.0, 9.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9073486328125e-06, -1.8524006009101868e-06, -1.7974525690078735e-06, -1.7425045371055603e-06, -1.687556505203247e-06, -1.6326084733009338e-06, -1.5776604413986206e-06, -1.5227124094963074e-06, -1.4677643775939941e-06, -1.412816345691681e-06, -1.3578683137893677e-06, -1.3029202818870544e-06, -1.2479722499847412e-06, -1.193024218082428e-06, -1.1380761861801147e-06, -1.0831281542778015e-06, -1.0281801223754883e-06, -9.73232090473175e-07, -9.182840585708618e-07, -8.633360266685486e-07, -8.083879947662354e-07, -7.534399628639221e-07, -6.984919309616089e-07, -6.435438990592957e-07, -5.885958671569824e-07, -5.336478352546692e-07, -4.78699803352356e-07, -4.237517714500427e-07, -3.688037395477295e-07, -3.1385570764541626e-07, -2.5890767574310303e-07, -2.039596438407898e-07, -1.4901161193847656e-07, -9.406358003616333e-08, -3.91155481338501e-08, 1.5832483768463135e-08, 7.078051567077637e-08, 1.257285475730896e-07, 1.8067657947540283e-07, 2.3562461137771606e-07, 2.905726432800293e-07, 3.4552067518234253e-07, 4.0046870708465576e-07, 4.55416738986969e-07, 5.103647708892822e-07, 5.653128027915955e-07, 6.202608346939087e-07, 6.752088665962219e-07, 7.301568984985352e-07, 7.851049304008484e-07, 8.400529623031616e-07, 8.950009942054749e-07, 9.499490261077881e-07, 1.0048970580101013e-06, 1.0598450899124146e-06, 1.1147931218147278e-06, 1.169741153717041e-06, 1.2246891856193542e-06, 1.2796372175216675e-06, 1.3345852494239807e-06, 1.389533281326294e-06, 1.4444813132286072e-06, 1.4994293451309204e-06, 1.5543773770332336e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 0.0, 104.0, 0.0, 0.0, 0.0, 0.0, 643.0, 0.0, 0.0, 0.0, 113.0, 0.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 2.0, 11.0, 2.0, 11.0, 14.0, 16.0, 18.0, 34.0, 39.0, 54.0, 56.0, 92.0, 123.0, 112.0, 89.0, 82.0, 57.0, 31.0, 34.0, 23.0, 18.0, 18.0, 9.0, 11.0, 14.0, 5.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6234288169653155e-06, -6.388960173353553e-06, -6.15449152974179e-06, -5.9200228861300275e-06, -5.685554697265616e-06, -5.451086053653853e-06, -5.21661741004209e-06, -4.982148766430328e-06, -4.747680577565916e-06, -4.513211933954153e-06, -4.2787432903423905e-06, -4.044274646730628e-06, -3.809806457866216e-06, -3.5753378142544534e-06, -3.3408691706426907e-06, -3.106400527030928e-06, -2.8719318834191654e-06, -2.6374632398074027e-06, -2.4029948235693155e-06, -2.168526179957553e-06, -1.9340577637194656e-06, -1.699589120107703e-06, -1.4651204764959402e-06, -1.2306519465710153e-06, -9.961834166460903e-07, -7.617148867211654e-07, -5.272462999528216e-07, -2.9277771318447776e-07, -5.830918325955281e-08, 1.7615934666537214e-07, 4.106279902771348e-07, 6.450965202020598e-07, 8.795650501269847e-07, 1.1140335800519097e-06, 1.3485021099768346e-06, 1.5829707535885973e-06, 1.8174392835135222e-06, 2.051907813438447e-06, 2.28637645705021e-06, 2.5208451006619725e-06, 2.7553135169000598e-06, 2.9897821605118224e-06, 3.2242505767499097e-06, 3.4587192203616723e-06, 3.693187863973435e-06, 3.927656507585198e-06, 4.16212515119696e-06, 4.396593340061372e-06, 4.631061983673135e-06, 4.8655306272848975e-06, 5.09999927089666e-06, 5.334467459761072e-06, 5.568936103372835e-06, 5.803404746984597e-06, 6.03787339059636e-06, 6.272342034208123e-06, 6.506810677819885e-06, 6.741279321431648e-06, 6.975747965043411e-06, 7.210216608655173e-06, 7.444684797519585e-06, 7.679152986383997e-06, 7.913622539490461e-06, 8.148090273607522e-06, 8.382558917219285e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 6.0, 11.0, 8.0, 16.0, 19.0, 22.0, 23.0, 21.0, 31.0, 35.0, 39.0, 29.0, 42.0, 40.0, 31.0, 34.0, 44.0, 56.0, 51.0, 55.0, 37.0, 37.0, 26.0, 28.0, 38.0, 32.0, 31.0, 31.0, 18.0, 19.0, 14.0, 9.0, 14.0, 9.0, 7.0, 4.0, 6.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.610154519468779e-06, -4.4534726839629e-06, -4.296790848457022e-06, -4.140109012951143e-06, -3.9834271774452645e-06, -3.826745341939386e-06, -3.670063733807183e-06, -3.5133818983013043e-06, -3.3567000627954258e-06, -3.2000182272895472e-06, -3.0433363917836687e-06, -2.88665455627779e-06, -2.729972948145587e-06, -2.5732911126397084e-06, -2.41660927713383e-06, -2.2599274416279513e-06, -2.1032456061220728e-06, -1.9465637706161942e-06, -1.7898819351103157e-06, -1.6332002132912748e-06, -1.4765183777853963e-06, -1.3198365422795177e-06, -1.163154820460477e-06, -1.0064729849545984e-06, -8.497911494487198e-07, -6.931093139428413e-07, -5.364275352803816e-07, -3.7974572819621244e-07, -2.2306392111204332e-07, -6.638208560616476e-08, 9.029969305629493e-08, 2.469814717187546e-07, 4.036628524772823e-07, 5.603446879831608e-07, 7.170264666456205e-07, 8.737082453080802e-07, 1.0303900808139588e-06, 1.1870719163198373e-06, 1.3437536381388782e-06, 1.5004354736447567e-06, 1.6571173091506353e-06, 1.8137991446565138e-06, 1.9704809801623924e-06, 2.127162815668271e-06, 2.283844423800474e-06, 2.4405262593063526e-06, 2.597208094812231e-06, 2.7538899303181097e-06, 2.9105717658239882e-06, 3.067253601329867e-06, 3.2239354368357453e-06, 3.380617272341624e-06, 3.5372991078475025e-06, 3.693980943353381e-06, 3.8506627788592596e-06, 4.007344614365138e-06, 4.164025995123666e-06, 4.320707830629544e-06, 4.477389666135423e-06, 4.6340715016413014e-06, 4.79075333714718e-06, 4.9474351726530585e-06, 5.104117008158937e-06, 5.260798388917465e-06, 5.417480679170694e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 18.0, 22.0, 24.0, 49.0, 63.0, 132.0, 137.0, 321.0, 510.0, 643.0, 1366.0, 2099.0, 3417.0, 4251.0, 8211.0, 14053.0, 23608.0, 31679.0, 69043.0, 138340.0, 255752.0, 197650.0, 137869.0, 68849.0, 31356.0, 23851.0, 13771.0, 8567.0, 4205.0, 3413.0, 2114.0, 1297.0, 602.0, 499.0, 310.0, 150.0, 90.0, 81.0, 59.0, 27.0, 19.0, 11.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.463859558105469e-06, -8.181668817996979e-06, -7.899478077888489e-06, -7.617287337779999e-06, -7.335096597671509e-06, -7.052905857563019e-06, -6.770715117454529e-06, -6.488524377346039e-06, -6.206333637237549e-06, -5.924142897129059e-06, -5.641952157020569e-06, -5.359761416912079e-06, -5.077570676803589e-06, -4.795379936695099e-06, -4.513189196586609e-06, -4.230998456478119e-06, -3.948807716369629e-06, -3.666616976261139e-06, -3.384426236152649e-06, -3.102235496044159e-06, -2.820044755935669e-06, -2.537854015827179e-06, -2.255663275718689e-06, -1.973472535610199e-06, -1.691281795501709e-06, -1.409091055393219e-06, -1.126900315284729e-06, -8.44709575176239e-07, -5.62518835067749e-07, -2.8032809495925903e-07, 1.862645149230957e-09, 2.8405338525772095e-07, 5.662441253662109e-07, 8.484348654747009e-07, 1.130625605583191e-06, 1.412816345691681e-06, 1.695007085800171e-06, 1.977197825908661e-06, 2.259388566017151e-06, 2.541579306125641e-06, 2.823770046234131e-06, 3.105960786342621e-06, 3.388151526451111e-06, 3.670342266559601e-06, 3.952533006668091e-06, 4.234723746776581e-06, 4.516914486885071e-06, 4.799105226993561e-06, 5.081295967102051e-06, 5.363486707210541e-06, 5.645677447319031e-06, 5.927868187427521e-06, 6.210058927536011e-06, 6.492249667644501e-06, 6.774440407752991e-06, 7.056631147861481e-06, 7.338821887969971e-06, 7.621012628078461e-06, 7.90320336818695e-06, 8.18539410829544e-06, 8.46758484840393e-06, 8.74977558851242e-06, 9.03196632862091e-06, 9.3141570687294e-06, 9.59634780883789e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 5.0, 16.0, 15.0, 17.0, 17.0, 14.0, 19.0, 22.0, 26.0, 33.0, 38.0, 58.0, 32.0, 43.0, 48.0, 32.0, 63.0, 40.0, 47.0, 45.0, 35.0, 55.0, 38.0, 24.0, 26.0, 30.0, 30.0, 18.0, 19.0, 18.0, 6.0, 19.0, 7.0, 3.0, 11.0, 6.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.933906555175781e-06, -3.8025900721549988e-06, -3.6712735891342163e-06, -3.539957106113434e-06, -3.4086406230926514e-06, -3.277324140071869e-06, -3.1460076570510864e-06, -3.014691174030304e-06, -2.8833746910095215e-06, -2.752058207988739e-06, -2.6207417249679565e-06, -2.489425241947174e-06, -2.3581087589263916e-06, -2.226792275905609e-06, -2.0954757928848267e-06, -1.964159309864044e-06, -1.8328428268432617e-06, -1.7015263438224792e-06, -1.5702098608016968e-06, -1.4388933777809143e-06, -1.3075768947601318e-06, -1.1762604117393494e-06, -1.044943928718567e-06, -9.136274456977844e-07, -7.82310962677002e-07, -6.509944796562195e-07, -5.19677996635437e-07, -3.8836151361465454e-07, -2.5704503059387207e-07, -1.257285475730896e-07, 5.587935447692871e-09, 1.3690441846847534e-07, 2.682209014892578e-07, 3.995373845100403e-07, 5.308538675308228e-07, 6.621703505516052e-07, 7.934868335723877e-07, 9.248033165931702e-07, 1.0561197996139526e-06, 1.1874362826347351e-06, 1.3187527656555176e-06, 1.4500692486763e-06, 1.5813857316970825e-06, 1.712702214717865e-06, 1.8440186977386475e-06, 1.97533518075943e-06, 2.1066516637802124e-06, 2.237968146800995e-06, 2.3692846298217773e-06, 2.50060111284256e-06, 2.6319175958633423e-06, 2.7632340788841248e-06, 2.8945505619049072e-06, 3.0258670449256897e-06, 3.157183527946472e-06, 3.2885000109672546e-06, 3.419816493988037e-06, 3.5511329770088196e-06, 3.682449460029602e-06, 3.8137659430503845e-06, 3.945082426071167e-06, 4.0763989090919495e-06, 4.207715392112732e-06, 4.339031875133514e-06, 4.470348358154297e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 9.0, 3.0, 27.0, 23.0, 36.0, 37.0, 91.0, 110.0, 135.0, 246.0, 267.0, 539.0, 546.0, 1176.0, 1731.0, 1969.0, 3966.0, 4471.0, 8888.0, 14562.0, 17473.0, 37615.0, 46217.0, 104669.0, 129997.0, 242306.0, 187208.0, 83463.0, 66765.0, 30176.0, 24778.0, 11779.0, 10163.0, 6201.0, 3102.0, 2773.0, 1377.0, 1280.0, 867.0, 397.0, 396.0, 199.0, 171.0, 80.0, 100.0, 67.0, 39.0, 35.0, 12.0, 6.0, 9.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-6.735324859619141e-06, -6.522051990032196e-06, -6.3087791204452515e-06, -6.095506250858307e-06, -5.882233381271362e-06, -5.668960511684418e-06, -5.455687642097473e-06, -5.2424147725105286e-06, -5.029141902923584e-06, -4.815869033336639e-06, -4.602596163749695e-06, -4.38932329416275e-06, -4.176050424575806e-06, -3.962777554988861e-06, -3.7495046854019165e-06, -3.536231815814972e-06, -3.3229589462280273e-06, -3.1096860766410828e-06, -2.896413207054138e-06, -2.6831403374671936e-06, -2.469867467880249e-06, -2.2565945982933044e-06, -2.04332172870636e-06, -1.8300488591194153e-06, -1.6167759895324707e-06, -1.4035031199455261e-06, -1.1902302503585815e-06, -9.76957380771637e-07, -7.636845111846924e-07, -5.504116415977478e-07, -3.371387720108032e-07, -1.2386590242385864e-07, 8.940696716308594e-08, 3.026798367500305e-07, 5.159527063369751e-07, 7.292255759239197e-07, 9.424984455108643e-07, 1.1557713150978088e-06, 1.3690441846847534e-06, 1.582317054271698e-06, 1.7955899238586426e-06, 2.008862793445587e-06, 2.2221356630325317e-06, 2.4354085326194763e-06, 2.648681402206421e-06, 2.8619542717933655e-06, 3.07522714138031e-06, 3.2885000109672546e-06, 3.5017728805541992e-06, 3.715045750141144e-06, 3.928318619728088e-06, 4.141591489315033e-06, 4.3548643589019775e-06, 4.568137228488922e-06, 4.781410098075867e-06, 4.994682967662811e-06, 5.207955837249756e-06, 5.4212287068367004e-06, 5.634501576423645e-06, 5.84777444601059e-06, 6.061047315597534e-06, 6.274320185184479e-06, 6.487593054771423e-06, 6.700865924358368e-06, 6.9141387939453125e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 4.0, 15.0, 7.0, 10.0, 26.0, 11.0, 44.0, 14.0, 42.0, 28.0, 46.0, 26.0, 57.0, 32.0, 59.0, 42.0, 57.0, 34.0, 42.0, 61.0, 38.0, 61.0, 18.0, 52.0, 19.0, 41.0, 13.0, 31.0, 9.0, 13.0, 4.0, 8.0, 2.0, 7.0, 2.0, 3.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-06, -2.4158507585525513e-06, -2.3283064365386963e-06, -2.2407621145248413e-06, -2.1532177925109863e-06, -2.0656734704971313e-06, -1.9781291484832764e-06, -1.8905848264694214e-06, -1.8030405044555664e-06, -1.7154961824417114e-06, -1.6279518604278564e-06, -1.5404075384140015e-06, -1.4528632164001465e-06, -1.3653188943862915e-06, -1.2777745723724365e-06, -1.1902302503585815e-06, -1.1026859283447266e-06, -1.0151416063308716e-06, -9.275972843170166e-07, -8.400529623031616e-07, -7.525086402893066e-07, -6.649643182754517e-07, -5.774199962615967e-07, -4.898756742477417e-07, -4.023313522338867e-07, -3.1478703022003174e-07, -2.2724270820617676e-07, -1.3969838619232178e-07, -5.21540641784668e-08, 3.5390257835388184e-08, 1.2293457984924316e-07, 2.1047890186309814e-07, 2.980232238769531e-07, 3.855675458908081e-07, 4.731118679046631e-07, 5.606561899185181e-07, 6.48200511932373e-07, 7.35744833946228e-07, 8.23289155960083e-07, 9.10833477973938e-07, 9.98377799987793e-07, 1.085922122001648e-06, 1.173466444015503e-06, 1.261010766029358e-06, 1.3485550880432129e-06, 1.4360994100570679e-06, 1.5236437320709229e-06, 1.6111880540847778e-06, 1.6987323760986328e-06, 1.7862766981124878e-06, 1.8738210201263428e-06, 1.9613653421401978e-06, 2.0489096641540527e-06, 2.1364539861679077e-06, 2.2239983081817627e-06, 2.3115426301956177e-06, 2.3990869522094727e-06, 2.4866312742233276e-06, 2.5741755962371826e-06, 2.6617199182510376e-06, 2.7492642402648926e-06, 2.8368085622787476e-06, 2.9243528842926025e-06, 3.0118972063064575e-06, 3.0994415283203125e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 9.0, 0.0, 6.0, 18.0, 15.0, 0.0, 35.0, 43.0, 104.0, 140.0, 0.0, 270.0, 336.0, 652.0, 0.0, 1178.0, 1978.0, 3349.0, 0.0, 6717.0, 12400.0, 23181.0, 0.0, 38087.0, 871681.0, 38028.0, 23084.0, 0.0, 12404.0, 6695.0, 3295.0, 0.0, 1980.0, 1194.0, 709.0, 0.0, 349.0, 263.0, 148.0, 0.0, 85.0, 36.0, 31.0, 26.0, 0.0, 9.0, 12.0, 6.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.3848766684532166e-06, -1.339241862297058e-06, -1.2936070561408997e-06, -1.2479722499847412e-06, -1.2023374438285828e-06, -1.1567026376724243e-06, -1.1110678315162659e-06, -1.0654330253601074e-06, -1.019798219203949e-06, -9.741634130477905e-07, -9.285286068916321e-07, -8.828938007354736e-07, -8.372589945793152e-07, -7.916241884231567e-07, -7.459893822669983e-07, -7.003545761108398e-07, -6.547197699546814e-07, -6.09084963798523e-07, -5.634501576423645e-07, -5.178153514862061e-07, -4.721805453300476e-07, -4.2654573917388916e-07, -3.809109330177307e-07, -3.3527612686157227e-07, -2.896413207054138e-07, -2.4400651454925537e-07, -1.9837170839309692e-07, -1.5273690223693848e-07, -1.0710209608078003e-07, -6.146728992462158e-08, -1.5832483768463135e-08, 2.9802322387695312e-08, 7.543712854385376e-08, 1.210719347000122e-07, 1.6670674085617065e-07, 2.123415470123291e-07, 2.5797635316848755e-07, 3.03611159324646e-07, 3.4924596548080444e-07, 3.948807716369629e-07, 4.4051557779312134e-07, 4.861503839492798e-07, 5.317851901054382e-07, 5.774199962615967e-07, 6.230548024177551e-07, 6.686896085739136e-07, 7.14324414730072e-07, 7.599592208862305e-07, 8.055940270423889e-07, 8.512288331985474e-07, 8.968636393547058e-07, 9.424984455108643e-07, 9.881332516670227e-07, 1.0337680578231812e-06, 1.0794028639793396e-06, 1.125037670135498e-06, 1.1706724762916565e-06, 1.216307282447815e-06, 1.2619420886039734e-06, 1.3075768947601318e-06, 1.3532117009162903e-06, 1.3988465070724487e-06, 1.4444813132286072e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 7.0, 2.0, 0.0, 0.0, 2.0, 8.0, 17.0, 0.0, 35.0, 44.0, 79.0, 0.0, 113.0, 180.0, 301.0, 0.0, 446.0, 793.0, 1240.0, 0.0, 1956.0, 3634.0, 6301.0, 0.0, 11484.0, 26430.0, 63141.0, 0.0, 816274.0, 62872.0, 26747.0, 0.0, 11317.0, 6189.0, 3669.0, 0.0, 2046.0, 1247.0, 773.0, 0.0, 423.0, 303.0, 179.0, 0.0, 130.0, 81.0, 31.0, 0.0, 30.0, 21.0, 11.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 0.0, 2.0, 2.0], "bins": [-1.430511474609375e-06, -1.385807991027832e-06, -1.341104507446289e-06, -1.296401023864746e-06, -1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 85.0, 0.0, 0.0, 0.0, 0.0, 0.0, 723.0, 0.0, 0.0, 0.0, 0.0, 72.0, 0.0, 0.0, 0.0, 0.0, 47.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.5762786865234375e-07, -3.46451997756958e-07, -3.3527612686157227e-07, -3.241002559661865e-07, -3.129243850708008e-07, -3.0174851417541504e-07, -2.905726432800293e-07, -2.7939677238464355e-07, -2.682209014892578e-07, -2.5704503059387207e-07, -2.4586915969848633e-07, -2.3469328880310059e-07, -2.2351741790771484e-07, -2.123415470123291e-07, -2.0116567611694336e-07, -1.8998980522155762e-07, -1.7881393432617188e-07, -1.6763806343078613e-07, -1.564621925354004e-07, -1.4528632164001465e-07, -1.341104507446289e-07, -1.2293457984924316e-07, -1.1175870895385742e-07, -1.0058283805847168e-07, -8.940696716308594e-08, -7.82310962677002e-08, -6.705522537231445e-08, -5.587935447692871e-08, -4.470348358154297e-08, -3.3527612686157227e-08, -2.2351741790771484e-08, -1.1175870895385742e-08, 0.0, 1.1175870895385742e-08, 2.2351741790771484e-08, 3.3527612686157227e-08, 4.470348358154297e-08, 5.587935447692871e-08, 6.705522537231445e-08, 7.82310962677002e-08, 8.940696716308594e-08, 1.0058283805847168e-07, 1.1175870895385742e-07, 1.2293457984924316e-07, 1.341104507446289e-07, 1.4528632164001465e-07, 1.564621925354004e-07, 1.6763806343078613e-07, 1.7881393432617188e-07, 1.8998980522155762e-07, 2.0116567611694336e-07, 2.123415470123291e-07, 2.2351741790771484e-07, 2.3469328880310059e-07, 2.4586915969848633e-07, 2.5704503059387207e-07, 2.682209014892578e-07, 2.7939677238464355e-07, 2.905726432800293e-07, 3.0174851417541504e-07, 3.129243850708008e-07, 3.241002559661865e-07, 3.3527612686157227e-07, 3.46451997756958e-07, 3.5762786865234375e-07]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 8.0, 3.0, 5.0, 8.0, 5.0, 16.0, 14.0, 33.0, 29.0, 51.0, 74.0, 86.0, 107.0, 157.0, 110.0, 85.0, 60.0, 25.0, 32.0, 27.0, 21.0, 11.0, 9.0, 7.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.029113021417288e-06, -6.789800409023883e-06, -6.550488251377828e-06, -6.311175638984423e-06, -6.071863026591018e-06, -5.8325504141976126e-06, -5.593238256551558e-06, -5.353925644158153e-06, -5.1146134865120985e-06, -4.875300874118693e-06, -4.635988716472639e-06, -4.3966761040792335e-06, -4.157363491685828e-06, -3.918051334039774e-06, -3.6787387216463685e-06, -3.4394261092529632e-06, -3.200113496859558e-06, -2.960801111839828e-06, -2.721488499446423e-06, -2.482176114426693e-06, -2.2428635020332877e-06, -2.003551117013558e-06, -1.764238731993828e-06, -1.5249262332872604e-06, -1.2856137345806928e-06, -1.0463012358741253e-06, -8.069887940109766e-07, -5.676763521478279e-07, -3.283638534412603e-07, -8.905135473469272e-08, 1.5026103028503712e-07, 3.895735289916047e-07, 6.288855729508214e-07, 8.681980716573889e-07, 1.1075105703639565e-06, 1.3468229553836863e-06, 1.586135454090254e-06, 1.8254479527968215e-06, 2.0647603378165513e-06, 2.3040729502099566e-06, 2.5433853352296865e-06, 2.7826977202494163e-06, 3.0220103326428216e-06, 3.2613227176625514e-06, 3.5006351026822813e-06, 3.7399477150756866e-06, 3.979260327469092e-06, 4.218572485115146e-06, 4.4578850975085516e-06, 4.697197709901957e-06, 4.936509867548011e-06, 5.1758224799414165e-06, 5.415135092334822e-06, 5.654447704728227e-06, 5.8937598623742815e-06, 6.133072474767687e-06, 6.372384632413741e-06, 6.6116972448071465e-06, 6.851009402453201e-06, 7.090322014846606e-06, 7.3296346272400115e-06, 7.568946784886066e-06, 7.808259397279471e-06, 8.047572009672876e-06, 8.286884622066282e-06]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 9.0, 6.0, 6.0, 6.0, 11.0, 9.0, 8.0, 9.0, 20.0, 17.0, 22.0, 22.0, 19.0, 27.0, 22.0, 32.0, 37.0, 32.0, 39.0, 34.0, 35.0, 46.0, 48.0, 40.0, 30.0, 29.0, 37.0, 31.0, 34.0, 39.0, 29.0, 29.0, 29.0, 27.0, 13.0, 22.0, 18.0, 14.0, 15.0, 10.0, 9.0, 6.0, 6.0, 5.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.230051561331493e-06, -3.110239731540787e-06, -2.9904281291237567e-06, -2.870616299333051e-06, -2.750804469542345e-06, -2.6309926397516392e-06, -2.5111808099609334e-06, -2.391369207543903e-06, -2.2715573777531972e-06, -2.1517455479624914e-06, -2.031933945545461e-06, -1.9121221157547552e-06, -1.7923102859640494e-06, -1.6724984561733436e-06, -1.5526867400694755e-06, -1.4328750239656074e-06, -1.3130631941749016e-06, -1.1932513643841958e-06, -1.0734396482803277e-06, -9.536278753330407e-07, -8.338161023857538e-07, -7.140043294384668e-07, -5.941925564911799e-07, -4.743807835438929e-07, -3.5456901059660595e-07, -2.34757237649319e-07, -1.1494546470203204e-07, 4.866308245254913e-09, 1.2467808119254187e-07, 2.444898541398288e-07, 3.643016270871158e-07, 4.841134000344027e-07, 6.039249456080142e-07, 7.237367185553012e-07, 8.435484915025881e-07, 9.633602076064562e-07, 1.083172037397162e-06, 1.2029838671878679e-06, 1.322795583291736e-06, 1.442607299395604e-06, 1.5624191291863099e-06, 1.6822309589770157e-06, 1.8020426750808838e-06, 1.921854391184752e-06, 2.0416662209754577e-06, 2.1614780507661635e-06, 2.281289653183194e-06, 2.4011014829738997e-06, 2.5209133127646055e-06, 2.6407251425553113e-06, 2.760536972346017e-06, 2.8803485747630475e-06, 3.0001604045537533e-06, 3.119972234344459e-06, 3.2397838367614895e-06, 3.3595956665521953e-06, 3.479407496342901e-06, 3.599219326133607e-06, 3.7190311559243128e-06, 3.838842985715019e-06, 3.958654815505724e-06, 4.078466190549079e-06, 4.198278020339785e-06, 4.318089850130491e-06, 4.437901679921197e-06]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 11.0, 24.0, 16.0, 25.0, 48.0, 76.0, 166.0, 205.0, 315.0, 484.0, 1162.0, 1532.0, 2423.0, 3830.0, 5978.0, 14163.0, 19227.0, 34168.0, 64423.0, 134483.0, 555725.0, 1616359.0, 1124084.0, 324154.0, 164720.0, 54082.0, 29507.0, 16855.0, 10008.0, 7289.0, 3226.0, 1923.0, 1262.0, 994.0, 452.0, 328.0, 187.0, 109.0, 120.0, 46.0, 31.0, 24.0, 16.0, 9.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.496906280517578e-06, -6.3050538301467896e-06, -6.113201379776001e-06, -5.921348929405212e-06, -5.729496479034424e-06, -5.537644028663635e-06, -5.345791578292847e-06, -5.153939127922058e-06, -4.9620866775512695e-06, -4.770234227180481e-06, -4.578381776809692e-06, -4.386529326438904e-06, -4.194676876068115e-06, -4.002824425697327e-06, -3.810971975326538e-06, -3.6191195249557495e-06, -3.427267074584961e-06, -3.2354146242141724e-06, -3.043562173843384e-06, -2.8517097234725952e-06, -2.6598572731018066e-06, -2.468004822731018e-06, -2.2761523723602295e-06, -2.084299921989441e-06, -1.8924474716186523e-06, -1.7005950212478638e-06, -1.5087425708770752e-06, -1.3168901205062866e-06, -1.125037670135498e-06, -9.331852197647095e-07, -7.413327693939209e-07, -5.494803190231323e-07, -3.5762786865234375e-07, -1.6577541828155518e-07, 2.60770320892334e-08, 2.1792948246002197e-07, 4.0978193283081055e-07, 6.016343832015991e-07, 7.934868335723877e-07, 9.853392839431763e-07, 1.1771917343139648e-06, 1.3690441846847534e-06, 1.560896635055542e-06, 1.7527490854263306e-06, 1.944601535797119e-06, 2.1364539861679077e-06, 2.3283064365386963e-06, 2.520158886909485e-06, 2.7120113372802734e-06, 2.903863787651062e-06, 3.0957162380218506e-06, 3.287568688392639e-06, 3.4794211387634277e-06, 3.6712735891342163e-06, 3.863126039505005e-06, 4.0549784898757935e-06, 4.246830940246582e-06, 4.438683390617371e-06, 4.630535840988159e-06, 4.822388291358948e-06, 5.014240741729736e-06, 5.206093192100525e-06, 5.3979456424713135e-06, 5.589798092842102e-06, 5.781650543212891e-06]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 1.0, 6.0, 10.0, 4.0, 11.0, 4.0, 10.0, 22.0, 12.0, 14.0, 18.0, 16.0, 16.0, 38.0, 30.0, 22.0, 28.0, 21.0, 71.0, 32.0, 30.0, 44.0, 35.0, 58.0, 28.0, 42.0, 35.0, 33.0, 30.0, 50.0, 27.0, 22.0, 15.0, 8.0, 41.0, 21.0, 16.0, 10.0, 14.0, 21.0, 4.0, 8.0, 2.0, 3.0, 4.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.8477439880371094e-06, -1.776963472366333e-06, -1.7061829566955566e-06, -1.6354024410247803e-06, -1.564621925354004e-06, -1.4938414096832275e-06, -1.4230608940124512e-06, -1.3522803783416748e-06, -1.2814998626708984e-06, -1.210719347000122e-06, -1.1399388313293457e-06, -1.0691583156585693e-06, -9.98377799987793e-07, -9.275972843170166e-07, -8.568167686462402e-07, -7.860362529754639e-07, -7.152557373046875e-07, -6.444752216339111e-07, -5.736947059631348e-07, -5.029141902923584e-07, -4.3213367462158203e-07, -3.6135315895080566e-07, -2.905726432800293e-07, -2.1979212760925293e-07, -1.4901161193847656e-07, -7.82310962677002e-08, -7.450580596923828e-09, 6.332993507385254e-08, 1.341104507446289e-07, 2.0489096641540527e-07, 2.7567148208618164e-07, 3.46451997756958e-07, 4.172325134277344e-07, 4.880130290985107e-07, 5.587935447692871e-07, 6.295740604400635e-07, 7.003545761108398e-07, 7.711350917816162e-07, 8.419156074523926e-07, 9.126961231231689e-07, 9.834766387939453e-07, 1.0542571544647217e-06, 1.125037670135498e-06, 1.1958181858062744e-06, 1.2665987014770508e-06, 1.3373792171478271e-06, 1.4081597328186035e-06, 1.4789402484893799e-06, 1.5497207641601562e-06, 1.6205012798309326e-06, 1.691281795501709e-06, 1.7620623111724854e-06, 1.8328428268432617e-06, 1.903623342514038e-06, 1.9744038581848145e-06, 2.045184373855591e-06, 2.115964889526367e-06, 2.1867454051971436e-06, 2.25752592086792e-06, 2.3283064365386963e-06, 2.3990869522094727e-06, 2.469867467880249e-06, 2.5406479835510254e-06, 2.6114284992218018e-06, 2.682209014892578e-06]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 2.0, 21.0, 19.0, 38.0, 47.0, 48.0, 126.0, 157.0, 202.0, 477.0, 548.0, 1293.0, 1458.0, 2145.0, 5352.0, 5999.0, 9240.0, 24786.0, 29166.0, 83643.0, 109289.0, 200380.0, 745625.0, 1233239.0, 869551.0, 513302.0, 146653.0, 108985.0, 37645.0, 23130.0, 19746.0, 7431.0, 4876.0, 4461.0, 1571.0, 1596.0, 652.0, 432.0, 419.0, 169.0, 112.0, 98.0, 48.0, 48.0, 18.0, 11.0, 17.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.351139068603516e-06, -4.209578037261963e-06, -4.06801700592041e-06, -3.926455974578857e-06, -3.7848949432373047e-06, -3.643333911895752e-06, -3.5017728805541992e-06, -3.3602118492126465e-06, -3.2186508178710938e-06, -3.077089786529541e-06, -2.9355287551879883e-06, -2.7939677238464355e-06, -2.652406692504883e-06, -2.51084566116333e-06, -2.3692846298217773e-06, -2.2277235984802246e-06, -2.086162567138672e-06, -1.944601535797119e-06, -1.8030405044555664e-06, -1.6614794731140137e-06, -1.519918441772461e-06, -1.3783574104309082e-06, -1.2367963790893555e-06, -1.0952353477478027e-06, -9.5367431640625e-07, -8.121132850646973e-07, -6.705522537231445e-07, -5.289912223815918e-07, -3.8743019104003906e-07, -2.4586915969848633e-07, -1.043081283569336e-07, 3.725290298461914e-08, 1.7881393432617188e-07, 3.203749656677246e-07, 4.6193599700927734e-07, 6.034970283508301e-07, 7.450580596923828e-07, 8.866190910339355e-07, 1.0281801223754883e-06, 1.169741153717041e-06, 1.3113021850585938e-06, 1.4528632164001465e-06, 1.5944242477416992e-06, 1.735985279083252e-06, 1.8775463104248047e-06, 2.0191073417663574e-06, 2.16066837310791e-06, 2.302229404449463e-06, 2.4437904357910156e-06, 2.5853514671325684e-06, 2.726912498474121e-06, 2.868473529815674e-06, 3.0100345611572266e-06, 3.1515955924987793e-06, 3.293156623840332e-06, 3.4347176551818848e-06, 3.5762786865234375e-06, 3.7178397178649902e-06, 3.859400749206543e-06, 4.000961780548096e-06, 4.1425228118896484e-06, 4.284083843231201e-06, 4.425644874572754e-06, 4.567205905914307e-06, 4.708766937255859e-06]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 4.0, 8.0, 0.0, 16.0, 13.0, 0.0, 22.0, 0.0, 36.0, 30.0, 0.0, 37.0, 75.0, 0.0, 91.0, 158.0, 0.0, 160.0, 217.0, 0.0, 271.0, 0.0, 308.0, 364.0, 0.0, 432.0, 395.0, 0.0, 329.0, 282.0, 0.0, 203.0, 0.0, 155.0, 129.0, 0.0, 99.0, 63.0, 0.0, 63.0, 32.0, 0.0, 24.0, 23.0, 0.0, 12.0, 0.0, 16.0, 4.0, 0.0, 7.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.1920928955078125e-06, -1.1539086699485779e-06, -1.1157244443893433e-06, -1.0775402188301086e-06, -1.039355993270874e-06, -1.0011717677116394e-06, -9.629875421524048e-07, -9.248033165931702e-07, -8.866190910339355e-07, -8.484348654747009e-07, -8.102506399154663e-07, -7.720664143562317e-07, -7.338821887969971e-07, -6.956979632377625e-07, -6.575137376785278e-07, -6.193295121192932e-07, -5.811452865600586e-07, -5.42961061000824e-07, -5.047768354415894e-07, -4.6659260988235474e-07, -4.284083843231201e-07, -3.902241587638855e-07, -3.520399332046509e-07, -3.1385570764541626e-07, -2.7567148208618164e-07, -2.3748725652694702e-07, -1.993030309677124e-07, -1.6111880540847778e-07, -1.2293457984924316e-07, -8.475035429000854e-08, -4.6566128730773926e-08, -8.381903171539307e-09, 2.9802322387695312e-08, 6.798654794692993e-08, 1.0617077350616455e-07, 1.4435499906539917e-07, 1.825392246246338e-07, 2.207234501838684e-07, 2.5890767574310303e-07, 2.9709190130233765e-07, 3.3527612686157227e-07, 3.734603524208069e-07, 4.116445779800415e-07, 4.498288035392761e-07, 4.880130290985107e-07, 5.261972546577454e-07, 5.6438148021698e-07, 6.025657057762146e-07, 6.407499313354492e-07, 6.789341568946838e-07, 7.171183824539185e-07, 7.553026080131531e-07, 7.934868335723877e-07, 8.316710591316223e-07, 8.698552846908569e-07, 9.080395102500916e-07, 9.462237358093262e-07, 9.844079613685608e-07, 1.0225921869277954e-06, 1.06077641248703e-06, 1.0989606380462646e-06, 1.1371448636054993e-06, 1.1753290891647339e-06, 1.2135133147239685e-06, 1.2516975402832031e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 12.0, 7.0, 10.0, 16.0, 23.0, 24.0, 32.0, 54.0, 50.0, 68.0, 108.0, 118.0, 96.0, 83.0, 61.0, 53.0, 37.0, 29.0, 26.0, 23.0, 13.0, 8.0, 4.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1600937947805505e-06, -4.0243216972157825e-06, -3.888550054398365e-06, -3.7527779568335973e-06, -3.6170060866425047e-06, -3.481234216451412e-06, -3.345462118886644e-06, -3.2096902486955514e-06, -3.073918378504459e-06, -2.9381465083133662e-06, -2.8023746381222736e-06, -2.6666025405575056e-06, -2.530830670366413e-06, -2.3950588001753204e-06, -2.2592867026105523e-06, -2.1235148324194597e-06, -1.987742962228367e-06, -1.8519710920372745e-06, -1.7161991081593442e-06, -1.5804271242814139e-06, -1.4446552540903213e-06, -1.3088833838992286e-06, -1.1731114000212983e-06, -1.037339416143368e-06, -9.015675459522754e-07, -7.657956189177639e-07, -6.300236918832525e-07, -4.94251764848741e-07, -3.5847983781422954e-07, -2.2270791077971808e-07, -8.693598374520661e-08, 4.883594328930485e-08, 1.8460787032381631e-07, 3.203797973583278e-07, 4.5615172439283924e-07, 5.919236514273507e-07, 7.276955784618622e-07, 8.634675054963736e-07, 9.99239432530885e-07, 1.1350114164088154e-06, 1.270783286599908e-06, 1.4065551567910006e-06, 1.542327140668931e-06, 1.6780991245468613e-06, 1.8138709947379539e-06, 1.9496428649290465e-06, 2.0854149624938145e-06, 2.221186832684907e-06, 2.3569587028759997e-06, 2.4927305730670923e-06, 2.628502443258185e-06, 2.764274540822953e-06, 2.9000464110140456e-06, 3.035818281205138e-06, 3.1715903787699062e-06, 3.307362248960999e-06, 3.4431341191520914e-06, 3.578905989343184e-06, 3.7146778595342766e-06, 3.850449957099045e-06, 3.986221599916462e-06, 4.12199369748123e-06, 4.257765795045998e-06, 4.393537437863415e-06, 4.529309535428183e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 3.0, 7.0, 4.0, 7.0, 18.0, 20.0, 22.0, 25.0, 19.0, 23.0, 33.0, 31.0, 29.0, 42.0, 34.0, 47.0, 48.0, 38.0, 46.0, 39.0, 47.0, 38.0, 43.0, 35.0, 34.0, 28.0, 17.0, 23.0, 25.0, 27.0, 23.0, 21.0, 14.0, 15.0, 12.0, 12.0, 10.0, 9.0, 4.0, 1.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.5216900212399196e-06, -2.4381249659199966e-06, -2.354560137973749e-06, -2.270995082653826e-06, -2.1874302547075786e-06, -2.1038651993876556e-06, -2.0203001440677326e-06, -1.936735316121485e-06, -1.8531703744883998e-06, -1.7696054328553146e-06, -1.6860404912222293e-06, -1.602475549589144e-06, -1.518910494269221e-06, -1.4353456663229736e-06, -1.3517806110030506e-06, -1.2682156693699653e-06, -1.18465072773688e-06, -1.1010857861037948e-06, -1.0175208444707096e-06, -9.339558459942054e-07, -8.503909043611202e-07, -7.668259627280349e-07, -6.832609642515308e-07, -5.996960226184456e-07, -5.161310809853603e-07, -4.3256613935227506e-07, -3.490011692974804e-07, -2.654361992426857e-07, -1.8187125760960043e-07, -9.830631597651518e-08, -1.4741317500011064e-08, 6.882362413307419e-08, 1.523887931398349e-07, 2.3595374898377486e-07, 3.1951870482771483e-07, 4.030836748825095e-07, 4.866486165155948e-07, 5.7021355814868e-07, 6.537785566251841e-07, 7.373434982582694e-07, 8.209084398913546e-07, 9.044733815244399e-07, 9.880383231575252e-07, 1.0716032647906104e-06, 1.1551683201105334e-06, 1.238733148056781e-06, 1.322298203376704e-06, 1.4058631450097892e-06, 1.4894280866428744e-06, 1.5729930282759597e-06, 1.656557969909045e-06, 1.7401230252289679e-06, 1.8236878531752154e-06, 1.9072529084951384e-06, 1.9908179638150614e-06, 2.074382791761309e-06, 2.1579476197075564e-06, 2.2415126750274794e-06, 2.325077502973727e-06, 2.40864255829365e-06, 2.4922073862398975e-06, 2.5757724415598204e-06, 2.6593374968797434e-06, 2.742902324825991e-06, 2.826467380145914e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 13.0, 12.0, 11.0, 47.0, 50.0, 42.0, 124.0, 133.0, 133.0, 364.0, 385.0, 590.0, 1349.0, 1462.0, 2114.0, 5178.0, 5753.0, 8995.0, 24371.0, 29510.0, 49133.0, 146766.0, 187487.0, 224959.0, 193772.0, 63780.0, 38341.0, 31081.0, 11336.0, 7040.0, 6151.0, 2442.0, 1679.0, 1669.0, 653.0, 453.0, 471.0, 189.0, 144.0, 157.0, 68.0, 41.0, 41.0, 15.0, 17.0, 15.0, 14.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.0531158447265625e-06, -3.914348781108856e-06, -3.77558171749115e-06, -3.6368146538734436e-06, -3.4980475902557373e-06, -3.359280526638031e-06, -3.2205134630203247e-06, -3.0817463994026184e-06, -2.942979335784912e-06, -2.804212272167206e-06, -2.6654452085494995e-06, -2.5266781449317932e-06, -2.387911081314087e-06, -2.2491440176963806e-06, -2.1103769540786743e-06, -1.971609890460968e-06, -1.8328428268432617e-06, -1.6940757632255554e-06, -1.5553086996078491e-06, -1.4165416359901428e-06, -1.2777745723724365e-06, -1.1390075087547302e-06, -1.000240445137024e-06, -8.614733815193176e-07, -7.227063179016113e-07, -5.83939254283905e-07, -4.4517219066619873e-07, -3.0640512704849243e-07, -1.6763806343078613e-07, -2.8870999813079834e-08, 1.0989606380462646e-07, 2.4866312742233276e-07, 3.8743019104003906e-07, 5.261972546577454e-07, 6.649643182754517e-07, 8.03731381893158e-07, 9.424984455108643e-07, 1.0812655091285706e-06, 1.2200325727462769e-06, 1.3587996363639832e-06, 1.4975666999816895e-06, 1.6363337635993958e-06, 1.775100827217102e-06, 1.9138678908348083e-06, 2.0526349544525146e-06, 2.191402018070221e-06, 2.3301690816879272e-06, 2.4689361453056335e-06, 2.60770320892334e-06, 2.746470272541046e-06, 2.8852373361587524e-06, 3.0240043997764587e-06, 3.162771463394165e-06, 3.3015385270118713e-06, 3.4403055906295776e-06, 3.579072654247284e-06, 3.7178397178649902e-06, 3.8566067814826965e-06, 3.995373845100403e-06, 4.134140908718109e-06, 4.2729079723358154e-06, 4.411675035953522e-06, 4.550442099571228e-06, 4.689209163188934e-06, 4.827976226806641e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 8.0, 10.0, 8.0, 6.0, 16.0, 16.0, 13.0, 43.0, 20.0, 17.0, 32.0, 32.0, 21.0, 51.0, 29.0, 41.0, 72.0, 34.0, 35.0, 62.0, 29.0, 30.0, 53.0, 32.0, 37.0, 17.0, 21.0, 47.0, 15.0, 17.0, 30.0, 9.0, 10.0, 25.0, 13.0, 8.0, 12.0, 3.0, 1.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.3245811462402344e-06, -2.2444874048233032e-06, -2.164393663406372e-06, -2.084299921989441e-06, -2.0042061805725098e-06, -1.9241124391555786e-06, -1.8440186977386475e-06, -1.7639249563217163e-06, -1.6838312149047852e-06, -1.603737473487854e-06, -1.5236437320709229e-06, -1.4435499906539917e-06, -1.3634562492370605e-06, -1.2833625078201294e-06, -1.2032687664031982e-06, -1.123175024986267e-06, -1.043081283569336e-06, -9.629875421524048e-07, -8.828938007354736e-07, -8.028000593185425e-07, -7.227063179016113e-07, -6.426125764846802e-07, -5.62518835067749e-07, -4.824250936508179e-07, -4.023313522338867e-07, -3.2223761081695557e-07, -2.421438694000244e-07, -1.6205012798309326e-07, -8.195638656616211e-08, -1.862645149230957e-09, 7.82310962677002e-08, 1.5832483768463135e-07, 2.384185791015625e-07, 3.1851232051849365e-07, 3.986060619354248e-07, 4.78699803352356e-07, 5.587935447692871e-07, 6.388872861862183e-07, 7.189810276031494e-07, 7.990747690200806e-07, 8.791685104370117e-07, 9.592622518539429e-07, 1.039355993270874e-06, 1.1194497346878052e-06, 1.1995434761047363e-06, 1.2796372175216675e-06, 1.3597309589385986e-06, 1.4398247003555298e-06, 1.519918441772461e-06, 1.600012183189392e-06, 1.6801059246063232e-06, 1.7601996660232544e-06, 1.8402934074401855e-06, 1.9203871488571167e-06, 2.000480890274048e-06, 2.080574631690979e-06, 2.16066837310791e-06, 2.2407621145248413e-06, 2.3208558559417725e-06, 2.4009495973587036e-06, 2.4810433387756348e-06, 2.561137080192566e-06, 2.641230821609497e-06, 2.7213245630264282e-06, 2.8014183044433594e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 6.0, 14.0, 17.0, 26.0, 33.0, 56.0, 76.0, 96.0, 174.0, 325.0, 476.0, 981.0, 2122.0, 4811.0, 16449.0, 127898.0, 859147.0, 24149.0, 6382.0, 2552.0, 1206.0, 628.0, 341.0, 207.0, 111.0, 94.0, 46.0, 38.0, 25.0, 23.0, 13.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3909759521484375e-06, -7.152557373046875e-06, -6.9141387939453125e-06, -6.67572021484375e-06, -6.4373016357421875e-06, -6.198883056640625e-06, -5.9604644775390625e-06, -5.7220458984375e-06, -5.4836273193359375e-06, -5.245208740234375e-06, -5.0067901611328125e-06, -4.76837158203125e-06, -4.5299530029296875e-06, -4.291534423828125e-06, -4.0531158447265625e-06, -3.814697265625e-06, -3.5762786865234375e-06, -3.337860107421875e-06, -3.0994415283203125e-06, -2.86102294921875e-06, -2.6226043701171875e-06, -2.384185791015625e-06, -2.1457672119140625e-06, -1.9073486328125e-06, -1.6689300537109375e-06, -1.430511474609375e-06, -1.1920928955078125e-06, -9.5367431640625e-07, -7.152557373046875e-07, -4.76837158203125e-07, -2.384185791015625e-07, 0.0, 2.384185791015625e-07, 4.76837158203125e-07, 7.152557373046875e-07, 9.5367431640625e-07, 1.1920928955078125e-06, 1.430511474609375e-06, 1.6689300537109375e-06, 1.9073486328125e-06, 2.1457672119140625e-06, 2.384185791015625e-06, 2.6226043701171875e-06, 2.86102294921875e-06, 3.0994415283203125e-06, 3.337860107421875e-06, 3.5762786865234375e-06, 3.814697265625e-06, 4.0531158447265625e-06, 4.291534423828125e-06, 4.5299530029296875e-06, 4.76837158203125e-06, 5.0067901611328125e-06, 5.245208740234375e-06, 5.4836273193359375e-06, 5.7220458984375e-06, 5.9604644775390625e-06, 6.198883056640625e-06, 6.4373016357421875e-06, 6.67572021484375e-06, 6.9141387939453125e-06, 7.152557373046875e-06, 7.3909759521484375e-06, 7.62939453125e-06, 7.867813110351562e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 0.0, 5.0, 0.0, 13.0, 0.0, 17.0, 0.0, 29.0, 49.0, 0.0, 130.0, 0.0, 534.0, 0.0, 109.0, 0.0, 47.0, 0.0, 29.0, 0.0, 16.0, 0.0, 7.0, 0.0, 5.0, 0.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1324882507324219e-06, -1.101754605770111e-06, -1.0710209608078003e-06, -1.0402873158454895e-06, -1.0095536708831787e-06, -9.78820025920868e-07, -9.480863809585571e-07, -9.173527359962463e-07, -8.866190910339355e-07, -8.558854460716248e-07, -8.25151801109314e-07, -7.944181561470032e-07, -7.636845111846924e-07, -7.329508662223816e-07, -7.022172212600708e-07, -6.7148357629776e-07, -6.407499313354492e-07, -6.100162863731384e-07, -5.792826414108276e-07, -5.485489964485168e-07, -5.178153514862061e-07, -4.870817065238953e-07, -4.5634806156158447e-07, -4.256144165992737e-07, -3.948807716369629e-07, -3.641471266746521e-07, -3.334134817123413e-07, -3.026798367500305e-07, -2.7194619178771973e-07, -2.4121254682540894e-07, -2.1047890186309814e-07, -1.7974525690078735e-07, -1.4901161193847656e-07, -1.1827796697616577e-07, -8.754432201385498e-08, -5.681067705154419e-08, -2.60770320892334e-08, 4.6566128730773926e-09, 3.5390257835388184e-08, 6.612390279769897e-08, 9.685754776000977e-08, 1.2759119272232056e-07, 1.5832483768463135e-07, 1.8905848264694214e-07, 2.1979212760925293e-07, 2.505257725715637e-07, 2.812594175338745e-07, 3.119930624961853e-07, 3.427267074584961e-07, 3.734603524208069e-07, 4.041939973831177e-07, 4.3492764234542847e-07, 4.6566128730773926e-07, 4.9639493227005e-07, 5.271285772323608e-07, 5.578622221946716e-07, 5.885958671569824e-07, 6.193295121192932e-07, 6.50063157081604e-07, 6.807968020439148e-07, 7.115304470062256e-07, 7.422640919685364e-07, 7.729977369308472e-07, 8.03731381893158e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 2.0, 5.0, 7.0, 4.0, 34.0, 6.0, 23.0, 43.0, 175.0, 66.0, 103.0, 375.0, 261.0, 496.0, 641.0, 2526.0, 2538.0, 4524.0, 12931.0, 1011845.0, 4618.0, 2562.0, 2475.0, 667.0, 511.0, 271.0, 359.0, 114.0, 61.0, 180.0, 46.0, 18.0, 4.0, 37.0, 4.0, 7.0, 5.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4437904357910156e-06, -2.3674219846725464e-06, -2.291053533554077e-06, -2.214685082435608e-06, -2.1383166313171387e-06, -2.0619481801986694e-06, -1.9855797290802e-06, -1.909211277961731e-06, -1.8328428268432617e-06, -1.7564743757247925e-06, -1.6801059246063232e-06, -1.603737473487854e-06, -1.5273690223693848e-06, -1.4510005712509155e-06, -1.3746321201324463e-06, -1.298263669013977e-06, -1.2218952178955078e-06, -1.1455267667770386e-06, -1.0691583156585693e-06, -9.927898645401e-07, -9.164214134216309e-07, -8.400529623031616e-07, -7.636845111846924e-07, -6.873160600662231e-07, -6.109476089477539e-07, -5.345791578292847e-07, -4.5821070671081543e-07, -3.818422555923462e-07, -3.0547380447387695e-07, -2.2910535335540771e-07, -1.5273690223693848e-07, -7.636845111846924e-08, 0.0, 7.636845111846924e-08, 1.5273690223693848e-07, 2.2910535335540771e-07, 3.0547380447387695e-07, 3.818422555923462e-07, 4.5821070671081543e-07, 5.345791578292847e-07, 6.109476089477539e-07, 6.873160600662231e-07, 7.636845111846924e-07, 8.400529623031616e-07, 9.164214134216309e-07, 9.927898645401e-07, 1.0691583156585693e-06, 1.1455267667770386e-06, 1.2218952178955078e-06, 1.298263669013977e-06, 1.3746321201324463e-06, 1.4510005712509155e-06, 1.5273690223693848e-06, 1.603737473487854e-06, 1.6801059246063232e-06, 1.7564743757247925e-06, 1.8328428268432617e-06, 1.909211277961731e-06, 1.9855797290802e-06, 2.0619481801986694e-06, 2.1383166313171387e-06, 2.214685082435608e-06, 2.291053533554077e-06, 2.3674219846725464e-06, 2.4437904357910156e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 946.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 0.0, 0.0, 14.0, 0.0, 32.0, 0.0, 0.0, 117.0, 0.0, 221.0, 0.0, 0.0, 392.0, 0.0, 901.0, 0.0, 0.0, 1841.0, 0.0, 0.0, 3435.0, 0.0, 8347.0, 0.0, 0.0, 18786.0, 0.0, 980307.0, 0.0, 0.0, 18949.0, 0.0, 8220.0, 0.0, 0.0, 3440.0, 0.0, 1902.0, 0.0, 0.0, 874.0, 0.0, 0.0, 436.0, 0.0, 212.0, 0.0, 0.0, 95.0, 0.0, 25.0, 0.0, 0.0, 13.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.919726729393005e-07, -6.686896085739136e-07, -6.454065442085266e-07, -6.221234798431396e-07, -5.988404154777527e-07, -5.755573511123657e-07, -5.522742867469788e-07, -5.289912223815918e-07, -5.057081580162048e-07, -4.824250936508179e-07, -4.591420292854309e-07, -4.3585896492004395e-07, -4.12575900554657e-07, -3.8929283618927e-07, -3.6600977182388306e-07, -3.427267074584961e-07, -3.1944364309310913e-07, -2.9616057872772217e-07, -2.728775143623352e-07, -2.4959444999694824e-07, -2.2631138563156128e-07, -2.0302832126617432e-07, -1.7974525690078735e-07, -1.564621925354004e-07, -1.3317912817001343e-07, -1.0989606380462646e-07, -8.66129994392395e-08, -6.332993507385254e-08, -4.0046870708465576e-08, -1.6763806343078613e-08, 6.51925802230835e-09, 2.9802322387695312e-08, 5.3085386753082275e-08, 7.636845111846924e-08, 9.96515154838562e-08, 1.2293457984924316e-07, 1.4621764421463013e-07, 1.695007085800171e-07, 1.9278377294540405e-07, 2.1606683731079102e-07, 2.39349901676178e-07, 2.6263296604156494e-07, 2.859160304069519e-07, 3.0919909477233887e-07, 3.3248215913772583e-07, 3.557652235031128e-07, 3.7904828786849976e-07, 4.023313522338867e-07, 4.256144165992737e-07, 4.4889748096466064e-07, 4.721805453300476e-07, 4.954636096954346e-07, 5.187466740608215e-07, 5.420297384262085e-07, 5.653128027915955e-07, 5.885958671569824e-07, 6.118789315223694e-07, 6.351619958877563e-07, 6.584450602531433e-07, 6.817281246185303e-07, 7.050111889839172e-07, 7.282942533493042e-07, 7.515773177146912e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 938.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-2.384185791015625e-07, -2.3189932107925415e-07, -2.253800630569458e-07, -2.1886080503463745e-07, -2.123415470123291e-07, -2.0582228899002075e-07, -1.993030309677124e-07, -1.9278377294540405e-07, -1.862645149230957e-07, -1.7974525690078735e-07, -1.73225998878479e-07, -1.6670674085617065e-07, -1.601874828338623e-07, -1.5366822481155396e-07, -1.471489667892456e-07, -1.4062970876693726e-07, -1.341104507446289e-07, -1.2759119272232056e-07, -1.210719347000122e-07, -1.1455267667770386e-07, -1.0803341865539551e-07, -1.0151416063308716e-07, -9.499490261077881e-08, -8.847564458847046e-08, -8.195638656616211e-08, -7.543712854385376e-08, -6.891787052154541e-08, -6.239861249923706e-08, -5.587935447692871e-08, -4.936009645462036e-08, -4.284083843231201e-08, -3.632158041000366e-08, -2.9802322387695312e-08, -2.3283064365386963e-08, -1.6763806343078613e-08, -1.0244548320770264e-08, -3.725290298461914e-09, 2.7939677238464355e-09, 9.313225746154785e-09, 1.5832483768463135e-08, 2.2351741790771484e-08, 2.8870999813079834e-08, 3.5390257835388184e-08, 4.190951585769653e-08, 4.842877388000488e-08, 5.494803190231323e-08, 6.146728992462158e-08, 6.798654794692993e-08, 7.450580596923828e-08, 8.102506399154663e-08, 8.754432201385498e-08, 9.406358003616333e-08, 1.0058283805847168e-07, 1.0710209608078003e-07, 1.1362135410308838e-07, 1.2014061212539673e-07, 1.2665987014770508e-07, 1.3317912817001343e-07, 1.3969838619232178e-07, 1.4621764421463013e-07, 1.5273690223693848e-07, 1.5925616025924683e-07, 1.6577541828155518e-07, 1.7229467630386353e-07, 1.7881393432617188e-07]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 9.0, 8.0, 10.0, 18.0, 12.0, 25.0, 34.0, 42.0, 62.0, 64.0, 90.0, 124.0, 118.0, 77.0, 55.0, 56.0, 33.0, 36.0, 20.0, 23.0, 18.0, 11.0, 12.0, 13.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.906332040060079e-06, -3.780031420319574e-06, -3.6537310279527446e-06, -3.5274306355859153e-06, -3.4011300158454105e-06, -3.2748293961049058e-06, -3.1485290037380764e-06, -3.022228611371247e-06, -2.8959279916307423e-06, -2.7696273718902376e-06, -2.6433269795234082e-06, -2.517026587156579e-06, -2.390725967416074e-06, -2.2644253476755694e-06, -2.13812495530874e-06, -2.0118245629419107e-06, -1.885523943201406e-06, -1.7592234371477389e-06, -1.6329229310940718e-06, -1.5066224250404048e-06, -1.3803219189867377e-06, -1.2540214129330707e-06, -1.1277209068794036e-06, -1.0014204008257366e-06, -8.751198947720695e-07, -7.488193887184025e-07, -6.225188826647354e-07, -4.962183766110684e-07, -3.6991787055740133e-07, -2.436173645037343e-07, -1.1731685845006723e-07, 8.98364760359982e-09, 1.3528415365726687e-07, 2.615846597109339e-07, 3.8788516576460097e-07, 5.14185671818268e-07, 6.404861778719351e-07, 7.667866839256021e-07, 8.930871899792692e-07, 1.0193876960329362e-06, 1.1456882020866033e-06, 1.2719887081402703e-06, 1.3982892141939374e-06, 1.5245897202476044e-06, 1.6508902263012715e-06, 1.7771907323549385e-06, 1.9034912384086056e-06, 2.029791630775435e-06, 2.1560922505159397e-06, 2.2823928702564444e-06, 2.4086932626232738e-06, 2.534993654990103e-06, 2.661294274730608e-06, 2.7875948944711126e-06, 2.913895286837942e-06, 3.0401956792047713e-06, 3.166496298945276e-06, 3.292796918685781e-06, 3.41909731105261e-06, 3.5453977034194395e-06, 3.6716983231599443e-06, 3.797998942900449e-06, 3.924299562640954e-06, 4.050599727634108e-06, 4.1769003473746125e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 5.0, 7.0, 3.0, 6.0, 13.0, 22.0, 18.0, 23.0, 24.0, 21.0, 35.0, 29.0, 33.0, 31.0, 40.0, 48.0, 39.0, 43.0, 48.0, 41.0, 39.0, 44.0, 37.0, 42.0, 31.0, 31.0, 18.0, 26.0, 25.0, 22.0, 31.0, 16.0, 16.0, 16.0, 14.0, 12.0, 11.0, 6.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.3932695967232576e-06, -2.314866378583247e-06, -2.2364629330695607e-06, -2.15805971492955e-06, -2.079656269415864e-06, -2.001253051275853e-06, -1.922849605762167e-06, -1.8444463876221562e-06, -1.7660431694821455e-06, -1.687639837655297e-06, -1.6092365058284486e-06, -1.5308332876884378e-06, -1.4524299558615894e-06, -1.374026624034741e-06, -1.2956232922078925e-06, -1.217219960381044e-06, -1.1388166285541956e-06, -1.0604132967273472e-06, -9.820099649004987e-07, -9.036066899170692e-07, -8.252034149336396e-07, -7.468000831067911e-07, -6.683967512799427e-07, -5.899934762965131e-07, -5.115901444696647e-07, -4.3318684106452565e-07, -3.5478353765938664e-07, -2.763802058325382e-07, -1.9797690242739918e-07, -1.1957359902226017e-07, -4.1170267195411725e-08, 3.723300778801786e-08, 1.156363396148663e-07, 1.9403964302000531e-07, 2.7244294642514433e-07, 3.5084627825199277e-07, 4.292495816571318e-07, 5.076528850622708e-07, 5.860562168891192e-07, 6.644594918725488e-07, 7.428628236993973e-07, 8.212661555262457e-07, 8.996694305096753e-07, 9.780727623365237e-07, 1.0564760941633722e-06, 1.134879312303383e-06, 1.213282757817069e-06, 1.2916859759570798e-06, 1.3700893077839282e-06, 1.4484926396107767e-06, 1.5268959714376251e-06, 1.6052993032644736e-06, 1.6837025214044843e-06, 1.7621058532313327e-06, 1.8405091850581812e-06, 1.918912403198192e-06, 1.997315848711878e-06, 2.0757190668518888e-06, 2.154122512365575e-06, 2.2325257305055857e-06, 2.310929176019272e-06, 2.3893323941592826e-06, 2.4677356122992933e-06, 2.5461390578129794e-06, 2.62454227595299e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 8.0, 14.0, 15.0, 30.0, 47.0, 59.0, 136.0, 142.0, 189.0, 452.0, 446.0, 1046.0, 1086.0, 2458.0, 2461.0, 5652.0, 5763.0, 8701.0, 21124.0, 24530.0, 67791.0, 85061.0, 243854.0, 206094.0, 144229.0, 113471.0, 39477.0, 33170.0, 12561.0, 11620.0, 4837.0, 4678.0, 2085.0, 1542.0, 1423.0, 644.0, 701.0, 281.0, 276.0, 113.0, 86.0, 73.0, 35.0, 37.0, 21.0, 9.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.410743713378906e-06, -4.265457391738892e-06, -4.120171070098877e-06, -3.974884748458862e-06, -3.829598426818848e-06, -3.684312105178833e-06, -3.5390257835388184e-06, -3.3937394618988037e-06, -3.248453140258789e-06, -3.1031668186187744e-06, -2.9578804969787598e-06, -2.812594175338745e-06, -2.6673078536987305e-06, -2.522021532058716e-06, -2.376735210418701e-06, -2.2314488887786865e-06, -2.086162567138672e-06, -1.9408762454986572e-06, -1.7955899238586426e-06, -1.650303602218628e-06, -1.5050172805786133e-06, -1.3597309589385986e-06, -1.214444637298584e-06, -1.0691583156585693e-06, -9.238719940185547e-07, -7.7858567237854e-07, -6.332993507385254e-07, -4.880130290985107e-07, -3.427267074584961e-07, -1.9744038581848145e-07, -5.21540641784668e-08, 9.313225746154785e-08, 2.384185791015625e-07, 3.8370490074157715e-07, 5.289912223815918e-07, 6.742775440216064e-07, 8.195638656616211e-07, 9.648501873016357e-07, 1.1101365089416504e-06, 1.255422830581665e-06, 1.4007091522216797e-06, 1.5459954738616943e-06, 1.691281795501709e-06, 1.8365681171417236e-06, 1.9818544387817383e-06, 2.127140760421753e-06, 2.2724270820617676e-06, 2.4177134037017822e-06, 2.562999725341797e-06, 2.7082860469818115e-06, 2.853572368621826e-06, 2.998858690261841e-06, 3.1441450119018555e-06, 3.28943133354187e-06, 3.4347176551818848e-06, 3.5800039768218994e-06, 3.725290298461914e-06, 3.870576620101929e-06, 4.015862941741943e-06, 4.161149263381958e-06, 4.306435585021973e-06, 4.451721906661987e-06, 4.597008228302002e-06, 4.742294549942017e-06, 4.887580871582031e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 8.0, 3.0, 7.0, 8.0, 11.0, 10.0, 15.0, 17.0, 48.0, 19.0, 24.0, 19.0, 31.0, 36.0, 32.0, 42.0, 41.0, 40.0, 42.0, 32.0, 45.0, 45.0, 39.0, 35.0, 38.0, 24.0, 40.0, 25.0, 26.0, 50.0, 23.0, 12.0, 13.0, 19.0, 11.0, 13.0, 5.0, 9.0, 6.0, 5.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0], "bins": [-2.086162567138672e-06, -2.023763954639435e-06, -1.9613653421401978e-06, -1.8989667296409607e-06, -1.8365681171417236e-06, -1.7741695046424866e-06, -1.7117708921432495e-06, -1.6493722796440125e-06, -1.5869736671447754e-06, -1.5245750546455383e-06, -1.4621764421463013e-06, -1.3997778296470642e-06, -1.3373792171478271e-06, -1.27498060464859e-06, -1.212581992149353e-06, -1.150183379650116e-06, -1.087784767150879e-06, -1.0253861546516418e-06, -9.629875421524048e-07, -9.005889296531677e-07, -8.381903171539307e-07, -7.757917046546936e-07, -7.133930921554565e-07, -6.509944796562195e-07, -5.885958671569824e-07, -5.261972546577454e-07, -4.637986421585083e-07, -4.0140002965927124e-07, -3.390014171600342e-07, -2.766028046607971e-07, -2.1420419216156006e-07, -1.51805579662323e-07, -8.940696716308594e-08, -2.7008354663848877e-08, 3.5390257835388184e-08, 9.778887033462524e-08, 1.601874828338623e-07, 2.2258609533309937e-07, 2.849847078323364e-07, 3.473833203315735e-07, 4.0978193283081055e-07, 4.721805453300476e-07, 5.345791578292847e-07, 5.969777703285217e-07, 6.593763828277588e-07, 7.217749953269958e-07, 7.841736078262329e-07, 8.4657222032547e-07, 9.08970832824707e-07, 9.71369445323944e-07, 1.0337680578231812e-06, 1.0961666703224182e-06, 1.1585652828216553e-06, 1.2209638953208923e-06, 1.2833625078201294e-06, 1.3457611203193665e-06, 1.4081597328186035e-06, 1.4705583453178406e-06, 1.5329569578170776e-06, 1.5953555703163147e-06, 1.6577541828155518e-06, 1.7201527953147888e-06, 1.7825514078140259e-06, 1.844950020313263e-06, 1.9073486328125e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 12.0, 7.0, 17.0, 13.0, 34.0, 48.0, 75.0, 64.0, 151.0, 210.0, 321.0, 257.0, 603.0, 905.0, 664.0, 1847.0, 2782.0, 4368.0, 2944.0, 8737.0, 14198.0, 23755.0, 17267.0, 51646.0, 88900.0, 148465.0, 100668.0, 211268.0, 148369.0, 50379.0, 67936.0, 39805.0, 23741.0, 7962.0, 11129.0, 6801.0, 4358.0, 1526.0, 2219.0, 1357.0, 948.0, 362.0, 502.0, 318.0, 118.0, 178.0, 111.0, 88.0, 23.0, 49.0, 20.0, 18.0, 4.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.2186508178710938e-06, -3.1152740120887756e-06, -3.0118972063064575e-06, -2.9085204005241394e-06, -2.8051435947418213e-06, -2.701766788959503e-06, -2.598389983177185e-06, -2.495013177394867e-06, -2.391636371612549e-06, -2.2882595658302307e-06, -2.1848827600479126e-06, -2.0815059542655945e-06, -1.9781291484832764e-06, -1.8747523427009583e-06, -1.7713755369186401e-06, -1.667998731136322e-06, -1.564621925354004e-06, -1.4612451195716858e-06, -1.3578683137893677e-06, -1.2544915080070496e-06, -1.1511147022247314e-06, -1.0477378964424133e-06, -9.443610906600952e-07, -8.409842848777771e-07, -7.37607479095459e-07, -6.342306733131409e-07, -5.308538675308228e-07, -4.2747706174850464e-07, -3.241002559661865e-07, -2.207234501838684e-07, -1.1734664440155029e-07, -1.3969838619232178e-08, 8.940696716308594e-08, 1.9278377294540405e-07, 2.9616057872772217e-07, 3.995373845100403e-07, 5.029141902923584e-07, 6.062909960746765e-07, 7.096678018569946e-07, 8.130446076393127e-07, 9.164214134216309e-07, 1.019798219203949e-06, 1.123175024986267e-06, 1.2265518307685852e-06, 1.3299286365509033e-06, 1.4333054423332214e-06, 1.5366822481155396e-06, 1.6400590538978577e-06, 1.7434358596801758e-06, 1.846812665462494e-06, 1.950189471244812e-06, 2.05356627702713e-06, 2.1569430828094482e-06, 2.2603198885917664e-06, 2.3636966943740845e-06, 2.4670735001564026e-06, 2.5704503059387207e-06, 2.673827111721039e-06, 2.777203917503357e-06, 2.880580723285675e-06, 2.983957529067993e-06, 3.0873343348503113e-06, 3.1907111406326294e-06, 3.2940879464149475e-06, 3.3974647521972656e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 6.0, 11.0, 0.0, 9.0, 0.0, 14.0, 24.0, 0.0, 29.0, 28.0, 0.0, 34.0, 40.0, 0.0, 40.0, 46.0, 0.0, 58.0, 0.0, 46.0, 54.0, 0.0, 74.0, 60.0, 0.0, 56.0, 57.0, 0.0, 59.0, 0.0, 43.0, 40.0, 0.0, 39.0, 36.0, 0.0, 26.0, 17.0, 0.0, 17.0, 15.0, 0.0, 8.0, 0.0, 4.0, 4.0, 0.0, 6.0, 7.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1539086699485779e-06, -1.1157244443893433e-06, -1.0775402188301086e-06, -1.039355993270874e-06, -1.0011717677116394e-06, -9.629875421524048e-07, -9.248033165931702e-07, -8.866190910339355e-07, -8.484348654747009e-07, -8.102506399154663e-07, -7.720664143562317e-07, -7.338821887969971e-07, -6.956979632377625e-07, -6.575137376785278e-07, -6.193295121192932e-07, -5.811452865600586e-07, -5.42961061000824e-07, -5.047768354415894e-07, -4.6659260988235474e-07, -4.284083843231201e-07, -3.902241587638855e-07, -3.520399332046509e-07, -3.1385570764541626e-07, -2.7567148208618164e-07, -2.3748725652694702e-07, -1.993030309677124e-07, -1.6111880540847778e-07, -1.2293457984924316e-07, -8.475035429000854e-08, -4.6566128730773926e-08, -8.381903171539307e-09, 2.9802322387695312e-08, 6.798654794692993e-08, 1.0617077350616455e-07, 1.4435499906539917e-07, 1.825392246246338e-07, 2.207234501838684e-07, 2.5890767574310303e-07, 2.9709190130233765e-07, 3.3527612686157227e-07, 3.734603524208069e-07, 4.116445779800415e-07, 4.498288035392761e-07, 4.880130290985107e-07, 5.261972546577454e-07, 5.6438148021698e-07, 6.025657057762146e-07, 6.407499313354492e-07, 6.789341568946838e-07, 7.171183824539185e-07, 7.553026080131531e-07, 7.934868335723877e-07, 8.316710591316223e-07, 8.698552846908569e-07, 9.080395102500916e-07, 9.462237358093262e-07, 9.844079613685608e-07, 1.0225921869277954e-06, 1.06077641248703e-06, 1.0989606380462646e-06, 1.1371448636054993e-06, 1.1753290891647339e-06, 1.2135133147239685e-06, 1.2516975402832031e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 10.0, 5.0, 3.0, 2.0, 16.0, 8.0, 12.0, 18.0, 44.0, 36.0, 50.0, 64.0, 254.0, 223.0, 390.0, 473.0, 2443.0, 1845.0, 3254.0, 6932.0, 39792.0, 45628.0, 845471.0, 45878.0, 39612.0, 6938.0, 3203.0, 1892.0, 2415.0, 459.0, 403.0, 236.0, 266.0, 66.0, 48.0, 33.0, 40.0, 10.0, 21.0, 12.0, 11.0, 5.0, 4.0, 4.0, 15.0, 1.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.1904706954956055e-06, -2.115964889526367e-06, -2.041459083557129e-06, -1.9669532775878906e-06, -1.8924474716186523e-06, -1.817941665649414e-06, -1.7434358596801758e-06, -1.6689300537109375e-06, -1.5944242477416992e-06, -1.519918441772461e-06, -1.4454126358032227e-06, -1.3709068298339844e-06, -1.296401023864746e-06, -1.2218952178955078e-06, -1.1473894119262695e-06, -1.0728836059570312e-06, -9.98377799987793e-07, -9.238719940185547e-07, -8.493661880493164e-07, -7.748603820800781e-07, -7.003545761108398e-07, -6.258487701416016e-07, -5.513429641723633e-07, -4.76837158203125e-07, -4.023313522338867e-07, -3.2782554626464844e-07, -2.5331974029541016e-07, -1.7881393432617188e-07, -1.043081283569336e-07, -2.9802322387695312e-08, 4.470348358154297e-08, 1.1920928955078125e-07, 1.9371509552001953e-07, 2.682209014892578e-07, 3.427267074584961e-07, 4.172325134277344e-07, 4.917383193969727e-07, 5.662441253662109e-07, 6.407499313354492e-07, 7.152557373046875e-07, 7.897615432739258e-07, 8.642673492431641e-07, 9.387731552124023e-07, 1.0132789611816406e-06, 1.087784767150879e-06, 1.1622905731201172e-06, 1.2367963790893555e-06, 1.3113021850585938e-06, 1.385807991027832e-06, 1.4603137969970703e-06, 1.5348196029663086e-06, 1.6093254089355469e-06, 1.6838312149047852e-06, 1.7583370208740234e-06, 1.8328428268432617e-06, 1.9073486328125e-06, 1.9818544387817383e-06, 2.0563602447509766e-06, 2.130866050720215e-06, 2.205371856689453e-06, 2.2798776626586914e-06, 2.3543834686279297e-06, 2.428889274597168e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 0.0, 6.0, 14.0, 20.0, 25.0, 0.0, 42.0, 54.0, 95.0, 122.0, 0.0, 156.0, 246.0, 321.0, 459.0, 0.0, 710.0, 1004.0, 1633.0, 2501.0, 0.0, 4069.0, 6990.0, 11824.0, 28556.0, 0.0, 69955.0, 791042.0, 69877.0, 28612.0, 0.0, 11821.0, 6903.0, 4091.0, 2486.0, 0.0, 1639.0, 1011.0, 698.0, 464.0, 0.0, 309.0, 277.0, 152.0, 118.0, 0.0, 87.0, 62.0, 37.0, 33.0, 0.0, 16.0, 14.0, 9.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4426186680793762e-06, -1.3951212167739868e-06, -1.3476237654685974e-06, -1.300126314163208e-06, -1.2526288628578186e-06, -1.2051314115524292e-06, -1.1576339602470398e-06, -1.1101365089416504e-06, -1.062639057636261e-06, -1.0151416063308716e-06, -9.676441550254822e-07, -9.201467037200928e-07, -8.726492524147034e-07, -8.25151801109314e-07, -7.776543498039246e-07, -7.301568984985352e-07, -6.826594471931458e-07, -6.351619958877563e-07, -5.876645445823669e-07, -5.401670932769775e-07, -4.926696419715881e-07, -4.4517219066619873e-07, -3.976747393608093e-07, -3.501772880554199e-07, -3.026798367500305e-07, -2.551823854446411e-07, -2.076849341392517e-07, -1.601874828338623e-07, -1.126900315284729e-07, -6.51925802230835e-08, -1.7695128917694092e-08, 2.9802322387695312e-08, 7.729977369308472e-08, 1.2479722499847412e-07, 1.7229467630386353e-07, 2.1979212760925293e-07, 2.6728957891464233e-07, 3.1478703022003174e-07, 3.6228448152542114e-07, 4.0978193283081055e-07, 4.5727938413619995e-07, 5.047768354415894e-07, 5.522742867469788e-07, 5.997717380523682e-07, 6.472691893577576e-07, 6.94766640663147e-07, 7.422640919685364e-07, 7.897615432739258e-07, 8.372589945793152e-07, 8.847564458847046e-07, 9.32253897190094e-07, 9.797513484954834e-07, 1.0272487998008728e-06, 1.0747462511062622e-06, 1.1222437024116516e-06, 1.169741153717041e-06, 1.2172386050224304e-06, 1.2647360563278198e-06, 1.3122335076332092e-06, 1.3597309589385986e-06, 1.407228410243988e-06, 1.4547258615493774e-06, 1.5022233128547668e-06, 1.5497207641601562e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 84.0, 0.0, 0.0, 0.0, 694.0, 0.0, 0.0, 0.0, 95.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.6193599700927734e-07, -4.470348358154297e-07, -4.3213367462158203e-07, -4.172325134277344e-07, -4.023313522338867e-07, -3.8743019104003906e-07, -3.725290298461914e-07, -3.5762786865234375e-07, -3.427267074584961e-07, -3.2782554626464844e-07, -3.129243850708008e-07, -2.980232238769531e-07, -2.8312206268310547e-07, -2.682209014892578e-07, -2.5331974029541016e-07, -2.384185791015625e-07, -2.2351741790771484e-07, -2.086162567138672e-07, -1.9371509552001953e-07, -1.7881393432617188e-07, -1.6391277313232422e-07, -1.4901161193847656e-07, -1.341104507446289e-07, -1.1920928955078125e-07, -1.043081283569336e-07, -8.940696716308594e-08, -7.450580596923828e-08, -5.960464477539063e-08, -4.470348358154297e-08, -2.9802322387695312e-08, -1.4901161193847656e-08, 0.0, 1.4901161193847656e-08, 2.9802322387695312e-08, 4.470348358154297e-08, 5.960464477539063e-08, 7.450580596923828e-08, 8.940696716308594e-08, 1.043081283569336e-07, 1.1920928955078125e-07, 1.341104507446289e-07, 1.4901161193847656e-07, 1.6391277313232422e-07, 1.7881393432617188e-07, 1.9371509552001953e-07, 2.086162567138672e-07, 2.2351741790771484e-07, 2.384185791015625e-07, 2.5331974029541016e-07, 2.682209014892578e-07, 2.8312206268310547e-07, 2.980232238769531e-07, 3.129243850708008e-07, 3.2782554626464844e-07, 3.427267074584961e-07, 3.5762786865234375e-07, 3.725290298461914e-07, 3.8743019104003906e-07, 4.023313522338867e-07, 4.172325134277344e-07, 4.3213367462158203e-07, 4.470348358154297e-07, 4.6193599700927734e-07, 4.76837158203125e-07]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 3.0, 7.0, 15.0, 6.0, 11.0, 19.0, 20.0, 34.0, 39.0, 54.0, 54.0, 87.0, 77.0, 94.0, 102.0, 88.0, 63.0, 42.0, 42.0, 32.0, 20.0, 11.0, 22.0, 12.0, 5.0, 9.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.177887720084982e-06, -3.070116235903697e-06, -2.962344751722412e-06, -2.8545732675411273e-06, -2.7468017833598424e-06, -2.6390302991785575e-06, -2.5312588149972726e-06, -2.4234873308159877e-06, -2.3157158466347028e-06, -2.207944362453418e-06, -2.100172878272133e-06, -1.992401394090848e-06, -1.8846299099095631e-06, -1.7768584257282782e-06, -1.6690869415469933e-06, -1.5613154573657084e-06, -1.4535439731844235e-06, -1.3457724890031386e-06, -1.2380010048218537e-06, -1.1302295206405688e-06, -1.022458036459284e-06, -9.14686552277999e-07, -8.069150680967141e-07, -6.991435839154292e-07, -5.913720997341443e-07, -4.836006155528594e-07, -3.758291313715745e-07, -2.6805764719028957e-07, -1.6028616300900467e-07, -5.251467882771976e-08, 5.525680535356514e-08, 1.6302828953485005e-07, 2.7079977371613495e-07, 3.7857125789741985e-07, 4.863427420787048e-07, 5.941142262599897e-07, 7.018857104412746e-07, 8.096571946225595e-07, 9.174286788038444e-07, 1.0252001629851293e-06, 1.1329716471664142e-06, 1.240743131347699e-06, 1.348514615528984e-06, 1.456286099710269e-06, 1.5640575838915538e-06, 1.6718290680728387e-06, 1.7796005522541236e-06, 1.8873720364354085e-06, 1.9951435206166934e-06, 2.1029150047979783e-06, 2.2106864889792632e-06, 2.318457973160548e-06, 2.426229457341833e-06, 2.534000941523118e-06, 2.641772425704403e-06, 2.7495439098856878e-06, 2.8573153940669727e-06, 2.9650868782482576e-06, 3.0728583624295425e-06, 3.1806298466108274e-06, 3.2884013307921123e-06, 3.396172814973397e-06, 3.503944299154682e-06, 3.611715783335967e-06, 3.719487267517252e-06]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 3.0, 2.0, 10.0, 7.0, 11.0, 9.0, 13.0, 22.0, 24.0, 21.0, 33.0, 26.0, 20.0, 34.0, 33.0, 31.0, 38.0, 49.0, 41.0, 45.0, 24.0, 43.0, 40.0, 32.0, 30.0, 44.0, 24.0, 28.0, 38.0, 28.0, 19.0, 27.0, 21.0, 21.0, 12.0, 17.0, 11.0, 13.0, 8.0, 10.0, 11.0, 4.0, 3.0, 4.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.0494856016739504e-06, -1.983276888495311e-06, -1.9170679479429964e-06, -1.850859234764357e-06, -1.7846505215857178e-06, -1.7184418084070785e-06, -1.6522329815416015e-06, -1.5860241546761245e-06, -1.5198154414974852e-06, -1.4536067283188459e-06, -1.3873979014533688e-06, -1.3211890745878918e-06, -1.2549803614092525e-06, -1.1887716482306132e-06, -1.1225628213651362e-06, -1.0563539944996592e-06, -9.901452813210199e-07, -9.239365112989617e-07, -8.577277412769035e-07, -7.915189712548454e-07, -7.253102012327872e-07, -6.591014312107291e-07, -5.928926611886709e-07, -5.266838911666127e-07, -4.604751211445546e-07, -3.942663511224964e-07, -3.2805758110043826e-07, -2.618488110783801e-07, -1.9564004105632193e-07, -1.2943127103426377e-07, -6.322250101220561e-08, 2.986269009852549e-09, 6.919503903191071e-08, 1.3540380905396887e-07, 2.0161257907602703e-07, 2.678213490980852e-07, 3.3403011912014335e-07, 4.002388891422015e-07, 4.664476591642597e-07, 5.326564291863178e-07, 5.98865199208376e-07, 6.650739692304342e-07, 7.312827392524923e-07, 7.974915092745505e-07, 8.637002792966086e-07, 9.299090493186668e-07, 9.96117819340725e-07, 1.062326646206202e-06, 1.1285353593848413e-06, 1.1947440725634806e-06, 1.2609528994289576e-06, 1.3271617262944346e-06, 1.393370439473074e-06, 1.4595791526517132e-06, 1.5257879795171903e-06, 1.5919968063826673e-06, 1.6582055195613066e-06, 1.7244142327399459e-06, 1.790623059605423e-06, 1.8568318864709e-06, 1.9230405996495392e-06, 1.9892493128281785e-06, 2.055458026006818e-06, 2.1216669665591326e-06, 2.187875679737772e-06]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 9.0, 5.0, 18.0, 20.0, 24.0, 66.0, 32.0, 134.0, 99.0, 325.0, 255.0, 295.0, 1059.0, 821.0, 2584.0, 2001.0, 2645.0, 8549.0, 6858.0, 22502.0, 18699.0, 66718.0, 60876.0, 94642.0, 480601.0, 745955.0, 1905095.0, 317220.0, 255812.0, 61665.0, 41270.0, 47428.0, 13563.0, 16826.0, 4957.0, 3719.0, 4749.0, 1530.0, 2008.0, 666.0, 885.0, 269.0, 207.0, 291.0, 88.0, 95.0, 44.0, 54.0, 11.0, 17.0, 15.0, 4.0, 6.0, 3.0, 3.0], "bins": [-2.9802322387695312e-06, -2.8954818844795227e-06, -2.810731530189514e-06, -2.7259811758995056e-06, -2.641230821609497e-06, -2.5564804673194885e-06, -2.47173011302948e-06, -2.3869797587394714e-06, -2.302229404449463e-06, -2.2174790501594543e-06, -2.132728695869446e-06, -2.0479783415794373e-06, -1.9632279872894287e-06, -1.8784776329994202e-06, -1.7937272787094116e-06, -1.708976924419403e-06, -1.6242265701293945e-06, -1.539476215839386e-06, -1.4547258615493774e-06, -1.369975507259369e-06, -1.2852251529693604e-06, -1.2004747986793518e-06, -1.1157244443893433e-06, -1.0309740900993347e-06, -9.462237358093262e-07, -8.614733815193176e-07, -7.767230272293091e-07, -6.919726729393005e-07, -6.07222318649292e-07, -5.224719643592834e-07, -4.377216100692749e-07, -3.5297125577926636e-07, -2.682209014892578e-07, -1.8347054719924927e-07, -9.872019290924072e-08, -1.3969838619232178e-08, 7.078051567077637e-08, 1.555308699607849e-07, 2.4028122425079346e-07, 3.25031578540802e-07, 4.0978193283081055e-07, 4.945322871208191e-07, 5.792826414108276e-07, 6.640329957008362e-07, 7.487833499908447e-07, 8.335337042808533e-07, 9.182840585708618e-07, 1.0030344128608704e-06, 1.087784767150879e-06, 1.1725351214408875e-06, 1.257285475730896e-06, 1.3420358300209045e-06, 1.426786184310913e-06, 1.5115365386009216e-06, 1.5962868928909302e-06, 1.6810372471809387e-06, 1.7657876014709473e-06, 1.8505379557609558e-06, 1.9352883100509644e-06, 2.020038664340973e-06, 2.1047890186309814e-06, 2.18953937292099e-06, 2.2742897272109985e-06, 2.359040081501007e-06, 2.4437904357910156e-06]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 0.0, 5.0, 0.0, 6.0, 17.0, 0.0, 18.0, 0.0, 17.0, 24.0, 0.0, 31.0, 0.0, 22.0, 41.0, 0.0, 54.0, 0.0, 46.0, 63.0, 0.0, 71.0, 0.0, 78.0, 0.0, 60.0, 54.0, 0.0, 41.0, 0.0, 51.0, 52.0, 0.0, 46.0, 0.0, 43.0, 35.0, 0.0, 17.0, 0.0, 35.0, 21.0, 0.0, 12.0, 0.0, 9.0, 16.0, 0.0, 7.0, 0.0, 6.0, 5.0, 0.0, 4.0, 0.0, 0.0, 3.0], "bins": [-1.1324882507324219e-06, -1.0970979928970337e-06, -1.0617077350616455e-06, -1.0263174772262573e-06, -9.909272193908691e-07, -9.55536961555481e-07, -9.201467037200928e-07, -8.847564458847046e-07, -8.493661880493164e-07, -8.139759302139282e-07, -7.7858567237854e-07, -7.431954145431519e-07, -7.078051567077637e-07, -6.724148988723755e-07, -6.370246410369873e-07, -6.016343832015991e-07, -5.662441253662109e-07, -5.308538675308228e-07, -4.954636096954346e-07, -4.600733518600464e-07, -4.246830940246582e-07, -3.8929283618927e-07, -3.5390257835388184e-07, -3.1851232051849365e-07, -2.8312206268310547e-07, -2.477318048477173e-07, -2.123415470123291e-07, -1.7695128917694092e-07, -1.4156103134155273e-07, -1.0617077350616455e-07, -7.078051567077637e-08, -3.5390257835388184e-08, 0.0, 3.5390257835388184e-08, 7.078051567077637e-08, 1.0617077350616455e-07, 1.4156103134155273e-07, 1.7695128917694092e-07, 2.123415470123291e-07, 2.477318048477173e-07, 2.8312206268310547e-07, 3.1851232051849365e-07, 3.5390257835388184e-07, 3.8929283618927e-07, 4.246830940246582e-07, 4.600733518600464e-07, 4.954636096954346e-07, 5.308538675308228e-07, 5.662441253662109e-07, 6.016343832015991e-07, 6.370246410369873e-07, 6.724148988723755e-07, 7.078051567077637e-07, 7.431954145431519e-07, 7.7858567237854e-07, 8.139759302139282e-07, 8.493661880493164e-07, 8.847564458847046e-07, 9.201467037200928e-07, 9.55536961555481e-07, 9.909272193908691e-07, 1.0263174772262573e-06, 1.0617077350616455e-06, 1.0970979928970337e-06, 1.1324882507324219e-06]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 6.0, 17.0, 8.0, 23.0, 26.0, 46.0, 69.0, 194.0, 177.0, 223.0, 323.0, 460.0, 639.0, 905.0, 3124.0, 2591.0, 3903.0, 5386.0, 8354.0, 12324.0, 47398.0, 44720.0, 71611.0, 118009.0, 199458.0, 358045.0, 640072.0, 1797289.0, 358428.0, 200084.0, 118338.0, 71643.0, 44796.0, 46836.0, 12324.0, 8255.0, 5528.0, 3791.0, 2665.0, 3118.0, 866.0, 664.0, 452.0, 340.0, 231.0, 150.0, 195.0, 60.0, 35.0, 27.0, 26.0, 11.0, 15.0, 8.0, 5.0, 0.0, 2.0, 0.0, 3.0], "bins": [-2.205371856689453e-06, -2.1364539861679077e-06, -2.0675361156463623e-06, -1.998618245124817e-06, -1.9297003746032715e-06, -1.860782504081726e-06, -1.7918646335601807e-06, -1.7229467630386353e-06, -1.6540288925170898e-06, -1.5851110219955444e-06, -1.516193151473999e-06, -1.4472752809524536e-06, -1.3783574104309082e-06, -1.3094395399093628e-06, -1.2405216693878174e-06, -1.171603798866272e-06, -1.1026859283447266e-06, -1.0337680578231812e-06, -9.648501873016357e-07, -8.959323167800903e-07, -8.270144462585449e-07, -7.580965757369995e-07, -6.891787052154541e-07, -6.202608346939087e-07, -5.513429641723633e-07, -4.824250936508179e-07, -4.1350722312927246e-07, -3.4458935260772705e-07, -2.7567148208618164e-07, -2.0675361156463623e-07, -1.3783574104309082e-07, -6.891787052154541e-08, 0.0, 6.891787052154541e-08, 1.3783574104309082e-07, 2.0675361156463623e-07, 2.7567148208618164e-07, 3.4458935260772705e-07, 4.1350722312927246e-07, 4.824250936508179e-07, 5.513429641723633e-07, 6.202608346939087e-07, 6.891787052154541e-07, 7.580965757369995e-07, 8.270144462585449e-07, 8.959323167800903e-07, 9.648501873016357e-07, 1.0337680578231812e-06, 1.1026859283447266e-06, 1.171603798866272e-06, 1.2405216693878174e-06, 1.3094395399093628e-06, 1.3783574104309082e-06, 1.4472752809524536e-06, 1.516193151473999e-06, 1.5851110219955444e-06, 1.6540288925170898e-06, 1.7229467630386353e-06, 1.7918646335601807e-06, 1.860782504081726e-06, 1.9297003746032715e-06, 1.998618245124817e-06, 2.0675361156463623e-06, 2.1364539861679077e-06, 2.205371856689453e-06]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 0.0, 12.0, 0.0, 0.0, 18.0, 0.0, 25.0, 0.0, 62.0, 0.0, 0.0, 82.0, 0.0, 166.0, 0.0, 0.0, 291.0, 0.0, 419.0, 0.0, 563.0, 0.0, 0.0, 774.0, 0.0, 589.0, 0.0, 426.0, 0.0, 0.0, 279.0, 0.0, 158.0, 0.0, 0.0, 97.0, 0.0, 53.0, 0.0, 31.0, 0.0, 0.0, 17.0, 0.0, 13.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.093193173408508e-07, -7.841736078262329e-07, -7.59027898311615e-07, -7.338821887969971e-07, -7.087364792823792e-07, -6.835907697677612e-07, -6.584450602531433e-07, -6.332993507385254e-07, -6.081536412239075e-07, -5.830079317092896e-07, -5.578622221946716e-07, -5.327165126800537e-07, -5.075708031654358e-07, -4.824250936508179e-07, -4.5727938413619995e-07, -4.3213367462158203e-07, -4.069879651069641e-07, -3.818422555923462e-07, -3.5669654607772827e-07, -3.3155083656311035e-07, -3.0640512704849243e-07, -2.812594175338745e-07, -2.561137080192566e-07, -2.3096799850463867e-07, -2.0582228899002075e-07, -1.8067657947540283e-07, -1.555308699607849e-07, -1.30385160446167e-07, -1.0523945093154907e-07, -8.009374141693115e-08, -5.494803190231323e-08, -2.9802322387695312e-08, -4.6566128730773926e-09, 2.0489096641540527e-08, 4.563480615615845e-08, 7.078051567077637e-08, 9.592622518539429e-08, 1.210719347000122e-07, 1.4621764421463013e-07, 1.7136335372924805e-07, 1.9650906324386597e-07, 2.2165477275848389e-07, 2.468004822731018e-07, 2.7194619178771973e-07, 2.9709190130233765e-07, 3.2223761081695557e-07, 3.473833203315735e-07, 3.725290298461914e-07, 3.976747393608093e-07, 4.2282044887542725e-07, 4.4796615839004517e-07, 4.731118679046631e-07, 4.98257577419281e-07, 5.234032869338989e-07, 5.485489964485168e-07, 5.736947059631348e-07, 5.988404154777527e-07, 6.239861249923706e-07, 6.491318345069885e-07, 6.742775440216064e-07, 6.994232535362244e-07, 7.245689630508423e-07, 7.497146725654602e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 5.0, 8.0, 5.0, 12.0, 10.0, 21.0, 30.0, 34.0, 44.0, 54.0, 87.0, 74.0, 94.0, 74.0, 84.0, 62.0, 62.0, 56.0, 28.0, 32.0, 27.0, 12.0, 14.0, 9.0, 8.0, 8.0, 3.0, 9.0, 5.0, 1.0, 0.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0859433789155446e-06, -2.0166885406069923e-06, -1.94743370229844e-06, -1.8781786366162123e-06, -1.80892379830766e-06, -1.7396689599991078e-06, -1.6704140080037178e-06, -1.6011590560083278e-06, -1.5319042176997755e-06, -1.4626493793912232e-06, -1.3933944273958332e-06, -1.3241394754004432e-06, -1.254884637091891e-06, -1.1856297987833386e-06, -1.1163748467879486e-06, -1.0471198947925586e-06, -9.778650564840063e-07, -9.086101613320352e-07, -8.393552661800641e-07, -7.701003710280929e-07, -7.008454758761218e-07, -6.315905807241506e-07, -5.623356855721795e-07, -4.930807904202084e-07, -4.238258952682372e-07, -3.545710001162661e-07, -2.8531610496429494e-07, -2.160612098123238e-07, -1.4680631466035265e-07, -7.755141950838151e-08, -8.296524356410373e-09, 6.095837079556077e-08, 1.3021349332120735e-07, 1.994683884731785e-07, 2.6872328362514963e-07, 3.379781787771208e-07, 4.072330739290919e-07, 4.7648796908106306e-07, 5.457428642330342e-07, 6.149977593850053e-07, 6.842526545369765e-07, 7.535075496889476e-07, 8.227624448409188e-07, 8.920173399928899e-07, 9.61272235144861e-07, 1.0305270734534133e-06, 1.0997820254488033e-06, 1.1690369774441933e-06, 1.2382918157527456e-06, 1.3075466540612979e-06, 1.3768016060566879e-06, 1.4460565580520779e-06, 1.5153113963606302e-06, 1.5845662346691824e-06, 1.6538211866645725e-06, 1.7230761386599625e-06, 1.7923309769685147e-06, 1.861585815277067e-06, 1.9308408809592947e-06, 2.000095719267847e-06, 2.0693505575763993e-06, 2.1386053958849516e-06, 2.207860234193504e-06, 2.2771152998757316e-06, 2.346370138184284e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 9.0, 11.0, 9.0, 13.0, 13.0, 11.0, 22.0, 19.0, 13.0, 28.0, 24.0, 37.0, 28.0, 26.0, 29.0, 51.0, 37.0, 45.0, 40.0, 39.0, 41.0, 46.0, 40.0, 36.0, 32.0, 29.0, 27.0, 27.0, 26.0, 24.0, 23.0, 25.0, 34.0, 15.0, 9.0, 11.0, 13.0, 8.0, 7.0, 2.0, 2.0, 3.0, 4.0, 5.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.291862758989737e-06, -1.2454805755623966e-06, -1.1990983921350562e-06, -1.1527162087077159e-06, -1.1063340252803755e-06, -1.0599518418530351e-06, -1.0135696584256948e-06, -9.671874749983544e-07, -9.208052915710141e-07, -8.744231081436737e-07, -8.280409247163334e-07, -7.81658741288993e-07, -7.352765578616527e-07, -6.888943744343123e-07, -6.42512191006972e-07, -5.961300075796316e-07, -5.497478241522913e-07, -5.033656407249509e-07, -4.569834572976106e-07, -4.1060127387027023e-07, -3.642190904429299e-07, -3.1783690701558953e-07, -2.714547235882492e-07, -2.2507254016090883e-07, -1.7869035673356848e-07, -1.3230817330622813e-07, -8.592598987888778e-08, -3.9543806451547425e-08, 6.838376975792926e-09, 5.322056040313328e-08, 9.960274383047363e-08, 1.4598492725781398e-07, 1.923669969983166e-07, 2.3874918042565696e-07, 2.851313638529973e-07, 3.3151354728033766e-07, 3.77895730707678e-07, 4.2427791413501836e-07, 4.706600975623587e-07, 5.170422809896991e-07, 5.634244644170394e-07, 6.098066478443798e-07, 6.561888312717201e-07, 7.025710146990605e-07, 7.489531981264008e-07, 7.953353815537412e-07, 8.417175649810815e-07, 8.880997484084219e-07, 9.344819318357622e-07, 9.808641152631026e-07, 1.027246298690443e-06, 1.0736284821177833e-06, 1.1200106655451236e-06, 1.166392848972464e-06, 1.2127750323998043e-06, 1.2591572158271447e-06, 1.305539399254485e-06, 1.3519215826818254e-06, 1.3983037661091657e-06, 1.444685949536506e-06, 1.4910681329638464e-06, 1.5374503163911868e-06, 1.5838324998185271e-06, 1.6302146832458675e-06, 1.6765968666732078e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 4.0, 12.0, 15.0, 29.0, 22.0, 52.0, 73.0, 133.0, 233.0, 163.0, 463.0, 811.0, 1631.0, 1236.0, 4251.0, 8694.0, 18336.0, 15988.0, 60514.0, 150899.0, 365545.0, 156320.0, 150557.0, 60190.0, 26817.0, 12680.0, 3565.0, 4327.0, 2238.0, 1212.0, 337.0, 492.0, 275.0, 162.0, 63.0, 76.0, 60.0, 22.0, 12.0, 17.0, 14.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.039836883544922e-06, -2.934597432613373e-06, -2.8293579816818237e-06, -2.7241185307502747e-06, -2.6188790798187256e-06, -2.5136396288871765e-06, -2.4084001779556274e-06, -2.3031607270240784e-06, -2.1979212760925293e-06, -2.0926818251609802e-06, -1.987442374229431e-06, -1.882202923297882e-06, -1.776963472366333e-06, -1.671724021434784e-06, -1.5664845705032349e-06, -1.4612451195716858e-06, -1.3560056686401367e-06, -1.2507662177085876e-06, -1.1455267667770386e-06, -1.0402873158454895e-06, -9.350478649139404e-07, -8.298084139823914e-07, -7.245689630508423e-07, -6.193295121192932e-07, -5.140900611877441e-07, -4.0885061025619507e-07, -3.03611159324646e-07, -1.9837170839309692e-07, -9.313225746154785e-08, 1.210719347000122e-08, 1.1734664440155029e-07, 2.2258609533309937e-07, 3.2782554626464844e-07, 4.330649971961975e-07, 5.383044481277466e-07, 6.435438990592957e-07, 7.487833499908447e-07, 8.540228009223938e-07, 9.592622518539429e-07, 1.064501702785492e-06, 1.169741153717041e-06, 1.27498060464859e-06, 1.3802200555801392e-06, 1.4854595065116882e-06, 1.5906989574432373e-06, 1.6959384083747864e-06, 1.8011778593063354e-06, 1.9064173102378845e-06, 2.0116567611694336e-06, 2.1168962121009827e-06, 2.2221356630325317e-06, 2.327375113964081e-06, 2.43261456489563e-06, 2.537854015827179e-06, 2.643093466758728e-06, 2.748332917690277e-06, 2.853572368621826e-06, 2.9588118195533752e-06, 3.0640512704849243e-06, 3.1692907214164734e-06, 3.2745301723480225e-06, 3.3797696232795715e-06, 3.4850090742111206e-06, 3.5902485251426697e-06, 3.6954879760742188e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 3.0, 0.0, 7.0, 10.0, 9.0, 17.0, 0.0, 22.0, 29.0, 25.0, 20.0, 24.0, 0.0, 35.0, 50.0, 36.0, 60.0, 0.0, 53.0, 53.0, 61.0, 63.0, 0.0, 66.0, 40.0, 43.0, 47.0, 44.0, 0.0, 36.0, 39.0, 21.0, 16.0, 0.0, 25.0, 12.0, 16.0, 3.0, 0.0, 4.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.430511474609375e-06, -1.3820827007293701e-06, -1.3336539268493652e-06, -1.2852251529693604e-06, -1.2367963790893555e-06, -1.1883676052093506e-06, -1.1399388313293457e-06, -1.0915100574493408e-06, -1.043081283569336e-06, -9.94652509689331e-07, -9.462237358093262e-07, -8.977949619293213e-07, -8.493661880493164e-07, -8.009374141693115e-07, -7.525086402893066e-07, -7.040798664093018e-07, -6.556510925292969e-07, -6.07222318649292e-07, -5.587935447692871e-07, -5.103647708892822e-07, -4.6193599700927734e-07, -4.1350722312927246e-07, -3.650784492492676e-07, -3.166496753692627e-07, -2.682209014892578e-07, -2.1979212760925293e-07, -1.7136335372924805e-07, -1.2293457984924316e-07, -7.450580596923828e-08, -2.60770320892334e-08, 2.2351741790771484e-08, 7.078051567077637e-08, 1.1920928955078125e-07, 1.6763806343078613e-07, 2.1606683731079102e-07, 2.644956111907959e-07, 3.129243850708008e-07, 3.6135315895080566e-07, 4.0978193283081055e-07, 4.5821070671081543e-07, 5.066394805908203e-07, 5.550682544708252e-07, 6.034970283508301e-07, 6.51925802230835e-07, 7.003545761108398e-07, 7.487833499908447e-07, 7.972121238708496e-07, 8.456408977508545e-07, 8.940696716308594e-07, 9.424984455108643e-07, 9.909272193908691e-07, 1.039355993270874e-06, 1.087784767150879e-06, 1.1362135410308838e-06, 1.1846423149108887e-06, 1.2330710887908936e-06, 1.2814998626708984e-06, 1.3299286365509033e-06, 1.3783574104309082e-06, 1.426786184310913e-06, 1.475214958190918e-06, 1.5236437320709229e-06, 1.5720725059509277e-06, 1.6205012798309326e-06, 1.6689300537109375e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 15.0, 1.0, 9.0, 11.0, 12.0, 28.0, 45.0, 45.0, 69.0, 131.0, 194.0, 341.0, 467.0, 725.0, 1526.0, 2884.0, 15110.0, 58617.0, 931916.0, 22699.0, 7314.0, 2860.0, 1850.0, 582.0, 395.0, 270.0, 154.0, 81.0, 81.0, 36.0, 27.0, 15.0, 11.0, 11.0, 9.0, 7.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.410743713378906e-06, -4.28222119808197e-06, -4.153698682785034e-06, -4.025176167488098e-06, -3.896653652191162e-06, -3.768131136894226e-06, -3.63960862159729e-06, -3.511086106300354e-06, -3.382563591003418e-06, -3.254041075706482e-06, -3.125518560409546e-06, -2.99699604511261e-06, -2.868473529815674e-06, -2.739951014518738e-06, -2.6114284992218018e-06, -2.4829059839248657e-06, -2.3543834686279297e-06, -2.2258609533309937e-06, -2.0973384380340576e-06, -1.9688159227371216e-06, -1.8402934074401855e-06, -1.7117708921432495e-06, -1.5832483768463135e-06, -1.4547258615493774e-06, -1.3262033462524414e-06, -1.1976808309555054e-06, -1.0691583156585693e-06, -9.406358003616333e-07, -8.121132850646973e-07, -6.835907697677612e-07, -5.550682544708252e-07, -4.2654573917388916e-07, -2.980232238769531e-07, -1.695007085800171e-07, -4.0978193283081055e-08, 8.754432201385498e-08, 2.1606683731079102e-07, 3.4458935260772705e-07, 4.731118679046631e-07, 6.016343832015991e-07, 7.301568984985352e-07, 8.586794137954712e-07, 9.872019290924072e-07, 1.1157244443893433e-06, 1.2442469596862793e-06, 1.3727694749832153e-06, 1.5012919902801514e-06, 1.6298145055770874e-06, 1.7583370208740234e-06, 1.8868595361709595e-06, 2.0153820514678955e-06, 2.1439045667648315e-06, 2.2724270820617676e-06, 2.4009495973587036e-06, 2.5294721126556396e-06, 2.6579946279525757e-06, 2.7865171432495117e-06, 2.9150396585464478e-06, 3.043562173843384e-06, 3.17208468914032e-06, 3.300607204437256e-06, 3.429129719734192e-06, 3.557652235031128e-06, 3.686174750328064e-06, 3.814697265625e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 108.0, 0.0, 0.0, 0.0, 0.0, 694.0, 0.0, 0.0, 0.0, 0.0, 128.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4552067518234253e-07, -3.334134817123413e-07, -3.213062882423401e-07, -3.0919909477233887e-07, -2.9709190130233765e-07, -2.849847078323364e-07, -2.728775143623352e-07, -2.60770320892334e-07, -2.4866312742233276e-07, -2.3655593395233154e-07, -2.2444874048233032e-07, -2.123415470123291e-07, -2.0023435354232788e-07, -1.8812716007232666e-07, -1.7601996660232544e-07, -1.6391277313232422e-07, -1.51805579662323e-07, -1.3969838619232178e-07, -1.2759119272232056e-07, -1.1548399925231934e-07, -1.0337680578231812e-07, -9.12696123123169e-08, -7.916241884231567e-08, -6.705522537231445e-08, -5.494803190231323e-08, -4.284083843231201e-08, -3.073364496231079e-08, -1.862645149230957e-08, -6.51925802230835e-09, 5.587935447692871e-09, 1.7695128917694092e-08, 2.9802322387695312e-08, 4.190951585769653e-08, 5.4016709327697754e-08, 6.612390279769897e-08, 7.82310962677002e-08, 9.033828973770142e-08, 1.0244548320770264e-07, 1.1455267667770386e-07, 1.2665987014770508e-07, 1.387670636177063e-07, 1.5087425708770752e-07, 1.6298145055770874e-07, 1.7508864402770996e-07, 1.8719583749771118e-07, 1.993030309677124e-07, 2.1141022443771362e-07, 2.2351741790771484e-07, 2.3562461137771606e-07, 2.477318048477173e-07, 2.598389983177185e-07, 2.7194619178771973e-07, 2.8405338525772095e-07, 2.9616057872772217e-07, 3.082677721977234e-07, 3.203749656677246e-07, 3.3248215913772583e-07, 3.4458935260772705e-07, 3.5669654607772827e-07, 3.688037395477295e-07, 3.809109330177307e-07, 3.9301812648773193e-07, 4.0512531995773315e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 5.0, 3.0, 2.0, 3.0, 5.0, 7.0, 11.0, 9.0, 12.0, 19.0, 14.0, 23.0, 25.0, 40.0, 42.0, 57.0, 79.0, 89.0, 74.0, 72.0, 77.0, 62.0, 58.0, 40.0, 33.0, 35.0, 22.0, 13.0, 15.0, 10.0, 10.0, 4.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6453153648399166e-06, -1.5859395716688596e-06, -1.5265636648109648e-06, -1.46718775795307e-06, -1.407811964782013e-06, -1.348436171610956e-06, -1.2890602647530613e-06, -1.2296843578951666e-06, -1.1703085647241096e-06, -1.1109327715530526e-06, -1.0515568646951579e-06, -9.921809578372631e-07, -9.328051646662061e-07, -8.734293146517302e-07, -8.140534646372544e-07, -7.546776146227785e-07, -6.953017646083026e-07, -6.359259145938267e-07, -5.765500645793509e-07, -5.17174214564875e-07, -4.5779836455039913e-07, -3.9842251453592326e-07, -3.390466645214474e-07, -2.796708145069715e-07, -2.2029496449249564e-07, -1.6091911447801976e-07, -1.0154326446354389e-07, -4.216741444906802e-08, 1.7208435565407854e-08, 7.658428557988373e-08, 1.359601355943596e-07, 1.9533598560883547e-07, 2.5471194931014907e-07, 3.1408779932462494e-07, 3.734636493391008e-07, 4.328394993535767e-07, 4.922153493680526e-07, 5.515911993825284e-07, 6.109670493970043e-07, 6.703428994114802e-07, 7.29718749425956e-07, 7.890945994404319e-07, 8.484704494549078e-07, 9.078462994693837e-07, 9.672221494838595e-07, 1.0265980563417543e-06, 1.0859738495128113e-06, 1.1453496426838683e-06, 1.204725549541763e-06, 1.2641014563996578e-06, 1.3234772495707148e-06, 1.3828530427417718e-06, 1.4422289495996665e-06, 1.5016048564575613e-06, 1.5609806496286183e-06, 1.6203564427996753e-06, 1.67973234965757e-06, 1.7391082565154647e-06, 1.7984840496865218e-06, 1.8578598428575788e-06, 1.9172357497154735e-06, 1.9766116565733682e-06, 2.035987563431263e-06, 2.0953632429154823e-06, 2.154739149773377e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 7.0, 8.0, 11.0, 14.0, 8.0, 17.0, 20.0, 17.0, 12.0, 20.0, 27.0, 39.0, 29.0, 25.0, 30.0, 46.0, 40.0, 42.0, 40.0, 37.0, 53.0, 38.0, 36.0, 42.0, 33.0, 31.0, 27.0, 25.0, 32.0, 21.0, 26.0, 22.0, 29.0, 21.0, 10.0, 10.0, 11.0, 13.0, 8.0, 2.0, 2.0, 2.0, 4.0, 6.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.229081817655242e-06, -1.185095925393398e-06, -1.1411100331315538e-06, -1.0971241408697097e-06, -1.0531381349210278e-06, -1.0091522426591837e-06, -9.651663503973396e-07, -9.211804581354954e-07, -8.771945658736513e-07, -8.332086736118072e-07, -7.892227245065442e-07, -7.452368322447001e-07, -7.012509399828559e-07, -6.572649908775929e-07, -6.132790986157488e-07, -5.692932063539047e-07, -5.253072572486417e-07, -4.813213649867976e-07, -4.37335444303244e-07, -3.9334952361969044e-07, -3.493636313578463e-07, -3.0537771067429276e-07, -2.613917899907392e-07, -2.1740589772889507e-07, -1.734199770453415e-07, -1.2943407057264267e-07, -8.544815699451647e-08, -4.1462243416390265e-08, 2.5236630563085782e-09, 4.650956952900742e-08, 9.049549021256098e-08, 1.344813824744051e-07, 1.7846730315795867e-07, 2.224532096306575e-07, 2.6643911610335635e-07, 3.104250367869099e-07, 3.5441092904875404e-07, 3.983968497323076e-07, 4.4238277041586116e-07, 4.863686626777053e-07, 5.303545549395494e-07, 5.743404472013935e-07, 6.183263963066565e-07, 6.623122885685007e-07, 7.062981808303448e-07, 7.502841299356078e-07, 7.942700221974519e-07, 8.38255914459296e-07, 8.82241863564559e-07, 9.262277558264032e-07, 9.702137049316661e-07, 1.0141995971935103e-06, 1.0581854894553544e-06, 1.1021713817171985e-06, 1.1461572739790427e-06, 1.1901431662408868e-06, 1.2341291721895686e-06, 1.2781150644514128e-06, 1.3221009567132569e-06, 1.3660869626619387e-06, 1.4100728549237829e-06, 1.454058747185627e-06, 1.4980446394474711e-06, 1.5420305317093153e-06, 1.5860164239711594e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 13.0, 9.0, 16.0, 36.0, 36.0, 27.0, 48.0, 133.0, 99.0, 154.0, 497.0, 444.0, 606.0, 797.0, 2857.0, 2364.0, 3552.0, 13051.0, 11841.0, 17594.0, 27322.0, 107119.0, 100984.0, 148014.0, 174078.0, 247615.0, 65597.0, 42047.0, 45224.0, 11846.0, 7717.0, 5059.0, 6073.0, 1601.0, 1170.0, 1334.0, 436.0, 292.0, 216.0, 296.0, 98.0, 61.0, 87.0, 25.0, 19.0, 13.0, 19.0, 3.0, 4.0, 11.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.384185791015625e-06, -2.3078173398971558e-06, -2.2314488887786865e-06, -2.1550804376602173e-06, -2.078711986541748e-06, -2.002343535423279e-06, -1.9259750843048096e-06, -1.8496066331863403e-06, -1.773238182067871e-06, -1.6968697309494019e-06, -1.6205012798309326e-06, -1.5441328287124634e-06, -1.4677643775939941e-06, -1.391395926475525e-06, -1.3150274753570557e-06, -1.2386590242385864e-06, -1.1622905731201172e-06, -1.085922122001648e-06, -1.0095536708831787e-06, -9.331852197647095e-07, -8.568167686462402e-07, -7.80448317527771e-07, -7.040798664093018e-07, -6.277114152908325e-07, -5.513429641723633e-07, -4.7497451305389404e-07, -3.986060619354248e-07, -3.2223761081695557e-07, -2.4586915969848633e-07, -1.695007085800171e-07, -9.313225746154785e-08, -1.6763806343078613e-08, 5.960464477539063e-08, 1.3597309589385986e-07, 2.123415470123291e-07, 2.8870999813079834e-07, 3.650784492492676e-07, 4.414469003677368e-07, 5.178153514862061e-07, 5.941838026046753e-07, 6.705522537231445e-07, 7.469207048416138e-07, 8.23289155960083e-07, 8.996576070785522e-07, 9.760260581970215e-07, 1.0523945093154907e-06, 1.12876296043396e-06, 1.2051314115524292e-06, 1.2814998626708984e-06, 1.3578683137893677e-06, 1.434236764907837e-06, 1.5106052160263062e-06, 1.5869736671447754e-06, 1.6633421182632446e-06, 1.7397105693817139e-06, 1.816079020500183e-06, 1.8924474716186523e-06, 1.9688159227371216e-06, 2.045184373855591e-06, 2.12155282497406e-06, 2.1979212760925293e-06, 2.2742897272109985e-06, 2.3506581783294678e-06, 2.427026629447937e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 6.0, 0.0, 0.0, 0.0, 4.0, 21.0, 0.0, 10.0, 0.0, 19.0, 30.0, 0.0, 31.0, 0.0, 34.0, 53.0, 0.0, 47.0, 63.0, 0.0, 61.0, 0.0, 84.0, 81.0, 0.0, 65.0, 0.0, 58.0, 56.0, 0.0, 63.0, 0.0, 60.0, 46.0, 0.0, 39.0, 0.0, 28.0, 18.0, 0.0, 11.0, 10.0, 0.0, 7.0, 0.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.76957380771637e-07, -9.406358003616333e-07, -9.043142199516296e-07, -8.67992639541626e-07, -8.316710591316223e-07, -7.953494787216187e-07, -7.59027898311615e-07, -7.227063179016113e-07, -6.863847374916077e-07, -6.50063157081604e-07, -6.137415766716003e-07, -5.774199962615967e-07, -5.41098415851593e-07, -5.047768354415894e-07, -4.684552550315857e-07, -4.3213367462158203e-07, -3.9581209421157837e-07, -3.594905138015747e-07, -3.2316893339157104e-07, -2.868473529815674e-07, -2.505257725715637e-07, -2.1420419216156006e-07, -1.778826117515564e-07, -1.4156103134155273e-07, -1.0523945093154907e-07, -6.891787052154541e-08, -3.259629011154175e-08, 3.725290298461914e-09, 4.0046870708465576e-08, 7.636845111846924e-08, 1.126900315284729e-07, 1.4901161193847656e-07, 1.8533319234848022e-07, 2.2165477275848389e-07, 2.5797635316848755e-07, 2.942979335784912e-07, 3.3061951398849487e-07, 3.6694109439849854e-07, 4.032626748085022e-07, 4.3958425521850586e-07, 4.759058356285095e-07, 5.122274160385132e-07, 5.485489964485168e-07, 5.848705768585205e-07, 6.211921572685242e-07, 6.575137376785278e-07, 6.938353180885315e-07, 7.301568984985352e-07, 7.664784789085388e-07, 8.028000593185425e-07, 8.391216397285461e-07, 8.754432201385498e-07, 9.117648005485535e-07, 9.480863809585571e-07, 9.844079613685608e-07, 1.0207295417785645e-06, 1.0570511221885681e-06, 1.0933727025985718e-06, 1.1296942830085754e-06, 1.166015863418579e-06, 1.2023374438285828e-06, 1.2386590242385864e-06, 1.27498060464859e-06, 1.3113021850585938e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 26.0, 21.0, 31.0, 50.0, 51.0, 97.0, 116.0, 200.0, 258.0, 1003.0, 858.0, 1253.0, 1869.0, 2652.0, 3841.0, 5801.0, 8516.0, 12660.0, 47203.0, 42959.0, 65183.0, 99547.0, 144072.0, 171660.0, 143936.0, 99740.0, 65706.0, 71038.0, 18849.0, 12770.0, 8574.0, 5674.0, 4001.0, 2640.0, 1793.0, 1204.0, 1411.0, 425.0, 263.0, 206.0, 138.0, 78.0, 50.0, 44.0, 34.0, 35.0, 13.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1457672119140625e-06, -2.0796433091163635e-06, -2.0135194063186646e-06, -1.9473955035209656e-06, -1.8812716007232666e-06, -1.8151476979255676e-06, -1.7490237951278687e-06, -1.6828998923301697e-06, -1.6167759895324707e-06, -1.5506520867347717e-06, -1.4845281839370728e-06, -1.4184042811393738e-06, -1.3522803783416748e-06, -1.2861564755439758e-06, -1.2200325727462769e-06, -1.1539086699485779e-06, -1.087784767150879e-06, -1.02166086435318e-06, -9.55536961555481e-07, -8.89413058757782e-07, -8.23289155960083e-07, -7.57165253162384e-07, -6.910413503646851e-07, -6.249174475669861e-07, -5.587935447692871e-07, -4.926696419715881e-07, -4.2654573917388916e-07, -3.604218363761902e-07, -2.942979335784912e-07, -2.2817403078079224e-07, -1.6205012798309326e-07, -9.592622518539429e-08, -2.9802322387695312e-08, 3.632158041000366e-08, 1.0244548320770264e-07, 1.685693860054016e-07, 2.3469328880310059e-07, 3.0081719160079956e-07, 3.6694109439849854e-07, 4.330649971961975e-07, 4.991888999938965e-07, 5.653128027915955e-07, 6.314367055892944e-07, 6.975606083869934e-07, 7.636845111846924e-07, 8.298084139823914e-07, 8.959323167800903e-07, 9.620562195777893e-07, 1.0281801223754883e-06, 1.0943040251731873e-06, 1.1604279279708862e-06, 1.2265518307685852e-06, 1.2926757335662842e-06, 1.3587996363639832e-06, 1.4249235391616821e-06, 1.491047441959381e-06, 1.55717134475708e-06, 1.623295247554779e-06, 1.689419150352478e-06, 1.755543053150177e-06, 1.821666955947876e-06, 1.887790858745575e-06, 1.953914761543274e-06, 2.020038664340973e-06, 2.086162567138672e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 15.0, 0.0, 0.0, 13.0, 0.0, 33.0, 0.0, 34.0, 0.0, 67.0, 0.0, 0.0, 83.0, 0.0, 82.0, 0.0, 112.0, 0.0, 0.0, 119.0, 0.0, 108.0, 0.0, 76.0, 0.0, 85.0, 0.0, 0.0, 66.0, 0.0, 41.0, 0.0, 30.0, 0.0, 0.0, 11.0, 0.0, 15.0, 0.0, 13.0, 0.0, 8.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.083879947662354e-07, -7.82310962677002e-07, -7.562339305877686e-07, -7.301568984985352e-07, -7.040798664093018e-07, -6.780028343200684e-07, -6.51925802230835e-07, -6.258487701416016e-07, -5.997717380523682e-07, -5.736947059631348e-07, -5.476176738739014e-07, -5.21540641784668e-07, -4.954636096954346e-07, -4.6938657760620117e-07, -4.4330954551696777e-07, -4.172325134277344e-07, -3.91155481338501e-07, -3.650784492492676e-07, -3.390014171600342e-07, -3.129243850708008e-07, -2.868473529815674e-07, -2.60770320892334e-07, -2.3469328880310059e-07, -2.086162567138672e-07, -1.825392246246338e-07, -1.564621925354004e-07, -1.30385160446167e-07, -1.043081283569336e-07, -7.82310962677002e-08, -5.21540641784668e-08, -2.60770320892334e-08, 0.0, 2.60770320892334e-08, 5.21540641784668e-08, 7.82310962677002e-08, 1.043081283569336e-07, 1.30385160446167e-07, 1.564621925354004e-07, 1.825392246246338e-07, 2.086162567138672e-07, 2.3469328880310059e-07, 2.60770320892334e-07, 2.868473529815674e-07, 3.129243850708008e-07, 3.390014171600342e-07, 3.650784492492676e-07, 3.91155481338501e-07, 4.172325134277344e-07, 4.4330954551696777e-07, 4.6938657760620117e-07, 4.954636096954346e-07, 5.21540641784668e-07, 5.476176738739014e-07, 5.736947059631348e-07, 5.997717380523682e-07, 6.258487701416016e-07, 6.51925802230835e-07, 6.780028343200684e-07, 7.040798664093018e-07, 7.301568984985352e-07, 7.562339305877686e-07, 7.82310962677002e-07, 8.083879947662354e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 15.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 74.0, 0.0, 0.0, 143.0, 0.0, 0.0, 1294.0, 0.0, 0.0, 3939.0, 0.0, 0.0, 10962.0, 0.0, 0.0, 0.0, 22283.0, 0.0, 0.0, 971186.0, 0.0, 0.0, 22255.0, 0.0, 0.0, 10786.0, 0.0, 0.0, 4006.0, 0.0, 0.0, 0.0, 1291.0, 0.0, 0.0, 154.0, 0.0, 0.0, 95.0, 0.0, 0.0, 31.0, 0.0, 0.0, 27.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.370246410369873e-07, -6.183981895446777e-07, -5.997717380523682e-07, -5.811452865600586e-07, -5.62518835067749e-07, -5.438923835754395e-07, -5.252659320831299e-07, -5.066394805908203e-07, -4.880130290985107e-07, -4.6938657760620117e-07, -4.507601261138916e-07, -4.3213367462158203e-07, -4.1350722312927246e-07, -3.948807716369629e-07, -3.762543201446533e-07, -3.5762786865234375e-07, -3.390014171600342e-07, -3.203749656677246e-07, -3.0174851417541504e-07, -2.8312206268310547e-07, -2.644956111907959e-07, -2.4586915969848633e-07, -2.2724270820617676e-07, -2.086162567138672e-07, -1.8998980522155762e-07, -1.7136335372924805e-07, -1.5273690223693848e-07, -1.341104507446289e-07, -1.1548399925231934e-07, -9.685754776000977e-08, -7.82310962677002e-08, -5.960464477539063e-08, -4.0978193283081055e-08, -2.2351741790771484e-08, -3.725290298461914e-09, 1.4901161193847656e-08, 3.3527612686157227e-08, 5.21540641784668e-08, 7.078051567077637e-08, 8.940696716308594e-08, 1.0803341865539551e-07, 1.2665987014770508e-07, 1.4528632164001465e-07, 1.6391277313232422e-07, 1.825392246246338e-07, 2.0116567611694336e-07, 2.1979212760925293e-07, 2.384185791015625e-07, 2.5704503059387207e-07, 2.7567148208618164e-07, 2.942979335784912e-07, 3.129243850708008e-07, 3.3155083656311035e-07, 3.501772880554199e-07, 3.688037395477295e-07, 3.8743019104003906e-07, 4.0605664253234863e-07, 4.246830940246582e-07, 4.4330954551696777e-07, 4.6193599700927734e-07, 4.805624485015869e-07, 4.991888999938965e-07, 5.178153514862061e-07, 5.364418029785156e-07]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 24.0, 0.0, 0.0, 60.0, 0.0, 0.0, 0.0, 186.0, 0.0, 0.0, 363.0, 0.0, 0.0, 815.0, 0.0, 0.0, 0.0, 2363.0, 0.0, 0.0, 10727.0, 0.0, 0.0, 32616.0, 0.0, 0.0, 0.0, 954257.0, 0.0, 0.0, 32623.0, 0.0, 0.0, 0.0, 10705.0, 0.0, 0.0, 2392.0, 0.0, 0.0, 838.0, 0.0, 0.0, 0.0, 334.0, 0.0, 0.0, 175.0, 0.0, 0.0, 50.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 14.0, 0.0, 0.0, 6.0], "bins": [-5.364418029785156e-07, -5.187466740608215e-07, -5.010515451431274e-07, -4.833564162254333e-07, -4.6566128730773926e-07, -4.4796615839004517e-07, -4.302710294723511e-07, -4.12575900554657e-07, -3.948807716369629e-07, -3.771856427192688e-07, -3.594905138015747e-07, -3.417953848838806e-07, -3.241002559661865e-07, -3.0640512704849243e-07, -2.8870999813079834e-07, -2.7101486921310425e-07, -2.5331974029541016e-07, -2.3562461137771606e-07, -2.1792948246002197e-07, -2.0023435354232788e-07, -1.825392246246338e-07, -1.648440957069397e-07, -1.471489667892456e-07, -1.2945383787155151e-07, -1.1175870895385742e-07, -9.406358003616333e-08, -7.636845111846924e-08, -5.8673322200775146e-08, -4.0978193283081055e-08, -2.3283064365386963e-08, -5.587935447692871e-09, 1.210719347000122e-08, 2.9802322387695312e-08, 4.7497451305389404e-08, 6.51925802230835e-08, 8.288770914077759e-08, 1.0058283805847168e-07, 1.1827796697616577e-07, 1.3597309589385986e-07, 1.5366822481155396e-07, 1.7136335372924805e-07, 1.8905848264694214e-07, 2.0675361156463623e-07, 2.2444874048233032e-07, 2.421438694000244e-07, 2.598389983177185e-07, 2.775341272354126e-07, 2.952292561531067e-07, 3.129243850708008e-07, 3.3061951398849487e-07, 3.4831464290618896e-07, 3.6600977182388306e-07, 3.8370490074157715e-07, 4.0140002965927124e-07, 4.1909515857696533e-07, 4.367902874946594e-07, 4.544854164123535e-07, 4.721805453300476e-07, 4.898756742477417e-07, 5.075708031654358e-07, 5.252659320831299e-07, 5.42961061000824e-07, 5.606561899185181e-07, 5.783513188362122e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 877.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 7.0, 3.0, 9.0, 12.0, 12.0, 24.0, 19.0, 21.0, 33.0, 44.0, 55.0, 64.0, 77.0, 85.0, 87.0, 65.0, 74.0, 67.0, 46.0, 44.0, 25.0, 22.0, 14.0, 18.0, 16.0, 11.0, 10.0, 6.0, 8.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5202499525912572e-06, -1.4648586557086674e-06, -1.4094673588260775e-06, -1.35407594825665e-06, -1.2986846513740602e-06, -1.2432933544914704e-06, -1.1879020576088806e-06, -1.1325107607262908e-06, -1.0771193501568632e-06, -1.0217280532742734e-06, -9.663367563916836e-07, -9.109454026656749e-07, -8.555540489396662e-07, -8.001627520570764e-07, -7.447714551744866e-07, -6.893801014484779e-07, -6.339888045658881e-07, -5.785975076832983e-07, -5.232061539572896e-07, -4.6781485707469983e-07, -4.1242350334869116e-07, -3.5703220646610134e-07, -3.016408811618021e-07, -2.4624955585750286e-07, -1.908582305532036e-07, -1.3546690524890437e-07, -8.007558705003248e-08, -2.4684268851160596e-08, 3.070705645313865e-08, 8.609836754658318e-08, 1.4148969285088242e-07, 1.9688101815518166e-07, 2.522723434594809e-07, 3.0766366876378015e-07, 3.630549940680794e-07, 4.184462909506692e-07, 4.738376446766779e-07, 5.292289415592677e-07, 5.846202384418575e-07, 6.400115921678662e-07, 6.954029458938749e-07, 7.507942427764647e-07, 8.061855965024733e-07, 8.615768933850632e-07, 9.169682471110718e-07, 9.723595439936616e-07, 1.0277508408762515e-06, 1.083142251445679e-06, 1.138533434641431e-06, 1.193924731524021e-06, 1.2493160284066107e-06, 1.3047074389760382e-06, 1.360098735858628e-06, 1.4154900327412179e-06, 1.4708813296238077e-06, 1.5262726265063975e-06, 1.581664037075825e-06, 1.6370553339584148e-06, 1.6924466308410047e-06, 1.7478380414104322e-06, 1.803229338293022e-06, 1.8586206351756118e-06, 1.9140120457450394e-06, 1.9694032289407915e-06, 2.024794639510219e-06]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 7.0, 6.0, 9.0, 13.0, 8.0, 12.0, 11.0, 18.0, 20.0, 20.0, 34.0, 36.0, 25.0, 35.0, 37.0, 35.0, 29.0, 47.0, 40.0, 45.0, 43.0, 39.0, 46.0, 44.0, 36.0, 49.0, 27.0, 29.0, 29.0, 21.0, 26.0, 18.0, 13.0, 23.0, 16.0, 13.0, 13.0, 11.0, 6.0, 5.0, 2.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1083533308919868e-06, -1.067708694790781e-06, -1.0270640586895752e-06, -9.864193089015316e-07, -9.457746728003258e-07, -9.0513003669912e-07, -8.644854005979141e-07, -8.238407644967083e-07, -7.831960715520836e-07, -7.425514354508778e-07, -7.019067425062531e-07, -6.612621064050472e-07, -6.206174703038414e-07, -5.799727773592167e-07, -5.393281412580109e-07, -4.986834483133862e-07, -4.5803881221218035e-07, -4.173941476892651e-07, -3.767494831663498e-07, -3.36104847065144e-07, -2.954601825422287e-07, -2.5481551801931346e-07, -2.1417088191810763e-07, -1.7352621739519236e-07, -1.328815528722771e-07, -9.223689545478919e-08, -5.1592238037301286e-08, -1.0947587725240737e-08, 2.9697076797674526e-08, 7.034174132058979e-08, 1.1098637742179562e-07, 1.516310419447109e-07, 1.9227559278078843e-07, 2.329202573037037e-07, 2.7356492182661896e-07, 3.142095579278248e-07, 3.5485422245074005e-07, 3.954988869736553e-07, 4.3614352307486115e-07, 4.767881875977764e-07, 5.174328521206917e-07, 5.580774882218975e-07, 5.987221811665222e-07, 6.39366817267728e-07, 6.800114533689339e-07, 7.206561463135586e-07, 7.613007824147644e-07, 8.019454753593891e-07, 8.425901114605949e-07, 8.832347475618008e-07, 9.238794405064255e-07, 9.645241334510501e-07, 1.005168769552256e-06, 1.0458134056534618e-06, 1.0864580417546676e-06, 1.1271026778558735e-06, 1.1677473139570793e-06, 1.2083919500582851e-06, 1.249036586159491e-06, 1.2896812222606968e-06, 1.3303259720487404e-06, 1.3709706081499462e-06, 1.411615244251152e-06, 1.4522598803523579e-06, 1.4929046301404014e-06]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 9.0, 7.0, 16.0, 0.0, 22.0, 36.0, 53.0, 77.0, 102.0, 146.0, 225.0, 333.0, 0.0, 518.0, 772.0, 1296.0, 1999.0, 3328.0, 5507.0, 9482.0, 16227.0, 0.0, 28890.0, 52986.0, 103295.0, 228149.0, 747591.0, 1781447.0, 756827.0, 237505.0, 0.0, 103937.0, 51748.0, 27272.0, 14529.0, 8200.0, 4667.0, 2827.0, 1627.0, 0.0, 988.0, 631.0, 394.0, 247.0, 151.0, 81.0, 51.0, 37.0, 0.0, 25.0, 17.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-06, -1.7350539565086365e-06, -1.6819685697555542e-06, -1.628883183002472e-06, -1.5757977962493896e-06, -1.5227124094963074e-06, -1.469627022743225e-06, -1.4165416359901428e-06, -1.3634562492370605e-06, -1.3103708624839783e-06, -1.257285475730896e-06, -1.2042000889778137e-06, -1.1511147022247314e-06, -1.0980293154716492e-06, -1.044943928718567e-06, -9.918585419654846e-07, -9.387731552124023e-07, -8.856877684593201e-07, -8.326023817062378e-07, -7.795169949531555e-07, -7.264316082000732e-07, -6.73346221446991e-07, -6.202608346939087e-07, -5.671754479408264e-07, -5.140900611877441e-07, -4.6100467443466187e-07, -4.079192876815796e-07, -3.548339009284973e-07, -3.0174851417541504e-07, -2.4866312742233276e-07, -1.955777406692505e-07, -1.424923539161682e-07, -8.940696716308594e-08, -3.632158041000366e-08, 1.6763806343078613e-08, 6.984919309616089e-08, 1.2293457984924316e-07, 1.7601996660232544e-07, 2.2910535335540771e-07, 2.8219074010849e-07, 3.3527612686157227e-07, 3.8836151361465454e-07, 4.414469003677368e-07, 4.945322871208191e-07, 5.476176738739014e-07, 6.007030606269836e-07, 6.537884473800659e-07, 7.068738341331482e-07, 7.599592208862305e-07, 8.130446076393127e-07, 8.66129994392395e-07, 9.192153811454773e-07, 9.723007678985596e-07, 1.0253861546516418e-06, 1.0784715414047241e-06, 1.1315569281578064e-06, 1.1846423149108887e-06, 1.237727701663971e-06, 1.2908130884170532e-06, 1.3438984751701355e-06, 1.3969838619232178e-06, 1.4500692486763e-06, 1.5031546354293823e-06, 1.5562400221824646e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 6.0, 0.0, 0.0, 6.0, 0.0, 10.0, 0.0, 0.0, 14.0, 0.0, 19.0, 0.0, 0.0, 37.0, 0.0, 44.0, 0.0, 0.0, 67.0, 0.0, 0.0, 70.0, 0.0, 85.0, 0.0, 0.0, 103.0, 0.0, 106.0, 0.0, 0.0, 99.0, 0.0, 84.0, 0.0, 0.0, 67.0, 0.0, 63.0, 0.0, 0.0, 47.0, 0.0, 0.0, 32.0, 0.0, 26.0, 0.0, 0.0, 17.0, 0.0, 8.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.152557373046875e-07, -6.919726729393005e-07, -6.686896085739136e-07, -6.454065442085266e-07, -6.221234798431396e-07, -5.988404154777527e-07, -5.755573511123657e-07, -5.522742867469788e-07, -5.289912223815918e-07, -5.057081580162048e-07, -4.824250936508179e-07, -4.591420292854309e-07, -4.3585896492004395e-07, -4.12575900554657e-07, -3.8929283618927e-07, -3.6600977182388306e-07, -3.427267074584961e-07, -3.1944364309310913e-07, -2.9616057872772217e-07, -2.728775143623352e-07, -2.4959444999694824e-07, -2.2631138563156128e-07, -2.0302832126617432e-07, -1.7974525690078735e-07, -1.564621925354004e-07, -1.3317912817001343e-07, -1.0989606380462646e-07, -8.66129994392395e-08, -6.332993507385254e-08, -4.0046870708465576e-08, -1.6763806343078613e-08, 6.51925802230835e-09, 2.9802322387695312e-08, 5.3085386753082275e-08, 7.636845111846924e-08, 9.96515154838562e-08, 1.2293457984924316e-07, 1.4621764421463013e-07, 1.695007085800171e-07, 1.9278377294540405e-07, 2.1606683731079102e-07, 2.39349901676178e-07, 2.6263296604156494e-07, 2.859160304069519e-07, 3.0919909477233887e-07, 3.3248215913772583e-07, 3.557652235031128e-07, 3.7904828786849976e-07, 4.023313522338867e-07, 4.256144165992737e-07, 4.4889748096466064e-07, 4.721805453300476e-07, 4.954636096954346e-07, 5.187466740608215e-07, 5.420297384262085e-07, 5.653128027915955e-07, 5.885958671569824e-07, 6.118789315223694e-07, 6.351619958877563e-07, 6.584450602531433e-07, 6.817281246185303e-07, 7.050111889839172e-07, 7.282942533493042e-07, 7.515773177146912e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 8.0, 23.0, 0.0, 30.0, 55.0, 122.0, 0.0, 198.0, 376.0, 689.0, 0.0, 1242.0, 2347.0, 4282.0, 0.0, 8707.0, 16134.0, 32642.0, 0.0, 65685.0, 137400.0, 313343.0, 0.0, 662006.0, 1702481.0, 662917.0, 0.0, 312883.0, 137975.0, 66285.0, 0.0, 32613.0, 16263.0, 8485.0, 0.0, 4272.0, 2215.0, 1182.0, 0.0, 646.0, 341.0, 195.0, 0.0, 101.0, 67.0, 34.0, 0.0, 18.0, 8.0, 15.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4454126358032227e-06, -1.4007091522216797e-06, -1.3560056686401367e-06, -1.3113021850585938e-06, -1.2665987014770508e-06, -1.2218952178955078e-06, -1.1771917343139648e-06, -1.1324882507324219e-06, -1.087784767150879e-06, -1.043081283569336e-06, -9.98377799987793e-07, -9.5367431640625e-07, -9.08970832824707e-07, -8.642673492431641e-07, -8.195638656616211e-07, -7.748603820800781e-07, -7.301568984985352e-07, -6.854534149169922e-07, -6.407499313354492e-07, -5.960464477539062e-07, -5.513429641723633e-07, -5.066394805908203e-07, -4.6193599700927734e-07, -4.172325134277344e-07, -3.725290298461914e-07, -3.2782554626464844e-07, -2.8312206268310547e-07, -2.384185791015625e-07, -1.9371509552001953e-07, -1.4901161193847656e-07, -1.043081283569336e-07, -5.960464477539063e-08, -1.4901161193847656e-08, 2.9802322387695312e-08, 7.450580596923828e-08, 1.1920928955078125e-07, 1.6391277313232422e-07, 2.086162567138672e-07, 2.5331974029541016e-07, 2.980232238769531e-07, 3.427267074584961e-07, 3.8743019104003906e-07, 4.3213367462158203e-07, 4.76837158203125e-07, 5.21540641784668e-07, 5.662441253662109e-07, 6.109476089477539e-07, 6.556510925292969e-07, 7.003545761108398e-07, 7.450580596923828e-07, 7.897615432739258e-07, 8.344650268554688e-07, 8.791685104370117e-07, 9.238719940185547e-07, 9.685754776000977e-07, 1.0132789611816406e-06, 1.0579824447631836e-06, 1.1026859283447266e-06, 1.1473894119262695e-06, 1.1920928955078125e-06, 1.2367963790893555e-06, 1.2814998626708984e-06, 1.3262033462524414e-06, 1.3709068298339844e-06]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 38.0, 0.0, 0.0, 89.0, 0.0, 0.0, 0.0, 188.0, 0.0, 0.0, 0.0, 396.0, 0.0, 0.0, 0.0, 736.0, 0.0, 0.0, 1236.0, 0.0, 0.0, 0.0, 726.0, 0.0, 0.0, 0.0, 371.0, 0.0, 0.0, 0.0, 191.0, 0.0, 0.0, 70.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.364418029785156e-07, -5.206093192100525e-07, -5.047768354415894e-07, -4.889443516731262e-07, -4.731118679046631e-07, -4.5727938413619995e-07, -4.414469003677368e-07, -4.256144165992737e-07, -4.0978193283081055e-07, -3.939494490623474e-07, -3.781169652938843e-07, -3.6228448152542114e-07, -3.46451997756958e-07, -3.3061951398849487e-07, -3.1478703022003174e-07, -2.989545464515686e-07, -2.8312206268310547e-07, -2.6728957891464233e-07, -2.514570951461792e-07, -2.3562461137771606e-07, -2.1979212760925293e-07, -2.039596438407898e-07, -1.8812716007232666e-07, -1.7229467630386353e-07, -1.564621925354004e-07, -1.4062970876693726e-07, -1.2479722499847412e-07, -1.0896474123001099e-07, -9.313225746154785e-08, -7.729977369308472e-08, -6.146728992462158e-08, -4.563480615615845e-08, -2.9802322387695312e-08, -1.3969838619232178e-08, 1.862645149230957e-09, 1.7695128917694092e-08, 3.3527612686157227e-08, 4.936009645462036e-08, 6.51925802230835e-08, 8.102506399154663e-08, 9.685754776000977e-08, 1.126900315284729e-07, 1.2852251529693604e-07, 1.4435499906539917e-07, 1.601874828338623e-07, 1.7601996660232544e-07, 1.9185245037078857e-07, 2.076849341392517e-07, 2.2351741790771484e-07, 2.39349901676178e-07, 2.551823854446411e-07, 2.7101486921310425e-07, 2.868473529815674e-07, 3.026798367500305e-07, 3.1851232051849365e-07, 3.343448042869568e-07, 3.501772880554199e-07, 3.6600977182388306e-07, 3.818422555923462e-07, 3.976747393608093e-07, 4.1350722312927246e-07, 4.293397068977356e-07, 4.4517219066619873e-07, 4.6100467443466187e-07, 4.76837158203125e-07]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 6.0, 8.0, 6.0, 8.0, 14.0, 18.0, 9.0, 17.0, 25.0, 27.0, 33.0, 42.0, 51.0, 52.0, 60.0, 58.0, 70.0, 71.0, 57.0, 59.0, 56.0, 49.0, 41.0, 35.0, 23.0, 20.0, 13.0, 10.0, 14.0, 11.0, 3.0, 6.0, 5.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.1811547437901027e-06, -1.144191173807485e-06, -1.1072274901380297e-06, -1.070263920155412e-06, -1.0333003501727944e-06, -9.963367801901768e-07, -9.593732102075592e-07, -9.224095265381038e-07, -8.854459565554862e-07, -8.484823865728686e-07, -8.115187597468321e-07, -7.745551329207956e-07, -7.37591562938178e-07, -7.006279929555603e-07, -6.636643661295238e-07, -6.267007393034874e-07, -5.897371693208697e-07, -5.527735993382521e-07, -5.158099725122156e-07, -4.788463456861791e-07, -4.418827757035615e-07, -4.0491917729923443e-07, -3.679555788949074e-07, -3.309919804905803e-07, -2.9402838208625326e-07, -2.570647836819262e-07, -2.2010118527759914e-07, -1.8313758687327208e-07, -1.4617398846894503e-07, -1.0921039006461797e-07, -7.224679166029091e-08, -3.528319325596385e-08, 1.6804051483632065e-09, 3.8644003552690265e-08, 7.560760195701732e-08, 1.1257120036134438e-07, 1.4953479876567144e-07, 1.864983971699985e-07, 2.2346199557432556e-07, 2.604255939786526e-07, 2.9738919238297967e-07, 3.3435279078730673e-07, 3.713163891916338e-07, 4.0827998759596085e-07, 4.452435860002879e-07, 4.822071559829055e-07, 5.19170782808942e-07, 5.561344096349785e-07, 5.930979796175961e-07, 6.300615496002138e-07, 6.670251764262503e-07, 7.039888032522867e-07, 7.409523732349044e-07, 7.77915943217522e-07, 8.148795700435585e-07, 8.51843196869595e-07, 8.888067668522126e-07, 9.257703368348302e-07, 9.627340205042856e-07, 9.996975904869032e-07, 1.0366611604695208e-06, 1.0736247304521385e-06, 1.110588300434756e-06, 1.1475519841042114e-06, 1.184515554086829e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 3.0, 6.0, 6.0, 7.0, 5.0, 14.0, 6.0, 12.0, 14.0, 18.0, 18.0, 22.0, 25.0, 22.0, 40.0, 30.0, 20.0, 32.0, 31.0, 33.0, 41.0, 31.0, 49.0, 38.0, 41.0, 41.0, 46.0, 40.0, 33.0, 40.0, 29.0, 25.0, 35.0, 21.0, 17.0, 17.0, 20.0, 13.0, 11.0, 12.0, 11.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.379156722388871e-07, -9.085390502150403e-07, -8.791624850346125e-07, -8.497858630107658e-07, -8.204092978303379e-07, -7.910326758064912e-07, -7.616561106260633e-07, -7.322794886022166e-07, -7.029028665783699e-07, -6.735262445545231e-07, -6.441496793740953e-07, -6.147730573502486e-07, -5.853964921698207e-07, -5.56019870145974e-07, -5.266432481221273e-07, -4.972666829416994e-07, -4.678900893395621e-07, -4.385134957374248e-07, -4.0913690213528753e-07, -3.7976030853315024e-07, -3.503836865093035e-07, -3.210070929071662e-07, -2.9163049930502893e-07, -2.622538772811822e-07, -2.3287729788989964e-07, -2.0350070428776235e-07, -1.7412409647477034e-07, -1.4474750287263305e-07, -1.153709021650684e-07, -8.599430145750375e-08, -5.661770785536646e-08, -2.7241100042374455e-08, 2.1354935597628355e-09, 3.1512094267327484e-08, 6.088869497489213e-08, 9.026528857702942e-08, 1.1964189639002143e-07, 1.4901848999215872e-07, 1.78395083594296e-07, 2.0777169140728802e-07, 2.371482850094253e-07, 2.665248928224173e-07, 2.959014864245546e-07, 3.252780800266919e-07, 3.546546736288292e-07, 3.840312956526759e-07, 4.1340786083310377e-07, 4.427844828569505e-07, 4.721610764590878e-07, 5.015376700612251e-07, 5.309142920850718e-07, 5.602908572654997e-07, 5.896674792893464e-07, 6.190440444697742e-07, 6.48420666493621e-07, 6.777972885174677e-07, 7.071738536978955e-07, 7.365504757217423e-07, 7.659270409021701e-07, 7.953036629260168e-07, 8.246802281064447e-07, 8.540568501302914e-07, 8.834334721541381e-07, 9.12810037334566e-07, 9.421866593584127e-07]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 15.0, 21.0, 20.0, 34.0, 45.0, 61.0, 70.0, 110.0, 171.0, 221.0, 351.0, 523.0, 763.0, 1273.0, 2086.0, 3318.0, 5917.0, 10261.0, 19407.0, 37878.0, 81893.0, 190250.0, 529339.0, 82081.0, 38377.0, 19147.0, 10229.0, 5702.0, 3318.0, 1944.0, 1196.0, 825.0, 520.0, 345.0, 247.0, 160.0, 126.0, 81.0, 63.0, 47.0, 28.0, 24.0, 15.0, 8.0, 9.0, 7.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.9669532775878906e-06, -1.905485987663269e-06, -1.8440186977386475e-06, -1.7825514078140259e-06, -1.7210841178894043e-06, -1.6596168279647827e-06, -1.5981495380401611e-06, -1.5366822481155396e-06, -1.475214958190918e-06, -1.4137476682662964e-06, -1.3522803783416748e-06, -1.2908130884170532e-06, -1.2293457984924316e-06, -1.16787850856781e-06, -1.1064112186431885e-06, -1.044943928718567e-06, -9.834766387939453e-07, -9.220093488693237e-07, -8.605420589447021e-07, -7.990747690200806e-07, -7.37607479095459e-07, -6.761401891708374e-07, -6.146728992462158e-07, -5.532056093215942e-07, -4.917383193969727e-07, -4.302710294723511e-07, -3.688037395477295e-07, -3.073364496231079e-07, -2.4586915969848633e-07, -1.8440186977386475e-07, -1.2293457984924316e-07, -6.146728992462158e-08, 0.0, 6.146728992462158e-08, 1.2293457984924316e-07, 1.8440186977386475e-07, 2.4586915969848633e-07, 3.073364496231079e-07, 3.688037395477295e-07, 4.302710294723511e-07, 4.917383193969727e-07, 5.532056093215942e-07, 6.146728992462158e-07, 6.761401891708374e-07, 7.37607479095459e-07, 7.990747690200806e-07, 8.605420589447021e-07, 9.220093488693237e-07, 9.834766387939453e-07, 1.044943928718567e-06, 1.1064112186431885e-06, 1.16787850856781e-06, 1.2293457984924316e-06, 1.2908130884170532e-06, 1.3522803783416748e-06, 1.4137476682662964e-06, 1.475214958190918e-06, 1.5366822481155396e-06, 1.5981495380401611e-06, 1.6596168279647827e-06, 1.7210841178894043e-06, 1.7825514078140259e-06, 1.8440186977386475e-06, 1.905485987663269e-06, 1.9669532775878906e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 0.0, 7.0, 0.0, 13.0, 0.0, 16.0, 0.0, 20.0, 0.0, 25.0, 0.0, 37.0, 0.0, 43.0, 0.0, 51.0, 0.0, 59.0, 0.0, 87.0, 0.0, 88.0, 0.0, 89.0, 0.0, 80.0, 0.0, 91.0, 0.0, 89.0, 0.0, 50.0, 0.0, 58.0, 0.0, 37.0, 0.0, 25.0, 0.0, 12.0, 0.0, 18.0, 0.0, 8.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 8.0, 0.0, 9.0, 15.0, 10.0, 8.0, 27.0, 10.0, 38.0, 41.0, 160.0, 66.0, 269.0, 161.0, 678.0, 527.0, 704.0, 3379.0, 4181.0, 35898.0, 956113.0, 36059.0, 4119.0, 3378.0, 716.0, 896.0, 279.0, 327.0, 104.0, 144.0, 63.0, 62.0, 27.0, 22.0, 10.0, 20.0, 1.0, 10.0, 12.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2186508178710938e-06, -3.1301751732826233e-06, -3.041699528694153e-06, -2.9532238841056824e-06, -2.864748239517212e-06, -2.7762725949287415e-06, -2.687796950340271e-06, -2.5993213057518005e-06, -2.51084566116333e-06, -2.4223700165748596e-06, -2.333894371986389e-06, -2.2454187273979187e-06, -2.1569430828094482e-06, -2.0684674382209778e-06, -1.9799917936325073e-06, -1.8915161490440369e-06, -1.8030405044555664e-06, -1.714564859867096e-06, -1.6260892152786255e-06, -1.537613570690155e-06, -1.4491379261016846e-06, -1.3606622815132141e-06, -1.2721866369247437e-06, -1.1837109923362732e-06, -1.0952353477478027e-06, -1.0067597031593323e-06, -9.182840585708618e-07, -8.298084139823914e-07, -7.413327693939209e-07, -6.528571248054504e-07, -5.6438148021698e-07, -4.759058356285095e-07, -3.8743019104003906e-07, -2.989545464515686e-07, -2.1047890186309814e-07, -1.2200325727462769e-07, -3.3527612686157227e-08, 5.494803190231323e-08, 1.434236764907837e-07, 2.3189932107925415e-07, 3.203749656677246e-07, 4.0885061025619507e-07, 4.973262548446655e-07, 5.85801899433136e-07, 6.742775440216064e-07, 7.627531886100769e-07, 8.512288331985474e-07, 9.397044777870178e-07, 1.0281801223754883e-06, 1.1166557669639587e-06, 1.2051314115524292e-06, 1.2936070561408997e-06, 1.3820827007293701e-06, 1.4705583453178406e-06, 1.559033989906311e-06, 1.6475096344947815e-06, 1.735985279083252e-06, 1.8244609236717224e-06, 1.912936568260193e-06, 2.0014122128486633e-06, 2.089887857437134e-06, 2.1783635020256042e-06, 2.2668391466140747e-06, 2.355314791202545e-06, 2.4437904357910156e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 807.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.7881393432617188e-07, -1.7229467630386353e-07, -1.6577541828155518e-07, -1.5925616025924683e-07, -1.5273690223693848e-07, -1.4621764421463013e-07, -1.3969838619232178e-07, -1.3317912817001343e-07, -1.2665987014770508e-07, -1.2014061212539673e-07, -1.1362135410308838e-07, -1.0710209608078003e-07, -1.0058283805847168e-07, -9.406358003616333e-08, -8.754432201385498e-08, -8.102506399154663e-08, -7.450580596923828e-08, -6.798654794692993e-08, -6.146728992462158e-08, -5.494803190231323e-08, -4.842877388000488e-08, -4.190951585769653e-08, -3.5390257835388184e-08, -2.8870999813079834e-08, -2.2351741790771484e-08, -1.5832483768463135e-08, -9.313225746154785e-09, -2.7939677238464355e-09, 3.725290298461914e-09, 1.0244548320770264e-08, 1.6763806343078613e-08, 2.3283064365386963e-08, 2.9802322387695312e-08, 3.632158041000366e-08, 4.284083843231201e-08, 4.936009645462036e-08, 5.587935447692871e-08, 6.239861249923706e-08, 6.891787052154541e-08, 7.543712854385376e-08, 8.195638656616211e-08, 8.847564458847046e-08, 9.499490261077881e-08, 1.0151416063308716e-07, 1.0803341865539551e-07, 1.1455267667770386e-07, 1.210719347000122e-07, 1.2759119272232056e-07, 1.341104507446289e-07, 1.4062970876693726e-07, 1.471489667892456e-07, 1.5366822481155396e-07, 1.601874828338623e-07, 1.6670674085617065e-07, 1.73225998878479e-07, 1.7974525690078735e-07, 1.862645149230957e-07, 1.9278377294540405e-07, 1.993030309677124e-07, 2.0582228899002075e-07, 2.123415470123291e-07, 2.1886080503463745e-07, 2.253800630569458e-07, 2.3189932107925415e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 9.0, 5.0, 5.0, 9.0, 14.0, 15.0, 17.0, 23.0, 26.0, 35.0, 52.0, 64.0, 53.0, 89.0, 77.0, 85.0, 67.0, 67.0, 72.0, 41.0, 38.0, 30.0, 26.0, 18.0, 10.0, 11.0, 11.0, 6.0, 4.0, 4.0, 3.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0589745897959801e-06, -1.0167534583160887e-06, -9.745324405230349e-07, -9.323113090431434e-07, -8.900901775632519e-07, -8.478690460833604e-07, -8.056479714468878e-07, -7.634268968104152e-07, -7.212057653305237e-07, -6.789846338506322e-07, -6.367635592141596e-07, -5.94542484577687e-07, -5.523213530977955e-07, -5.10100221617904e-07, -4.678791469814314e-07, -4.2565804392324935e-07, -3.834369408650673e-07, -3.4121583780688525e-07, -2.989947347487032e-07, -2.5677363169052114e-07, -2.145525286323391e-07, -1.7233142557415704e-07, -1.3011032251597499e-07, -8.788921945779293e-08, -4.566811639961088e-08, -3.4470133414288284e-09, 3.8774089716753224e-08, 8.099519277493528e-08, 1.2321629583311733e-07, 1.6543739889129938e-07, 2.0765850194948143e-07, 2.498796050076635e-07, 2.9210070806584554e-07, 3.343218111240276e-07, 3.7654291418220964e-07, 4.187640172403917e-07, 4.6098512029857375e-07, 5.032062517784652e-07, 5.454273264149379e-07, 5.876484010514105e-07, 6.29869532531302e-07, 6.720906640111934e-07, 7.143117386476661e-07, 7.565328132841387e-07, 7.987539447640302e-07, 8.409750762439216e-07, 8.831961508803943e-07, 9.254172255168669e-07, 9.676383569967584e-07, 1.0098594884766499e-06, 1.0520805062697036e-06, 1.094301637749595e-06, 1.1365227692294866e-06, 1.178743900709378e-06, 1.2209650321892696e-06, 1.2631860499823233e-06, 1.3054071814622148e-06, 1.3476283129421063e-06, 1.38984933073516e-06, 1.4320704622150515e-06, 1.474291593694943e-06, 1.5165127251748345e-06, 1.558733856654726e-06, 1.6009548744477797e-06, 1.6431760059276712e-06]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 7.0, 2.0, 7.0, 4.0, 10.0, 3.0, 9.0, 12.0, 12.0, 9.0, 19.0, 19.0, 15.0, 24.0, 29.0, 32.0, 31.0, 24.0, 32.0, 28.0, 30.0, 43.0, 37.0, 35.0, 51.0, 33.0, 48.0, 38.0, 46.0, 31.0, 38.0, 37.0, 24.0, 34.0, 24.0, 21.0, 13.0, 21.0, 12.0, 16.0, 11.0, 8.0, 13.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.191335266223177e-07, -8.905509503165376e-07, -8.619684308541764e-07, -8.333858545483963e-07, -8.048033350860351e-07, -7.76220758780255e-07, -7.476381824744749e-07, -7.190556061686948e-07, -6.904730867063336e-07, -6.618905104005535e-07, -6.333079909381922e-07, -6.047254146324121e-07, -5.76142838326632e-07, -5.475603188642708e-07, -5.189777425584907e-07, -4.903952230961295e-07, -4.618126467903494e-07, -4.3323009890627873e-07, -4.0464755102220806e-07, -3.7606497471642797e-07, -3.474824268323573e-07, -3.1889987894828664e-07, -2.9031730264250655e-07, -2.617347547584359e-07, -2.3315220687436522e-07, -2.0456965899029456e-07, -1.7598709689536918e-07, -1.474045348004438e-07, -1.1882198691637313e-07, -9.023943903230247e-08, -6.165687693737709e-08, -3.307431484245171e-08, -4.4917101149621885e-09, 2.4090844874535833e-08, 5.2673399864033854e-08, 8.125595485353188e-08, 1.098385098430299e-07, 1.3842105772710056e-07, 1.6700361982202594e-07, 1.9558618191695132e-07, 2.2416872980102198e-07, 2.5275127768509265e-07, 2.813338255691633e-07, 3.099164018749434e-07, 3.3849894975901407e-07, 3.6708149764308473e-07, 3.956640739488648e-07, 4.242466218329355e-07, 4.5282916971700615e-07, 4.814117460227862e-07, 5.099942654851475e-07, 5.385768417909276e-07, 5.671594180967077e-07, 5.957419375590689e-07, 6.24324513864849e-07, 6.529070333272102e-07, 6.814896096329903e-07, 7.100721859387704e-07, 7.386547054011317e-07, 7.672372817069117e-07, 7.95819801169273e-07, 8.244023774750531e-07, 8.529849537808332e-07, 8.815675300866133e-07, 9.101500495489745e-07]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 0.0, 17.0, 11.0, 23.0, 38.0, 58.0, 84.0, 114.0, 0.0, 187.0, 306.0, 485.0, 725.0, 1203.0, 1957.0, 3213.0, 0.0, 5390.0, 9466.0, 16576.0, 30240.0, 55924.0, 103040.0, 178547.0, 0.0, 233615.0, 178373.0, 102579.0, 55885.0, 30282.0, 16839.0, 9463.0, 0.0, 5511.0, 3205.0, 1924.0, 1206.0, 767.0, 471.0, 300.0, 0.0, 197.0, 104.0, 73.0, 65.0, 37.0, 24.0, 10.0, 0.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.6167759895324707e-06, -1.564621925354004e-06, -1.5124678611755371e-06, -1.4603137969970703e-06, -1.4081597328186035e-06, -1.3560056686401367e-06, -1.30385160446167e-06, -1.2516975402832031e-06, -1.1995434761047363e-06, -1.1473894119262695e-06, -1.0952353477478027e-06, -1.043081283569336e-06, -9.909272193908691e-07, -9.387731552124023e-07, -8.866190910339355e-07, -8.344650268554688e-07, -7.82310962677002e-07, -7.301568984985352e-07, -6.780028343200684e-07, -6.258487701416016e-07, -5.736947059631348e-07, -5.21540641784668e-07, -4.6938657760620117e-07, -4.172325134277344e-07, -3.650784492492676e-07, -3.129243850708008e-07, -2.60770320892334e-07, -2.086162567138672e-07, -1.564621925354004e-07, -1.043081283569336e-07, -5.21540641784668e-08, 0.0, 5.21540641784668e-08, 1.043081283569336e-07, 1.564621925354004e-07, 2.086162567138672e-07, 2.60770320892334e-07, 3.129243850708008e-07, 3.650784492492676e-07, 4.172325134277344e-07, 4.6938657760620117e-07, 5.21540641784668e-07, 5.736947059631348e-07, 6.258487701416016e-07, 6.780028343200684e-07, 7.301568984985352e-07, 7.82310962677002e-07, 8.344650268554688e-07, 8.866190910339355e-07, 9.387731552124023e-07, 9.909272193908691e-07, 1.043081283569336e-06, 1.0952353477478027e-06, 1.1473894119262695e-06, 1.1995434761047363e-06, 1.2516975402832031e-06, 1.30385160446167e-06, 1.3560056686401367e-06, 1.4081597328186035e-06, 1.4603137969970703e-06, 1.5124678611755371e-06, 1.564621925354004e-06, 1.6167759895324707e-06, 1.6689300537109375e-06]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 5.0, 0.0, 10.0, 0.0, 0.0, 14.0, 0.0, 17.0, 0.0, 32.0, 0.0, 0.0, 43.0, 0.0, 49.0, 0.0, 0.0, 81.0, 0.0, 79.0, 0.0, 99.0, 0.0, 0.0, 122.0, 0.0, 122.0, 0.0, 83.0, 0.0, 0.0, 84.0, 0.0, 66.0, 0.0, 0.0, 41.0, 0.0, 24.0, 0.0, 19.0, 0.0, 0.0, 12.0, 0.0, 3.0, 0.0, 5.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.093193173408508e-07, -7.841736078262329e-07, -7.59027898311615e-07, -7.338821887969971e-07, -7.087364792823792e-07, -6.835907697677612e-07, -6.584450602531433e-07, -6.332993507385254e-07, -6.081536412239075e-07, -5.830079317092896e-07, -5.578622221946716e-07, -5.327165126800537e-07, -5.075708031654358e-07, -4.824250936508179e-07, -4.5727938413619995e-07, -4.3213367462158203e-07, -4.069879651069641e-07, -3.818422555923462e-07, -3.5669654607772827e-07, -3.3155083656311035e-07, -3.0640512704849243e-07, -2.812594175338745e-07, -2.561137080192566e-07, -2.3096799850463867e-07, -2.0582228899002075e-07, -1.8067657947540283e-07, -1.555308699607849e-07, -1.30385160446167e-07, -1.0523945093154907e-07, -8.009374141693115e-08, -5.494803190231323e-08, -2.9802322387695312e-08, -4.6566128730773926e-09, 2.0489096641540527e-08, 4.563480615615845e-08, 7.078051567077637e-08, 9.592622518539429e-08, 1.210719347000122e-07, 1.4621764421463013e-07, 1.7136335372924805e-07, 1.9650906324386597e-07, 2.2165477275848389e-07, 2.468004822731018e-07, 2.7194619178771973e-07, 2.9709190130233765e-07, 3.2223761081695557e-07, 3.473833203315735e-07, 3.725290298461914e-07, 3.976747393608093e-07, 4.2282044887542725e-07, 4.4796615839004517e-07, 4.731118679046631e-07, 4.98257577419281e-07, 5.234032869338989e-07, 5.485489964485168e-07, 5.736947059631348e-07, 5.988404154777527e-07, 6.239861249923706e-07, 6.491318345069885e-07, 6.742775440216064e-07, 6.994232535362244e-07, 7.245689630508423e-07, 7.497146725654602e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 8.0, 2.0, 0.0, 6.0, 13.0, 18.0, 28.0, 38.0, 0.0, 63.0, 120.0, 228.0, 301.0, 521.0, 792.0, 0.0, 1320.0, 2234.0, 3692.0, 6688.0, 11250.0, 0.0, 19553.0, 33436.0, 59013.0, 102384.0, 165107.0, 0.0, 235100.0, 165469.0, 102189.0, 58385.0, 33958.0, 19395.0, 0.0, 11072.0, 6589.0, 3663.0, 2269.0, 1457.0, 0.0, 778.0, 547.0, 335.0, 215.0, 126.0, 68.0, 0.0, 54.0, 34.0, 13.0, 19.0, 7.0, 0.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.559033989906311e-06, -1.5087425708770752e-06, -1.4584511518478394e-06, -1.4081597328186035e-06, -1.3578683137893677e-06, -1.3075768947601318e-06, -1.257285475730896e-06, -1.2069940567016602e-06, -1.1567026376724243e-06, -1.1064112186431885e-06, -1.0561197996139526e-06, -1.0058283805847168e-06, -9.55536961555481e-07, -9.052455425262451e-07, -8.549541234970093e-07, -8.046627044677734e-07, -7.543712854385376e-07, -7.040798664093018e-07, -6.537884473800659e-07, -6.034970283508301e-07, -5.532056093215942e-07, -5.029141902923584e-07, -4.5262277126312256e-07, -4.023313522338867e-07, -3.520399332046509e-07, -3.0174851417541504e-07, -2.514570951461792e-07, -2.0116567611694336e-07, -1.5087425708770752e-07, -1.0058283805847168e-07, -5.029141902923584e-08, 0.0, 5.029141902923584e-08, 1.0058283805847168e-07, 1.5087425708770752e-07, 2.0116567611694336e-07, 2.514570951461792e-07, 3.0174851417541504e-07, 3.520399332046509e-07, 4.023313522338867e-07, 4.5262277126312256e-07, 5.029141902923584e-07, 5.532056093215942e-07, 6.034970283508301e-07, 6.537884473800659e-07, 7.040798664093018e-07, 7.543712854385376e-07, 8.046627044677734e-07, 8.549541234970093e-07, 9.052455425262451e-07, 9.55536961555481e-07, 1.0058283805847168e-06, 1.0561197996139526e-06, 1.1064112186431885e-06, 1.1567026376724243e-06, 1.2069940567016602e-06, 1.257285475730896e-06, 1.3075768947601318e-06, 1.3578683137893677e-06, 1.4081597328186035e-06, 1.4584511518478394e-06, 1.5087425708770752e-06, 1.559033989906311e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 8.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 51.0, 0.0, 0.0, 72.0, 0.0, 0.0, 124.0, 0.0, 0.0, 0.0, 134.0, 0.0, 0.0, 145.0, 0.0, 0.0, 0.0, 136.0, 0.0, 0.0, 130.0, 0.0, 0.0, 85.0, 0.0, 0.0, 0.0, 54.0, 0.0, 0.0, 26.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.783513188362122e-07, -5.606561899185181e-07, -5.42961061000824e-07, -5.252659320831299e-07, -5.075708031654358e-07, -4.898756742477417e-07, -4.721805453300476e-07, -4.544854164123535e-07, -4.367902874946594e-07, -4.1909515857696533e-07, -4.0140002965927124e-07, -3.8370490074157715e-07, -3.6600977182388306e-07, -3.4831464290618896e-07, -3.3061951398849487e-07, -3.129243850708008e-07, -2.952292561531067e-07, -2.775341272354126e-07, -2.598389983177185e-07, -2.421438694000244e-07, -2.2444874048233032e-07, -2.0675361156463623e-07, -1.8905848264694214e-07, -1.7136335372924805e-07, -1.5366822481155396e-07, -1.3597309589385986e-07, -1.1827796697616577e-07, -1.0058283805847168e-07, -8.288770914077759e-08, -6.51925802230835e-08, -4.7497451305389404e-08, -2.9802322387695312e-08, -1.210719347000122e-08, 5.587935447692871e-09, 2.3283064365386963e-08, 4.0978193283081055e-08, 5.8673322200775146e-08, 7.636845111846924e-08, 9.406358003616333e-08, 1.1175870895385742e-07, 1.2945383787155151e-07, 1.471489667892456e-07, 1.648440957069397e-07, 1.825392246246338e-07, 2.0023435354232788e-07, 2.1792948246002197e-07, 2.3562461137771606e-07, 2.5331974029541016e-07, 2.7101486921310425e-07, 2.8870999813079834e-07, 3.0640512704849243e-07, 3.241002559661865e-07, 3.417953848838806e-07, 3.594905138015747e-07, 3.771856427192688e-07, 3.948807716369629e-07, 4.12575900554657e-07, 4.302710294723511e-07, 4.4796615839004517e-07, 4.6566128730773926e-07, 4.833564162254333e-07, 5.010515451431274e-07, 5.187466740608215e-07, 5.364418029785156e-07]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 12.0, 12.0, 9.0, 17.0, 11.0, 21.0, 31.0, 41.0, 52.0, 60.0, 77.0, 104.0, 107.0, 98.0, 67.0, 60.0, 49.0, 34.0, 28.0, 31.0, 15.0, 14.0, 11.0, 7.0, 6.0, 10.0, 2.0, 6.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2852927966378047e-06, -1.2400645346133388e-06, -1.194836158902035e-06, -1.1496078968775691e-06, -1.1043796348531032e-06, -1.0591513728286372e-06, -1.0139229971173336e-06, -9.686947350928676e-07, -9.234664162249828e-07, -8.78238097357098e-07, -8.330098353326321e-07, -7.877815164647473e-07, -7.425531975968624e-07, -6.973249355723965e-07, -6.520966167045117e-07, -6.068682978366269e-07, -5.616400358121609e-07, -5.164117169442761e-07, -4.711834549198102e-07, -4.2595513605192536e-07, -3.8072684560575e-07, -3.354985551595746e-07, -2.902702362916898e-07, -2.450419458455144e-07, -1.9981365539933904e-07, -1.5458536495316366e-07, -1.0935706029613357e-07, -6.412875563910347e-08, -1.8900465192928095e-08, 2.6327825253247283e-08, 7.155614412113209e-08, 1.1678443456730747e-07, 1.6201272501348285e-07, 2.0724101545965823e-07, 2.524693059058336e-07, 2.976976247737184e-07, 3.429259152198938e-07, 3.881542056660692e-07, 4.33382524533954e-07, 4.786107865584199e-07, 5.238391054263047e-07, 5.690674242941895e-07, 6.142956863186555e-07, 6.595240051865403e-07, 7.047523240544251e-07, 7.499805860788911e-07, 7.952089049467759e-07, 8.404372238146607e-07, 8.856654858391266e-07, 9.308938047070114e-07, 9.761221235748962e-07, 1.0213503855993622e-06, 1.0665786476238281e-06, 1.1118070233351318e-06, 1.1570352853595978e-06, 1.2022635473840637e-06, 1.2474918094085297e-06, 1.2927200714329956e-06, 1.3379484471442993e-06, 1.3831767091687652e-06, 1.4284049711932312e-06, 1.4736333469045348e-06, 1.5188616089290008e-06, 1.5640898709534667e-06, 1.6093182466647704e-06]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 7.0, 6.0, 9.0, 16.0, 14.0, 23.0, 18.0, 22.0, 31.0, 30.0, 40.0, 23.0, 34.0, 43.0, 39.0, 32.0, 36.0, 63.0, 51.0, 48.0, 43.0, 44.0, 41.0, 46.0, 30.0, 23.0, 22.0, 27.0, 16.0, 37.0, 13.0, 11.0, 14.0, 7.0, 7.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.888183285511332e-07, -9.595192977940314e-07, -9.302203807237674e-07, -9.009213499666657e-07, -8.716223760529829e-07, -8.423234021393e-07, -8.130244282256172e-07, -7.837254543119343e-07, -7.544264803982514e-07, -7.251275064845686e-07, -6.958285325708857e-07, -6.665295586572029e-07, -6.372305279001012e-07, -6.079315539864183e-07, -5.786325800727354e-07, -5.493336061590526e-07, -5.200346322453697e-07, -4.907356583316869e-07, -4.614366559962946e-07, -4.321376820826117e-07, -4.0283870816892886e-07, -3.7353970583353657e-07, -3.442407319198537e-07, -3.1494175800617086e-07, -2.8564272724906914e-07, -2.563437533353863e-07, -2.270447652108487e-07, -1.9774577708631114e-07, -1.6844680317262828e-07, -1.391478150480907e-07, -1.0984882692355313e-07, -8.054985300987028e-08, -5.125087909618742e-08, -2.1951896300720364e-08, 7.347086494746691e-09, 3.6646071066570585e-08, 6.59450520856808e-08, 9.524403310479101e-08, 1.245430212293286e-07, 1.5384199514301145e-07, 1.8314098326754902e-07, 2.124399713920866e-07, 2.4173894530576945e-07, 2.7103794764116174e-07, 3.003369215548446e-07, 3.2963589546852745e-07, 3.589348693822103e-07, 3.8823384329589317e-07, 4.1753284563128545e-07, 4.468318195449683e-07, 4.761308218803606e-07, 5.054297957940435e-07, 5.347287697077263e-07, 5.640277436214092e-07, 5.93326717535092e-07, 6.226257482921937e-07, 6.519247222058766e-07, 6.812236961195595e-07, 7.105226700332423e-07, 7.398216439469252e-07, 7.691206747040269e-07, 7.984196486177098e-07, 8.277186225313926e-07, 8.570175964450755e-07, 8.863165703587583e-07]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 6.0, 6.0, 7.0, 19.0, 15.0, 23.0, 23.0, 35.0, 36.0, 54.0, 53.0, 67.0, 62.0, 83.0, 73.0, 102.0, 131.0, 244.0, 520729.0, 1498.0, 203.0, 110.0, 90.0, 94.0, 87.0, 89.0, 49.0, 55.0, 47.0, 29.0, 40.0, 22.0, 24.0, 14.0, 12.0, 9.0, 5.0, 6.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3836129912524484e-05, -2.3132000933401287e-05, -2.242787195427809e-05, -2.172374297515489e-05, -2.1019615815021098e-05, -2.03154868358979e-05, -1.9611357856774703e-05, -1.8907228877651505e-05, -1.8203099898528308e-05, -1.749897091940511e-05, -1.6794841940281913e-05, -1.6090712961158715e-05, -1.5386583982035518e-05, -1.4682455912407022e-05, -1.3978327842778526e-05, -1.3274198863655329e-05, -1.2570069884532131e-05, -1.1865940905408934e-05, -1.1161811926285736e-05, -1.045768385665724e-05, -9.753554877534043e-06, -9.049425898410846e-06, -8.34529782878235e-06, -7.641168849659152e-06, -6.937039870535955e-06, -6.232910891412757e-06, -5.528782367036911e-06, -4.824653842661064e-06, -4.120524863537867e-06, -3.4163961117883446e-06, -2.7122673600388225e-06, -2.008138835662976e-06, -1.304011675529182e-06, -5.998829237796599e-07, 1.0424582796986215e-07, 8.083745797193842e-07, 1.5125033314689063e-06, 2.2166320832184283e-06, 2.9207608349679504e-06, 3.624889359343797e-06, 4.3290183384669945e-06, 5.033147317590192e-06, 5.7372758419660386e-06, 6.441404366341885e-06, 7.145533345465083e-06, 7.84966232458828e-06, 8.553790394216776e-06, 9.257919373339973e-06, 9.962048352463171e-06, 1.0666177331586368e-05, 1.1370306310709566e-05, 1.2074434380338062e-05, 1.2778563359461259e-05, 1.3482692338584457e-05, 1.4186820408212952e-05, 1.489094938733615e-05, 1.5595078366459347e-05, 1.6299207345582545e-05, 1.7003336324705742e-05, 1.770746530382894e-05, 1.8411592463962734e-05, 1.911572144308593e-05, 1.981985042220913e-05, 2.0523979401332326e-05, 2.1228108380455524e-05]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 7.0, 6.0, 15.0, 13.0, 18.0, 22.0, 18.0, 31.0, 27.0, 44.0, 26.0, 31.0, 38.0, 46.0, 31.0, 33.0, 1077.0, 62.0, 42.0, 46.0, 45.0, 42.0, 39.0, 43.0, 15.0, 33.0, 23.0, 19.0, 29.0, 22.0, 10.0, 14.0, 11.0, 5.0, 7.0, 4.0, 1.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.9159618861740455e-05, -2.83007939287927e-05, -2.744197081483435e-05, -2.6583147700875998e-05, -2.5724322767928243e-05, -2.4865497834980488e-05, -2.4006674721022137e-05, -2.3147851607063785e-05, -2.228902667411603e-05, -2.1430201741168275e-05, -2.0571378627209924e-05, -1.9712555513251573e-05, -1.8853730580303818e-05, -1.7994905647356063e-05, -1.7136082533397712e-05, -1.627725941943936e-05, -1.5418434486491606e-05, -1.4559610463038553e-05, -1.37007864395855e-05, -1.2841962416132446e-05, -1.1983138392679393e-05, -1.112431436922634e-05, -1.0265490345773287e-05, -9.406666322320234e-06, -8.547842298867181e-06, -7.689018275414128e-06, -6.830194251961075e-06, -5.971370228508022e-06, -5.112546205054969e-06, -4.2537221816019155e-06, -3.3948981581488624e-06, -2.5360741346958093e-06, -1.6772519302321598e-06, -8.184279067791067e-07, 4.039611667394638e-08, 8.992201401269995e-07, 1.7580441635800526e-06, 2.6168681870331056e-06, 3.4756922104861587e-06, 4.334516233939212e-06, 5.193340257392265e-06, 6.052164280845318e-06, 6.910988304298371e-06, 7.769812327751424e-06, 8.628636351204477e-06, 9.48746037465753e-06, 1.0346284398110583e-05, 1.1205108421563637e-05, 1.206393244501669e-05, 1.2922756468469743e-05, 1.3781580491922796e-05, 1.4640404515375849e-05, 1.5499228538828902e-05, 1.6358051652787253e-05, 1.7216876585735008e-05, 1.8075701518682763e-05, 1.8934524632641114e-05, 1.9793347746599466e-05, 2.065217267954722e-05, 2.1510997612494975e-05, 2.2369820726453327e-05, 2.3228643840411678e-05, 2.4087468773359433e-05, 2.4946293706307188e-05, 2.580511682026554e-05]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 15.0, 4.0, 4.0, 18.0, 16.0, 26.0, 28.0, 32.0, 45.0, 54.0, 80.0, 103.0, 173.0, 237.0, 405.0, 653.0, 979.0, 1399.0, 2013.0, 2829.0, 3932.0, 5157.0, 6329.0, 8034.0, 10883.0, 19243.0, 29995964.0, 1087955.0, 39173.0, 56244.0, 5352.0, 4692.0, 1530.0, 366.0, 214.0, 207.0, 187.0, 32.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-377.75, -369.16015625, -360.5703125, -351.98046875, -343.390625, -334.80078125, -326.2109375, -317.62109375, -309.03125, -300.44140625, -291.8515625, -283.26171875, -274.671875, -266.08203125, -257.4921875, -248.90234375, -240.3125, -231.72265625, -223.1328125, -214.54296875, -205.953125, -197.36328125, -188.7734375, -180.18359375, -171.59375, -163.00390625, -154.4140625, -145.82421875, -137.234375, -128.64453125, -120.0546875, -111.46484375, -102.875, -94.28515625, -85.6953125, -77.10546875, -68.515625, -59.92578125, -51.3359375, -42.74609375, -34.15625, -25.56640625, -16.9765625, -8.38671875, 0.203125, 8.79296875, 17.3828125, 25.97265625, 34.5625, 43.15234375, 51.7421875, 60.33203125, 68.921875, 77.51171875, 86.1015625, 94.69140625, 103.28125, 111.87109375, 120.4609375, 129.05078125, 137.640625, 146.23046875, 154.8203125, 163.41015625, 172.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [6.0, 2.0, 4.0, 4.0, 18.0, 13.0, 24.0, 34.0, 23.0, 39.0, 57.0, 66.0, 85.0, 167.0, 203.0, 316.0, 452.0, 650.0, 1068.0, 1512.0, 2317.0, 3332.0, 5364.0, 8702.0, 14519.0, 25674.0, 48271.0, 101153.0, 245034.0, 753132.0, 2997798.0, 1405683.0, 382272.0, 145525.0, 65772.0, 33575.0, 18572.0, 10861.0, 6603.0, 4131.0, 2697.0, 1813.0, 1223.0, 797.0, 569.0, 377.0, 289.0, 168.0, 143.0, 108.0, 75.0, 50.0, 34.0, 20.0, 19.0, 15.0, 10.0, 1.0, 2.0, 4.0, 5.0, 0.0, 3.0, 1.0], "bins": [-46.03125, -44.53271484375, -43.0341796875, -41.53564453125, -40.037109375, -38.53857421875, -37.0400390625, -35.54150390625, -34.04296875, -32.54443359375, -31.0458984375, -29.54736328125, -28.048828125, -26.55029296875, -25.0517578125, -23.55322265625, -22.0546875, -20.55615234375, -19.0576171875, -17.55908203125, -16.060546875, -14.56201171875, -13.0634765625, -11.56494140625, -10.06640625, -8.56787109375, -7.0693359375, -5.57080078125, -4.072265625, -2.57373046875, -1.0751953125, 0.42333984375, 1.921875, 3.42041015625, 4.9189453125, 6.41748046875, 7.916015625, 9.41455078125, 10.9130859375, 12.41162109375, 13.91015625, 15.40869140625, 16.9072265625, 18.40576171875, 19.904296875, 21.40283203125, 22.9013671875, 24.39990234375, 25.8984375, 27.39697265625, 28.8955078125, 30.39404296875, 31.892578125, 33.39111328125, 34.8896484375, 36.38818359375, 37.88671875, 39.38525390625, 40.8837890625, 42.38232421875, 43.880859375, 45.37939453125, 46.8779296875, 48.37646484375, 49.875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 3.0, 2.0, 5.0, 4.0, 12.0, 14.0, 8.0, 15.0, 20.0, 24.0, 27.0, 45.0, 50.0, 72.0, 70.0, 110.0, 169.0, 223.0, 307.0, 239.0, 149.0, 74.0, 63.0, 63.0, 46.0, 32.0, 30.0, 24.0, 21.0, 13.0, 19.0, 18.0, 7.0, 14.0, 4.0, 3.0, 8.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-48.8125, -47.37158203125, -45.9306640625, -44.48974609375, -43.048828125, -41.60791015625, -40.1669921875, -38.72607421875, -37.28515625, -35.84423828125, -34.4033203125, -32.96240234375, -31.521484375, -30.08056640625, -28.6396484375, -27.19873046875, -25.7578125, -24.31689453125, -22.8759765625, -21.43505859375, -19.994140625, -18.55322265625, -17.1123046875, -15.67138671875, -14.23046875, -12.78955078125, -11.3486328125, -9.90771484375, -8.466796875, -7.02587890625, -5.5849609375, -4.14404296875, -2.703125, -1.26220703125, 0.1787109375, 1.61962890625, 3.060546875, 4.50146484375, 5.9423828125, 7.38330078125, 8.82421875, 10.26513671875, 11.7060546875, 13.14697265625, 14.587890625, 16.02880859375, 17.4697265625, 18.91064453125, 20.3515625, 21.79248046875, 23.2333984375, 24.67431640625, 26.115234375, 27.55615234375, 28.9970703125, 30.43798828125, 31.87890625, 33.31982421875, 34.7607421875, 36.20166015625, 37.642578125, 39.08349609375, 40.5244140625, 41.96533203125, 43.40625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 9.0, 16.0, 35.0, 35.0, 36.0, 64.0, 98.0, 153.0, 210.0, 311.0, 457.0, 616.0, 827.0, 1268.0, 1805.0, 2469.0, 3679.0, 5467.0, 8813.0, 14128.0, 22446.0, 37873.0, 66999.0, 122756.0, 243975.0, 517882.0, 1410112.0, 2377736.0, 745239.0, 331127.0, 164722.0, 85842.0, 48125.0, 28038.0, 16716.0, 10368.0, 6678.0, 4409.0, 3020.0, 1987.0, 1435.0, 987.0, 732.0, 523.0, 354.0, 250.0, 186.0, 132.0, 84.0, 57.0, 42.0, 32.0, 24.0, 11.0, 14.0, 12.0, 6.0, 6.0], "bins": [-25.34375, -24.5810546875, -23.818359375, -23.0556640625, -22.29296875, -21.5302734375, -20.767578125, -20.0048828125, -19.2421875, -18.4794921875, -17.716796875, -16.9541015625, -16.19140625, -15.4287109375, -14.666015625, -13.9033203125, -13.140625, -12.3779296875, -11.615234375, -10.8525390625, -10.08984375, -9.3271484375, -8.564453125, -7.8017578125, -7.0390625, -6.2763671875, -5.513671875, -4.7509765625, -3.98828125, -3.2255859375, -2.462890625, -1.7001953125, -0.9375, -0.1748046875, 0.587890625, 1.3505859375, 2.11328125, 2.8759765625, 3.638671875, 4.4013671875, 5.1640625, 5.9267578125, 6.689453125, 7.4521484375, 8.21484375, 8.9775390625, 9.740234375, 10.5029296875, 11.265625, 12.0283203125, 12.791015625, 13.5537109375, 14.31640625, 15.0791015625, 15.841796875, 16.6044921875, 17.3671875, 18.1298828125, 18.892578125, 19.6552734375, 20.41796875, 21.1806640625, 21.943359375, 22.7060546875, 23.46875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 9.0, 8.0, 10.0, 7.0, 9.0, 11.0, 14.0, 15.0, 24.0, 28.0, 27.0, 34.0, 55.0, 74.0, 109.0, 187.0, 395.0, 446.0, 146.0, 75.0, 62.0, 54.0, 44.0, 39.0, 25.0, 20.0, 20.0, 15.0, 9.0, 10.0, 7.0, 5.0, 5.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.5, -90.6103515625, -87.720703125, -84.8310546875, -81.94140625, -79.0517578125, -76.162109375, -73.2724609375, -70.3828125, -67.4931640625, -64.603515625, -61.7138671875, -58.82421875, -55.9345703125, -53.044921875, -50.1552734375, -47.265625, -44.3759765625, -41.486328125, -38.5966796875, -35.70703125, -32.8173828125, -29.927734375, -27.0380859375, -24.1484375, -21.2587890625, -18.369140625, -15.4794921875, -12.58984375, -9.7001953125, -6.810546875, -3.9208984375, -1.03125, 1.8583984375, 4.748046875, 7.6376953125, 10.52734375, 13.4169921875, 16.306640625, 19.1962890625, 22.0859375, 24.9755859375, 27.865234375, 30.7548828125, 33.64453125, 36.5341796875, 39.423828125, 42.3134765625, 45.203125, 48.0927734375, 50.982421875, 53.8720703125, 56.76171875, 59.6513671875, 62.541015625, 65.4306640625, 68.3203125, 71.2099609375, 74.099609375, 76.9892578125, 79.87890625, 82.7685546875, 85.658203125, 88.5478515625, 91.4375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 4.0, 5.0, 5.0, 6.0, 5.0, 12.0, 10.0, 15.0, 20.0, 28.0, 17.0, 28.0, 64.0, 64.0, 84.0, 114.0, 182.0, 258.0, 497.0, 1006.0, 2191.0, 4820.0, 13365.0, 48183.0, 283104.0, 5806576.0, 94266.0, 22691.0, 7617.0, 3013.0, 1326.0, 659.0, 403.0, 244.0, 161.0, 84.0, 55.0, 60.0, 46.0, 46.0, 27.0, 10.0, 10.0, 13.0, 12.0, 6.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 6.0, 3.0], "bins": [-168.75, -163.513671875, -158.27734375, -153.041015625, -147.8046875, -142.568359375, -137.33203125, -132.095703125, -126.859375, -121.623046875, -116.38671875, -111.150390625, -105.9140625, -100.677734375, -95.44140625, -90.205078125, -84.96875, -79.732421875, -74.49609375, -69.259765625, -64.0234375, -58.787109375, -53.55078125, -48.314453125, -43.078125, -37.841796875, -32.60546875, -27.369140625, -22.1328125, -16.896484375, -11.66015625, -6.423828125, -1.1875, 4.048828125, 9.28515625, 14.521484375, 19.7578125, 24.994140625, 30.23046875, 35.466796875, 40.703125, 45.939453125, 51.17578125, 56.412109375, 61.6484375, 66.884765625, 72.12109375, 77.357421875, 82.59375, 87.830078125, 93.06640625, 98.302734375, 103.5390625, 108.775390625, 114.01171875, 119.248046875, 124.484375, 129.720703125, 134.95703125, 140.193359375, 145.4296875, 150.666015625, 155.90234375, 161.138671875, 166.375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 2.0, 7.0, 7.0, 18.0, 23.0, 22.0, 35.0, 25.0, 35.0, 37.0, 54.0, 64.0, 80.0, 304.0, 792.0, 118.0, 76.0, 52.0, 49.0, 31.0, 33.0, 17.0, 19.0, 17.0, 17.0, 17.0, 14.0, 14.0, 4.0, 3.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-193.0, -186.654296875, -180.30859375, -173.962890625, -167.6171875, -161.271484375, -154.92578125, -148.580078125, -142.234375, -135.888671875, -129.54296875, -123.197265625, -116.8515625, -110.505859375, -104.16015625, -97.814453125, -91.46875, -85.123046875, -78.77734375, -72.431640625, -66.0859375, -59.740234375, -53.39453125, -47.048828125, -40.703125, -34.357421875, -28.01171875, -21.666015625, -15.3203125, -8.974609375, -2.62890625, 3.716796875, 10.0625, 16.408203125, 22.75390625, 29.099609375, 35.4453125, 41.791015625, 48.13671875, 54.482421875, 60.828125, 67.173828125, 73.51953125, 79.865234375, 86.2109375, 92.556640625, 98.90234375, 105.248046875, 111.59375, 117.939453125, 124.28515625, 130.630859375, 136.9765625, 143.322265625, 149.66796875, 156.013671875, 162.359375, 168.705078125, 175.05078125, 181.396484375, 187.7421875, 194.087890625, 200.43359375, 206.779296875, 213.125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 12.0, 379.0, 607.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14219.568359375, -13824.8173828125, -13430.06640625, -13035.3154296875, -12640.564453125, -12245.8134765625, -11851.0625, -11456.3125, -11061.560546875, -10666.8095703125, -10272.05859375, -9877.3076171875, -9482.556640625, -9087.8056640625, -8693.0546875, -8298.3046875, -7903.5537109375, -7508.802734375, -7114.0517578125, -6719.30078125, -6324.5498046875, -5929.798828125, -5535.04833984375, -5140.29736328125, -4745.54638671875, -4350.79541015625, -3956.04443359375, -3561.293701171875, -3166.542724609375, -2771.791748046875, -2377.041015625, -1982.2900390625, -1587.5390625, -1192.7880859375, -798.0372314453125, -403.286376953125, -8.535400390625, 386.215576171875, 780.96630859375, 1175.71728515625, 1570.46826171875, 1965.21923828125, 2359.97021484375, 2754.720947265625, 3149.471923828125, 3544.222900390625, 3938.9736328125, 4333.724609375, 4728.4755859375, 5123.2265625, 5517.9775390625, 5912.728515625, 6307.4794921875, 6702.23046875, 7096.98095703125, 7491.73193359375, 7886.48291015625, 8281.2333984375, 8675.984375, 9070.7353515625, 9465.486328125, 9860.2373046875, 10254.98828125, 10649.7392578125, 11044.490234375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 11.0, 25.0, 237.0, 654.0, 41.0, 10.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5052.6259765625, -4851.18408203125, -4649.7421875, -4448.30078125, -4246.85888671875, -4045.4169921875, -3843.975341796875, -3642.53369140625, -3441.091796875, -3239.64990234375, -3038.208251953125, -2836.7666015625, -2635.32470703125, -2433.8828125, -2232.441162109375, -2030.9993896484375, -1829.5576171875, -1628.1158447265625, -1426.674072265625, -1225.2322998046875, -1023.79052734375, -822.3487548828125, -620.906982421875, -419.4652099609375, -218.0234375, -16.5816650390625, 184.860107421875, 386.3018798828125, 587.74365234375, 789.1854248046875, 990.627197265625, 1192.0689697265625, 1393.5107421875, 1594.9525146484375, 1796.394287109375, 1997.8360595703125, 2199.27783203125, 2400.7197265625, 2602.161376953125, 2803.60302734375, 3005.044921875, 3206.48681640625, 3407.928466796875, 3609.3701171875, 3810.81201171875, 4012.25390625, 4213.6953125, 4415.13720703125, 4616.5791015625, 4818.02099609375, 5019.462890625, 5220.904296875, 5422.34619140625, 5623.7880859375, 5825.2294921875, 6026.67138671875, 6228.11328125, 6429.55517578125, 6630.9970703125, 6832.4384765625, 7033.88037109375, 7235.322265625, 7436.763671875, 7638.20556640625, 7839.6474609375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 3.0, 10.0, 5.0, 19.0, 25.0, 24.0, 46.0, 54.0, 114.0, 177.0, 246.0, 503.0, 962.0, 2061.0, 5322.0, 19313.0, 286503.0, 3837219.0, 29435.0, 7067.0, 2549.0, 1153.0, 520.0, 319.0, 201.0, 97.0, 70.0, 75.0, 44.0, 32.0, 21.0, 18.0, 20.0, 18.0, 6.0, 7.0, 8.0, 7.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.375, -15.723388671875, -15.07177734375, -14.420166015625, -13.7685546875, -13.116943359375, -12.46533203125, -11.813720703125, -11.162109375, -10.510498046875, -9.85888671875, -9.207275390625, -8.5556640625, -7.904052734375, -7.25244140625, -6.600830078125, -5.94921875, -5.297607421875, -4.64599609375, -3.994384765625, -3.3427734375, -2.691162109375, -2.03955078125, -1.387939453125, -0.736328125, -0.084716796875, 0.56689453125, 1.218505859375, 1.8701171875, 2.521728515625, 3.17333984375, 3.824951171875, 4.4765625, 5.128173828125, 5.77978515625, 6.431396484375, 7.0830078125, 7.734619140625, 8.38623046875, 9.037841796875, 9.689453125, 10.341064453125, 10.99267578125, 11.644287109375, 12.2958984375, 12.947509765625, 13.59912109375, 14.250732421875, 14.90234375, 15.553955078125, 16.20556640625, 16.857177734375, 17.5087890625, 18.160400390625, 18.81201171875, 19.463623046875, 20.115234375, 20.766845703125, 21.41845703125, 22.070068359375, 22.7216796875, 23.373291015625, 24.02490234375, 24.676513671875, 25.328125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 12.0, 9.0, 14.0, 21.0, 28.0, 68.0, 589.0, 135.0, 27.0, 16.0, 13.0, 11.0, 10.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1171875, -3.9619140625, -3.806640625, -3.6513671875, -3.49609375, -3.3408203125, -3.185546875, -3.0302734375, -2.875, -2.7197265625, -2.564453125, -2.4091796875, -2.25390625, -2.0986328125, -1.943359375, -1.7880859375, -1.6328125, -1.4775390625, -1.322265625, -1.1669921875, -1.01171875, -0.8564453125, -0.701171875, -0.5458984375, -0.390625, -0.2353515625, -0.080078125, 0.0751953125, 0.23046875, 0.3857421875, 0.541015625, 0.6962890625, 0.8515625, 1.0068359375, 1.162109375, 1.3173828125, 1.47265625, 1.6279296875, 1.783203125, 1.9384765625, 2.09375, 2.2490234375, 2.404296875, 2.5595703125, 2.71484375, 2.8701171875, 3.025390625, 3.1806640625, 3.3359375, 3.4912109375, 3.646484375, 3.8017578125, 3.95703125, 4.1123046875, 4.267578125, 4.4228515625, 4.578125, 4.7333984375, 4.888671875, 5.0439453125, 5.19921875, 5.3544921875, 5.509765625, 5.6650390625, 5.8203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 15.0, 14.0, 14.0, 39.0, 69.0, 118.0, 261.0, 609.0, 1812.0, 7010.0, 40036.0, 810046.0, 3260219.0, 61721.0, 8998.0, 2087.0, 638.0, 271.0, 117.0, 66.0, 42.0, 22.0, 19.0, 14.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.1875, -23.535888671875, -22.88427734375, -22.232666015625, -21.5810546875, -20.929443359375, -20.27783203125, -19.626220703125, -18.974609375, -18.322998046875, -17.67138671875, -17.019775390625, -16.3681640625, -15.716552734375, -15.06494140625, -14.413330078125, -13.76171875, -13.110107421875, -12.45849609375, -11.806884765625, -11.1552734375, -10.503662109375, -9.85205078125, -9.200439453125, -8.548828125, -7.897216796875, -7.24560546875, -6.593994140625, -5.9423828125, -5.290771484375, -4.63916015625, -3.987548828125, -3.3359375, -2.684326171875, -2.03271484375, -1.381103515625, -0.7294921875, -0.077880859375, 0.57373046875, 1.225341796875, 1.876953125, 2.528564453125, 3.18017578125, 3.831787109375, 4.4833984375, 5.135009765625, 5.78662109375, 6.438232421875, 7.08984375, 7.741455078125, 8.39306640625, 9.044677734375, 9.6962890625, 10.347900390625, 10.99951171875, 11.651123046875, 12.302734375, 12.954345703125, 13.60595703125, 14.257568359375, 14.9091796875, 15.560791015625, 16.21240234375, 16.864013671875, 17.515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 6.0, 6.0, 4.0, 9.0, 21.0, 18.0, 15.0, 32.0, 36.0, 54.0, 72.0, 108.0, 154.0, 324.0, 822.0, 1428.0, 394.0, 218.0, 119.0, 68.0, 49.0, 26.0, 29.0, 14.0, 19.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.662109375, -3.522491455078125, -3.38287353515625, -3.243255615234375, -3.1036376953125, -2.964019775390625, -2.82440185546875, -2.684783935546875, -2.545166015625, -2.405548095703125, -2.26593017578125, -2.126312255859375, -1.9866943359375, -1.847076416015625, -1.70745849609375, -1.567840576171875, -1.42822265625, -1.288604736328125, -1.14898681640625, -1.009368896484375, -0.8697509765625, -0.730133056640625, -0.59051513671875, -0.450897216796875, -0.311279296875, -0.171661376953125, -0.03204345703125, 0.107574462890625, 0.2471923828125, 0.386810302734375, 0.52642822265625, 0.666046142578125, 0.8056640625, 0.945281982421875, 1.08489990234375, 1.224517822265625, 1.3641357421875, 1.503753662109375, 1.64337158203125, 1.782989501953125, 1.922607421875, 2.062225341796875, 2.20184326171875, 2.341461181640625, 2.4810791015625, 2.620697021484375, 2.76031494140625, 2.899932861328125, 3.03955078125, 3.179168701171875, 3.31878662109375, 3.458404541015625, 3.5980224609375, 3.737640380859375, 3.87725830078125, 4.016876220703125, 4.156494140625, 4.296112060546875, 4.43572998046875, 4.575347900390625, 4.7149658203125, 4.854583740234375, 4.99420166015625, 5.133819580078125, 5.2734375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 17.0, 78.0, 470.0, 374.0, 43.0, 11.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-87.3570556640625, -83.54649353027344, -79.73592376708984, -75.92535400390625, -72.11479187011719, -68.30422973632812, -64.49365997314453, -60.6830940246582, -56.872528076171875, -53.06196212768555, -49.25139617919922, -45.44083023071289, -41.63026428222656, -37.819698333740234, -34.009132385253906, -30.198566436767578, -26.38800048828125, -22.577434539794922, -18.766868591308594, -14.956302642822266, -11.145736694335938, -7.335170745849609, -3.5246047973632812, 0.2859611511230469, 4.096527099609375, 7.907093048095703, 11.717658996582031, 15.52822494506836, 19.338790893554688, 23.149356842041016, 26.959922790527344, 30.770488739013672, 34.5810546875, 38.39162063598633, 42.202186584472656, 46.012752532958984, 49.82331848144531, 53.63388442993164, 57.44445037841797, 61.2550163269043, 65.06558227539062, 68.87614440917969, 72.68671417236328, 76.49728393554688, 80.30784606933594, 84.118408203125, 87.9289779663086, 91.73954772949219, 95.55010986328125, 99.36067199707031, 103.1712417602539, 106.9818115234375, 110.79237365722656, 114.60293579101562, 118.41350555419922, 122.22407531738281, 126.03463745117188, 129.84519958496094, 133.65576171875, 137.46633911132812, 141.2769012451172, 145.08746337890625, 148.89804077148438, 152.70860290527344, 156.5191650390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 18.0, 22.0, 28.0, 53.0, 54.0, 76.0, 87.0, 119.0, 91.0, 122.0, 89.0, 67.0, 59.0, 31.0, 32.0, 21.0, 9.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.208810806274414, -24.011411666870117, -22.81401252746582, -21.616613388061523, -20.419214248657227, -19.22181510925293, -18.0244140625, -16.827014923095703, -15.629616737365723, -14.432217597961426, -13.234818458557129, -12.037418365478516, -10.840019226074219, -9.642620086669922, -8.445220947265625, -7.247821807861328, -6.050422668457031, -4.853023529052734, -3.6556241512298584, -2.4582247734069824, -1.2608256340026855, -0.06342649459838867, 1.1339731216430664, 2.3313722610473633, 3.52877140045166, 4.726170539855957, 5.923569679260254, 7.120969295501709, 8.318368911743164, 9.515768051147461, 10.713167190551758, 11.910566329956055, 13.107963562011719, 14.305362701416016, 15.502761840820312, 16.70016098022461, 17.897560119628906, 19.094959259033203, 20.2923583984375, 21.489757537841797, 22.687156677246094, 23.88455581665039, 25.081954956054688, 26.279354095458984, 27.47675323486328, 28.674152374267578, 29.871551513671875, 31.068950653076172, 32.26634979248047, 33.463748931884766, 34.66114807128906, 35.85854721069336, 37.055946350097656, 38.25334548950195, 39.45074462890625, 40.64814376831055, 41.84554672241211, 43.042945861816406, 44.2403450012207, 45.437744140625, 46.6351432800293, 47.832542419433594, 49.02994155883789, 50.22734069824219, 51.424739837646484]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 12.0, 13.0, 18.0, 24.0, 25.0, 46.0, 61.0, 66.0, 105.0, 140.0, 200.0, 320.0, 500.0, 860.0, 1506.0, 2778.0, 6002.0, 15193.0, 51921.0, 857246.0, 77668.0, 18888.0, 7224.0, 3353.0, 1674.0, 957.0, 543.0, 357.0, 257.0, 166.0, 131.0, 77.0, 51.0, 46.0, 23.0, 30.0, 15.0, 12.0, 14.0, 3.0, 12.0, 3.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.5, -17.9326171875, -17.365234375, -16.7978515625, -16.23046875, -15.6630859375, -15.095703125, -14.5283203125, -13.9609375, -13.3935546875, -12.826171875, -12.2587890625, -11.69140625, -11.1240234375, -10.556640625, -9.9892578125, -9.421875, -8.8544921875, -8.287109375, -7.7197265625, -7.15234375, -6.5849609375, -6.017578125, -5.4501953125, -4.8828125, -4.3154296875, -3.748046875, -3.1806640625, -2.61328125, -2.0458984375, -1.478515625, -0.9111328125, -0.34375, 0.2236328125, 0.791015625, 1.3583984375, 1.92578125, 2.4931640625, 3.060546875, 3.6279296875, 4.1953125, 4.7626953125, 5.330078125, 5.8974609375, 6.46484375, 7.0322265625, 7.599609375, 8.1669921875, 8.734375, 9.3017578125, 9.869140625, 10.4365234375, 11.00390625, 11.5712890625, 12.138671875, 12.7060546875, 13.2734375, 13.8408203125, 14.408203125, 14.9755859375, 15.54296875, 16.1103515625, 16.677734375, 17.2451171875, 17.8125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 8.0, 8.0, 12.0, 11.0, 19.0, 23.0, 22.0, 105.0, 506.0, 178.0, 27.0, 15.0, 15.0, 13.0, 7.0, 9.0, 2.0, 1.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.9542236328125, -3.799072265625, -3.6439208984375, -3.48876953125, -3.3336181640625, -3.178466796875, -3.0233154296875, -2.8681640625, -2.7130126953125, -2.557861328125, -2.4027099609375, -2.24755859375, -2.0924072265625, -1.937255859375, -1.7821044921875, -1.626953125, -1.4718017578125, -1.316650390625, -1.1614990234375, -1.00634765625, -0.8511962890625, -0.696044921875, -0.5408935546875, -0.3857421875, -0.2305908203125, -0.075439453125, 0.0797119140625, 0.23486328125, 0.3900146484375, 0.545166015625, 0.7003173828125, 0.85546875, 1.0106201171875, 1.165771484375, 1.3209228515625, 1.47607421875, 1.6312255859375, 1.786376953125, 1.9415283203125, 2.0966796875, 2.2518310546875, 2.406982421875, 2.5621337890625, 2.71728515625, 2.8724365234375, 3.027587890625, 3.1827392578125, 3.337890625, 3.4930419921875, 3.648193359375, 3.8033447265625, 3.95849609375, 4.1136474609375, 4.268798828125, 4.4239501953125, 4.5791015625, 4.7342529296875, 4.889404296875, 5.0445556640625, 5.19970703125, 5.3548583984375, 5.510009765625, 5.6651611328125, 5.8203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 13.0, 18.0, 25.0, 26.0, 56.0, 90.0, 167.0, 347.0, 770.0, 2645.0, 17719.0, 225242.0, 741151.0, 51730.0, 6238.0, 1345.0, 452.0, 203.0, 106.0, 73.0, 41.0, 31.0, 18.0, 8.0, 15.0, 9.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.9375, -21.132080078125, -20.32666015625, -19.521240234375, -18.7158203125, -17.910400390625, -17.10498046875, -16.299560546875, -15.494140625, -14.688720703125, -13.88330078125, -13.077880859375, -12.2724609375, -11.467041015625, -10.66162109375, -9.856201171875, -9.05078125, -8.245361328125, -7.43994140625, -6.634521484375, -5.8291015625, -5.023681640625, -4.21826171875, -3.412841796875, -2.607421875, -1.802001953125, -0.99658203125, -0.191162109375, 0.6142578125, 1.419677734375, 2.22509765625, 3.030517578125, 3.8359375, 4.641357421875, 5.44677734375, 6.252197265625, 7.0576171875, 7.863037109375, 8.66845703125, 9.473876953125, 10.279296875, 11.084716796875, 11.89013671875, 12.695556640625, 13.5009765625, 14.306396484375, 15.11181640625, 15.917236328125, 16.72265625, 17.528076171875, 18.33349609375, 19.138916015625, 19.9443359375, 20.749755859375, 21.55517578125, 22.360595703125, 23.166015625, 23.971435546875, 24.77685546875, 25.582275390625, 26.3876953125, 27.193115234375, 27.99853515625, 28.803955078125, 29.609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 13.0, 12.0, 11.0, 11.0, 9.0, 16.0, 15.0, 19.0, 20.0, 29.0, 28.0, 19.0, 33.0, 32.0, 37.0, 36.0, 50.0, 42.0, 34.0, 51.0, 39.0, 39.0, 36.0, 40.0, 40.0, 38.0, 37.0, 29.0, 33.0, 20.0, 21.0, 14.0, 21.0, 12.0, 11.0, 10.0, 7.0, 5.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0], "bins": [-11.625, -11.309814453125, -10.99462890625, -10.679443359375, -10.3642578125, -10.049072265625, -9.73388671875, -9.418701171875, -9.103515625, -8.788330078125, -8.47314453125, -8.157958984375, -7.8427734375, -7.527587890625, -7.21240234375, -6.897216796875, -6.58203125, -6.266845703125, -5.95166015625, -5.636474609375, -5.3212890625, -5.006103515625, -4.69091796875, -4.375732421875, -4.060546875, -3.745361328125, -3.43017578125, -3.114990234375, -2.7998046875, -2.484619140625, -2.16943359375, -1.854248046875, -1.5390625, -1.223876953125, -0.90869140625, -0.593505859375, -0.2783203125, 0.036865234375, 0.35205078125, 0.667236328125, 0.982421875, 1.297607421875, 1.61279296875, 1.927978515625, 2.2431640625, 2.558349609375, 2.87353515625, 3.188720703125, 3.50390625, 3.819091796875, 4.13427734375, 4.449462890625, 4.7646484375, 5.079833984375, 5.39501953125, 5.710205078125, 6.025390625, 6.340576171875, 6.65576171875, 6.970947265625, 7.2861328125, 7.601318359375, 7.91650390625, 8.231689453125, 8.546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 10.0, 10.0, 11.0, 17.0, 25.0, 44.0, 72.0, 139.0, 228.0, 409.0, 904.0, 1962.0, 5113.0, 16993.0, 94060.0, 735304.0, 158724.0, 23236.0, 6661.0, 2449.0, 1034.0, 490.0, 245.0, 143.0, 100.0, 51.0, 35.0, 27.0, 12.0, 16.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2421875, -11.7447509765625, -11.247314453125, -10.7498779296875, -10.25244140625, -9.7550048828125, -9.257568359375, -8.7601318359375, -8.2626953125, -7.7652587890625, -7.267822265625, -6.7703857421875, -6.27294921875, -5.7755126953125, -5.278076171875, -4.7806396484375, -4.283203125, -3.7857666015625, -3.288330078125, -2.7908935546875, -2.29345703125, -1.7960205078125, -1.298583984375, -0.8011474609375, -0.3037109375, 0.1937255859375, 0.691162109375, 1.1885986328125, 1.68603515625, 2.1834716796875, 2.680908203125, 3.1783447265625, 3.67578125, 4.1732177734375, 4.670654296875, 5.1680908203125, 5.66552734375, 6.1629638671875, 6.660400390625, 7.1578369140625, 7.6552734375, 8.1527099609375, 8.650146484375, 9.1475830078125, 9.64501953125, 10.1424560546875, 10.639892578125, 11.1373291015625, 11.634765625, 12.1322021484375, 12.629638671875, 13.1270751953125, 13.62451171875, 14.1219482421875, 14.619384765625, 15.1168212890625, 15.6142578125, 16.1116943359375, 16.609130859375, 17.1065673828125, 17.60400390625, 18.1014404296875, 18.598876953125, 19.0963134765625, 19.59375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 8.0, 12.0, 11.0, 14.0, 18.0, 16.0, 27.0, 27.0, 36.0, 62.0, 69.0, 95.0, 111.0, 109.0, 87.0, 75.0, 58.0, 40.0, 35.0, 18.0, 9.0, 17.0, 7.0, 10.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004410743713378906, -0.0004271268844604492, -0.0004131793975830078, -0.0003992319107055664, -0.000385284423828125, -0.0003713369369506836, -0.0003573894500732422, -0.0003434419631958008, -0.0003294944763183594, -0.00031554698944091797, -0.00030159950256347656, -0.00028765201568603516, -0.00027370452880859375, -0.00025975704193115234, -0.00024580955505371094, -0.00023186206817626953, -0.00021791458129882812, -0.00020396709442138672, -0.0001900196075439453, -0.0001760721206665039, -0.0001621246337890625, -0.0001481771469116211, -0.0001342296600341797, -0.00012028217315673828, -0.00010633468627929688, -9.238719940185547e-05, -7.843971252441406e-05, -6.449222564697266e-05, -5.054473876953125e-05, -3.6597251892089844e-05, -2.2649765014648438e-05, -8.702278137207031e-06, 5.245208740234375e-06, 1.919269561767578e-05, 3.314018249511719e-05, 4.7087669372558594e-05, 6.103515625e-05, 7.49826431274414e-05, 8.893013000488281e-05, 0.00010287761688232422, 0.00011682510375976562, 0.00013077259063720703, 0.00014472007751464844, 0.00015866756439208984, 0.00017261505126953125, 0.00018656253814697266, 0.00020051002502441406, 0.00021445751190185547, 0.00022840499877929688, 0.00024235248565673828, 0.0002562999725341797, 0.0002702474594116211, 0.0002841949462890625, 0.0002981424331665039, 0.0003120899200439453, 0.0003260374069213867, 0.0003399848937988281, 0.00035393238067626953, 0.00036787986755371094, 0.00038182735443115234, 0.00039577484130859375, 0.00040972232818603516, 0.00042366981506347656, 0.00043761730194091797, 0.0004515647888183594]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 8.0, 10.0, 16.0, 13.0, 12.0, 11.0, 29.0, 46.0, 65.0, 104.0, 120.0, 253.0, 355.0, 660.0, 1158.0, 2191.0, 4658.0, 10677.0, 29741.0, 102465.0, 411176.0, 353044.0, 87095.0, 25961.0, 9757.0, 4248.0, 2097.0, 999.0, 624.0, 318.0, 221.0, 119.0, 114.0, 45.0, 40.0, 21.0, 23.0, 21.0, 8.0, 12.0, 7.0, 10.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.0390625, -8.7646484375, -8.490234375, -8.2158203125, -7.94140625, -7.6669921875, -7.392578125, -7.1181640625, -6.84375, -6.5693359375, -6.294921875, -6.0205078125, -5.74609375, -5.4716796875, -5.197265625, -4.9228515625, -4.6484375, -4.3740234375, -4.099609375, -3.8251953125, -3.55078125, -3.2763671875, -3.001953125, -2.7275390625, -2.453125, -2.1787109375, -1.904296875, -1.6298828125, -1.35546875, -1.0810546875, -0.806640625, -0.5322265625, -0.2578125, 0.0166015625, 0.291015625, 0.5654296875, 0.83984375, 1.1142578125, 1.388671875, 1.6630859375, 1.9375, 2.2119140625, 2.486328125, 2.7607421875, 3.03515625, 3.3095703125, 3.583984375, 3.8583984375, 4.1328125, 4.4072265625, 4.681640625, 4.9560546875, 5.23046875, 5.5048828125, 5.779296875, 6.0537109375, 6.328125, 6.6025390625, 6.876953125, 7.1513671875, 7.42578125, 7.7001953125, 7.974609375, 8.2490234375, 8.5234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 9.0, 17.0, 19.0, 22.0, 29.0, 39.0, 26.0, 51.0, 38.0, 47.0, 48.0, 63.0, 66.0, 83.0, 60.0, 66.0, 48.0, 50.0, 33.0, 36.0, 25.0, 22.0, 13.0, 12.0, 12.0, 12.0, 6.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.8101806640625, -7.557861328125, -7.3055419921875, -7.05322265625, -6.8009033203125, -6.548583984375, -6.2962646484375, -6.0439453125, -5.7916259765625, -5.539306640625, -5.2869873046875, -5.03466796875, -4.7823486328125, -4.530029296875, -4.2777099609375, -4.025390625, -3.7730712890625, -3.520751953125, -3.2684326171875, -3.01611328125, -2.7637939453125, -2.511474609375, -2.2591552734375, -2.0068359375, -1.7545166015625, -1.502197265625, -1.2498779296875, -0.99755859375, -0.7452392578125, -0.492919921875, -0.2406005859375, 0.01171875, 0.2640380859375, 0.516357421875, 0.7686767578125, 1.02099609375, 1.2733154296875, 1.525634765625, 1.7779541015625, 2.0302734375, 2.2825927734375, 2.534912109375, 2.7872314453125, 3.03955078125, 3.2918701171875, 3.544189453125, 3.7965087890625, 4.048828125, 4.3011474609375, 4.553466796875, 4.8057861328125, 5.05810546875, 5.3104248046875, 5.562744140625, 5.8150634765625, 6.0673828125, 6.3197021484375, 6.572021484375, 6.8243408203125, 7.07666015625, 7.3289794921875, 7.581298828125, 7.8336181640625, 8.0859375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 11.0, 22.0, 256.0, 534.0, 137.0, 29.0, 7.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-425.1136169433594, -411.51708984375, -397.9205627441406, -384.32403564453125, -370.72747802734375, -357.1309509277344, -343.534423828125, -329.9378967285156, -316.34136962890625, -302.7448425292969, -289.1483154296875, -275.5517578125, -261.9552307128906, -248.35870361328125, -234.76217651367188, -221.1656494140625, -207.569091796875, -193.97256469726562, -180.3760223388672, -166.7794952392578, -153.18295288085938, -139.58642578125, -125.98989868164062, -112.39336395263672, -98.79682922363281, -85.2002944946289, -71.603759765625, -58.007232666015625, -44.41069793701172, -30.814163208007812, -17.217636108398438, -3.6211013793945312, 9.97540283203125, 23.571935653686523, 37.1684684753418, 50.76499938964844, 64.36153411865234, 77.95806884765625, 91.55459594726562, 105.15113067626953, 118.74766540527344, 132.3441925048828, 145.94073486328125, 159.53726196289062, 173.1337890625, 186.73033142089844, 200.3268585205078, 213.92340087890625, 227.51992797851562, 241.116455078125, 254.71299743652344, 268.30950927734375, 281.90606689453125, 295.5025939941406, 309.09912109375, 322.6956481933594, 336.29217529296875, 349.8887023925781, 363.4852294921875, 377.081787109375, 390.6783142089844, 404.27484130859375, 417.8713684082031, 431.4678955078125, 445.064453125]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 5.0, 12.0, 11.0, 11.0, 35.0, 56.0, 82.0, 134.0, 157.0, 140.0, 103.0, 100.0, 38.0, 22.0, 15.0, 9.0, 11.0, 2.0, 6.0, 6.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.03836059570312, -182.28524780273438, -175.5321502685547, -168.77903747558594, -162.0259246826172, -155.2728271484375, -148.51971435546875, -141.7666015625, -135.01348876953125, -128.2603759765625, -121.50727081298828, -114.75416564941406, -108.00105285644531, -101.2479476928711, -94.49484252929688, -87.74172973632812, -80.98863220214844, -74.23552703857422, -67.48241424560547, -60.72930908203125, -53.976200103759766, -47.22309112548828, -40.46998596191406, -33.71687698364258, -26.963768005371094, -20.21065902709961, -13.457551956176758, -6.704444885253906, 0.048664093017578125, 6.8017730712890625, 13.554878234863281, 20.307987213134766, 27.06109619140625, 33.814205169677734, 40.56731414794922, 47.32041931152344, 54.07352828979492, 60.826637268066406, 67.57974243164062, 74.33285522460938, 81.0859603881836, 87.83906555175781, 94.59217834472656, 101.34528350830078, 108.098388671875, 114.85150146484375, 121.60460662841797, 128.3577117919922, 135.11082458496094, 141.8639373779297, 148.61703491210938, 155.37014770507812, 162.12326049804688, 168.87637329101562, 175.6294708251953, 182.38258361816406, 189.13568115234375, 195.8887939453125, 202.6418914794922, 209.39500427246094, 216.1481170654297, 222.90121459960938, 229.65432739257812, 236.40744018554688, 243.16055297851562]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 6.0, 8.0, 29.0, 46.0, 40.0, 120.0, 215.0, 589.0, 2120.0, 14208.0, 4085049.0, 85028.0, 4783.0, 1146.0, 396.0, 215.0, 104.0, 54.0, 39.0, 25.0, 21.0, 11.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.5, -80.380859375, -77.26171875, -74.142578125, -71.0234375, -67.904296875, -64.78515625, -61.666015625, -58.546875, -55.427734375, -52.30859375, -49.189453125, -46.0703125, -42.951171875, -39.83203125, -36.712890625, -33.59375, -30.474609375, -27.35546875, -24.236328125, -21.1171875, -17.998046875, -14.87890625, -11.759765625, -8.640625, -5.521484375, -2.40234375, 0.716796875, 3.8359375, 6.955078125, 10.07421875, 13.193359375, 16.3125, 19.431640625, 22.55078125, 25.669921875, 28.7890625, 31.908203125, 35.02734375, 38.146484375, 41.265625, 44.384765625, 47.50390625, 50.623046875, 53.7421875, 56.861328125, 59.98046875, 63.099609375, 66.21875, 69.337890625, 72.45703125, 75.576171875, 78.6953125, 81.814453125, 84.93359375, 88.052734375, 91.171875, 94.291015625, 97.41015625, 100.529296875, 103.6484375, 106.767578125, 109.88671875, 113.005859375, 116.125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 3.0, 10.0, 14.0, 22.0, 21.0, 32.0, 125.0, 392.0, 250.0, 59.0, 20.0, 11.0, 16.0, 11.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.0718994140625, -3.913330078125, -3.7547607421875, -3.59619140625, -3.4376220703125, -3.279052734375, -3.1204833984375, -2.9619140625, -2.8033447265625, -2.644775390625, -2.4862060546875, -2.32763671875, -2.1690673828125, -2.010498046875, -1.8519287109375, -1.693359375, -1.5347900390625, -1.376220703125, -1.2176513671875, -1.05908203125, -0.9005126953125, -0.741943359375, -0.5833740234375, -0.4248046875, -0.2662353515625, -0.107666015625, 0.0509033203125, 0.20947265625, 0.3680419921875, 0.526611328125, 0.6851806640625, 0.84375, 1.0023193359375, 1.160888671875, 1.3194580078125, 1.47802734375, 1.6365966796875, 1.795166015625, 1.9537353515625, 2.1123046875, 2.2708740234375, 2.429443359375, 2.5880126953125, 2.74658203125, 2.9051513671875, 3.063720703125, 3.2222900390625, 3.380859375, 3.5394287109375, 3.697998046875, 3.8565673828125, 4.01513671875, 4.1737060546875, 4.332275390625, 4.4908447265625, 4.6494140625, 4.8079833984375, 4.966552734375, 5.1251220703125, 5.28369140625, 5.4422607421875, 5.600830078125, 5.7593994140625, 5.91796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 6.0, 12.0, 13.0, 21.0, 32.0, 41.0, 84.0, 108.0, 215.0, 400.0, 690.0, 1310.0, 2748.0, 6523.0, 16592.0, 50903.0, 241917.0, 3462712.0, 315570.0, 61143.0, 19220.0, 7453.0, 3194.0, 1518.0, 799.0, 423.0, 246.0, 120.0, 89.0, 58.0, 43.0, 33.0, 13.0, 8.0, 10.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-25.65625, -24.990966796875, -24.32568359375, -23.660400390625, -22.9951171875, -22.329833984375, -21.66455078125, -20.999267578125, -20.333984375, -19.668701171875, -19.00341796875, -18.338134765625, -17.6728515625, -17.007568359375, -16.34228515625, -15.677001953125, -15.01171875, -14.346435546875, -13.68115234375, -13.015869140625, -12.3505859375, -11.685302734375, -11.02001953125, -10.354736328125, -9.689453125, -9.024169921875, -8.35888671875, -7.693603515625, -7.0283203125, -6.363037109375, -5.69775390625, -5.032470703125, -4.3671875, -3.701904296875, -3.03662109375, -2.371337890625, -1.7060546875, -1.040771484375, -0.37548828125, 0.289794921875, 0.955078125, 1.620361328125, 2.28564453125, 2.950927734375, 3.6162109375, 4.281494140625, 4.94677734375, 5.612060546875, 6.27734375, 6.942626953125, 7.60791015625, 8.273193359375, 8.9384765625, 9.603759765625, 10.26904296875, 10.934326171875, 11.599609375, 12.264892578125, 12.93017578125, 13.595458984375, 14.2607421875, 14.926025390625, 15.59130859375, 16.256591796875, 16.921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 8.0, 12.0, 13.0, 14.0, 27.0, 47.0, 65.0, 79.0, 109.0, 193.0, 383.0, 1973.0, 465.0, 212.0, 135.0, 81.0, 62.0, 41.0, 34.0, 17.0, 13.0, 14.0, 9.0, 11.0, 7.0, 9.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.82421875, -2.72564697265625, -2.6270751953125, -2.52850341796875, -2.429931640625, -2.33135986328125, -2.2327880859375, -2.13421630859375, -2.03564453125, -1.93707275390625, -1.8385009765625, -1.73992919921875, -1.641357421875, -1.54278564453125, -1.4442138671875, -1.34564208984375, -1.2470703125, -1.14849853515625, -1.0499267578125, -0.95135498046875, -0.852783203125, -0.75421142578125, -0.6556396484375, -0.55706787109375, -0.45849609375, -0.35992431640625, -0.2613525390625, -0.16278076171875, -0.064208984375, 0.03436279296875, 0.1329345703125, 0.23150634765625, 0.330078125, 0.42864990234375, 0.5272216796875, 0.62579345703125, 0.724365234375, 0.82293701171875, 0.9215087890625, 1.02008056640625, 1.11865234375, 1.21722412109375, 1.3157958984375, 1.41436767578125, 1.512939453125, 1.61151123046875, 1.7100830078125, 1.80865478515625, 1.9072265625, 2.00579833984375, 2.1043701171875, 2.20294189453125, 2.301513671875, 2.40008544921875, 2.4986572265625, 2.59722900390625, 2.69580078125, 2.79437255859375, 2.8929443359375, 2.99151611328125, 3.090087890625, 3.18865966796875, 3.2872314453125, 3.38580322265625, 3.484375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 30.0, 135.0, 324.0, 322.0, 130.0, 36.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.28564453125, -57.49095916748047, -55.69627380371094, -53.901588439941406, -52.106903076171875, -50.312217712402344, -48.51752853393555, -46.722843170166016, -44.928157806396484, -43.13347244262695, -41.33878707885742, -39.54410171508789, -37.749412536621094, -35.95472717285156, -34.16004180908203, -32.3653564453125, -30.57067108154297, -28.775985717773438, -26.981300354003906, -25.186613082885742, -23.39192771911621, -21.59724235534668, -19.802555084228516, -18.007869720458984, -16.213184356689453, -14.418498992919922, -12.623812675476074, -10.829126358032227, -9.034440994262695, -7.239755630493164, -5.445069313049316, -3.6503829956054688, -1.8556938171386719, -0.06100797653198242, 1.733677864074707, 3.5283637046813965, 5.323049545288086, 7.117734909057617, 8.912421226501465, 10.707107543945312, 12.501792907714844, 14.296478271484375, 16.091163635253906, 17.88585090637207, 19.6805362701416, 21.475221633911133, 23.269908905029297, 25.064594268798828, 26.85927963256836, 28.65396499633789, 30.448650360107422, 32.24333572387695, 34.03802490234375, 35.83271026611328, 37.62739562988281, 39.422080993652344, 41.216766357421875, 43.011451721191406, 44.80613708496094, 46.60082244873047, 48.3955078125, 50.19019317626953, 51.98488235473633, 53.77956771850586, 55.57425308227539]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 1.0, 5.0, 6.0, 6.0, 11.0, 20.0, 16.0, 27.0, 23.0, 41.0, 48.0, 56.0, 65.0, 59.0, 80.0, 70.0, 73.0, 58.0, 59.0, 62.0, 47.0, 37.0, 33.0, 25.0, 15.0, 19.0, 8.0, 9.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.208098411560059, -11.720442771911621, -11.232787132263184, -10.745131492614746, -10.257475852966309, -9.769820213317871, -9.282163619995117, -8.79450798034668, -8.306852340698242, -7.819196701049805, -7.331541061401367, -6.84388542175293, -6.356229782104492, -5.868574142456055, -5.380918025970459, -4.8932623863220215, -4.405607223510742, -3.9179515838623047, -3.430295944213867, -2.9426400661468506, -2.454984426498413, -1.9673287868499756, -1.479672908782959, -0.9920172691345215, -0.504361629486084, -0.01670593023300171, 0.47094976902008057, 0.9586055278778076, 1.4462611675262451, 1.9339168071746826, 2.421572685241699, 2.9092283248901367, 3.396883010864258, 3.8845386505126953, 4.372194290161133, 4.85984992980957, 5.347505569458008, 5.835161209106445, 6.322817325592041, 6.8104729652404785, 7.298128604888916, 7.7857842445373535, 8.27344036102295, 8.761096000671387, 9.248751640319824, 9.736407279968262, 10.2240629196167, 10.711718559265137, 11.199374198913574, 11.687029838562012, 12.17468547821045, 12.662341117858887, 13.149996757507324, 13.637652397155762, 14.125308990478516, 14.612964630126953, 15.10062026977539, 15.588275909423828, 16.075931549072266, 16.563587188720703, 17.05124282836914, 17.538898468017578, 18.026554107666016, 18.514209747314453, 19.00186538696289]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 3.0, 3.0, 7.0, 14.0, 10.0, 15.0, 23.0, 41.0, 66.0, 69.0, 186.0, 311.0, 613.0, 1666.0, 6354.0, 134108.0, 888768.0, 12203.0, 2379.0, 849.0, 375.0, 179.0, 106.0, 58.0, 36.0, 28.0, 24.0, 17.0, 11.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.25, -65.826171875, -63.40234375, -60.978515625, -58.5546875, -56.130859375, -53.70703125, -51.283203125, -48.859375, -46.435546875, -44.01171875, -41.587890625, -39.1640625, -36.740234375, -34.31640625, -31.892578125, -29.46875, -27.044921875, -24.62109375, -22.197265625, -19.7734375, -17.349609375, -14.92578125, -12.501953125, -10.078125, -7.654296875, -5.23046875, -2.806640625, -0.3828125, 2.041015625, 4.46484375, 6.888671875, 9.3125, 11.736328125, 14.16015625, 16.583984375, 19.0078125, 21.431640625, 23.85546875, 26.279296875, 28.703125, 31.126953125, 33.55078125, 35.974609375, 38.3984375, 40.822265625, 43.24609375, 45.669921875, 48.09375, 50.517578125, 52.94140625, 55.365234375, 57.7890625, 60.212890625, 62.63671875, 65.060546875, 67.484375, 69.908203125, 72.33203125, 74.755859375, 77.1796875, 79.603515625, 82.02734375, 84.451171875, 86.875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 8.0, 16.0, 15.0, 26.0, 38.0, 123.0, 323.0, 264.0, 100.0, 35.0, 16.0, 12.0, 9.0, 6.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.06915283203125, -3.9117431640625, -3.75433349609375, -3.596923828125, -3.43951416015625, -3.2821044921875, -3.12469482421875, -2.96728515625, -2.80987548828125, -2.6524658203125, -2.49505615234375, -2.337646484375, -2.18023681640625, -2.0228271484375, -1.86541748046875, -1.7080078125, -1.55059814453125, -1.3931884765625, -1.23577880859375, -1.078369140625, -0.92095947265625, -0.7635498046875, -0.60614013671875, -0.44873046875, -0.29132080078125, -0.1339111328125, 0.02349853515625, 0.180908203125, 0.33831787109375, 0.4957275390625, 0.65313720703125, 0.810546875, 0.96795654296875, 1.1253662109375, 1.28277587890625, 1.440185546875, 1.59759521484375, 1.7550048828125, 1.91241455078125, 2.06982421875, 2.22723388671875, 2.3846435546875, 2.54205322265625, 2.699462890625, 2.85687255859375, 3.0142822265625, 3.17169189453125, 3.3291015625, 3.48651123046875, 3.6439208984375, 3.80133056640625, 3.958740234375, 4.11614990234375, 4.2735595703125, 4.43096923828125, 4.58837890625, 4.74578857421875, 4.9031982421875, 5.06060791015625, 5.218017578125, 5.37542724609375, 5.5328369140625, 5.69024658203125, 5.84765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 0.0, 5.0, 7.0, 24.0, 85.0, 496.0, 9135.0, 1019078.0, 18816.0, 694.0, 102.0, 29.0, 8.0, 6.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.875, -79.009765625, -76.14453125, -73.279296875, -70.4140625, -67.548828125, -64.68359375, -61.818359375, -58.953125, -56.087890625, -53.22265625, -50.357421875, -47.4921875, -44.626953125, -41.76171875, -38.896484375, -36.03125, -33.166015625, -30.30078125, -27.435546875, -24.5703125, -21.705078125, -18.83984375, -15.974609375, -13.109375, -10.244140625, -7.37890625, -4.513671875, -1.6484375, 1.216796875, 4.08203125, 6.947265625, 9.8125, 12.677734375, 15.54296875, 18.408203125, 21.2734375, 24.138671875, 27.00390625, 29.869140625, 32.734375, 35.599609375, 38.46484375, 41.330078125, 44.1953125, 47.060546875, 49.92578125, 52.791015625, 55.65625, 58.521484375, 61.38671875, 64.251953125, 67.1171875, 69.982421875, 72.84765625, 75.712890625, 78.578125, 81.443359375, 84.30859375, 87.173828125, 90.0390625, 92.904296875, 95.76953125, 98.634765625, 101.5]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 6.0, 8.0, 12.0, 15.0, 18.0, 14.0, 23.0, 23.0, 31.0, 26.0, 39.0, 41.0, 36.0, 52.0, 72.0, 52.0, 59.0, 60.0, 53.0, 53.0, 44.0, 36.0, 39.0, 35.0, 29.0, 30.0, 28.0, 17.0, 8.0, 13.0, 11.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8125, -8.5572509765625, -8.302001953125, -8.0467529296875, -7.79150390625, -7.5362548828125, -7.281005859375, -7.0257568359375, -6.7705078125, -6.5152587890625, -6.260009765625, -6.0047607421875, -5.74951171875, -5.4942626953125, -5.239013671875, -4.9837646484375, -4.728515625, -4.4732666015625, -4.218017578125, -3.9627685546875, -3.70751953125, -3.4522705078125, -3.197021484375, -2.9417724609375, -2.6865234375, -2.4312744140625, -2.176025390625, -1.9207763671875, -1.66552734375, -1.4102783203125, -1.155029296875, -0.8997802734375, -0.64453125, -0.3892822265625, -0.134033203125, 0.1212158203125, 0.37646484375, 0.6317138671875, 0.886962890625, 1.1422119140625, 1.3974609375, 1.6527099609375, 1.907958984375, 2.1632080078125, 2.41845703125, 2.6737060546875, 2.928955078125, 3.1842041015625, 3.439453125, 3.6947021484375, 3.949951171875, 4.2052001953125, 4.46044921875, 4.7156982421875, 4.970947265625, 5.2261962890625, 5.4814453125, 5.7366943359375, 5.991943359375, 6.2471923828125, 6.50244140625, 6.7576904296875, 7.012939453125, 7.2681884765625, 7.5234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 11.0, 8.0, 10.0, 16.0, 22.0, 34.0, 48.0, 78.0, 148.0, 326.0, 746.0, 2460.0, 10743.0, 95585.0, 819905.0, 103147.0, 11199.0, 2492.0, 860.0, 323.0, 130.0, 107.0, 46.0, 28.0, 22.0, 11.0, 13.0, 7.0, 2.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.296875, -23.4736328125, -22.650390625, -21.8271484375, -21.00390625, -20.1806640625, -19.357421875, -18.5341796875, -17.7109375, -16.8876953125, -16.064453125, -15.2412109375, -14.41796875, -13.5947265625, -12.771484375, -11.9482421875, -11.125, -10.3017578125, -9.478515625, -8.6552734375, -7.83203125, -7.0087890625, -6.185546875, -5.3623046875, -4.5390625, -3.7158203125, -2.892578125, -2.0693359375, -1.24609375, -0.4228515625, 0.400390625, 1.2236328125, 2.046875, 2.8701171875, 3.693359375, 4.5166015625, 5.33984375, 6.1630859375, 6.986328125, 7.8095703125, 8.6328125, 9.4560546875, 10.279296875, 11.1025390625, 11.92578125, 12.7490234375, 13.572265625, 14.3955078125, 15.21875, 16.0419921875, 16.865234375, 17.6884765625, 18.51171875, 19.3349609375, 20.158203125, 20.9814453125, 21.8046875, 22.6279296875, 23.451171875, 24.2744140625, 25.09765625, 25.9208984375, 26.744140625, 27.5673828125, 28.390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 6.0, 9.0, 11.0, 21.0, 37.0, 66.0, 109.0, 162.0, 194.0, 151.0, 92.0, 49.0, 32.0, 25.0, 11.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010471343994140625, -0.001012563705444336, -0.0009779930114746094, -0.0009434223175048828, -0.0009088516235351562, -0.0008742809295654297, -0.0008397102355957031, -0.0008051395416259766, -0.00077056884765625, -0.0007359981536865234, -0.0007014274597167969, -0.0006668567657470703, -0.0006322860717773438, -0.0005977153778076172, -0.0005631446838378906, -0.0005285739898681641, -0.0004940032958984375, -0.00045943260192871094, -0.0004248619079589844, -0.0003902912139892578, -0.00035572052001953125, -0.0003211498260498047, -0.0002865791320800781, -0.00025200843811035156, -0.000217437744140625, -0.00018286705017089844, -0.00014829635620117188, -0.00011372566223144531, -7.915496826171875e-05, -4.458427429199219e-05, -1.0013580322265625e-05, 2.4557113647460938e-05, 5.91278076171875e-05, 9.369850158691406e-05, 0.00012826919555664062, 0.0001628398895263672, 0.00019741058349609375, 0.0002319812774658203, 0.0002665519714355469, 0.00030112266540527344, 0.000335693359375, 0.00037026405334472656, 0.0004048347473144531, 0.0004394054412841797, 0.00047397613525390625, 0.0005085468292236328, 0.0005431175231933594, 0.0005776882171630859, 0.0006122589111328125, 0.0006468296051025391, 0.0006814002990722656, 0.0007159709930419922, 0.0007505416870117188, 0.0007851123809814453, 0.0008196830749511719, 0.0008542537689208984, 0.000888824462890625, 0.0009233951568603516, 0.0009579658508300781, 0.0009925365447998047, 0.0010271072387695312, 0.0010616779327392578, 0.0010962486267089844, 0.001130819320678711, 0.0011653900146484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 8.0, 5.0, 14.0, 26.0, 43.0, 63.0, 86.0, 198.0, 376.0, 768.0, 1933.0, 5302.0, 17103.0, 78648.0, 546174.0, 330137.0, 49410.0, 11613.0, 3846.0, 1438.0, 648.0, 304.0, 182.0, 94.0, 46.0, 28.0, 11.0, 15.0, 16.0, 3.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.09375, -16.57373046875, -16.0537109375, -15.53369140625, -15.013671875, -14.49365234375, -13.9736328125, -13.45361328125, -12.93359375, -12.41357421875, -11.8935546875, -11.37353515625, -10.853515625, -10.33349609375, -9.8134765625, -9.29345703125, -8.7734375, -8.25341796875, -7.7333984375, -7.21337890625, -6.693359375, -6.17333984375, -5.6533203125, -5.13330078125, -4.61328125, -4.09326171875, -3.5732421875, -3.05322265625, -2.533203125, -2.01318359375, -1.4931640625, -0.97314453125, -0.453125, 0.06689453125, 0.5869140625, 1.10693359375, 1.626953125, 2.14697265625, 2.6669921875, 3.18701171875, 3.70703125, 4.22705078125, 4.7470703125, 5.26708984375, 5.787109375, 6.30712890625, 6.8271484375, 7.34716796875, 7.8671875, 8.38720703125, 8.9072265625, 9.42724609375, 9.947265625, 10.46728515625, 10.9873046875, 11.50732421875, 12.02734375, 12.54736328125, 13.0673828125, 13.58740234375, 14.107421875, 14.62744140625, 15.1474609375, 15.66748046875, 16.1875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 6.0, 9.0, 8.0, 12.0, 9.0, 21.0, 11.0, 20.0, 29.0, 35.0, 54.0, 46.0, 49.0, 74.0, 90.0, 128.0, 60.0, 59.0, 53.0, 44.0, 38.0, 36.0, 20.0, 15.0, 16.0, 6.0, 10.0, 6.0, 5.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.3203125, -8.084228515625, -7.84814453125, -7.612060546875, -7.3759765625, -7.139892578125, -6.90380859375, -6.667724609375, -6.431640625, -6.195556640625, -5.95947265625, -5.723388671875, -5.4873046875, -5.251220703125, -5.01513671875, -4.779052734375, -4.54296875, -4.306884765625, -4.07080078125, -3.834716796875, -3.5986328125, -3.362548828125, -3.12646484375, -2.890380859375, -2.654296875, -2.418212890625, -2.18212890625, -1.946044921875, -1.7099609375, -1.473876953125, -1.23779296875, -1.001708984375, -0.765625, -0.529541015625, -0.29345703125, -0.057373046875, 0.1787109375, 0.414794921875, 0.65087890625, 0.886962890625, 1.123046875, 1.359130859375, 1.59521484375, 1.831298828125, 2.0673828125, 2.303466796875, 2.53955078125, 2.775634765625, 3.01171875, 3.247802734375, 3.48388671875, 3.719970703125, 3.9560546875, 4.192138671875, 4.42822265625, 4.664306640625, 4.900390625, 5.136474609375, 5.37255859375, 5.608642578125, 5.8447265625, 6.080810546875, 6.31689453125, 6.552978515625, 6.7890625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 22.0, 32.0, 92.0, 215.0, 298.0, 191.0, 88.0, 31.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.6951904296875, -123.1673583984375, -117.6395263671875, -112.1116943359375, -106.5838623046875, -101.0560302734375, -95.5281982421875, -90.0003662109375, -84.4725341796875, -78.9447021484375, -73.4168701171875, -67.8890380859375, -62.3612060546875, -56.8333740234375, -51.305538177490234, -45.777706146240234, -40.24987030029297, -34.72203826904297, -29.19420623779297, -23.666372299194336, -18.138540267944336, -12.610708236694336, -7.082874298095703, -1.5550422668457031, 3.972789764404297, 9.500621795654297, 15.028454780578613, 20.55628776550293, 26.08411979675293, 31.61195182800293, 37.13978576660156, 42.66761779785156, 48.19544982910156, 53.72328186035156, 59.25111389160156, 64.77894592285156, 70.30677795410156, 75.83460998535156, 81.36244201660156, 86.89027404785156, 92.41810607910156, 97.94593811035156, 103.47377014160156, 109.00160217285156, 114.52943420410156, 120.05726623535156, 125.58509826660156, 131.11293029785156, 136.64077758789062, 142.16860961914062, 147.69644165039062, 153.22427368164062, 158.75210571289062, 164.27993774414062, 169.80776977539062, 175.33560180664062, 180.86343383789062, 186.39126586914062, 191.91909790039062, 197.44692993164062, 202.97476196289062, 208.50259399414062, 214.03042602539062, 219.55825805664062, 225.08609008789062]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 7.0, 6.0, 9.0, 13.0, 21.0, 28.0, 24.0, 39.0, 50.0, 64.0, 89.0, 80.0, 70.0, 80.0, 72.0, 68.0, 77.0, 48.0, 38.0, 31.0, 29.0, 20.0, 10.0, 10.0, 3.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.92555236816406, -89.06329345703125, -86.20104217529297, -83.33878326416016, -80.47653198242188, -77.61427307128906, -74.75201416015625, -71.88976287841797, -69.02750396728516, -66.16524505615234, -63.30299377441406, -60.44073486328125, -57.5784797668457, -54.716224670410156, -51.85396957397461, -48.99171447753906, -46.129459381103516, -43.26720428466797, -40.40494918823242, -37.542694091796875, -34.68043518066406, -31.818180084228516, -28.95592498779297, -26.09366798400879, -23.231412887573242, -20.369157791137695, -17.506900787353516, -14.644645690917969, -11.782389640808105, -8.920133590698242, -6.057878494262695, -3.1956214904785156, -0.33336639404296875, 2.5288894176483154, 5.3911452293396, 8.253400802612305, 11.115656852722168, 13.977912902832031, 16.840167999267578, 19.702425003051758, 22.564680099487305, 25.42693519592285, 28.28919219970703, 31.151447296142578, 34.013702392578125, 36.87596130371094, 39.73821258544922, 42.60047149658203, 45.46272659301758, 48.324981689453125, 51.18723678588867, 54.04949188232422, 56.91175079345703, 59.77400588989258, 62.636260986328125, 65.49851989746094, 68.36077117919922, 71.22303009033203, 74.08528137207031, 76.94754028320312, 79.8097915649414, 82.67205047607422, 85.5343017578125, 88.39656066894531, 91.25881958007812]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 8.0, 11.0, 9.0, 15.0, 23.0, 23.0, 39.0, 46.0, 66.0, 96.0, 176.0, 343.0, 715.0, 1685.0, 6142.0, 151563.0, 4020478.0, 8944.0, 1994.0, 820.0, 393.0, 215.0, 136.0, 88.0, 59.0, 37.0, 39.0, 24.0, 7.0, 19.0, 9.0, 9.0, 5.0, 9.0, 5.0, 4.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.125, -108.79296875, -104.4609375, -100.12890625, -95.796875, -91.46484375, -87.1328125, -82.80078125, -78.46875, -74.13671875, -69.8046875, -65.47265625, -61.140625, -56.80859375, -52.4765625, -48.14453125, -43.8125, -39.48046875, -35.1484375, -30.81640625, -26.484375, -22.15234375, -17.8203125, -13.48828125, -9.15625, -4.82421875, -0.4921875, 3.83984375, 8.171875, 12.50390625, 16.8359375, 21.16796875, 25.5, 29.83203125, 34.1640625, 38.49609375, 42.828125, 47.16015625, 51.4921875, 55.82421875, 60.15625, 64.48828125, 68.8203125, 73.15234375, 77.484375, 81.81640625, 86.1484375, 90.48046875, 94.8125, 99.14453125, 103.4765625, 107.80859375, 112.140625, 116.47265625, 120.8046875, 125.13671875, 129.46875, 133.80078125, 138.1328125, 142.46484375, 146.796875, 151.12890625, 155.4609375, 159.79296875, 164.125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 10.0, 19.0, 19.0, 41.0, 98.0, 238.0, 291.0, 160.0, 58.0, 24.0, 13.0, 8.0, 7.0, 7.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.187744140625, -4.02783203125, -3.867919921875, -3.7080078125, -3.548095703125, -3.38818359375, -3.228271484375, -3.068359375, -2.908447265625, -2.74853515625, -2.588623046875, -2.4287109375, -2.268798828125, -2.10888671875, -1.948974609375, -1.7890625, -1.629150390625, -1.46923828125, -1.309326171875, -1.1494140625, -0.989501953125, -0.82958984375, -0.669677734375, -0.509765625, -0.349853515625, -0.18994140625, -0.030029296875, 0.1298828125, 0.289794921875, 0.44970703125, 0.609619140625, 0.76953125, 0.929443359375, 1.08935546875, 1.249267578125, 1.4091796875, 1.569091796875, 1.72900390625, 1.888916015625, 2.048828125, 2.208740234375, 2.36865234375, 2.528564453125, 2.6884765625, 2.848388671875, 3.00830078125, 3.168212890625, 3.328125, 3.488037109375, 3.64794921875, 3.807861328125, 3.9677734375, 4.127685546875, 4.28759765625, 4.447509765625, 4.607421875, 4.767333984375, 4.92724609375, 5.087158203125, 5.2470703125, 5.406982421875, 5.56689453125, 5.726806640625, 5.88671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 8.0, 7.0, 7.0, 9.0, 8.0, 12.0, 18.0, 23.0, 31.0, 40.0, 89.0, 231.0, 1614.0, 74456.0, 4108538.0, 8102.0, 699.0, 162.0, 63.0, 48.0, 33.0, 26.0, 19.0, 11.0, 8.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.125, -136.75, -132.375, -128.0, -123.625, -119.25, -114.875, -110.5, -106.125, -101.75, -97.375, -93.0, -88.625, -84.25, -79.875, -75.5, -71.125, -66.75, -62.375, -58.0, -53.625, -49.25, -44.875, -40.5, -36.125, -31.75, -27.375, -23.0, -18.625, -14.25, -9.875, -5.5, -1.125, 3.25, 7.625, 12.0, 16.375, 20.75, 25.125, 29.5, 33.875, 38.25, 42.625, 47.0, 51.375, 55.75, 60.125, 64.5, 68.875, 73.25, 77.625, 82.0, 86.375, 90.75, 95.125, 99.5, 103.875, 108.25, 112.625, 117.0, 121.375, 125.75, 130.125, 134.5, 138.875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 11.0, 15.0, 29.0, 30.0, 28.0, 44.0, 81.0, 128.0, 262.0, 794.0, 1963.0, 274.0, 136.0, 86.0, 43.0, 28.0, 20.0, 22.0, 12.0, 8.0, 9.0, 6.0, 11.0, 7.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.14453125, -4.0155029296875, -3.886474609375, -3.7574462890625, -3.62841796875, -3.4993896484375, -3.370361328125, -3.2413330078125, -3.1123046875, -2.9832763671875, -2.854248046875, -2.7252197265625, -2.59619140625, -2.4671630859375, -2.338134765625, -2.2091064453125, -2.080078125, -1.9510498046875, -1.822021484375, -1.6929931640625, -1.56396484375, -1.4349365234375, -1.305908203125, -1.1768798828125, -1.0478515625, -0.9188232421875, -0.789794921875, -0.6607666015625, -0.53173828125, -0.4027099609375, -0.273681640625, -0.1446533203125, -0.015625, 0.1134033203125, 0.242431640625, 0.3714599609375, 0.50048828125, 0.6295166015625, 0.758544921875, 0.8875732421875, 1.0166015625, 1.1456298828125, 1.274658203125, 1.4036865234375, 1.53271484375, 1.6617431640625, 1.790771484375, 1.9197998046875, 2.048828125, 2.1778564453125, 2.306884765625, 2.4359130859375, 2.56494140625, 2.6939697265625, 2.822998046875, 2.9520263671875, 3.0810546875, 3.2100830078125, 3.339111328125, 3.4681396484375, 3.59716796875, 3.7261962890625, 3.855224609375, 3.9842529296875, 4.11328125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 21.0, 29.0, 42.0, 117.0, 239.0, 248.0, 161.0, 67.0, 35.0, 17.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.626405715942383, -21.111913681030273, -19.59741973876953, -18.082927703857422, -16.568435668945312, -15.05394172668457, -13.539449691772461, -12.024956703186035, -10.51046371459961, -8.995970726013184, -7.481478214263916, -5.966985702514648, -4.452492713928223, -2.937999725341797, -1.4235076904296875, 0.09098529815673828, 1.605478286743164, 3.1199710369110107, 4.634463787078857, 6.148956298828125, 7.663449287414551, 9.177942276000977, 10.692434310913086, 12.206927299499512, 13.721420288085938, 15.235913276672363, 16.75040626525879, 18.2648983001709, 19.77939224243164, 21.29388427734375, 22.80837631225586, 24.32286834716797, 25.837364196777344, 27.351856231689453, 28.866350173950195, 30.380842208862305, 31.895336151123047, 33.409828186035156, 34.924320220947266, 36.438812255859375, 37.95330810546875, 39.46780014038086, 40.98229217529297, 42.496788024902344, 44.01128005981445, 45.52577209472656, 47.04026412963867, 48.55475616455078, 50.06924819946289, 51.583740234375, 53.09823226928711, 54.61272430419922, 56.127220153808594, 57.6417121887207, 59.15620422363281, 60.67069625854492, 62.18518829345703, 63.69968032836914, 65.21417236328125, 66.72866821289062, 68.24315643310547, 69.75765228271484, 71.27214050292969, 72.78663635253906, 74.30113220214844]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 9.0, 8.0, 17.0, 24.0, 20.0, 34.0, 28.0, 39.0, 40.0, 47.0, 35.0, 73.0, 56.0, 59.0, 62.0, 61.0, 54.0, 52.0, 36.0, 36.0, 29.0, 38.0, 39.0, 28.0, 20.0, 12.0, 7.0, 6.0, 8.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.083532333374023, -14.552916526794434, -14.02230167388916, -13.49168586730957, -12.961071014404297, -12.430455207824707, -11.899839401245117, -11.369224548339844, -10.838608741760254, -10.307992935180664, -9.77737808227539, -9.2467622756958, -8.716146469116211, -8.185531616210938, -7.654915809631348, -7.124300479888916, -6.593685150146484, -6.063069820404053, -5.532454490661621, -5.001838684082031, -4.4712233543396, -3.940608024597168, -3.4099924564361572, -2.8793768882751465, -2.348761558532715, -1.8181461095809937, -1.2875306606292725, -0.7569152116775513, -0.22629976272583008, 0.30431556701660156, 0.8349311351776123, 1.365546703338623, 1.8961601257324219, 2.4267754554748535, 2.9573910236358643, 3.488006591796875, 4.018621921539307, 4.549237251281738, 5.079853057861328, 5.61046838760376, 6.141083717346191, 6.671699047088623, 7.202314376831055, 7.7329301834106445, 8.263545989990234, 8.794160842895508, 9.324776649475098, 9.855392456054688, 10.386007308959961, 10.91662311553955, 11.447237968444824, 11.977853775024414, 12.508468627929688, 13.039084434509277, 13.569700241088867, 14.10031509399414, 14.63093090057373, 15.16154670715332, 15.692161560058594, 16.222776412963867, 16.753393173217773, 17.284008026123047, 17.81462287902832, 18.345239639282227, 18.8758544921875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 7.0, 11.0, 9.0, 10.0, 18.0, 21.0, 35.0, 49.0, 73.0, 109.0, 173.0, 263.0, 420.0, 921.0, 2206.0, 9065.0, 122990.0, 860651.0, 42795.0, 5305.0, 1625.0, 724.0, 421.0, 227.0, 141.0, 79.0, 65.0, 51.0, 24.0, 12.0, 25.0, 8.0, 4.0, 7.0, 3.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.71875, -54.9091796875, -53.099609375, -51.2900390625, -49.48046875, -47.6708984375, -45.861328125, -44.0517578125, -42.2421875, -40.4326171875, -38.623046875, -36.8134765625, -35.00390625, -33.1943359375, -31.384765625, -29.5751953125, -27.765625, -25.9560546875, -24.146484375, -22.3369140625, -20.52734375, -18.7177734375, -16.908203125, -15.0986328125, -13.2890625, -11.4794921875, -9.669921875, -7.8603515625, -6.05078125, -4.2412109375, -2.431640625, -0.6220703125, 1.1875, 2.9970703125, 4.806640625, 6.6162109375, 8.42578125, 10.2353515625, 12.044921875, 13.8544921875, 15.6640625, 17.4736328125, 19.283203125, 21.0927734375, 22.90234375, 24.7119140625, 26.521484375, 28.3310546875, 30.140625, 31.9501953125, 33.759765625, 35.5693359375, 37.37890625, 39.1884765625, 40.998046875, 42.8076171875, 44.6171875, 46.4267578125, 48.236328125, 50.0458984375, 51.85546875, 53.6650390625, 55.474609375, 57.2841796875, 59.09375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 9.0, 18.0, 39.0, 79.0, 162.0, 259.0, 226.0, 104.0, 54.0, 18.0, 7.0, 4.0, 6.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.34478759765625, -4.1817626953125, -4.01873779296875, -3.855712890625, -3.69268798828125, -3.5296630859375, -3.36663818359375, -3.20361328125, -3.04058837890625, -2.8775634765625, -2.71453857421875, -2.551513671875, -2.38848876953125, -2.2254638671875, -2.06243896484375, -1.8994140625, -1.73638916015625, -1.5733642578125, -1.41033935546875, -1.247314453125, -1.08428955078125, -0.9212646484375, -0.75823974609375, -0.59521484375, -0.43218994140625, -0.2691650390625, -0.10614013671875, 0.056884765625, 0.21990966796875, 0.3829345703125, 0.54595947265625, 0.708984375, 0.87200927734375, 1.0350341796875, 1.19805908203125, 1.361083984375, 1.52410888671875, 1.6871337890625, 1.85015869140625, 2.01318359375, 2.17620849609375, 2.3392333984375, 2.50225830078125, 2.665283203125, 2.82830810546875, 2.9913330078125, 3.15435791015625, 3.3173828125, 3.48040771484375, 3.6434326171875, 3.80645751953125, 3.969482421875, 4.13250732421875, 4.2955322265625, 4.45855712890625, 4.62158203125, 4.78460693359375, 4.9476318359375, 5.11065673828125, 5.273681640625, 5.43670654296875, 5.5997314453125, 5.76275634765625, 5.92578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 10.0, 18.0, 19.0, 25.0, 31.0, 59.0, 56.0, 102.0, 148.0, 180.0, 239.0, 366.0, 525.0, 892.0, 1685.0, 3534.0, 8712.0, 28329.0, 120477.0, 473943.0, 313099.0, 66348.0, 17475.0, 5960.0, 2660.0, 1310.0, 775.0, 496.0, 294.0, 214.0, 145.0, 108.0, 90.0, 47.0, 31.0, 36.0, 27.0, 27.0, 12.0, 5.0, 4.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-26.828125, -26.03466796875, -25.2412109375, -24.44775390625, -23.654296875, -22.86083984375, -22.0673828125, -21.27392578125, -20.48046875, -19.68701171875, -18.8935546875, -18.10009765625, -17.306640625, -16.51318359375, -15.7197265625, -14.92626953125, -14.1328125, -13.33935546875, -12.5458984375, -11.75244140625, -10.958984375, -10.16552734375, -9.3720703125, -8.57861328125, -7.78515625, -6.99169921875, -6.1982421875, -5.40478515625, -4.611328125, -3.81787109375, -3.0244140625, -2.23095703125, -1.4375, -0.64404296875, 0.1494140625, 0.94287109375, 1.736328125, 2.52978515625, 3.3232421875, 4.11669921875, 4.91015625, 5.70361328125, 6.4970703125, 7.29052734375, 8.083984375, 8.87744140625, 9.6708984375, 10.46435546875, 11.2578125, 12.05126953125, 12.8447265625, 13.63818359375, 14.431640625, 15.22509765625, 16.0185546875, 16.81201171875, 17.60546875, 18.39892578125, 19.1923828125, 19.98583984375, 20.779296875, 21.57275390625, 22.3662109375, 23.15966796875, 23.953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 6.0, 8.0, 7.0, 4.0, 7.0, 9.0, 13.0, 13.0, 18.0, 18.0, 22.0, 36.0, 39.0, 35.0, 38.0, 34.0, 30.0, 38.0, 55.0, 48.0, 44.0, 49.0, 46.0, 42.0, 39.0, 36.0, 38.0, 40.0, 24.0, 25.0, 21.0, 18.0, 15.0, 18.0, 16.0, 4.0, 7.0, 4.0, 3.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.953125, -9.62744140625, -9.3017578125, -8.97607421875, -8.650390625, -8.32470703125, -7.9990234375, -7.67333984375, -7.34765625, -7.02197265625, -6.6962890625, -6.37060546875, -6.044921875, -5.71923828125, -5.3935546875, -5.06787109375, -4.7421875, -4.41650390625, -4.0908203125, -3.76513671875, -3.439453125, -3.11376953125, -2.7880859375, -2.46240234375, -2.13671875, -1.81103515625, -1.4853515625, -1.15966796875, -0.833984375, -0.50830078125, -0.1826171875, 0.14306640625, 0.46875, 0.79443359375, 1.1201171875, 1.44580078125, 1.771484375, 2.09716796875, 2.4228515625, 2.74853515625, 3.07421875, 3.39990234375, 3.7255859375, 4.05126953125, 4.376953125, 4.70263671875, 5.0283203125, 5.35400390625, 5.6796875, 6.00537109375, 6.3310546875, 6.65673828125, 6.982421875, 7.30810546875, 7.6337890625, 7.95947265625, 8.28515625, 8.61083984375, 8.9365234375, 9.26220703125, 9.587890625, 9.91357421875, 10.2392578125, 10.56494140625, 10.890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 7.0, 7.0, 11.0, 12.0, 18.0, 33.0, 39.0, 97.0, 140.0, 271.0, 528.0, 1483.0, 5554.0, 34603.0, 533011.0, 436162.0, 29089.0, 4995.0, 1388.0, 528.0, 230.0, 145.0, 72.0, 40.0, 28.0, 18.0, 11.0, 9.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-46.1875, -45.001953125, -43.81640625, -42.630859375, -41.4453125, -40.259765625, -39.07421875, -37.888671875, -36.703125, -35.517578125, -34.33203125, -33.146484375, -31.9609375, -30.775390625, -29.58984375, -28.404296875, -27.21875, -26.033203125, -24.84765625, -23.662109375, -22.4765625, -21.291015625, -20.10546875, -18.919921875, -17.734375, -16.548828125, -15.36328125, -14.177734375, -12.9921875, -11.806640625, -10.62109375, -9.435546875, -8.25, -7.064453125, -5.87890625, -4.693359375, -3.5078125, -2.322265625, -1.13671875, 0.048828125, 1.234375, 2.419921875, 3.60546875, 4.791015625, 5.9765625, 7.162109375, 8.34765625, 9.533203125, 10.71875, 11.904296875, 13.08984375, 14.275390625, 15.4609375, 16.646484375, 17.83203125, 19.017578125, 20.203125, 21.388671875, 22.57421875, 23.759765625, 24.9453125, 26.130859375, 27.31640625, 28.501953125, 29.6875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 13.0, 12.0, 18.0, 19.0, 25.0, 31.0, 72.0, 66.0, 79.0, 104.0, 104.0, 91.0, 81.0, 63.0, 48.0, 41.0, 35.0, 28.0, 17.0, 12.0, 5.0, 10.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001438140869140625, -0.0013911277055740356, -0.0013441145420074463, -0.001297101378440857, -0.0012500882148742676, -0.0012030750513076782, -0.0011560618877410889, -0.0011090487241744995, -0.0010620355606079102, -0.0010150223970413208, -0.0009680092334747314, -0.0009209960699081421, -0.0008739829063415527, -0.0008269697427749634, -0.000779956579208374, -0.0007329434156417847, -0.0006859302520751953, -0.000638917088508606, -0.0005919039249420166, -0.0005448907613754272, -0.0004978775978088379, -0.00045086443424224854, -0.0004038512706756592, -0.0003568381071090698, -0.00030982494354248047, -0.0002628117799758911, -0.00021579861640930176, -0.0001687854528427124, -0.00012177228927612305, -7.475912570953369e-05, -2.7745962142944336e-05, 1.926720142364502e-05, 6.628036499023438e-05, 0.00011329352855682373, 0.00016030669212341309, 0.00020731985569000244, 0.0002543330192565918, 0.00030134618282318115, 0.0003483593463897705, 0.00039537250995635986, 0.0004423856735229492, 0.0004893988370895386, 0.0005364120006561279, 0.0005834251642227173, 0.0006304383277893066, 0.000677451491355896, 0.0007244646549224854, 0.0007714778184890747, 0.0008184909820556641, 0.0008655041456222534, 0.0009125173091888428, 0.0009595304727554321, 0.0010065436363220215, 0.0010535567998886108, 0.0011005699634552002, 0.0011475831270217896, 0.001194596290588379, 0.0012416094541549683, 0.0012886226177215576, 0.001335635781288147, 0.0013826489448547363, 0.0014296621084213257, 0.001476675271987915, 0.0015236884355545044, 0.0015707015991210938]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 10.0, 11.0, 11.0, 25.0, 38.0, 70.0, 101.0, 148.0, 243.0, 536.0, 1151.0, 3475.0, 15037.0, 143416.0, 786444.0, 82500.0, 10656.0, 2676.0, 945.0, 470.0, 254.0, 118.0, 69.0, 38.0, 39.0, 16.0, 18.0, 12.0, 4.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.09375, -31.96826171875, -30.8427734375, -29.71728515625, -28.591796875, -27.46630859375, -26.3408203125, -25.21533203125, -24.08984375, -22.96435546875, -21.8388671875, -20.71337890625, -19.587890625, -18.46240234375, -17.3369140625, -16.21142578125, -15.0859375, -13.96044921875, -12.8349609375, -11.70947265625, -10.583984375, -9.45849609375, -8.3330078125, -7.20751953125, -6.08203125, -4.95654296875, -3.8310546875, -2.70556640625, -1.580078125, -0.45458984375, 0.6708984375, 1.79638671875, 2.921875, 4.04736328125, 5.1728515625, 6.29833984375, 7.423828125, 8.54931640625, 9.6748046875, 10.80029296875, 11.92578125, 13.05126953125, 14.1767578125, 15.30224609375, 16.427734375, 17.55322265625, 18.6787109375, 19.80419921875, 20.9296875, 22.05517578125, 23.1806640625, 24.30615234375, 25.431640625, 26.55712890625, 27.6826171875, 28.80810546875, 29.93359375, 31.05908203125, 32.1845703125, 33.31005859375, 34.435546875, 35.56103515625, 36.6865234375, 37.81201171875, 38.9375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 3.0, 7.0, 9.0, 20.0, 25.0, 42.0, 55.0, 75.0, 105.0, 123.0, 138.0, 105.0, 83.0, 60.0, 45.0, 25.0, 14.0, 15.0, 13.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-21.078125, -20.578369140625, -20.07861328125, -19.578857421875, -19.0791015625, -18.579345703125, -18.07958984375, -17.579833984375, -17.080078125, -16.580322265625, -16.08056640625, -15.580810546875, -15.0810546875, -14.581298828125, -14.08154296875, -13.581787109375, -13.08203125, -12.582275390625, -12.08251953125, -11.582763671875, -11.0830078125, -10.583251953125, -10.08349609375, -9.583740234375, -9.083984375, -8.584228515625, -8.08447265625, -7.584716796875, -7.0849609375, -6.585205078125, -6.08544921875, -5.585693359375, -5.0859375, -4.586181640625, -4.08642578125, -3.586669921875, -3.0869140625, -2.587158203125, -2.08740234375, -1.587646484375, -1.087890625, -0.588134765625, -0.08837890625, 0.411376953125, 0.9111328125, 1.410888671875, 1.91064453125, 2.410400390625, 2.91015625, 3.409912109375, 3.90966796875, 4.409423828125, 4.9091796875, 5.408935546875, 5.90869140625, 6.408447265625, 6.908203125, 7.407958984375, 7.90771484375, 8.407470703125, 8.9072265625, 9.406982421875, 9.90673828125, 10.406494140625, 10.90625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 13.0, 24.0, 80.0, 210.0, 313.0, 220.0, 68.0, 34.0, 18.0, 8.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-366.717529296875, -357.88861083984375, -349.0596923828125, -340.23077392578125, -331.40185546875, -322.57293701171875, -313.7440185546875, -304.91510009765625, -296.086181640625, -287.25726318359375, -278.4283447265625, -269.59942626953125, -260.7705078125, -251.94158935546875, -243.11265563964844, -234.2837371826172, -225.45480346679688, -216.62588500976562, -207.79696655273438, -198.96804809570312, -190.13912963867188, -181.31021118164062, -172.4812774658203, -163.65235900878906, -154.8234405517578, -145.99452209472656, -137.1656036376953, -128.33668518066406, -119.50775909423828, -110.67884063720703, -101.84991455078125, -93.02099609375, -84.19204711914062, -75.36312866210938, -66.53421020507812, -57.705284118652344, -48.876365661621094, -40.047447204589844, -31.218524932861328, -22.389602661132812, -13.560684204101562, -4.73176383972168, 4.097156524658203, 12.926076889038086, 21.75499725341797, 30.58391571044922, 39.412837982177734, 48.24176025390625, 57.0706787109375, 65.89959716796875, 74.728515625, 83.55744171142578, 92.38636016845703, 101.21527862548828, 110.04420471191406, 118.87312316894531, 127.70204162597656, 136.5309600830078, 145.35987854003906, 154.1887969970703, 163.01773071289062, 171.84664916992188, 180.67556762695312, 189.50448608398438, 198.33340454101562]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 5.0, 3.0, 12.0, 25.0, 36.0, 26.0, 31.0, 32.0, 50.0, 53.0, 66.0, 77.0, 54.0, 85.0, 60.0, 73.0, 57.0, 54.0, 37.0, 34.0, 36.0, 18.0, 26.0, 22.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-97.95089721679688, -94.25940704345703, -90.56790924072266, -86.87641906738281, -83.18492126464844, -79.4934310913086, -75.80193328857422, -72.11044311523438, -68.4189453125, -64.72745513916016, -61.03595733642578, -57.34446334838867, -53.65296936035156, -49.96147918701172, -46.269981384277344, -42.5784912109375, -38.88699722290039, -35.19550323486328, -31.504009246826172, -27.812515258789062, -24.121021270751953, -20.429529190063477, -16.738035202026367, -13.046541213989258, -9.355047225952148, -5.663553237915039, -1.972059726715088, 1.7194337844848633, 5.410927772521973, 9.102420806884766, 12.793914794921875, 16.485408782958984, 20.176902770996094, 23.868396759033203, 27.559890747070312, 31.251384735107422, 34.94287872314453, 38.634368896484375, 42.32586669921875, 46.017356872558594, 49.70885467529297, 53.40034866333008, 57.09184265136719, 60.7833366394043, 64.4748306274414, 68.16632080078125, 71.85781860351562, 75.54930877685547, 79.24079895019531, 82.93228912353516, 86.62378692626953, 90.31527709960938, 94.00677490234375, 97.6982650756836, 101.38976287841797, 105.08125305175781, 108.77275085449219, 112.46424102783203, 116.1557388305664, 119.84722900390625, 123.53872680664062, 127.23021697998047, 130.9217071533203, 134.6132049560547, 138.30470275878906]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 16.0, 26.0, 52.0, 161.0, 458.0, 2363.0, 4105409.0, 83843.0, 1330.0, 348.0, 145.0, 55.0, 25.0, 17.0, 10.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-215.75, -207.71875, -199.6875, -191.65625, -183.625, -175.59375, -167.5625, -159.53125, -151.5, -143.46875, -135.4375, -127.40625, -119.375, -111.34375, -103.3125, -95.28125, -87.25, -79.21875, -71.1875, -63.15625, -55.125, -47.09375, -39.0625, -31.03125, -23.0, -14.96875, -6.9375, 1.09375, 9.125, 17.15625, 25.1875, 33.21875, 41.25, 49.28125, 57.3125, 65.34375, 73.375, 81.40625, 89.4375, 97.46875, 105.5, 113.53125, 121.5625, 129.59375, 137.625, 145.65625, 153.6875, 161.71875, 169.75, 177.78125, 185.8125, 193.84375, 201.875, 209.90625, 217.9375, 225.96875, 234.0, 242.03125, 250.0625, 258.09375, 266.125, 274.15625, 282.1875, 290.21875, 298.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 12.0, 19.0, 44.0, 83.0, 121.0, 158.0, 197.0, 145.0, 101.0, 55.0, 23.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.75189208984375, -4.5701904296875, -4.38848876953125, -4.206787109375, -4.02508544921875, -3.8433837890625, -3.66168212890625, -3.47998046875, -3.29827880859375, -3.1165771484375, -2.93487548828125, -2.753173828125, -2.57147216796875, -2.3897705078125, -2.20806884765625, -2.0263671875, -1.84466552734375, -1.6629638671875, -1.48126220703125, -1.299560546875, -1.11785888671875, -0.9361572265625, -0.75445556640625, -0.57275390625, -0.39105224609375, -0.2093505859375, -0.02764892578125, 0.154052734375, 0.33575439453125, 0.5174560546875, 0.69915771484375, 0.880859375, 1.06256103515625, 1.2442626953125, 1.42596435546875, 1.607666015625, 1.78936767578125, 1.9710693359375, 2.15277099609375, 2.33447265625, 2.51617431640625, 2.6978759765625, 2.87957763671875, 3.061279296875, 3.24298095703125, 3.4246826171875, 3.60638427734375, 3.7880859375, 3.96978759765625, 4.1514892578125, 4.33319091796875, 4.514892578125, 4.69659423828125, 4.8782958984375, 5.05999755859375, 5.24169921875, 5.42340087890625, 5.6051025390625, 5.78680419921875, 5.968505859375, 6.15020751953125, 6.3319091796875, 6.51361083984375, 6.6953125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 15.0, 12.0, 11.0, 24.0, 41.0, 66.0, 114.0, 220.0, 525.0, 1688.0, 6724.0, 37243.0, 722622.0, 3349474.0, 61896.0, 9717.0, 2402.0, 747.0, 311.0, 121.0, 86.0, 40.0, 28.0, 38.0, 22.0, 22.0, 8.0, 9.0, 6.0, 7.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.28125, -38.89794921875, -37.5146484375, -36.13134765625, -34.748046875, -33.36474609375, -31.9814453125, -30.59814453125, -29.21484375, -27.83154296875, -26.4482421875, -25.06494140625, -23.681640625, -22.29833984375, -20.9150390625, -19.53173828125, -18.1484375, -16.76513671875, -15.3818359375, -13.99853515625, -12.615234375, -11.23193359375, -9.8486328125, -8.46533203125, -7.08203125, -5.69873046875, -4.3154296875, -2.93212890625, -1.548828125, -0.16552734375, 1.2177734375, 2.60107421875, 3.984375, 5.36767578125, 6.7509765625, 8.13427734375, 9.517578125, 10.90087890625, 12.2841796875, 13.66748046875, 15.05078125, 16.43408203125, 17.8173828125, 19.20068359375, 20.583984375, 21.96728515625, 23.3505859375, 24.73388671875, 26.1171875, 27.50048828125, 28.8837890625, 30.26708984375, 31.650390625, 33.03369140625, 34.4169921875, 35.80029296875, 37.18359375, 38.56689453125, 39.9501953125, 41.33349609375, 42.716796875, 44.10009765625, 45.4833984375, 46.86669921875, 48.25]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 1.0, 4.0, 11.0, 6.0, 15.0, 22.0, 21.0, 20.0, 56.0, 73.0, 107.0, 193.0, 477.0, 1848.0, 598.0, 252.0, 134.0, 67.0, 40.0, 39.0, 27.0, 15.0, 10.0, 5.0, 9.0, 1.0, 6.0, 7.0, 7.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8671875, -4.69110107421875, -4.5150146484375, -4.33892822265625, -4.162841796875, -3.98675537109375, -3.8106689453125, -3.63458251953125, -3.45849609375, -3.28240966796875, -3.1063232421875, -2.93023681640625, -2.754150390625, -2.57806396484375, -2.4019775390625, -2.22589111328125, -2.0498046875, -1.87371826171875, -1.6976318359375, -1.52154541015625, -1.345458984375, -1.16937255859375, -0.9932861328125, -0.81719970703125, -0.64111328125, -0.46502685546875, -0.2889404296875, -0.11285400390625, 0.063232421875, 0.23931884765625, 0.4154052734375, 0.59149169921875, 0.767578125, 0.94366455078125, 1.1197509765625, 1.29583740234375, 1.471923828125, 1.64801025390625, 1.8240966796875, 2.00018310546875, 2.17626953125, 2.35235595703125, 2.5284423828125, 2.70452880859375, 2.880615234375, 3.05670166015625, 3.2327880859375, 3.40887451171875, 3.5849609375, 3.76104736328125, 3.9371337890625, 4.11322021484375, 4.289306640625, 4.46539306640625, 4.6414794921875, 4.81756591796875, 4.99365234375, 5.16973876953125, 5.3458251953125, 5.52191162109375, 5.697998046875, 5.87408447265625, 6.0501708984375, 6.22625732421875, 6.40234375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 7.0, 32.0, 81.0, 204.0, 300.0, 193.0, 109.0, 37.0, 16.0, 9.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.83592987060547, -79.59486389160156, -77.35379028320312, -75.11272430419922, -72.87165069580078, -70.63058471679688, -68.38951110839844, -66.14844512939453, -63.907379150390625, -61.66630935668945, -59.42523956298828, -57.184173583984375, -54.9431037902832, -52.70203399658203, -50.46096420288086, -48.21989440917969, -45.978824615478516, -43.737754821777344, -41.49668502807617, -39.255615234375, -37.014549255371094, -34.77347946166992, -32.53240966796875, -30.291339874267578, -28.05027198791504, -25.809202194213867, -23.568134307861328, -21.327064514160156, -19.085994720458984, -16.844926834106445, -14.603857040405273, -12.362788200378418, -10.121723175048828, -7.880654335021973, -5.639585018157959, -3.3985157012939453, -1.1574468612670898, 1.0836219787597656, 3.3246917724609375, 5.565760612487793, 7.806829452514648, 10.047898292541504, 12.28896713256836, 14.530036926269531, 16.771106719970703, 19.012174606323242, 21.253244400024414, 23.494312286376953, 25.735382080078125, 27.976451873779297, 30.217519760131836, 32.458587646484375, 34.69965744018555, 36.94072723388672, 39.18179702758789, 41.42286682128906, 43.66393280029297, 45.90500259399414, 48.14607238769531, 50.38713836669922, 52.62820816040039, 54.86927795410156, 57.110347747802734, 59.351417541503906, 61.59248733520508]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 5.0, 9.0, 16.0, 12.0, 14.0, 18.0, 20.0, 24.0, 37.0, 36.0, 31.0, 40.0, 36.0, 39.0, 51.0, 39.0, 52.0, 44.0, 48.0, 44.0, 48.0, 44.0, 34.0, 33.0, 28.0, 37.0, 27.0, 31.0, 21.0, 17.0, 11.0, 10.0, 7.0, 3.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-18.93552017211914, -18.376623153686523, -17.817724227905273, -17.258827209472656, -16.69993019104004, -16.141033172607422, -15.582134246826172, -15.023237228393555, -14.464340209960938, -13.905442237854004, -13.346545219421387, -12.787647247314453, -12.228750228881836, -11.669852256774902, -11.110954284667969, -10.552057266235352, -9.993159294128418, -9.434261322021484, -8.875364303588867, -8.316466331481934, -7.757569313049316, -7.198671340942383, -6.639773845672607, -6.080876350402832, -5.521978855133057, -4.963081359863281, -4.404183864593506, -3.8452861309051514, -3.286388635635376, -2.7274911403656006, -2.168593406677246, -1.6096959114074707, -1.0507984161376953, -0.49190086126327515, 0.06699669361114502, 0.62589430809021, 1.1847918033599854, 1.7436892986297607, 2.3025870323181152, 2.8614845275878906, 3.420382022857666, 3.9792795181274414, 4.538177013397217, 5.097074508666992, 5.655972480773926, 6.214869499206543, 6.773767471313477, 7.332664966583252, 7.891562461853027, 8.450460433959961, 9.009357452392578, 9.568255424499512, 10.127152442932129, 10.686050415039062, 11.24494743347168, 11.803845405578613, 12.362743377685547, 12.92164134979248, 13.480538368225098, 14.039436340332031, 14.598333358764648, 15.157231330871582, 15.716129302978516, 16.275026321411133, 16.83392333984375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 0.0, 7.0, 4.0, 9.0, 9.0, 9.0, 12.0, 16.0, 24.0, 42.0, 52.0, 75.0, 100.0, 129.0, 204.0, 305.0, 519.0, 948.0, 2078.0, 5963.0, 32558.0, 379213.0, 561602.0, 51276.0, 8138.0, 2495.0, 1076.0, 587.0, 354.0, 222.0, 151.0, 104.0, 72.0, 52.0, 41.0, 27.0, 24.0, 13.0, 11.0, 11.0, 5.0, 4.0, 8.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-42.78125, -41.52685546875, -40.2724609375, -39.01806640625, -37.763671875, -36.50927734375, -35.2548828125, -34.00048828125, -32.74609375, -31.49169921875, -30.2373046875, -28.98291015625, -27.728515625, -26.47412109375, -25.2197265625, -23.96533203125, -22.7109375, -21.45654296875, -20.2021484375, -18.94775390625, -17.693359375, -16.43896484375, -15.1845703125, -13.93017578125, -12.67578125, -11.42138671875, -10.1669921875, -8.91259765625, -7.658203125, -6.40380859375, -5.1494140625, -3.89501953125, -2.640625, -1.38623046875, -0.1318359375, 1.12255859375, 2.376953125, 3.63134765625, 4.8857421875, 6.14013671875, 7.39453125, 8.64892578125, 9.9033203125, 11.15771484375, 12.412109375, 13.66650390625, 14.9208984375, 16.17529296875, 17.4296875, 18.68408203125, 19.9384765625, 21.19287109375, 22.447265625, 23.70166015625, 24.9560546875, 26.21044921875, 27.46484375, 28.71923828125, 29.9736328125, 31.22802734375, 32.482421875, 33.73681640625, 34.9912109375, 36.24560546875, 37.5]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 4.0, 11.0, 22.0, 39.0, 67.0, 113.0, 123.0, 188.0, 169.0, 123.0, 73.0, 31.0, 15.0, 12.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.90875244140625, -4.7237548828125, -4.53875732421875, -4.353759765625, -4.16876220703125, -3.9837646484375, -3.79876708984375, -3.61376953125, -3.42877197265625, -3.2437744140625, -3.05877685546875, -2.873779296875, -2.68878173828125, -2.5037841796875, -2.31878662109375, -2.1337890625, -1.94879150390625, -1.7637939453125, -1.57879638671875, -1.393798828125, -1.20880126953125, -1.0238037109375, -0.83880615234375, -0.65380859375, -0.46881103515625, -0.2838134765625, -0.09881591796875, 0.086181640625, 0.27117919921875, 0.4561767578125, 0.64117431640625, 0.826171875, 1.01116943359375, 1.1961669921875, 1.38116455078125, 1.566162109375, 1.75115966796875, 1.9361572265625, 2.12115478515625, 2.30615234375, 2.49114990234375, 2.6761474609375, 2.86114501953125, 3.046142578125, 3.23114013671875, 3.4161376953125, 3.60113525390625, 3.7861328125, 3.97113037109375, 4.1561279296875, 4.34112548828125, 4.526123046875, 4.71112060546875, 4.8961181640625, 5.08111572265625, 5.26611328125, 5.45111083984375, 5.6361083984375, 5.82110595703125, 6.006103515625, 6.19110107421875, 6.3760986328125, 6.56109619140625, 6.74609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 13.0, 8.0, 10.0, 16.0, 34.0, 33.0, 49.0, 73.0, 92.0, 125.0, 166.0, 256.0, 409.0, 700.0, 1155.0, 2421.0, 6074.0, 20643.0, 99771.0, 501075.0, 335236.0, 57906.0, 13482.0, 4366.0, 1847.0, 945.0, 541.0, 369.0, 208.0, 155.0, 107.0, 63.0, 59.0, 39.0, 34.0, 23.0, 7.0, 6.0, 13.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-34.8125, -33.892578125, -32.97265625, -32.052734375, -31.1328125, -30.212890625, -29.29296875, -28.373046875, -27.453125, -26.533203125, -25.61328125, -24.693359375, -23.7734375, -22.853515625, -21.93359375, -21.013671875, -20.09375, -19.173828125, -18.25390625, -17.333984375, -16.4140625, -15.494140625, -14.57421875, -13.654296875, -12.734375, -11.814453125, -10.89453125, -9.974609375, -9.0546875, -8.134765625, -7.21484375, -6.294921875, -5.375, -4.455078125, -3.53515625, -2.615234375, -1.6953125, -0.775390625, 0.14453125, 1.064453125, 1.984375, 2.904296875, 3.82421875, 4.744140625, 5.6640625, 6.583984375, 7.50390625, 8.423828125, 9.34375, 10.263671875, 11.18359375, 12.103515625, 13.0234375, 13.943359375, 14.86328125, 15.783203125, 16.703125, 17.623046875, 18.54296875, 19.462890625, 20.3828125, 21.302734375, 22.22265625, 23.142578125, 24.0625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 5.0, 3.0, 6.0, 11.0, 8.0, 15.0, 26.0, 30.0, 27.0, 34.0, 47.0, 48.0, 62.0, 59.0, 61.0, 53.0, 57.0, 60.0, 43.0, 44.0, 47.0, 42.0, 30.0, 32.0, 34.0, 22.0, 25.0, 18.0, 15.0, 11.0, 8.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.700927734375, -17.16748046875, -16.634033203125, -16.1005859375, -15.567138671875, -15.03369140625, -14.500244140625, -13.966796875, -13.433349609375, -12.89990234375, -12.366455078125, -11.8330078125, -11.299560546875, -10.76611328125, -10.232666015625, -9.69921875, -9.165771484375, -8.63232421875, -8.098876953125, -7.5654296875, -7.031982421875, -6.49853515625, -5.965087890625, -5.431640625, -4.898193359375, -4.36474609375, -3.831298828125, -3.2978515625, -2.764404296875, -2.23095703125, -1.697509765625, -1.1640625, -0.630615234375, -0.09716796875, 0.436279296875, 0.9697265625, 1.503173828125, 2.03662109375, 2.570068359375, 3.103515625, 3.636962890625, 4.17041015625, 4.703857421875, 5.2373046875, 5.770751953125, 6.30419921875, 6.837646484375, 7.37109375, 7.904541015625, 8.43798828125, 8.971435546875, 9.5048828125, 10.038330078125, 10.57177734375, 11.105224609375, 11.638671875, 12.172119140625, 12.70556640625, 13.239013671875, 13.7724609375, 14.305908203125, 14.83935546875, 15.372802734375, 15.90625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 7.0, 15.0, 10.0, 14.0, 20.0, 33.0, 32.0, 50.0, 65.0, 122.0, 181.0, 352.0, 730.0, 2070.0, 6783.0, 38530.0, 681622.0, 290337.0, 20339.0, 4429.0, 1456.0, 616.0, 286.0, 150.0, 82.0, 48.0, 42.0, 28.0, 27.0, 20.0, 12.0, 13.0, 9.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-51.0, -49.61572265625, -48.2314453125, -46.84716796875, -45.462890625, -44.07861328125, -42.6943359375, -41.31005859375, -39.92578125, -38.54150390625, -37.1572265625, -35.77294921875, -34.388671875, -33.00439453125, -31.6201171875, -30.23583984375, -28.8515625, -27.46728515625, -26.0830078125, -24.69873046875, -23.314453125, -21.93017578125, -20.5458984375, -19.16162109375, -17.77734375, -16.39306640625, -15.0087890625, -13.62451171875, -12.240234375, -10.85595703125, -9.4716796875, -8.08740234375, -6.703125, -5.31884765625, -3.9345703125, -2.55029296875, -1.166015625, 0.21826171875, 1.6025390625, 2.98681640625, 4.37109375, 5.75537109375, 7.1396484375, 8.52392578125, 9.908203125, 11.29248046875, 12.6767578125, 14.06103515625, 15.4453125, 16.82958984375, 18.2138671875, 19.59814453125, 20.982421875, 22.36669921875, 23.7509765625, 25.13525390625, 26.51953125, 27.90380859375, 29.2880859375, 30.67236328125, 32.056640625, 33.44091796875, 34.8251953125, 36.20947265625, 37.59375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 12.0, 11.0, 9.0, 29.0, 27.0, 46.0, 59.0, 90.0, 103.0, 142.0, 124.0, 96.0, 76.0, 54.0, 33.0, 25.0, 18.0, 15.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002017974853515625, -0.0019543468952178955, -0.001890718936920166, -0.0018270909786224365, -0.001763463020324707, -0.0016998350620269775, -0.001636207103729248, -0.0015725791454315186, -0.001508951187133789, -0.0014453232288360596, -0.00138169527053833, -0.0013180673122406006, -0.001254439353942871, -0.0011908113956451416, -0.0011271834373474121, -0.0010635554790496826, -0.0009999275207519531, -0.0009362995624542236, -0.0008726716041564941, -0.0008090436458587646, -0.0007454156875610352, -0.0006817877292633057, -0.0006181597709655762, -0.0005545318126678467, -0.0004909038543701172, -0.0004272758960723877, -0.0003636479377746582, -0.0003000199794769287, -0.00023639202117919922, -0.00017276406288146973, -0.00010913610458374023, -4.550814628601074e-05, 1.811981201171875e-05, 8.174777030944824e-05, 0.00014537572860717773, 0.00020900368690490723, 0.0002726316452026367, 0.0003362596035003662, 0.0003998875617980957, 0.0004635155200958252, 0.0005271434783935547, 0.0005907714366912842, 0.0006543993949890137, 0.0007180273532867432, 0.0007816553115844727, 0.0008452832698822021, 0.0009089112281799316, 0.0009725391864776611, 0.0010361671447753906, 0.0010997951030731201, 0.0011634230613708496, 0.001227051019668579, 0.0012906789779663086, 0.001354306936264038, 0.0014179348945617676, 0.001481562852859497, 0.0015451908111572266, 0.001608818769454956, 0.0016724467277526855, 0.001736074686050415, 0.0017997026443481445, 0.001863330602645874, 0.0019269585609436035, 0.001990586519241333, 0.0020542144775390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 3.0, 12.0, 14.0, 16.0, 27.0, 24.0, 38.0, 45.0, 63.0, 111.0, 168.0, 290.0, 520.0, 1198.0, 3234.0, 11302.0, 62890.0, 664073.0, 265835.0, 28238.0, 6435.0, 2027.0, 864.0, 405.0, 237.0, 130.0, 91.0, 61.0, 49.0, 43.0, 20.0, 19.0, 10.0, 13.0, 9.0, 10.0, 6.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-35.0625, -33.9931640625, -32.923828125, -31.8544921875, -30.78515625, -29.7158203125, -28.646484375, -27.5771484375, -26.5078125, -25.4384765625, -24.369140625, -23.2998046875, -22.23046875, -21.1611328125, -20.091796875, -19.0224609375, -17.953125, -16.8837890625, -15.814453125, -14.7451171875, -13.67578125, -12.6064453125, -11.537109375, -10.4677734375, -9.3984375, -8.3291015625, -7.259765625, -6.1904296875, -5.12109375, -4.0517578125, -2.982421875, -1.9130859375, -0.84375, 0.2255859375, 1.294921875, 2.3642578125, 3.43359375, 4.5029296875, 5.572265625, 6.6416015625, 7.7109375, 8.7802734375, 9.849609375, 10.9189453125, 11.98828125, 13.0576171875, 14.126953125, 15.1962890625, 16.265625, 17.3349609375, 18.404296875, 19.4736328125, 20.54296875, 21.6123046875, 22.681640625, 23.7509765625, 24.8203125, 25.8896484375, 26.958984375, 28.0283203125, 29.09765625, 30.1669921875, 31.236328125, 32.3056640625, 33.375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 10.0, 11.0, 18.0, 17.0, 37.0, 34.0, 62.0, 66.0, 81.0, 129.0, 119.0, 92.0, 70.0, 43.0, 41.0, 28.0, 28.0, 23.0, 15.0, 10.0, 2.0, 7.0, 9.0, 6.0, 3.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.265625, -14.756103515625, -14.24658203125, -13.737060546875, -13.2275390625, -12.718017578125, -12.20849609375, -11.698974609375, -11.189453125, -10.679931640625, -10.17041015625, -9.660888671875, -9.1513671875, -8.641845703125, -8.13232421875, -7.622802734375, -7.11328125, -6.603759765625, -6.09423828125, -5.584716796875, -5.0751953125, -4.565673828125, -4.05615234375, -3.546630859375, -3.037109375, -2.527587890625, -2.01806640625, -1.508544921875, -0.9990234375, -0.489501953125, 0.02001953125, 0.529541015625, 1.0390625, 1.548583984375, 2.05810546875, 2.567626953125, 3.0771484375, 3.586669921875, 4.09619140625, 4.605712890625, 5.115234375, 5.624755859375, 6.13427734375, 6.643798828125, 7.1533203125, 7.662841796875, 8.17236328125, 8.681884765625, 9.19140625, 9.700927734375, 10.21044921875, 10.719970703125, 11.2294921875, 11.739013671875, 12.24853515625, 12.758056640625, 13.267578125, 13.777099609375, 14.28662109375, 14.796142578125, 15.3056640625, 15.815185546875, 16.32470703125, 16.834228515625, 17.34375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 14.0, 25.0, 63.0, 109.0, 186.0, 236.0, 162.0, 92.0, 49.0, 25.0, 16.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.768310546875, -260.9114074707031, -253.05450439453125, -245.1975860595703, -237.34068298339844, -229.48377990722656, -221.6268768310547, -213.76995849609375, -205.91305541992188, -198.05615234375, -190.19924926757812, -182.3423309326172, -174.4854278564453, -166.62852478027344, -158.77162170410156, -150.91470336914062, -143.05780029296875, -135.20089721679688, -127.34398651123047, -119.4870834350586, -111.63017272949219, -103.77326965332031, -95.91636657714844, -88.05945587158203, -80.20256042480469, -72.34565734863281, -64.4887466430664, -56.63184356689453, -48.774932861328125, -40.91802978515625, -33.06112289428711, -25.20421600341797, -17.347305297851562, -9.490398406982422, -1.6334924697875977, 6.223413467407227, 14.080320358276367, 21.937225341796875, 29.794132232666016, 37.651039123535156, 45.5079460144043, 53.36485290527344, 61.22175979614258, 69.07866668701172, 76.9355697631836, 84.79248046875, 92.64938354492188, 100.50628662109375, 108.36319732666016, 116.22010040283203, 124.07701110839844, 131.9339141845703, 139.7908172607422, 147.64773559570312, 155.504638671875, 163.36154174804688, 171.21844482421875, 179.07534790039062, 186.9322509765625, 194.78916931152344, 202.6460723876953, 210.5029754638672, 218.35987854003906, 226.216796875, 234.07369995117188]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 12.0, 19.0, 23.0, 29.0, 33.0, 41.0, 52.0, 44.0, 49.0, 54.0, 67.0, 68.0, 66.0, 50.0, 60.0, 60.0, 50.0, 48.0, 44.0, 27.0, 19.0, 24.0, 14.0, 9.0, 10.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.94523620605469, -98.15853118896484, -93.37183380126953, -88.58512878417969, -83.79843139648438, -79.01172637939453, -74.22502136230469, -69.43832397460938, -64.65161895751953, -59.86491775512695, -55.078216552734375, -50.29151153564453, -45.50481033325195, -40.718109130859375, -35.93140411376953, -31.144702911376953, -26.358001708984375, -21.571300506591797, -16.784597396850586, -11.997895240783691, -7.211193084716797, -2.4244918823242188, 2.362211227416992, 7.148914337158203, 11.935615539550781, 16.72231674194336, 21.50901985168457, 26.29572296142578, 31.08242416381836, 35.86912536621094, 40.65583038330078, 45.44253158569336, 50.229248046875, 55.01594924926758, 59.802650451660156, 64.58935546875, 69.37605285644531, 74.16275787353516, 78.949462890625, 83.73616027832031, 88.52286529541016, 93.3095703125, 98.09626770019531, 102.88297271728516, 107.669677734375, 112.45637512207031, 117.24308013916016, 122.02978515625, 126.81648254394531, 131.60317993164062, 136.389892578125, 141.1765899658203, 145.96328735351562, 150.75, 155.5366973876953, 160.32339477539062, 165.110107421875, 169.8968048095703, 174.6835174560547, 179.47021484375, 184.2569122314453, 189.04360961914062, 193.830322265625, 198.6170196533203, 203.40371704101562]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 5.0, 9.0, 19.0, 23.0, 44.0, 90.0, 132.0, 279.0, 665.0, 2764.0, 22931.0, 3994752.0, 162072.0, 7597.0, 1596.0, 622.0, 284.0, 163.0, 75.0, 56.0, 24.0, 26.0, 18.0, 11.0, 5.0, 3.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.1875, -68.712890625, -66.23828125, -63.763671875, -61.2890625, -58.814453125, -56.33984375, -53.865234375, -51.390625, -48.916015625, -46.44140625, -43.966796875, -41.4921875, -39.017578125, -36.54296875, -34.068359375, -31.59375, -29.119140625, -26.64453125, -24.169921875, -21.6953125, -19.220703125, -16.74609375, -14.271484375, -11.796875, -9.322265625, -6.84765625, -4.373046875, -1.8984375, 0.576171875, 3.05078125, 5.525390625, 8.0, 10.474609375, 12.94921875, 15.423828125, 17.8984375, 20.373046875, 22.84765625, 25.322265625, 27.796875, 30.271484375, 32.74609375, 35.220703125, 37.6953125, 40.169921875, 42.64453125, 45.119140625, 47.59375, 50.068359375, 52.54296875, 55.017578125, 57.4921875, 59.966796875, 62.44140625, 64.916015625, 67.390625, 69.865234375, 72.33984375, 74.814453125, 77.2890625, 79.763671875, 82.23828125, 84.712890625, 87.1875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 12.0, 19.0, 19.0, 21.0, 60.0, 74.0, 101.0, 128.0, 119.0, 119.0, 119.0, 77.0, 54.0, 23.0, 16.0, 14.0, 7.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73046875, -5.52947998046875, -5.3284912109375, -5.12750244140625, -4.926513671875, -4.72552490234375, -4.5245361328125, -4.32354736328125, -4.12255859375, -3.92156982421875, -3.7205810546875, -3.51959228515625, -3.318603515625, -3.11761474609375, -2.9166259765625, -2.71563720703125, -2.5146484375, -2.31365966796875, -2.1126708984375, -1.91168212890625, -1.710693359375, -1.50970458984375, -1.3087158203125, -1.10772705078125, -0.90673828125, -0.70574951171875, -0.5047607421875, -0.30377197265625, -0.102783203125, 0.09820556640625, 0.2991943359375, 0.50018310546875, 0.701171875, 0.90216064453125, 1.1031494140625, 1.30413818359375, 1.505126953125, 1.70611572265625, 1.9071044921875, 2.10809326171875, 2.30908203125, 2.51007080078125, 2.7110595703125, 2.91204833984375, 3.113037109375, 3.31402587890625, 3.5150146484375, 3.71600341796875, 3.9169921875, 4.11798095703125, 4.3189697265625, 4.51995849609375, 4.720947265625, 4.92193603515625, 5.1229248046875, 5.32391357421875, 5.52490234375, 5.72589111328125, 5.9268798828125, 6.12786865234375, 6.328857421875, 6.52984619140625, 6.7308349609375, 6.93182373046875, 7.1328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 12.0, 9.0, 13.0, 23.0, 41.0, 63.0, 90.0, 180.0, 346.0, 642.0, 1374.0, 2893.0, 7876.0, 24333.0, 116753.0, 3111965.0, 829220.0, 70230.0, 16967.0, 5919.0, 2527.0, 1244.0, 619.0, 329.0, 225.0, 122.0, 85.0, 66.0, 38.0, 27.0, 20.0, 11.0, 6.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.3125, -32.432861328125, -31.55322265625, -30.673583984375, -29.7939453125, -28.914306640625, -28.03466796875, -27.155029296875, -26.275390625, -25.395751953125, -24.51611328125, -23.636474609375, -22.7568359375, -21.877197265625, -20.99755859375, -20.117919921875, -19.23828125, -18.358642578125, -17.47900390625, -16.599365234375, -15.7197265625, -14.840087890625, -13.96044921875, -13.080810546875, -12.201171875, -11.321533203125, -10.44189453125, -9.562255859375, -8.6826171875, -7.802978515625, -6.92333984375, -6.043701171875, -5.1640625, -4.284423828125, -3.40478515625, -2.525146484375, -1.6455078125, -0.765869140625, 0.11376953125, 0.993408203125, 1.873046875, 2.752685546875, 3.63232421875, 4.511962890625, 5.3916015625, 6.271240234375, 7.15087890625, 8.030517578125, 8.91015625, 9.789794921875, 10.66943359375, 11.549072265625, 12.4287109375, 13.308349609375, 14.18798828125, 15.067626953125, 15.947265625, 16.826904296875, 17.70654296875, 18.586181640625, 19.4658203125, 20.345458984375, 21.22509765625, 22.104736328125, 22.984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 3.0, 6.0, 10.0, 21.0, 21.0, 16.0, 31.0, 50.0, 90.0, 144.0, 321.0, 1510.0, 1208.0, 289.0, 132.0, 76.0, 48.0, 25.0, 11.0, 13.0, 14.0, 6.0, 8.0, 4.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.843505859375, -5.57763671875, -5.311767578125, -5.0458984375, -4.780029296875, -4.51416015625, -4.248291015625, -3.982421875, -3.716552734375, -3.45068359375, -3.184814453125, -2.9189453125, -2.653076171875, -2.38720703125, -2.121337890625, -1.85546875, -1.589599609375, -1.32373046875, -1.057861328125, -0.7919921875, -0.526123046875, -0.26025390625, 0.005615234375, 0.271484375, 0.537353515625, 0.80322265625, 1.069091796875, 1.3349609375, 1.600830078125, 1.86669921875, 2.132568359375, 2.3984375, 2.664306640625, 2.93017578125, 3.196044921875, 3.4619140625, 3.727783203125, 3.99365234375, 4.259521484375, 4.525390625, 4.791259765625, 5.05712890625, 5.322998046875, 5.5888671875, 5.854736328125, 6.12060546875, 6.386474609375, 6.65234375, 6.918212890625, 7.18408203125, 7.449951171875, 7.7158203125, 7.981689453125, 8.24755859375, 8.513427734375, 8.779296875, 9.045166015625, 9.31103515625, 9.576904296875, 9.8427734375, 10.108642578125, 10.37451171875, 10.640380859375, 10.90625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 13.0, 22.0, 54.0, 81.0, 138.0, 207.0, 161.0, 132.0, 74.0, 35.0, 23.0, 21.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.4171142578125, -45.73039245605469, -44.04367446899414, -42.356956481933594, -40.67023468017578, -38.98351287841797, -37.29679489135742, -35.610076904296875, -33.92335510253906, -32.23663330078125, -30.549915313720703, -28.863195419311523, -27.176475524902344, -25.489755630493164, -23.803035736083984, -22.116315841674805, -20.429595947265625, -18.742876052856445, -17.056156158447266, -15.369436264038086, -13.682716369628906, -11.995996475219727, -10.309276580810547, -8.622556686401367, -6.9358367919921875, -5.249116897583008, -3.562397003173828, -1.8756771087646484, -0.18895721435546875, 1.497762680053711, 3.1844825744628906, 4.87120246887207, 6.557918548583984, 8.244638442993164, 9.931358337402344, 11.618078231811523, 13.304798126220703, 14.991518020629883, 16.678237915039062, 18.364957809448242, 20.051677703857422, 21.7383975982666, 23.42511749267578, 25.11183738708496, 26.79855728149414, 28.48527717590332, 30.1719970703125, 31.85871696472168, 33.54543685913086, 35.232154846191406, 36.91887664794922, 38.60559844970703, 40.29231643676758, 41.979034423828125, 43.66575622558594, 45.35247802734375, 47.0391960144043, 48.725914001464844, 50.412635803222656, 52.09935760498047, 53.786075592041016, 55.47279357910156, 57.159515380859375, 58.84623718261719, 60.532955169677734]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 10.0, 11.0, 14.0, 13.0, 21.0, 32.0, 32.0, 47.0, 53.0, 56.0, 56.0, 71.0, 69.0, 57.0, 52.0, 65.0, 50.0, 63.0, 48.0, 31.0, 34.0, 26.0, 20.0, 17.0, 15.0, 11.0, 8.0, 9.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.90068435668945, -40.81103515625, -39.72138214111328, -38.63173294067383, -37.54207992553711, -36.452430725097656, -35.36277770996094, -34.273128509521484, -33.18347930908203, -32.09383010864258, -31.00417709350586, -29.914527893066406, -28.82487678527832, -27.735225677490234, -26.64557456970215, -25.555923461914062, -24.466272354125977, -23.37662124633789, -22.286970138549805, -21.19731903076172, -20.107669830322266, -19.01801872253418, -17.928367614746094, -16.838716506958008, -15.749066352844238, -14.659415245056152, -13.569765090942383, -12.480113983154297, -11.390462875366211, -10.300812721252441, -9.211161613464355, -8.121511459350586, -7.0318603515625, -5.942209720611572, -4.8525590896606445, -3.7629079818725586, -2.673257350921631, -1.5836067199707031, -0.4939556121826172, 0.5956950187683105, 1.6853456497192383, 2.774996280670166, 3.864647150039673, 4.95429801940918, 6.043948650360107, 7.133599281311035, 8.223250389099121, 9.31290054321289, 10.402551651000977, 11.492202758789062, 12.581852912902832, 13.671504020690918, 14.761154174804688, 15.850805282592773, 16.94045639038086, 18.030107498168945, 19.11975860595703, 20.209409713745117, 21.299060821533203, 22.388710021972656, 23.478361129760742, 24.568012237548828, 25.657663345336914, 26.747314453125, 27.836963653564453]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 1.0, 6.0, 8.0, 10.0, 16.0, 18.0, 23.0, 27.0, 37.0, 64.0, 95.0, 129.0, 176.0, 286.0, 422.0, 764.0, 1527.0, 3770.0, 11339.0, 43551.0, 199256.0, 512889.0, 209065.0, 45507.0, 11901.0, 3979.0, 1609.0, 721.0, 455.0, 295.0, 190.0, 112.0, 68.0, 77.0, 44.0, 28.0, 27.0, 11.0, 15.0, 8.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.9375, -23.153076171875, -22.36865234375, -21.584228515625, -20.7998046875, -20.015380859375, -19.23095703125, -18.446533203125, -17.662109375, -16.877685546875, -16.09326171875, -15.308837890625, -14.5244140625, -13.739990234375, -12.95556640625, -12.171142578125, -11.38671875, -10.602294921875, -9.81787109375, -9.033447265625, -8.2490234375, -7.464599609375, -6.68017578125, -5.895751953125, -5.111328125, -4.326904296875, -3.54248046875, -2.758056640625, -1.9736328125, -1.189208984375, -0.40478515625, 0.379638671875, 1.1640625, 1.948486328125, 2.73291015625, 3.517333984375, 4.3017578125, 5.086181640625, 5.87060546875, 6.655029296875, 7.439453125, 8.223876953125, 9.00830078125, 9.792724609375, 10.5771484375, 11.361572265625, 12.14599609375, 12.930419921875, 13.71484375, 14.499267578125, 15.28369140625, 16.068115234375, 16.8525390625, 17.636962890625, 18.42138671875, 19.205810546875, 19.990234375, 20.774658203125, 21.55908203125, 22.343505859375, 23.1279296875, 23.912353515625, 24.69677734375, 25.481201171875, 26.265625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 7.0, 13.0, 18.0, 21.0, 55.0, 56.0, 86.0, 112.0, 84.0, 120.0, 117.0, 99.0, 82.0, 57.0, 29.0, 14.0, 18.0, 4.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69921875, -5.49774169921875, -5.2962646484375, -5.09478759765625, -4.893310546875, -4.69183349609375, -4.4903564453125, -4.28887939453125, -4.08740234375, -3.88592529296875, -3.6844482421875, -3.48297119140625, -3.281494140625, -3.08001708984375, -2.8785400390625, -2.67706298828125, -2.4755859375, -2.27410888671875, -2.0726318359375, -1.87115478515625, -1.669677734375, -1.46820068359375, -1.2667236328125, -1.06524658203125, -0.86376953125, -0.66229248046875, -0.4608154296875, -0.25933837890625, -0.057861328125, 0.14361572265625, 0.3450927734375, 0.54656982421875, 0.748046875, 0.94952392578125, 1.1510009765625, 1.35247802734375, 1.553955078125, 1.75543212890625, 1.9569091796875, 2.15838623046875, 2.35986328125, 2.56134033203125, 2.7628173828125, 2.96429443359375, 3.165771484375, 3.36724853515625, 3.5687255859375, 3.77020263671875, 3.9716796875, 4.17315673828125, 4.3746337890625, 4.57611083984375, 4.777587890625, 4.97906494140625, 5.1805419921875, 5.38201904296875, 5.58349609375, 5.78497314453125, 5.9864501953125, 6.18792724609375, 6.389404296875, 6.59088134765625, 6.7923583984375, 6.99383544921875, 7.1953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 4.0, 7.0, 14.0, 25.0, 44.0, 76.0, 128.0, 223.0, 386.0, 967.0, 2780.0, 14881.0, 203210.0, 755891.0, 60224.0, 6833.0, 1583.0, 616.0, 279.0, 173.0, 91.0, 53.0, 26.0, 19.0, 9.0, 8.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.21875, -61.60986328125, -60.0009765625, -58.39208984375, -56.783203125, -55.17431640625, -53.5654296875, -51.95654296875, -50.34765625, -48.73876953125, -47.1298828125, -45.52099609375, -43.912109375, -42.30322265625, -40.6943359375, -39.08544921875, -37.4765625, -35.86767578125, -34.2587890625, -32.64990234375, -31.041015625, -29.43212890625, -27.8232421875, -26.21435546875, -24.60546875, -22.99658203125, -21.3876953125, -19.77880859375, -18.169921875, -16.56103515625, -14.9521484375, -13.34326171875, -11.734375, -10.12548828125, -8.5166015625, -6.90771484375, -5.298828125, -3.68994140625, -2.0810546875, -0.47216796875, 1.13671875, 2.74560546875, 4.3544921875, 5.96337890625, 7.572265625, 9.18115234375, 10.7900390625, 12.39892578125, 14.0078125, 15.61669921875, 17.2255859375, 18.83447265625, 20.443359375, 22.05224609375, 23.6611328125, 25.27001953125, 26.87890625, 28.48779296875, 30.0966796875, 31.70556640625, 33.314453125, 34.92333984375, 36.5322265625, 38.14111328125, 39.75]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 8.0, 5.0, 9.0, 16.0, 11.0, 17.0, 19.0, 17.0, 31.0, 30.0, 44.0, 53.0, 60.0, 60.0, 78.0, 58.0, 64.0, 74.0, 56.0, 43.0, 49.0, 45.0, 42.0, 27.0, 23.0, 17.0, 13.0, 12.0, 12.0, 9.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.28125, -22.5087890625, -21.736328125, -20.9638671875, -20.19140625, -19.4189453125, -18.646484375, -17.8740234375, -17.1015625, -16.3291015625, -15.556640625, -14.7841796875, -14.01171875, -13.2392578125, -12.466796875, -11.6943359375, -10.921875, -10.1494140625, -9.376953125, -8.6044921875, -7.83203125, -7.0595703125, -6.287109375, -5.5146484375, -4.7421875, -3.9697265625, -3.197265625, -2.4248046875, -1.65234375, -0.8798828125, -0.107421875, 0.6650390625, 1.4375, 2.2099609375, 2.982421875, 3.7548828125, 4.52734375, 5.2998046875, 6.072265625, 6.8447265625, 7.6171875, 8.3896484375, 9.162109375, 9.9345703125, 10.70703125, 11.4794921875, 12.251953125, 13.0244140625, 13.796875, 14.5693359375, 15.341796875, 16.1142578125, 16.88671875, 17.6591796875, 18.431640625, 19.2041015625, 19.9765625, 20.7490234375, 21.521484375, 22.2939453125, 23.06640625, 23.8388671875, 24.611328125, 25.3837890625, 26.15625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 9.0, 5.0, 10.0, 15.0, 21.0, 30.0, 55.0, 82.0, 103.0, 227.0, 426.0, 882.0, 2554.0, 9904.0, 63066.0, 620494.0, 311818.0, 29709.0, 5889.0, 1776.0, 669.0, 336.0, 158.0, 108.0, 64.0, 40.0, 35.0, 16.0, 8.0, 8.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.5, -21.834716796875, -21.16943359375, -20.504150390625, -19.8388671875, -19.173583984375, -18.50830078125, -17.843017578125, -17.177734375, -16.512451171875, -15.84716796875, -15.181884765625, -14.5166015625, -13.851318359375, -13.18603515625, -12.520751953125, -11.85546875, -11.190185546875, -10.52490234375, -9.859619140625, -9.1943359375, -8.529052734375, -7.86376953125, -7.198486328125, -6.533203125, -5.867919921875, -5.20263671875, -4.537353515625, -3.8720703125, -3.206787109375, -2.54150390625, -1.876220703125, -1.2109375, -0.545654296875, 0.11962890625, 0.784912109375, 1.4501953125, 2.115478515625, 2.78076171875, 3.446044921875, 4.111328125, 4.776611328125, 5.44189453125, 6.107177734375, 6.7724609375, 7.437744140625, 8.10302734375, 8.768310546875, 9.43359375, 10.098876953125, 10.76416015625, 11.429443359375, 12.0947265625, 12.760009765625, 13.42529296875, 14.090576171875, 14.755859375, 15.421142578125, 16.08642578125, 16.751708984375, 17.4169921875, 18.082275390625, 18.74755859375, 19.412841796875, 20.078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 3.0, 10.0, 13.0, 11.0, 14.0, 24.0, 42.0, 48.0, 62.0, 79.0, 82.0, 139.0, 115.0, 83.0, 62.0, 46.0, 46.0, 32.0, 16.0, 8.0, 10.0, 14.0, 5.0, 4.0, 3.0, 2.0, 1.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001529693603515625, -0.0014866441488265991, -0.0014435946941375732, -0.0014005452394485474, -0.0013574957847595215, -0.0013144463300704956, -0.0012713968753814697, -0.0012283474206924438, -0.001185297966003418, -0.001142248511314392, -0.0010991990566253662, -0.0010561496019363403, -0.0010131001472473145, -0.0009700506925582886, -0.0009270012378692627, -0.0008839517831802368, -0.0008409023284912109, -0.0007978528738021851, -0.0007548034191131592, -0.0007117539644241333, -0.0006687045097351074, -0.0006256550550460815, -0.0005826056003570557, -0.0005395561456680298, -0.0004965066909790039, -0.00045345723628997803, -0.00041040778160095215, -0.00036735832691192627, -0.0003243088722229004, -0.0002812594175338745, -0.00023820996284484863, -0.00019516050815582275, -0.00015211105346679688, -0.000109061598777771, -6.601214408874512e-05, -2.2962689399719238e-05, 2.008676528930664e-05, 6.313621997833252e-05, 0.0001061856746673584, 0.00014923512935638428, 0.00019228458404541016, 0.00023533403873443604, 0.0002783834934234619, 0.0003214329481124878, 0.00036448240280151367, 0.00040753185749053955, 0.00045058131217956543, 0.0004936307668685913, 0.0005366802215576172, 0.0005797296762466431, 0.0006227791309356689, 0.0006658285856246948, 0.0007088780403137207, 0.0007519274950027466, 0.0007949769496917725, 0.0008380264043807983, 0.0008810758590698242, 0.0009241253137588501, 0.000967174768447876, 0.0010102242231369019, 0.0010532736778259277, 0.0010963231325149536, 0.0011393725872039795, 0.0011824220418930054, 0.0012254714965820312]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 11.0, 3.0, 10.0, 10.0, 10.0, 13.0, 21.0, 34.0, 48.0, 79.0, 126.0, 214.0, 417.0, 943.0, 2889.0, 12798.0, 127806.0, 809348.0, 79756.0, 9776.0, 2478.0, 831.0, 363.0, 201.0, 119.0, 66.0, 40.0, 36.0, 23.0, 21.0, 8.0, 11.0, 11.0, 9.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.859375, -23.984619140625, -23.10986328125, -22.235107421875, -21.3603515625, -20.485595703125, -19.61083984375, -18.736083984375, -17.861328125, -16.986572265625, -16.11181640625, -15.237060546875, -14.3623046875, -13.487548828125, -12.61279296875, -11.738037109375, -10.86328125, -9.988525390625, -9.11376953125, -8.239013671875, -7.3642578125, -6.489501953125, -5.61474609375, -4.739990234375, -3.865234375, -2.990478515625, -2.11572265625, -1.240966796875, -0.3662109375, 0.508544921875, 1.38330078125, 2.258056640625, 3.1328125, 4.007568359375, 4.88232421875, 5.757080078125, 6.6318359375, 7.506591796875, 8.38134765625, 9.256103515625, 10.130859375, 11.005615234375, 11.88037109375, 12.755126953125, 13.6298828125, 14.504638671875, 15.37939453125, 16.254150390625, 17.12890625, 18.003662109375, 18.87841796875, 19.753173828125, 20.6279296875, 21.502685546875, 22.37744140625, 23.252197265625, 24.126953125, 25.001708984375, 25.87646484375, 26.751220703125, 27.6259765625, 28.500732421875, 29.37548828125, 30.250244140625, 31.125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 6.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 10.0, 15.0, 7.0, 25.0, 17.0, 30.0, 34.0, 35.0, 52.0, 80.0, 73.0, 72.0, 93.0, 75.0, 63.0, 71.0, 44.0, 34.0, 36.0, 25.0, 13.0, 12.0, 16.0, 11.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.0703125, -8.7457275390625, -8.421142578125, -8.0965576171875, -7.77197265625, -7.4473876953125, -7.122802734375, -6.7982177734375, -6.4736328125, -6.1490478515625, -5.824462890625, -5.4998779296875, -5.17529296875, -4.8507080078125, -4.526123046875, -4.2015380859375, -3.876953125, -3.5523681640625, -3.227783203125, -2.9031982421875, -2.57861328125, -2.2540283203125, -1.929443359375, -1.6048583984375, -1.2802734375, -0.9556884765625, -0.631103515625, -0.3065185546875, 0.01806640625, 0.3426513671875, 0.667236328125, 0.9918212890625, 1.31640625, 1.6409912109375, 1.965576171875, 2.2901611328125, 2.61474609375, 2.9393310546875, 3.263916015625, 3.5885009765625, 3.9130859375, 4.2376708984375, 4.562255859375, 4.8868408203125, 5.21142578125, 5.5360107421875, 5.860595703125, 6.1851806640625, 6.509765625, 6.8343505859375, 7.158935546875, 7.4835205078125, 7.80810546875, 8.1326904296875, 8.457275390625, 8.7818603515625, 9.1064453125, 9.4310302734375, 9.755615234375, 10.0802001953125, 10.40478515625, 10.7293701171875, 11.053955078125, 11.3785400390625, 11.703125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 15.0, 27.0, 44.0, 103.0, 228.0, 234.0, 169.0, 76.0, 38.0, 24.0, 12.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-277.29296875, -270.2442321777344, -263.19549560546875, -256.146728515625, -249.09799194335938, -242.04925537109375, -235.00050354003906, -227.95176696777344, -220.90301513671875, -213.85427856445312, -206.80552673339844, -199.7567901611328, -192.70803833007812, -185.6593017578125, -178.6105499267578, -171.5618133544922, -164.5130615234375, -157.46432495117188, -150.4155731201172, -143.36683654785156, -136.31808471679688, -129.26934814453125, -122.22059631347656, -115.17185974121094, -108.12312316894531, -101.07437896728516, -94.025634765625, -86.97689056396484, -79.92814636230469, -72.87940979003906, -65.83065795898438, -58.781917572021484, -51.73316955566406, -44.684425354003906, -37.63568115234375, -30.586938858032227, -23.53819465637207, -16.489452362060547, -9.44070816040039, -2.3919639587402344, 4.656780242919922, 11.705524444580078, 18.754268646240234, 25.803010940551758, 32.85175323486328, 39.90049743652344, 46.949241638183594, 53.99798583984375, 61.046730041503906, 68.09547424316406, 75.14421844482422, 82.19296264648438, 89.24170684814453, 96.29045104980469, 103.33918762207031, 110.387939453125, 117.43667602539062, 124.48542022705078, 131.53416442871094, 138.58290100097656, 145.63165283203125, 152.68038940429688, 159.72914123535156, 166.7778778076172, 173.82662963867188]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 12.0, 20.0, 15.0, 10.0, 29.0, 26.0, 31.0, 26.0, 55.0, 30.0, 48.0, 56.0, 46.0, 47.0, 53.0, 55.0, 42.0, 42.0, 68.0, 41.0, 38.0, 41.0, 30.0, 19.0, 27.0, 13.0, 20.0, 13.0, 11.0, 6.0, 8.0, 8.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.71200561523438, -111.81444549560547, -107.91688537597656, -104.01932525634766, -100.12176513671875, -96.22421264648438, -92.32665252685547, -88.42909240722656, -84.53153228759766, -80.63397216796875, -76.73641204833984, -72.83885192871094, -68.94129943847656, -65.04373168945312, -61.14617919921875, -57.248619079589844, -53.35105895996094, -49.45349884033203, -45.555938720703125, -41.658382415771484, -37.76082229614258, -33.86326217651367, -29.9657039642334, -26.068145751953125, -22.17058563232422, -18.273025512695312, -14.375467300415039, -10.47790813446045, -6.580348968505859, -2.682788848876953, 1.2147693634033203, 5.112327575683594, 9.0098876953125, 12.90744686126709, 16.80500602722168, 20.702564239501953, 24.60012435913086, 28.497684478759766, 32.395240783691406, 36.29280090332031, 40.19036102294922, 44.087921142578125, 47.98548126220703, 51.88303756713867, 55.78059768676758, 59.678157806396484, 63.575714111328125, 67.47327423095703, 71.37083435058594, 75.26839447021484, 79.16595458984375, 83.06351470947266, 86.96107482910156, 90.85862731933594, 94.75618743896484, 98.65374755859375, 102.55130767822266, 106.44886779785156, 110.34642791748047, 114.24398803710938, 118.14154052734375, 122.03910827636719, 125.93666076660156, 129.834228515625, 133.73178100585938]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 5.0, 10.0, 10.0, 18.0, 26.0, 52.0, 62.0, 120.0, 229.0, 782.0, 5573.0, 160520.0, 4006259.0, 17639.0, 1960.0, 490.0, 210.0, 101.0, 74.0, 51.0, 29.0, 25.0, 12.0, 11.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.5625, -35.6083984375, -33.654296875, -31.7001953125, -29.74609375, -27.7919921875, -25.837890625, -23.8837890625, -21.9296875, -19.9755859375, -18.021484375, -16.0673828125, -14.11328125, -12.1591796875, -10.205078125, -8.2509765625, -6.296875, -4.3427734375, -2.388671875, -0.4345703125, 1.51953125, 3.4736328125, 5.427734375, 7.3818359375, 9.3359375, 11.2900390625, 13.244140625, 15.1982421875, 17.15234375, 19.1064453125, 21.060546875, 23.0146484375, 24.96875, 26.9228515625, 28.876953125, 30.8310546875, 32.78515625, 34.7392578125, 36.693359375, 38.6474609375, 40.6015625, 42.5556640625, 44.509765625, 46.4638671875, 48.41796875, 50.3720703125, 52.326171875, 54.2802734375, 56.234375, 58.1884765625, 60.142578125, 62.0966796875, 64.05078125, 66.0048828125, 67.958984375, 69.9130859375, 71.8671875, 73.8212890625, 75.775390625, 77.7294921875, 79.68359375, 81.6376953125, 83.591796875, 85.5458984375, 87.5]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 10.0, 25.0, 28.0, 36.0, 42.0, 65.0, 88.0, 94.0, 118.0, 113.0, 106.0, 66.0, 56.0, 57.0, 37.0, 23.0, 10.0, 7.0, 6.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1015625, -5.88287353515625, -5.6641845703125, -5.44549560546875, -5.226806640625, -5.00811767578125, -4.7894287109375, -4.57073974609375, -4.35205078125, -4.13336181640625, -3.9146728515625, -3.69598388671875, -3.477294921875, -3.25860595703125, -3.0399169921875, -2.82122802734375, -2.6025390625, -2.38385009765625, -2.1651611328125, -1.94647216796875, -1.727783203125, -1.50909423828125, -1.2904052734375, -1.07171630859375, -0.85302734375, -0.63433837890625, -0.4156494140625, -0.19696044921875, 0.021728515625, 0.24041748046875, 0.4591064453125, 0.67779541015625, 0.896484375, 1.11517333984375, 1.3338623046875, 1.55255126953125, 1.771240234375, 1.98992919921875, 2.2086181640625, 2.42730712890625, 2.64599609375, 2.86468505859375, 3.0833740234375, 3.30206298828125, 3.520751953125, 3.73944091796875, 3.9581298828125, 4.17681884765625, 4.3955078125, 4.61419677734375, 4.8328857421875, 5.05157470703125, 5.270263671875, 5.48895263671875, 5.7076416015625, 5.92633056640625, 6.14501953125, 6.36370849609375, 6.5823974609375, 6.80108642578125, 7.019775390625, 7.23846435546875, 7.4571533203125, 7.67584228515625, 7.89453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 4.0, 7.0, 7.0, 19.0, 14.0, 21.0, 31.0, 54.0, 79.0, 106.0, 172.0, 255.0, 424.0, 725.0, 1303.0, 2668.0, 6337.0, 17518.0, 63931.0, 465822.0, 3379299.0, 195296.0, 39080.0, 11906.0, 4528.0, 2005.0, 1080.0, 595.0, 338.0, 182.0, 149.0, 96.0, 68.0, 50.0, 33.0, 32.0, 10.0, 12.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-20.484375, -19.887451171875, -19.29052734375, -18.693603515625, -18.0966796875, -17.499755859375, -16.90283203125, -16.305908203125, -15.708984375, -15.112060546875, -14.51513671875, -13.918212890625, -13.3212890625, -12.724365234375, -12.12744140625, -11.530517578125, -10.93359375, -10.336669921875, -9.73974609375, -9.142822265625, -8.5458984375, -7.948974609375, -7.35205078125, -6.755126953125, -6.158203125, -5.561279296875, -4.96435546875, -4.367431640625, -3.7705078125, -3.173583984375, -2.57666015625, -1.979736328125, -1.3828125, -0.785888671875, -0.18896484375, 0.407958984375, 1.0048828125, 1.601806640625, 2.19873046875, 2.795654296875, 3.392578125, 3.989501953125, 4.58642578125, 5.183349609375, 5.7802734375, 6.377197265625, 6.97412109375, 7.571044921875, 8.16796875, 8.764892578125, 9.36181640625, 9.958740234375, 10.5556640625, 11.152587890625, 11.74951171875, 12.346435546875, 12.943359375, 13.540283203125, 14.13720703125, 14.734130859375, 15.3310546875, 15.927978515625, 16.52490234375, 17.121826171875, 17.71875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 9.0, 9.0, 12.0, 21.0, 22.0, 36.0, 77.0, 116.0, 214.0, 729.0, 1956.0, 404.0, 165.0, 107.0, 66.0, 34.0, 31.0, 18.0, 11.0, 8.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3046875, -7.07867431640625, -6.8526611328125, -6.62664794921875, -6.400634765625, -6.17462158203125, -5.9486083984375, -5.72259521484375, -5.49658203125, -5.27056884765625, -5.0445556640625, -4.81854248046875, -4.592529296875, -4.36651611328125, -4.1405029296875, -3.91448974609375, -3.6884765625, -3.46246337890625, -3.2364501953125, -3.01043701171875, -2.784423828125, -2.55841064453125, -2.3323974609375, -2.10638427734375, -1.88037109375, -1.65435791015625, -1.4283447265625, -1.20233154296875, -0.976318359375, -0.75030517578125, -0.5242919921875, -0.29827880859375, -0.072265625, 0.15374755859375, 0.3797607421875, 0.60577392578125, 0.831787109375, 1.05780029296875, 1.2838134765625, 1.50982666015625, 1.73583984375, 1.96185302734375, 2.1878662109375, 2.41387939453125, 2.639892578125, 2.86590576171875, 3.0919189453125, 3.31793212890625, 3.5439453125, 3.76995849609375, 3.9959716796875, 4.22198486328125, 4.447998046875, 4.67401123046875, 4.9000244140625, 5.12603759765625, 5.35205078125, 5.57806396484375, 5.8040771484375, 6.03009033203125, 6.256103515625, 6.48211669921875, 6.7081298828125, 6.93414306640625, 7.16015625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 11.0, 16.0, 20.0, 43.0, 63.0, 118.0, 156.0, 164.0, 143.0, 106.0, 69.0, 31.0, 34.0, 6.0, 7.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.224361419677734, -27.91451644897461, -26.60466957092285, -25.294824600219727, -23.98497772216797, -22.675132751464844, -21.36528778076172, -20.05544090270996, -18.745594024658203, -17.435749053955078, -16.12590217590332, -14.816057205200195, -13.506210327148438, -12.196365356445312, -10.886519432067871, -9.57667350769043, -8.266828536987305, -6.956982612609863, -5.647136688232422, -4.337291240692139, -3.0274453163146973, -1.7175993919372559, -0.40775394439697266, 0.9020919799804688, 2.21193790435791, 3.5217838287353516, 4.831629753112793, 6.141475200653076, 7.451321125030518, 8.761167526245117, 10.071012496948242, 11.380858421325684, 12.690704345703125, 14.000550270080566, 15.310396194458008, 16.620241165161133, 17.93008804321289, 19.239933013916016, 20.54977798461914, 21.8596248626709, 23.169471740722656, 24.47931671142578, 25.78916358947754, 27.099008560180664, 28.408855438232422, 29.718700408935547, 31.028545379638672, 32.33839416503906, 33.64823913574219, 34.95808410644531, 36.26792907714844, 37.57777786254883, 38.88762283325195, 40.19746780395508, 41.5073127746582, 42.817161560058594, 44.12700271606445, 45.43684768676758, 46.7466926574707, 48.056541442871094, 49.36638641357422, 50.676231384277344, 51.98607635498047, 53.295921325683594, 54.605770111083984]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 8.0, 6.0, 6.0, 15.0, 15.0, 18.0, 35.0, 48.0, 55.0, 61.0, 60.0, 66.0, 68.0, 70.0, 81.0, 59.0, 54.0, 60.0, 51.0, 36.0, 28.0, 32.0, 20.0, 16.0, 15.0, 7.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.04438781738281, -33.10906982421875, -32.17375183105469, -31.238433837890625, -30.303115844726562, -29.3677978515625, -28.432479858398438, -27.497161865234375, -26.561843872070312, -25.62652587890625, -24.691207885742188, -23.755889892578125, -22.820571899414062, -21.88525390625, -20.949935913085938, -20.014617919921875, -19.07929801940918, -18.143980026245117, -17.208662033081055, -16.273344039916992, -15.33802604675293, -14.402708053588867, -13.467389106750488, -12.532071113586426, -11.596753120422363, -10.6614351272583, -9.726117134094238, -8.79079818725586, -7.855480670928955, -6.920162677764893, -5.984844207763672, -5.049526214599609, -4.114208221435547, -3.1788902282714844, -2.2435719966888428, -1.3082537651062012, -0.37293577194213867, 0.5623822212219238, 1.4977006912231445, 2.433018684387207, 3.3683366775512695, 4.303654670715332, 5.2389726638793945, 6.174291133880615, 7.109609127044678, 8.044927597045898, 8.980245590209961, 9.915563583374023, 10.850881576538086, 11.786199569702148, 12.721517562866211, 13.656835556030273, 14.592153549194336, 15.527471542358398, 16.462791442871094, 17.398109436035156, 18.33342742919922, 19.26874542236328, 20.204063415527344, 21.139381408691406, 22.07469940185547, 23.01001739501953, 23.945335388183594, 24.880653381347656, 25.81597137451172]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 10.0, 14.0, 23.0, 45.0, 52.0, 103.0, 128.0, 237.0, 462.0, 991.0, 2671.0, 8942.0, 41487.0, 283203.0, 575759.0, 107698.0, 18858.0, 4796.0, 1553.0, 647.0, 336.0, 203.0, 116.0, 77.0, 45.0, 28.0, 24.0, 5.0, 11.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.46142578125, -31.4853515625, -30.50927734375, -29.533203125, -28.55712890625, -27.5810546875, -26.60498046875, -25.62890625, -24.65283203125, -23.6767578125, -22.70068359375, -21.724609375, -20.74853515625, -19.7724609375, -18.79638671875, -17.8203125, -16.84423828125, -15.8681640625, -14.89208984375, -13.916015625, -12.93994140625, -11.9638671875, -10.98779296875, -10.01171875, -9.03564453125, -8.0595703125, -7.08349609375, -6.107421875, -5.13134765625, -4.1552734375, -3.17919921875, -2.203125, -1.22705078125, -0.2509765625, 0.72509765625, 1.701171875, 2.67724609375, 3.6533203125, 4.62939453125, 5.60546875, 6.58154296875, 7.5576171875, 8.53369140625, 9.509765625, 10.48583984375, 11.4619140625, 12.43798828125, 13.4140625, 14.39013671875, 15.3662109375, 16.34228515625, 17.318359375, 18.29443359375, 19.2705078125, 20.24658203125, 21.22265625, 22.19873046875, 23.1748046875, 24.15087890625, 25.126953125, 26.10302734375, 27.0791015625, 28.05517578125, 29.03125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 11.0, 18.0, 27.0, 45.0, 52.0, 64.0, 68.0, 113.0, 117.0, 102.0, 88.0, 87.0, 61.0, 46.0, 39.0, 27.0, 12.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -5.96209716796875, -5.7406005859375, -5.51910400390625, -5.297607421875, -5.07611083984375, -4.8546142578125, -4.63311767578125, -4.41162109375, -4.19012451171875, -3.9686279296875, -3.74713134765625, -3.525634765625, -3.30413818359375, -3.0826416015625, -2.86114501953125, -2.6396484375, -2.41815185546875, -2.1966552734375, -1.97515869140625, -1.753662109375, -1.53216552734375, -1.3106689453125, -1.08917236328125, -0.86767578125, -0.64617919921875, -0.4246826171875, -0.20318603515625, 0.018310546875, 0.23980712890625, 0.4613037109375, 0.68280029296875, 0.904296875, 1.12579345703125, 1.3472900390625, 1.56878662109375, 1.790283203125, 2.01177978515625, 2.2332763671875, 2.45477294921875, 2.67626953125, 2.89776611328125, 3.1192626953125, 3.34075927734375, 3.562255859375, 3.78375244140625, 4.0052490234375, 4.22674560546875, 4.4482421875, 4.66973876953125, 4.8912353515625, 5.11273193359375, 5.334228515625, 5.55572509765625, 5.7772216796875, 5.99871826171875, 6.22021484375, 6.44171142578125, 6.6632080078125, 6.88470458984375, 7.106201171875, 7.32769775390625, 7.5491943359375, 7.77069091796875, 7.9921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 5.0, 7.0, 13.0, 21.0, 25.0, 40.0, 34.0, 45.0, 78.0, 134.0, 189.0, 308.0, 497.0, 998.0, 2128.0, 5816.0, 23468.0, 168368.0, 680734.0, 135720.0, 20195.0, 5418.0, 2047.0, 866.0, 476.0, 301.0, 169.0, 116.0, 92.0, 57.0, 39.0, 38.0, 23.0, 22.0, 17.0, 7.0, 13.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.1875, -29.087890625, -27.98828125, -26.888671875, -25.7890625, -24.689453125, -23.58984375, -22.490234375, -21.390625, -20.291015625, -19.19140625, -18.091796875, -16.9921875, -15.892578125, -14.79296875, -13.693359375, -12.59375, -11.494140625, -10.39453125, -9.294921875, -8.1953125, -7.095703125, -5.99609375, -4.896484375, -3.796875, -2.697265625, -1.59765625, -0.498046875, 0.6015625, 1.701171875, 2.80078125, 3.900390625, 5.0, 6.099609375, 7.19921875, 8.298828125, 9.3984375, 10.498046875, 11.59765625, 12.697265625, 13.796875, 14.896484375, 15.99609375, 17.095703125, 18.1953125, 19.294921875, 20.39453125, 21.494140625, 22.59375, 23.693359375, 24.79296875, 25.892578125, 26.9921875, 28.091796875, 29.19140625, 30.291015625, 31.390625, 32.490234375, 33.58984375, 34.689453125, 35.7890625, 36.888671875, 37.98828125, 39.087890625, 40.1875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 13.0, 13.0, 13.0, 13.0, 15.0, 20.0, 29.0, 31.0, 39.0, 60.0, 53.0, 65.0, 83.0, 65.0, 62.0, 58.0, 59.0, 42.0, 49.0, 40.0, 39.0, 30.0, 24.0, 18.0, 15.0, 7.0, 4.0, 3.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.796875, -21.96533203125, -21.1337890625, -20.30224609375, -19.470703125, -18.63916015625, -17.8076171875, -16.97607421875, -16.14453125, -15.31298828125, -14.4814453125, -13.64990234375, -12.818359375, -11.98681640625, -11.1552734375, -10.32373046875, -9.4921875, -8.66064453125, -7.8291015625, -6.99755859375, -6.166015625, -5.33447265625, -4.5029296875, -3.67138671875, -2.83984375, -2.00830078125, -1.1767578125, -0.34521484375, 0.486328125, 1.31787109375, 2.1494140625, 2.98095703125, 3.8125, 4.64404296875, 5.4755859375, 6.30712890625, 7.138671875, 7.97021484375, 8.8017578125, 9.63330078125, 10.46484375, 11.29638671875, 12.1279296875, 12.95947265625, 13.791015625, 14.62255859375, 15.4541015625, 16.28564453125, 17.1171875, 17.94873046875, 18.7802734375, 19.61181640625, 20.443359375, 21.27490234375, 22.1064453125, 22.93798828125, 23.76953125, 24.60107421875, 25.4326171875, 26.26416015625, 27.095703125, 27.92724609375, 28.7587890625, 29.59033203125, 30.421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 17.0, 9.0, 21.0, 25.0, 42.0, 64.0, 97.0, 166.0, 315.0, 812.0, 2278.0, 9726.0, 126767.0, 878165.0, 23392.0, 4309.0, 1226.0, 552.0, 237.0, 118.0, 61.0, 48.0, 22.0, 23.0, 19.0, 15.0, 7.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.78125, -37.49853515625, -36.2158203125, -34.93310546875, -33.650390625, -32.36767578125, -31.0849609375, -29.80224609375, -28.51953125, -27.23681640625, -25.9541015625, -24.67138671875, -23.388671875, -22.10595703125, -20.8232421875, -19.54052734375, -18.2578125, -16.97509765625, -15.6923828125, -14.40966796875, -13.126953125, -11.84423828125, -10.5615234375, -9.27880859375, -7.99609375, -6.71337890625, -5.4306640625, -4.14794921875, -2.865234375, -1.58251953125, -0.2998046875, 0.98291015625, 2.265625, 3.54833984375, 4.8310546875, 6.11376953125, 7.396484375, 8.67919921875, 9.9619140625, 11.24462890625, 12.52734375, 13.81005859375, 15.0927734375, 16.37548828125, 17.658203125, 18.94091796875, 20.2236328125, 21.50634765625, 22.7890625, 24.07177734375, 25.3544921875, 26.63720703125, 27.919921875, 29.20263671875, 30.4853515625, 31.76806640625, 33.05078125, 34.33349609375, 35.6162109375, 36.89892578125, 38.181640625, 39.46435546875, 40.7470703125, 42.02978515625, 43.3125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 8.0, 12.0, 18.0, 24.0, 53.0, 109.0, 195.0, 245.0, 161.0, 67.0, 32.0, 27.0, 19.0, 12.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00312042236328125, -0.0030317306518554688, -0.0029430389404296875, -0.0028543472290039062, -0.002765655517578125, -0.0026769638061523438, -0.0025882720947265625, -0.0024995803833007812, -0.002410888671875, -0.0023221969604492188, -0.0022335052490234375, -0.0021448135375976562, -0.002056121826171875, -0.0019674301147460938, -0.0018787384033203125, -0.0017900466918945312, -0.00170135498046875, -0.0016126632690429688, -0.0015239715576171875, -0.0014352798461914062, -0.001346588134765625, -0.0012578964233398438, -0.0011692047119140625, -0.0010805130004882812, -0.0009918212890625, -0.0009031295776367188, -0.0008144378662109375, -0.0007257461547851562, -0.000637054443359375, -0.0005483627319335938, -0.0004596710205078125, -0.00037097930908203125, -0.00028228759765625, -0.00019359588623046875, -0.0001049041748046875, -1.621246337890625e-05, 7.2479248046875e-05, 0.00016117095947265625, 0.0002498626708984375, 0.00033855438232421875, 0.00042724609375, 0.0005159378051757812, 0.0006046295166015625, 0.0006933212280273438, 0.000782012939453125, 0.0008707046508789062, 0.0009593963623046875, 0.0010480880737304688, 0.00113677978515625, 0.0012254714965820312, 0.0013141632080078125, 0.0014028549194335938, 0.001491546630859375, 0.0015802383422851562, 0.0016689300537109375, 0.0017576217651367188, 0.0018463134765625, 0.0019350051879882812, 0.0020236968994140625, 0.0021123886108398438, 0.002201080322265625, 0.0022897720336914062, 0.0023784637451171875, 0.0024671554565429688, 0.00255584716796875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 2.0, 3.0, 3.0, 10.0, 8.0, 14.0, 12.0, 14.0, 24.0, 40.0, 60.0, 99.0, 204.0, 514.0, 1778.0, 9148.0, 486397.0, 538022.0, 9298.0, 1864.0, 525.0, 208.0, 119.0, 63.0, 30.0, 27.0, 17.0, 8.0, 14.0, 7.0, 6.0, 3.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.4375, -53.4580078125, -51.478515625, -49.4990234375, -47.51953125, -45.5400390625, -43.560546875, -41.5810546875, -39.6015625, -37.6220703125, -35.642578125, -33.6630859375, -31.68359375, -29.7041015625, -27.724609375, -25.7451171875, -23.765625, -21.7861328125, -19.806640625, -17.8271484375, -15.84765625, -13.8681640625, -11.888671875, -9.9091796875, -7.9296875, -5.9501953125, -3.970703125, -1.9912109375, -0.01171875, 1.9677734375, 3.947265625, 5.9267578125, 7.90625, 9.8857421875, 11.865234375, 13.8447265625, 15.82421875, 17.8037109375, 19.783203125, 21.7626953125, 23.7421875, 25.7216796875, 27.701171875, 29.6806640625, 31.66015625, 33.6396484375, 35.619140625, 37.5986328125, 39.578125, 41.5576171875, 43.537109375, 45.5166015625, 47.49609375, 49.4755859375, 51.455078125, 53.4345703125, 55.4140625, 57.3935546875, 59.373046875, 61.3525390625, 63.33203125, 65.3115234375, 67.291015625, 69.2705078125, 71.25]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 6.0, 22.0, 21.0, 54.0, 164.0, 327.0, 219.0, 54.0, 20.0, 23.0, 12.0, 13.0, 10.0, 6.0, 6.0, 5.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.28125, -34.317138671875, -33.35302734375, -32.388916015625, -31.4248046875, -30.460693359375, -29.49658203125, -28.532470703125, -27.568359375, -26.604248046875, -25.64013671875, -24.676025390625, -23.7119140625, -22.747802734375, -21.78369140625, -20.819580078125, -19.85546875, -18.891357421875, -17.92724609375, -16.963134765625, -15.9990234375, -15.034912109375, -14.07080078125, -13.106689453125, -12.142578125, -11.178466796875, -10.21435546875, -9.250244140625, -8.2861328125, -7.322021484375, -6.35791015625, -5.393798828125, -4.4296875, -3.465576171875, -2.50146484375, -1.537353515625, -0.5732421875, 0.390869140625, 1.35498046875, 2.319091796875, 3.283203125, 4.247314453125, 5.21142578125, 6.175537109375, 7.1396484375, 8.103759765625, 9.06787109375, 10.031982421875, 10.99609375, 11.960205078125, 12.92431640625, 13.888427734375, 14.8525390625, 15.816650390625, 16.78076171875, 17.744873046875, 18.708984375, 19.673095703125, 20.63720703125, 21.601318359375, 22.5654296875, 23.529541015625, 24.49365234375, 25.457763671875, 26.421875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 17.0, 60.0, 156.0, 301.0, 273.0, 107.0, 38.0, 20.0, 13.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-460.02301025390625, -448.4735107421875, -436.92401123046875, -425.37451171875, -413.82501220703125, -402.2755126953125, -390.72601318359375, -379.176513671875, -367.62701416015625, -356.0775146484375, -344.52801513671875, -332.978515625, -321.42901611328125, -309.8795166015625, -298.33001708984375, -286.780517578125, -275.23101806640625, -263.6815185546875, -252.13201904296875, -240.58251953125, -229.03302001953125, -217.4835205078125, -205.93402099609375, -194.384521484375, -182.83502197265625, -171.2855224609375, -159.73602294921875, -148.1865234375, -136.63702392578125, -125.0875244140625, -113.53802490234375, -101.988525390625, -90.43902587890625, -78.8895263671875, -67.34002685546875, -55.79052734375, -44.24102783203125, -32.6915283203125, -21.14202880859375, -9.592529296875, 1.95697021484375, 13.5064697265625, 25.05596923828125, 36.60546875, 48.15496826171875, 59.7044677734375, 71.25396728515625, 82.803466796875, 94.35296630859375, 105.9024658203125, 117.45196533203125, 129.00146484375, 140.55096435546875, 152.1004638671875, 163.64996337890625, 175.199462890625, 186.74896240234375, 198.2984619140625, 209.84796142578125, 221.3974609375, 232.94696044921875, 244.4964599609375, 256.04595947265625, 267.595458984375, 279.14495849609375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 4.0, 6.0, 8.0, 11.0, 11.0, 19.0, 26.0, 22.0, 29.0, 32.0, 30.0, 39.0, 43.0, 43.0, 39.0, 45.0, 49.0, 58.0, 49.0, 45.0, 44.0, 34.0, 63.0, 35.0, 31.0, 22.0, 32.0, 19.0, 22.0, 16.0, 14.0, 8.0, 3.0, 7.0, 10.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-150.17935180664062, -145.4374237060547, -140.69549560546875, -135.9535675048828, -131.21163940429688, -126.46971130371094, -121.727783203125, -116.98585510253906, -112.24392700195312, -107.50199890136719, -102.76007080078125, -98.01814270019531, -93.27621459960938, -88.53428649902344, -83.7923583984375, -79.05043029785156, -74.30850219726562, -69.56657409667969, -64.82464599609375, -60.08271789550781, -55.340789794921875, -50.59886169433594, -45.85693359375, -41.11500549316406, -36.373077392578125, -31.631149291992188, -26.88922119140625, -22.147293090820312, -17.405364990234375, -12.663436889648438, -7.9215087890625, -3.1795806884765625, 1.562347412109375, 6.3042755126953125, 11.04620361328125, 15.788131713867188, 20.530059814453125, 25.271987915039062, 30.013916015625, 34.75584411621094, 39.497772216796875, 44.23970031738281, 48.98162841796875, 53.72355651855469, 58.465484619140625, 63.20741271972656, 67.9493408203125, 72.69126892089844, 77.43319702148438, 82.17512512207031, 86.91705322265625, 91.65898132324219, 96.40090942382812, 101.14283752441406, 105.884765625, 110.62669372558594, 115.36862182617188, 120.11054992675781, 124.85247802734375, 129.5944061279297, 134.33633422851562, 139.07826232910156, 143.8201904296875, 148.56211853027344, 153.30404663085938]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 8.0, 4.0, 6.0, 5.0, 28.0, 35.0, 46.0, 112.0, 175.0, 336.0, 776.0, 1989.0, 6340.0, 37522.0, 3137232.0, 970703.0, 29636.0, 5724.0, 1881.0, 759.0, 404.0, 233.0, 122.0, 61.0, 43.0, 16.0, 24.0, 18.0, 7.0, 14.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.46875, -35.16357421875, -33.8583984375, -32.55322265625, -31.248046875, -29.94287109375, -28.6376953125, -27.33251953125, -26.02734375, -24.72216796875, -23.4169921875, -22.11181640625, -20.806640625, -19.50146484375, -18.1962890625, -16.89111328125, -15.5859375, -14.28076171875, -12.9755859375, -11.67041015625, -10.365234375, -9.06005859375, -7.7548828125, -6.44970703125, -5.14453125, -3.83935546875, -2.5341796875, -1.22900390625, 0.076171875, 1.38134765625, 2.6865234375, 3.99169921875, 5.296875, 6.60205078125, 7.9072265625, 9.21240234375, 10.517578125, 11.82275390625, 13.1279296875, 14.43310546875, 15.73828125, 17.04345703125, 18.3486328125, 19.65380859375, 20.958984375, 22.26416015625, 23.5693359375, 24.87451171875, 26.1796875, 27.48486328125, 28.7900390625, 30.09521484375, 31.400390625, 32.70556640625, 34.0107421875, 35.31591796875, 36.62109375, 37.92626953125, 39.2314453125, 40.53662109375, 41.841796875, 43.14697265625, 44.4521484375, 45.75732421875, 47.0625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 20.0, 29.0, 48.0, 56.0, 73.0, 96.0, 104.0, 100.0, 104.0, 110.0, 76.0, 53.0, 33.0, 31.0, 16.0, 11.0, 15.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.795166015625, -7.51220703125, -7.229248046875, -6.9462890625, -6.663330078125, -6.38037109375, -6.097412109375, -5.814453125, -5.531494140625, -5.24853515625, -4.965576171875, -4.6826171875, -4.399658203125, -4.11669921875, -3.833740234375, -3.55078125, -3.267822265625, -2.98486328125, -2.701904296875, -2.4189453125, -2.135986328125, -1.85302734375, -1.570068359375, -1.287109375, -1.004150390625, -0.72119140625, -0.438232421875, -0.1552734375, 0.127685546875, 0.41064453125, 0.693603515625, 0.9765625, 1.259521484375, 1.54248046875, 1.825439453125, 2.1083984375, 2.391357421875, 2.67431640625, 2.957275390625, 3.240234375, 3.523193359375, 3.80615234375, 4.089111328125, 4.3720703125, 4.655029296875, 4.93798828125, 5.220947265625, 5.50390625, 5.786865234375, 6.06982421875, 6.352783203125, 6.6357421875, 6.918701171875, 7.20166015625, 7.484619140625, 7.767578125, 8.050537109375, 8.33349609375, 8.616455078125, 8.8994140625, 9.182373046875, 9.46533203125, 9.748291015625, 10.03125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 10.0, 13.0, 21.0, 23.0, 42.0, 65.0, 84.0, 118.0, 176.0, 285.0, 487.0, 824.0, 1504.0, 3056.0, 7385.0, 21967.0, 94584.0, 1193931.0, 2695823.0, 131302.0, 26412.0, 8535.0, 3485.0, 1703.0, 932.0, 500.0, 304.0, 194.0, 134.0, 102.0, 76.0, 42.0, 34.0, 34.0, 22.0, 20.0, 8.0, 10.0, 3.0, 11.0, 5.0, 9.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.765625, -18.12060546875, -17.4755859375, -16.83056640625, -16.185546875, -15.54052734375, -14.8955078125, -14.25048828125, -13.60546875, -12.96044921875, -12.3154296875, -11.67041015625, -11.025390625, -10.38037109375, -9.7353515625, -9.09033203125, -8.4453125, -7.80029296875, -7.1552734375, -6.51025390625, -5.865234375, -5.22021484375, -4.5751953125, -3.93017578125, -3.28515625, -2.64013671875, -1.9951171875, -1.35009765625, -0.705078125, -0.06005859375, 0.5849609375, 1.22998046875, 1.875, 2.52001953125, 3.1650390625, 3.81005859375, 4.455078125, 5.10009765625, 5.7451171875, 6.39013671875, 7.03515625, 7.68017578125, 8.3251953125, 8.97021484375, 9.615234375, 10.26025390625, 10.9052734375, 11.55029296875, 12.1953125, 12.84033203125, 13.4853515625, 14.13037109375, 14.775390625, 15.42041015625, 16.0654296875, 16.71044921875, 17.35546875, 18.00048828125, 18.6455078125, 19.29052734375, 19.935546875, 20.58056640625, 21.2255859375, 21.87060546875, 22.515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 13.0, 15.0, 11.0, 25.0, 47.0, 95.0, 152.0, 345.0, 1523.0, 1186.0, 369.0, 134.0, 50.0, 30.0, 21.0, 14.0, 19.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.265625, -9.81787109375, -9.3701171875, -8.92236328125, -8.474609375, -8.02685546875, -7.5791015625, -7.13134765625, -6.68359375, -6.23583984375, -5.7880859375, -5.34033203125, -4.892578125, -4.44482421875, -3.9970703125, -3.54931640625, -3.1015625, -2.65380859375, -2.2060546875, -1.75830078125, -1.310546875, -0.86279296875, -0.4150390625, 0.03271484375, 0.48046875, 0.92822265625, 1.3759765625, 1.82373046875, 2.271484375, 2.71923828125, 3.1669921875, 3.61474609375, 4.0625, 4.51025390625, 4.9580078125, 5.40576171875, 5.853515625, 6.30126953125, 6.7490234375, 7.19677734375, 7.64453125, 8.09228515625, 8.5400390625, 8.98779296875, 9.435546875, 9.88330078125, 10.3310546875, 10.77880859375, 11.2265625, 11.67431640625, 12.1220703125, 12.56982421875, 13.017578125, 13.46533203125, 13.9130859375, 14.36083984375, 14.80859375, 15.25634765625, 15.7041015625, 16.15185546875, 16.599609375, 17.04736328125, 17.4951171875, 17.94287109375, 18.390625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 9.0, 14.0, 24.0, 87.0, 129.0, 175.0, 177.0, 169.0, 112.0, 59.0, 26.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.53042602539062, -75.12693786621094, -72.72344970703125, -70.31996154785156, -67.91646575927734, -65.51297760009766, -63.10948944091797, -60.70600128173828, -58.302513122558594, -55.899024963378906, -53.49553298950195, -51.092044830322266, -48.68855667114258, -46.285064697265625, -43.88157653808594, -41.47808837890625, -39.0745964050293, -36.67110824584961, -34.267616271972656, -31.86412811279297, -29.46063995361328, -27.05714988708496, -24.65365982055664, -22.250171661376953, -19.846681594848633, -17.443191528320312, -15.039703369140625, -12.636213302612305, -10.2327241897583, -7.829235076904297, -5.425745010375977, -3.022256851196289, -0.6187667846679688, 1.7847225666046143, 4.188211917877197, 6.591701507568359, 8.995190620422363, 11.398679733276367, 13.802169799804688, 16.205657958984375, 18.609148025512695, 21.012638092041016, 23.416126251220703, 25.819616317749023, 28.223106384277344, 30.62659454345703, 33.03008270263672, 35.433570861816406, 37.83706283569336, 40.24055099487305, 42.64404296875, 45.04753112792969, 47.451019287109375, 49.85450744628906, 52.257999420166016, 54.6614875793457, 57.064979553222656, 59.468467712402344, 61.8719596862793, 64.27545166015625, 66.67893981933594, 69.08242797851562, 71.48591613769531, 73.889404296875, 76.29289245605469]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 9.0, 13.0, 29.0, 37.0, 45.0, 59.0, 74.0, 80.0, 91.0, 103.0, 94.0, 78.0, 77.0, 69.0, 43.0, 25.0, 29.0, 22.0, 11.0, 9.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.79353332519531, -72.56404876708984, -70.33456420898438, -68.1050796508789, -65.87559509277344, -63.64611053466797, -61.4166259765625, -59.18714141845703, -56.95765686035156, -54.728172302246094, -52.498687744140625, -50.269203186035156, -48.03971862792969, -45.81023406982422, -43.58074951171875, -41.35126495361328, -39.12178039550781, -36.892295837402344, -34.662811279296875, -32.433326721191406, -30.203842163085938, -27.97435760498047, -25.744873046875, -23.51538848876953, -21.285903930664062, -19.056419372558594, -16.826934814453125, -14.597450256347656, -12.367965698242188, -10.138481140136719, -7.90899658203125, -5.679512023925781, -3.4500274658203125, -1.2205429077148438, 1.008941650390625, 3.2384262084960938, 5.4679107666015625, 7.697395324707031, 9.9268798828125, 12.156364440917969, 14.385848999023438, 16.615333557128906, 18.844818115234375, 21.074302673339844, 23.303787231445312, 25.53327178955078, 27.76275634765625, 29.99224090576172, 32.22172546386719, 34.451210021972656, 36.680694580078125, 38.910179138183594, 41.13966369628906, 43.36914825439453, 45.5986328125, 47.82811737060547, 50.05760192871094, 52.287086486816406, 54.516571044921875, 56.746055603027344, 58.97554016113281, 61.20502471923828, 63.43450927734375, 65.66399383544922, 67.89347839355469]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 9.0, 7.0, 18.0, 9.0, 25.0, 39.0, 74.0, 94.0, 196.0, 425.0, 985.0, 2936.0, 11622.0, 74096.0, 600378.0, 311633.0, 35817.0, 6870.0, 1890.0, 679.0, 329.0, 170.0, 101.0, 56.0, 32.0, 26.0, 12.0, 15.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.78125, -49.47314453125, -48.1650390625, -46.85693359375, -45.548828125, -44.24072265625, -42.9326171875, -41.62451171875, -40.31640625, -39.00830078125, -37.7001953125, -36.39208984375, -35.083984375, -33.77587890625, -32.4677734375, -31.15966796875, -29.8515625, -28.54345703125, -27.2353515625, -25.92724609375, -24.619140625, -23.31103515625, -22.0029296875, -20.69482421875, -19.38671875, -18.07861328125, -16.7705078125, -15.46240234375, -14.154296875, -12.84619140625, -11.5380859375, -10.22998046875, -8.921875, -7.61376953125, -6.3056640625, -4.99755859375, -3.689453125, -2.38134765625, -1.0732421875, 0.23486328125, 1.54296875, 2.85107421875, 4.1591796875, 5.46728515625, 6.775390625, 8.08349609375, 9.3916015625, 10.69970703125, 12.0078125, 13.31591796875, 14.6240234375, 15.93212890625, 17.240234375, 18.54833984375, 19.8564453125, 21.16455078125, 22.47265625, 23.78076171875, 25.0888671875, 26.39697265625, 27.705078125, 29.01318359375, 30.3212890625, 31.62939453125, 32.9375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 11.0, 15.0, 36.0, 37.0, 56.0, 72.0, 88.0, 106.0, 102.0, 90.0, 91.0, 87.0, 66.0, 37.0, 22.0, 28.0, 15.0, 13.0, 5.0, 8.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.525634765625, -6.26220703125, -5.998779296875, -5.7353515625, -5.471923828125, -5.20849609375, -4.945068359375, -4.681640625, -4.418212890625, -4.15478515625, -3.891357421875, -3.6279296875, -3.364501953125, -3.10107421875, -2.837646484375, -2.57421875, -2.310791015625, -2.04736328125, -1.783935546875, -1.5205078125, -1.257080078125, -0.99365234375, -0.730224609375, -0.466796875, -0.203369140625, 0.06005859375, 0.323486328125, 0.5869140625, 0.850341796875, 1.11376953125, 1.377197265625, 1.640625, 1.904052734375, 2.16748046875, 2.430908203125, 2.6943359375, 2.957763671875, 3.22119140625, 3.484619140625, 3.748046875, 4.011474609375, 4.27490234375, 4.538330078125, 4.8017578125, 5.065185546875, 5.32861328125, 5.592041015625, 5.85546875, 6.118896484375, 6.38232421875, 6.645751953125, 6.9091796875, 7.172607421875, 7.43603515625, 7.699462890625, 7.962890625, 8.226318359375, 8.48974609375, 8.753173828125, 9.0166015625, 9.280029296875, 9.54345703125, 9.806884765625, 10.0703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 4.0, 15.0, 14.0, 35.0, 39.0, 69.0, 146.0, 243.0, 658.0, 1662.0, 5292.0, 28839.0, 432855.0, 534760.0, 34626.0, 6155.0, 1783.0, 703.0, 277.0, 165.0, 75.0, 45.0, 29.0, 13.0, 10.0, 9.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.625, -46.138671875, -44.65234375, -43.166015625, -41.6796875, -40.193359375, -38.70703125, -37.220703125, -35.734375, -34.248046875, -32.76171875, -31.275390625, -29.7890625, -28.302734375, -26.81640625, -25.330078125, -23.84375, -22.357421875, -20.87109375, -19.384765625, -17.8984375, -16.412109375, -14.92578125, -13.439453125, -11.953125, -10.466796875, -8.98046875, -7.494140625, -6.0078125, -4.521484375, -3.03515625, -1.548828125, -0.0625, 1.423828125, 2.91015625, 4.396484375, 5.8828125, 7.369140625, 8.85546875, 10.341796875, 11.828125, 13.314453125, 14.80078125, 16.287109375, 17.7734375, 19.259765625, 20.74609375, 22.232421875, 23.71875, 25.205078125, 26.69140625, 28.177734375, 29.6640625, 31.150390625, 32.63671875, 34.123046875, 35.609375, 37.095703125, 38.58203125, 40.068359375, 41.5546875, 43.041015625, 44.52734375, 46.013671875, 47.5]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 5.0, 7.0, 11.0, 17.0, 27.0, 22.0, 36.0, 53.0, 57.0, 82.0, 85.0, 101.0, 86.0, 67.0, 67.0, 63.0, 63.0, 29.0, 30.0, 19.0, 14.0, 13.0, 10.0, 4.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.46875, -40.28125, -39.09375, -37.90625, -36.71875, -35.53125, -34.34375, -33.15625, -31.96875, -30.78125, -29.59375, -28.40625, -27.21875, -26.03125, -24.84375, -23.65625, -22.46875, -21.28125, -20.09375, -18.90625, -17.71875, -16.53125, -15.34375, -14.15625, -12.96875, -11.78125, -10.59375, -9.40625, -8.21875, -7.03125, -5.84375, -4.65625, -3.46875, -2.28125, -1.09375, 0.09375, 1.28125, 2.46875, 3.65625, 4.84375, 6.03125, 7.21875, 8.40625, 9.59375, 10.78125, 11.96875, 13.15625, 14.34375, 15.53125, 16.71875, 17.90625, 19.09375, 20.28125, 21.46875, 22.65625, 23.84375, 25.03125, 26.21875, 27.40625, 28.59375, 29.78125, 30.96875, 32.15625, 33.34375, 34.53125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 5.0, 9.0, 5.0, 12.0, 28.0, 26.0, 47.0, 74.0, 124.0, 268.0, 710.0, 2536.0, 16842.0, 979988.0, 42420.0, 3758.0, 936.0, 343.0, 162.0, 95.0, 60.0, 30.0, 15.0, 15.0, 12.0, 9.0, 4.0, 5.0, 7.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-88.0625, -85.72265625, -83.3828125, -81.04296875, -78.703125, -76.36328125, -74.0234375, -71.68359375, -69.34375, -67.00390625, -64.6640625, -62.32421875, -59.984375, -57.64453125, -55.3046875, -52.96484375, -50.625, -48.28515625, -45.9453125, -43.60546875, -41.265625, -38.92578125, -36.5859375, -34.24609375, -31.90625, -29.56640625, -27.2265625, -24.88671875, -22.546875, -20.20703125, -17.8671875, -15.52734375, -13.1875, -10.84765625, -8.5078125, -6.16796875, -3.828125, -1.48828125, 0.8515625, 3.19140625, 5.53125, 7.87109375, 10.2109375, 12.55078125, 14.890625, 17.23046875, 19.5703125, 21.91015625, 24.25, 26.58984375, 28.9296875, 31.26953125, 33.609375, 35.94921875, 38.2890625, 40.62890625, 42.96875, 45.30859375, 47.6484375, 49.98828125, 52.328125, 54.66796875, 57.0078125, 59.34765625, 61.6875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 9.0, 9.0, 10.0, 10.0, 24.0, 26.0, 42.0, 48.0, 105.0, 135.0, 170.0, 164.0, 62.0, 49.0, 43.0, 23.0, 19.0, 19.0, 10.0, 6.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0023288726806640625, -0.002271205186843872, -0.0022135376930236816, -0.002155870199203491, -0.0020982027053833008, -0.0020405352115631104, -0.00198286771774292, -0.0019252002239227295, -0.001867532730102539, -0.0018098652362823486, -0.0017521977424621582, -0.0016945302486419678, -0.0016368627548217773, -0.001579195261001587, -0.0015215277671813965, -0.001463860273361206, -0.0014061927795410156, -0.0013485252857208252, -0.0012908577919006348, -0.0012331902980804443, -0.001175522804260254, -0.0011178553104400635, -0.001060187816619873, -0.0010025203227996826, -0.0009448528289794922, -0.0008871853351593018, -0.0008295178413391113, -0.0007718503475189209, -0.0007141828536987305, -0.00065651535987854, -0.0005988478660583496, -0.0005411803722381592, -0.00048351287841796875, -0.0004258453845977783, -0.0003681778907775879, -0.00031051039695739746, -0.00025284290313720703, -0.0001951754093170166, -0.00013750791549682617, -7.984042167663574e-05, -2.2172927856445312e-05, 3.549456596374512e-05, 9.316205978393555e-05, 0.00015082955360412598, 0.0002084970474243164, 0.00026616454124450684, 0.00032383203506469727, 0.0003814995288848877, 0.0004391670227050781, 0.0004968345165252686, 0.000554502010345459, 0.0006121695041656494, 0.0006698369979858398, 0.0007275044918060303, 0.0007851719856262207, 0.0008428394794464111, 0.0009005069732666016, 0.000958174467086792, 0.0010158419609069824, 0.0010735094547271729, 0.0011311769485473633, 0.0011888444423675537, 0.0012465119361877441, 0.0013041794300079346, 0.001361846923828125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 7.0, 5.0, 7.0, 13.0, 12.0, 31.0, 41.0, 50.0, 119.0, 252.0, 584.0, 1446.0, 4082.0, 23184.0, 968432.0, 41932.0, 5189.0, 1716.0, 804.0, 270.0, 162.0, 64.0, 44.0, 25.0, 10.0, 12.0, 6.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-60.59375, -58.67578125, -56.7578125, -54.83984375, -52.921875, -51.00390625, -49.0859375, -47.16796875, -45.25, -43.33203125, -41.4140625, -39.49609375, -37.578125, -35.66015625, -33.7421875, -31.82421875, -29.90625, -27.98828125, -26.0703125, -24.15234375, -22.234375, -20.31640625, -18.3984375, -16.48046875, -14.5625, -12.64453125, -10.7265625, -8.80859375, -6.890625, -4.97265625, -3.0546875, -1.13671875, 0.78125, 2.69921875, 4.6171875, 6.53515625, 8.453125, 10.37109375, 12.2890625, 14.20703125, 16.125, 18.04296875, 19.9609375, 21.87890625, 23.796875, 25.71484375, 27.6328125, 29.55078125, 31.46875, 33.38671875, 35.3046875, 37.22265625, 39.140625, 41.05859375, 42.9765625, 44.89453125, 46.8125, 48.73046875, 50.6484375, 52.56640625, 54.484375, 56.40234375, 58.3203125, 60.23828125, 62.15625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 10.0, 20.0, 39.0, 158.0, 326.0, 289.0, 79.0, 31.0, 14.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.5625, -54.939453125, -53.31640625, -51.693359375, -50.0703125, -48.447265625, -46.82421875, -45.201171875, -43.578125, -41.955078125, -40.33203125, -38.708984375, -37.0859375, -35.462890625, -33.83984375, -32.216796875, -30.59375, -28.970703125, -27.34765625, -25.724609375, -24.1015625, -22.478515625, -20.85546875, -19.232421875, -17.609375, -15.986328125, -14.36328125, -12.740234375, -11.1171875, -9.494140625, -7.87109375, -6.248046875, -4.625, -3.001953125, -1.37890625, 0.244140625, 1.8671875, 3.490234375, 5.11328125, 6.736328125, 8.359375, 9.982421875, 11.60546875, 13.228515625, 14.8515625, 16.474609375, 18.09765625, 19.720703125, 21.34375, 22.966796875, 24.58984375, 26.212890625, 27.8359375, 29.458984375, 31.08203125, 32.705078125, 34.328125, 35.951171875, 37.57421875, 39.197265625, 40.8203125, 42.443359375, 44.06640625, 45.689453125, 47.3125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 13.0, 19.0, 36.0, 64.0, 191.0, 252.0, 203.0, 109.0, 56.0, 34.0, 12.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.50088500976562, -188.31272888183594, -178.12457275390625, -167.9364013671875, -157.7482452392578, -147.56008911132812, -137.37191772460938, -127.18376159667969, -116.99560546875, -106.80744934082031, -96.6192855834961, -86.43112182617188, -76.24296569824219, -66.0548095703125, -55.86664581298828, -45.67848205566406, -35.490325927734375, -25.302165985107422, -15.114006042480469, -4.925846099853516, 5.2623138427734375, 15.45047378540039, 25.638633728027344, 35.82679748535156, 46.01495361328125, 56.2031135559082, 66.39127349853516, 76.57943725585938, 86.76759338378906, 96.95574951171875, 107.14391326904297, 117.33207702636719, 127.52023315429688, 137.70838928222656, 147.89654541015625, 158.084716796875, 168.2728729248047, 178.46102905273438, 188.64920043945312, 198.8373565673828, 209.0255126953125, 219.2136688232422, 229.40182495117188, 239.58999633789062, 249.7781524658203, 259.96630859375, 270.15447998046875, 280.3426513671875, 290.5307922363281, 300.7189636230469, 310.9071044921875, 321.09527587890625, 331.283447265625, 341.4715881347656, 351.6597595214844, 361.847900390625, 372.03607177734375, 382.2242431640625, 392.4123840332031, 402.6005554199219, 412.7886962890625, 422.97686767578125, 433.1650390625, 443.35321044921875, 453.5413513183594]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 9.0, 21.0, 15.0, 27.0, 40.0, 36.0, 45.0, 50.0, 52.0, 63.0, 51.0, 63.0, 75.0, 59.0, 59.0, 52.0, 57.0, 41.0, 46.0, 27.0, 26.0, 20.0, 20.0, 11.0, 11.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-234.2310791015625, -226.9092254638672, -219.5873565673828, -212.2655029296875, -204.9436492919922, -197.62179565429688, -190.2999267578125, -182.9780731201172, -175.65621948242188, -168.33436584472656, -161.0124969482422, -153.69064331054688, -146.36878967285156, -139.04693603515625, -131.72506713867188, -124.40321350097656, -117.08134460449219, -109.75948333740234, -102.43762969970703, -95.11576843261719, -87.79391479492188, -80.47205352783203, -73.15019226074219, -65.82833862304688, -58.50647735595703, -51.18461990356445, -43.862762451171875, -36.54090118408203, -29.219043731689453, -21.897186279296875, -14.575325012207031, -7.253467559814453, 0.068389892578125, 7.3902482986450195, 14.712106704711914, 22.033966064453125, 29.355823516845703, 36.67768096923828, 43.999542236328125, 51.3213996887207, 58.64325714111328, 65.96511840820312, 73.28697204589844, 80.60883331298828, 87.93069458007812, 95.25254821777344, 102.57440948486328, 109.89627075195312, 117.21812438964844, 124.53998565673828, 131.86184692382812, 139.18370056152344, 146.50555419921875, 153.82742309570312, 161.14927673339844, 168.47113037109375, 175.79299926757812, 183.11485290527344, 190.4367218017578, 197.75857543945312, 205.08042907714844, 212.40228271484375, 219.72415161132812, 227.04600524902344, 234.36785888671875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 7.0, 11.0, 31.0, 34.0, 71.0, 140.0, 277.0, 634.0, 2362.0, 22997.0, 4010357.0, 148918.0, 6440.0, 1168.0, 386.0, 185.0, 110.0, 67.0, 25.0, 18.0, 13.0, 8.0, 3.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.6875, -68.86279296875, -67.0380859375, -65.21337890625, -63.388671875, -61.56396484375, -59.7392578125, -57.91455078125, -56.08984375, -54.26513671875, -52.4404296875, -50.61572265625, -48.791015625, -46.96630859375, -45.1416015625, -43.31689453125, -41.4921875, -39.66748046875, -37.8427734375, -36.01806640625, -34.193359375, -32.36865234375, -30.5439453125, -28.71923828125, -26.89453125, -25.06982421875, -23.2451171875, -21.42041015625, -19.595703125, -17.77099609375, -15.9462890625, -14.12158203125, -12.296875, -10.47216796875, -8.6474609375, -6.82275390625, -4.998046875, -3.17333984375, -1.3486328125, 0.47607421875, 2.30078125, 4.12548828125, 5.9501953125, 7.77490234375, 9.599609375, 11.42431640625, 13.2490234375, 15.07373046875, 16.8984375, 18.72314453125, 20.5478515625, 22.37255859375, 24.197265625, 26.02197265625, 27.8466796875, 29.67138671875, 31.49609375, 33.32080078125, 35.1455078125, 36.97021484375, 38.794921875, 40.61962890625, 42.4443359375, 44.26904296875, 46.09375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 12.0, 11.0, 23.0, 36.0, 64.0, 100.0, 101.0, 129.0, 139.0, 108.0, 97.0, 80.0, 46.0, 17.0, 16.0, 10.0, 9.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4140625, -13.043212890625, -12.67236328125, -12.301513671875, -11.9306640625, -11.559814453125, -11.18896484375, -10.818115234375, -10.447265625, -10.076416015625, -9.70556640625, -9.334716796875, -8.9638671875, -8.593017578125, -8.22216796875, -7.851318359375, -7.48046875, -7.109619140625, -6.73876953125, -6.367919921875, -5.9970703125, -5.626220703125, -5.25537109375, -4.884521484375, -4.513671875, -4.142822265625, -3.77197265625, -3.401123046875, -3.0302734375, -2.659423828125, -2.28857421875, -1.917724609375, -1.546875, -1.176025390625, -0.80517578125, -0.434326171875, -0.0634765625, 0.307373046875, 0.67822265625, 1.049072265625, 1.419921875, 1.790771484375, 2.16162109375, 2.532470703125, 2.9033203125, 3.274169921875, 3.64501953125, 4.015869140625, 4.38671875, 4.757568359375, 5.12841796875, 5.499267578125, 5.8701171875, 6.240966796875, 6.61181640625, 6.982666015625, 7.353515625, 7.724365234375, 8.09521484375, 8.466064453125, 8.8369140625, 9.207763671875, 9.57861328125, 9.949462890625, 10.3203125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 8.0, 10.0, 18.0, 20.0, 23.0, 38.0, 57.0, 94.0, 135.0, 206.0, 356.0, 526.0, 865.0, 1395.0, 2375.0, 4226.0, 8353.0, 20228.0, 63935.0, 424350.0, 3384045.0, 209973.0, 43681.0, 14849.0, 6550.0, 3334.0, 1791.0, 1040.0, 660.0, 404.0, 249.0, 159.0, 102.0, 84.0, 49.0, 31.0, 25.0, 12.0, 8.0, 5.0, 9.0, 0.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.34375, -16.7529296875, -16.162109375, -15.5712890625, -14.98046875, -14.3896484375, -13.798828125, -13.2080078125, -12.6171875, -12.0263671875, -11.435546875, -10.8447265625, -10.25390625, -9.6630859375, -9.072265625, -8.4814453125, -7.890625, -7.2998046875, -6.708984375, -6.1181640625, -5.52734375, -4.9365234375, -4.345703125, -3.7548828125, -3.1640625, -2.5732421875, -1.982421875, -1.3916015625, -0.80078125, -0.2099609375, 0.380859375, 0.9716796875, 1.5625, 2.1533203125, 2.744140625, 3.3349609375, 3.92578125, 4.5166015625, 5.107421875, 5.6982421875, 6.2890625, 6.8798828125, 7.470703125, 8.0615234375, 8.65234375, 9.2431640625, 9.833984375, 10.4248046875, 11.015625, 11.6064453125, 12.197265625, 12.7880859375, 13.37890625, 13.9697265625, 14.560546875, 15.1513671875, 15.7421875, 16.3330078125, 16.923828125, 17.5146484375, 18.10546875, 18.6962890625, 19.287109375, 19.8779296875, 20.46875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 2.0, 2.0, 10.0, 9.0, 8.0, 17.0, 23.0, 27.0, 40.0, 66.0, 115.0, 329.0, 1552.0, 1245.0, 301.0, 125.0, 70.0, 38.0, 22.0, 19.0, 11.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4453125, -10.084716796875, -9.72412109375, -9.363525390625, -9.0029296875, -8.642333984375, -8.28173828125, -7.921142578125, -7.560546875, -7.199951171875, -6.83935546875, -6.478759765625, -6.1181640625, -5.757568359375, -5.39697265625, -5.036376953125, -4.67578125, -4.315185546875, -3.95458984375, -3.593994140625, -3.2333984375, -2.872802734375, -2.51220703125, -2.151611328125, -1.791015625, -1.430419921875, -1.06982421875, -0.709228515625, -0.3486328125, 0.011962890625, 0.37255859375, 0.733154296875, 1.09375, 1.454345703125, 1.81494140625, 2.175537109375, 2.5361328125, 2.896728515625, 3.25732421875, 3.617919921875, 3.978515625, 4.339111328125, 4.69970703125, 5.060302734375, 5.4208984375, 5.781494140625, 6.14208984375, 6.502685546875, 6.86328125, 7.223876953125, 7.58447265625, 7.945068359375, 8.3056640625, 8.666259765625, 9.02685546875, 9.387451171875, 9.748046875, 10.108642578125, 10.46923828125, 10.829833984375, 11.1904296875, 11.551025390625, 11.91162109375, 12.272216796875, 12.6328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 21.0, 34.0, 103.0, 167.0, 213.0, 216.0, 118.0, 63.0, 27.0, 8.0, 9.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.47527313232422, -110.83724212646484, -108.19921112060547, -105.56117248535156, -102.92314147949219, -100.28511047363281, -97.64707946777344, -95.00904846191406, -92.37100982666016, -89.73297882080078, -87.0949478149414, -84.4569091796875, -81.81887817382812, -79.18084716796875, -76.54281616210938, -73.90478515625, -71.26675415039062, -68.62872314453125, -65.99069213867188, -63.352657318115234, -60.714622497558594, -58.07659149169922, -55.438560485839844, -52.8005256652832, -50.16249084472656, -47.52445983886719, -44.88642501831055, -42.24839401245117, -39.61035919189453, -36.972328186035156, -34.33429718017578, -31.69626235961914, -29.058223724365234, -26.420190811157227, -23.78215789794922, -21.144126892089844, -18.506092071533203, -15.868060111999512, -13.23002815246582, -10.591995239257812, -7.953962326049805, -5.315929412841797, -2.6778969764709473, -0.039864540100097656, 2.59816837310791, 5.236201286315918, 7.874233245849609, 10.512266159057617, 13.150299072265625, 15.788331985473633, 18.42636489868164, 21.064395904541016, 23.702430725097656, 26.34046173095703, 28.97849464416504, 31.616527557373047, 34.25456237792969, 36.89259338378906, 39.5306282043457, 42.16865921020508, 44.80669403076172, 47.444725036621094, 50.08275604248047, 52.72079086303711, 55.358821868896484]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 11.0, 8.0, 16.0, 27.0, 29.0, 43.0, 56.0, 50.0, 57.0, 86.0, 84.0, 71.0, 84.0, 85.0, 49.0, 51.0, 53.0, 39.0, 32.0, 24.0, 20.0, 5.0, 6.0, 10.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.36634063720703, -43.465248107910156, -41.564151763916016, -39.66305923461914, -37.761966705322266, -35.860870361328125, -33.95977783203125, -32.058685302734375, -30.1575927734375, -28.256498336791992, -26.355405807495117, -24.45431137084961, -22.553218841552734, -20.652124404907227, -18.75102996826172, -16.849937438964844, -14.948843002319336, -13.047749519348145, -11.146656036376953, -9.245561599731445, -7.344468593597412, -5.4433746337890625, -3.542281150817871, -1.6411876678466797, 0.2599058151245117, 2.160999298095703, 4.0620927810668945, 5.963186740875244, 7.8642802238464355, 9.765374183654785, 11.666467666625977, 13.567561149597168, 15.46865463256836, 17.369749069213867, 19.270841598510742, 21.17193603515625, 23.073028564453125, 24.974123001098633, 26.87521743774414, 28.776309967041016, 30.67740249633789, 32.578495025634766, 34.479591369628906, 36.38068389892578, 38.281776428222656, 40.18286895751953, 42.08396530151367, 43.98505783081055, 45.88615417480469, 47.78724670410156, 49.6883430480957, 51.58943557739258, 53.49052810668945, 55.391624450683594, 57.29271697998047, 59.193809509277344, 61.09490203857422, 62.995994567871094, 64.89708709716797, 66.79817962646484, 68.69927978515625, 70.60037231445312, 72.50146484375, 74.40255737304688, 76.30364990234375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 5.0, 16.0, 21.0, 41.0, 40.0, 48.0, 106.0, 156.0, 278.0, 477.0, 904.0, 2042.0, 5413.0, 17244.0, 69043.0, 323204.0, 470384.0, 118967.0, 26853.0, 7821.0, 2853.0, 1180.0, 567.0, 299.0, 184.0, 121.0, 81.0, 59.0, 38.0, 25.0, 25.0, 13.0, 15.0, 6.0, 2.0, 2.0, 7.0, 1.0, 4.0, 1.0], "bins": [-36.40625, -35.5, -34.59375, -33.6875, -32.78125, -31.875, -30.96875, -30.0625, -29.15625, -28.25, -27.34375, -26.4375, -25.53125, -24.625, -23.71875, -22.8125, -21.90625, -21.0, -20.09375, -19.1875, -18.28125, -17.375, -16.46875, -15.5625, -14.65625, -13.75, -12.84375, -11.9375, -11.03125, -10.125, -9.21875, -8.3125, -7.40625, -6.5, -5.59375, -4.6875, -3.78125, -2.875, -1.96875, -1.0625, -0.15625, 0.75, 1.65625, 2.5625, 3.46875, 4.375, 5.28125, 6.1875, 7.09375, 8.0, 8.90625, 9.8125, 10.71875, 11.625, 12.53125, 13.4375, 14.34375, 15.25, 16.15625, 17.0625, 17.96875, 18.875, 19.78125, 20.6875, 21.59375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 10.0, 15.0, 30.0, 35.0, 55.0, 72.0, 92.0, 120.0, 114.0, 93.0, 84.0, 79.0, 54.0, 49.0, 33.0, 21.0, 13.0, 6.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.46875, -8.1734619140625, -7.878173828125, -7.5828857421875, -7.28759765625, -6.9923095703125, -6.697021484375, -6.4017333984375, -6.1064453125, -5.8111572265625, -5.515869140625, -5.2205810546875, -4.92529296875, -4.6300048828125, -4.334716796875, -4.0394287109375, -3.744140625, -3.4488525390625, -3.153564453125, -2.8582763671875, -2.56298828125, -2.2677001953125, -1.972412109375, -1.6771240234375, -1.3818359375, -1.0865478515625, -0.791259765625, -0.4959716796875, -0.20068359375, 0.0946044921875, 0.389892578125, 0.6851806640625, 0.98046875, 1.2757568359375, 1.571044921875, 1.8663330078125, 2.16162109375, 2.4569091796875, 2.752197265625, 3.0474853515625, 3.3427734375, 3.6380615234375, 3.933349609375, 4.2286376953125, 4.52392578125, 4.8192138671875, 5.114501953125, 5.4097900390625, 5.705078125, 6.0003662109375, 6.295654296875, 6.5909423828125, 6.88623046875, 7.1815185546875, 7.476806640625, 7.7720947265625, 8.0673828125, 8.3626708984375, 8.657958984375, 8.9532470703125, 9.24853515625, 9.5438232421875, 9.839111328125, 10.1343994140625, 10.4296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 0.0, 4.0, 3.0, 2.0, 9.0, 11.0, 8.0, 19.0, 22.0, 60.0, 75.0, 91.0, 149.0, 211.0, 469.0, 892.0, 2459.0, 13534.0, 249439.0, 735675.0, 38351.0, 4458.0, 1231.0, 603.0, 299.0, 189.0, 84.0, 70.0, 40.0, 31.0, 33.0, 13.0, 9.0, 6.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.125, -49.3125, -47.5, -45.6875, -43.875, -42.0625, -40.25, -38.4375, -36.625, -34.8125, -33.0, -31.1875, -29.375, -27.5625, -25.75, -23.9375, -22.125, -20.3125, -18.5, -16.6875, -14.875, -13.0625, -11.25, -9.4375, -7.625, -5.8125, -4.0, -2.1875, -0.375, 1.4375, 3.25, 5.0625, 6.875, 8.6875, 10.5, 12.3125, 14.125, 15.9375, 17.75, 19.5625, 21.375, 23.1875, 25.0, 26.8125, 28.625, 30.4375, 32.25, 34.0625, 35.875, 37.6875, 39.5, 41.3125, 43.125, 44.9375, 46.75, 48.5625, 50.375, 52.1875, 54.0, 55.8125, 57.625, 59.4375, 61.25, 63.0625, 64.875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 12.0, 16.0, 13.0, 18.0, 20.0, 28.0, 38.0, 31.0, 52.0, 66.0, 65.0, 71.0, 72.0, 78.0, 70.0, 60.0, 60.0, 45.0, 40.0, 26.0, 38.0, 18.0, 11.0, 12.0, 9.0, 9.0, 3.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.796875, -28.646240234375, -27.49560546875, -26.344970703125, -25.1943359375, -24.043701171875, -22.89306640625, -21.742431640625, -20.591796875, -19.441162109375, -18.29052734375, -17.139892578125, -15.9892578125, -14.838623046875, -13.68798828125, -12.537353515625, -11.38671875, -10.236083984375, -9.08544921875, -7.934814453125, -6.7841796875, -5.633544921875, -4.48291015625, -3.332275390625, -2.181640625, -1.031005859375, 0.11962890625, 1.270263671875, 2.4208984375, 3.571533203125, 4.72216796875, 5.872802734375, 7.0234375, 8.174072265625, 9.32470703125, 10.475341796875, 11.6259765625, 12.776611328125, 13.92724609375, 15.077880859375, 16.228515625, 17.379150390625, 18.52978515625, 19.680419921875, 20.8310546875, 21.981689453125, 23.13232421875, 24.282958984375, 25.43359375, 26.584228515625, 27.73486328125, 28.885498046875, 30.0361328125, 31.186767578125, 32.33740234375, 33.488037109375, 34.638671875, 35.789306640625, 36.93994140625, 38.090576171875, 39.2412109375, 40.391845703125, 41.54248046875, 42.693115234375, 43.84375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 7.0, 11.0, 14.0, 17.0, 15.0, 38.0, 47.0, 69.0, 110.0, 165.0, 352.0, 685.0, 1622.0, 4716.0, 18614.0, 129128.0, 736618.0, 129749.0, 18679.0, 4649.0, 1668.0, 702.0, 336.0, 168.0, 112.0, 73.0, 43.0, 30.0, 20.0, 19.0, 12.0, 8.0, 11.0, 8.0, 6.0, 3.0, 3.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.703125, -17.10302734375, -16.5029296875, -15.90283203125, -15.302734375, -14.70263671875, -14.1025390625, -13.50244140625, -12.90234375, -12.30224609375, -11.7021484375, -11.10205078125, -10.501953125, -9.90185546875, -9.3017578125, -8.70166015625, -8.1015625, -7.50146484375, -6.9013671875, -6.30126953125, -5.701171875, -5.10107421875, -4.5009765625, -3.90087890625, -3.30078125, -2.70068359375, -2.1005859375, -1.50048828125, -0.900390625, -0.30029296875, 0.2998046875, 0.89990234375, 1.5, 2.10009765625, 2.7001953125, 3.30029296875, 3.900390625, 4.50048828125, 5.1005859375, 5.70068359375, 6.30078125, 6.90087890625, 7.5009765625, 8.10107421875, 8.701171875, 9.30126953125, 9.9013671875, 10.50146484375, 11.1015625, 11.70166015625, 12.3017578125, 12.90185546875, 13.501953125, 14.10205078125, 14.7021484375, 15.30224609375, 15.90234375, 16.50244140625, 17.1025390625, 17.70263671875, 18.302734375, 18.90283203125, 19.5029296875, 20.10302734375, 20.703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 7.0, 20.0, 27.0, 27.0, 50.0, 90.0, 144.0, 221.0, 165.0, 108.0, 58.0, 28.0, 17.0, 18.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003009796142578125, -0.002931833267211914, -0.002853870391845703, -0.002775907516479492, -0.0026979446411132812, -0.0026199817657470703, -0.0025420188903808594, -0.0024640560150146484, -0.0023860931396484375, -0.0023081302642822266, -0.0022301673889160156, -0.0021522045135498047, -0.0020742416381835938, -0.001996278762817383, -0.0019183158874511719, -0.001840353012084961, -0.00176239013671875, -0.001684427261352539, -0.0016064643859863281, -0.0015285015106201172, -0.0014505386352539062, -0.0013725757598876953, -0.0012946128845214844, -0.0012166500091552734, -0.0011386871337890625, -0.0010607242584228516, -0.0009827613830566406, -0.0009047985076904297, -0.0008268356323242188, -0.0007488727569580078, -0.0006709098815917969, -0.0005929470062255859, -0.000514984130859375, -0.00043702125549316406, -0.0003590583801269531, -0.0002810955047607422, -0.00020313262939453125, -0.0001251697540283203, -4.7206878662109375e-05, 3.075599670410156e-05, 0.0001087188720703125, 0.00018668174743652344, 0.0002646446228027344, 0.0003426074981689453, 0.00042057037353515625, 0.0004985332489013672, 0.0005764961242675781, 0.0006544589996337891, 0.000732421875, 0.0008103847503662109, 0.0008883476257324219, 0.0009663105010986328, 0.0010442733764648438, 0.0011222362518310547, 0.0012001991271972656, 0.0012781620025634766, 0.0013561248779296875, 0.0014340877532958984, 0.0015120506286621094, 0.0015900135040283203, 0.0016679763793945312, 0.0017459392547607422, 0.0018239021301269531, 0.001901865005493164, 0.001979827880859375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 9.0, 8.0, 4.0, 9.0, 16.0, 34.0, 43.0, 56.0, 110.0, 270.0, 587.0, 1826.0, 10776.0, 374528.0, 643117.0, 13671.0, 2212.0, 709.0, 263.0, 128.0, 63.0, 38.0, 23.0, 17.0, 8.0, 12.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-44.84375, -43.564453125, -42.28515625, -41.005859375, -39.7265625, -38.447265625, -37.16796875, -35.888671875, -34.609375, -33.330078125, -32.05078125, -30.771484375, -29.4921875, -28.212890625, -26.93359375, -25.654296875, -24.375, -23.095703125, -21.81640625, -20.537109375, -19.2578125, -17.978515625, -16.69921875, -15.419921875, -14.140625, -12.861328125, -11.58203125, -10.302734375, -9.0234375, -7.744140625, -6.46484375, -5.185546875, -3.90625, -2.626953125, -1.34765625, -0.068359375, 1.2109375, 2.490234375, 3.76953125, 5.048828125, 6.328125, 7.607421875, 8.88671875, 10.166015625, 11.4453125, 12.724609375, 14.00390625, 15.283203125, 16.5625, 17.841796875, 19.12109375, 20.400390625, 21.6796875, 22.958984375, 24.23828125, 25.517578125, 26.796875, 28.076171875, 29.35546875, 30.634765625, 31.9140625, 33.193359375, 34.47265625, 35.751953125, 37.03125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 8.0, 17.0, 21.0, 42.0, 55.0, 108.0, 198.0, 215.0, 128.0, 72.0, 43.0, 25.0, 16.0, 9.0, 9.0, 11.0, 5.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.96875, -23.2001953125, -22.431640625, -21.6630859375, -20.89453125, -20.1259765625, -19.357421875, -18.5888671875, -17.8203125, -17.0517578125, -16.283203125, -15.5146484375, -14.74609375, -13.9775390625, -13.208984375, -12.4404296875, -11.671875, -10.9033203125, -10.134765625, -9.3662109375, -8.59765625, -7.8291015625, -7.060546875, -6.2919921875, -5.5234375, -4.7548828125, -3.986328125, -3.2177734375, -2.44921875, -1.6806640625, -0.912109375, -0.1435546875, 0.625, 1.3935546875, 2.162109375, 2.9306640625, 3.69921875, 4.4677734375, 5.236328125, 6.0048828125, 6.7734375, 7.5419921875, 8.310546875, 9.0791015625, 9.84765625, 10.6162109375, 11.384765625, 12.1533203125, 12.921875, 13.6904296875, 14.458984375, 15.2275390625, 15.99609375, 16.7646484375, 17.533203125, 18.3017578125, 19.0703125, 19.8388671875, 20.607421875, 21.3759765625, 22.14453125, 22.9130859375, 23.681640625, 24.4501953125, 25.21875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 11.0, 30.0, 153.0, 394.0, 295.0, 92.0, 18.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-475.1171569824219, -459.5964050292969, -444.07568359375, -428.554931640625, -413.0341796875, -397.513427734375, -381.99267578125, -366.4719543457031, -350.9512023925781, -335.4304504394531, -319.90972900390625, -304.38897705078125, -288.86822509765625, -273.34747314453125, -257.82672119140625, -242.30599975585938, -226.78524780273438, -211.26449584960938, -195.74375915527344, -180.2230224609375, -164.7022705078125, -149.1815185546875, -133.66078186035156, -118.1400375366211, -102.61929321289062, -87.09854888916016, -71.57780456542969, -56.05706024169922, -40.53631591796875, -25.01557159423828, -9.494827270507812, 6.025917053222656, 21.546630859375, 37.06737518310547, 52.58811950683594, 68.1088638305664, 83.62960815429688, 99.15035247802734, 114.67109680175781, 130.19183349609375, 145.71258544921875, 161.23333740234375, 176.7540740966797, 192.27481079101562, 207.79556274414062, 223.31631469726562, 238.83705139160156, 254.3577880859375, 269.8785400390625, 285.3992919921875, 300.9200439453125, 316.4407653808594, 331.9615173339844, 347.4822692871094, 363.00299072265625, 378.52374267578125, 394.04449462890625, 409.56524658203125, 425.08599853515625, 440.6067199707031, 456.1274719238281, 471.6482238769531, 487.1689453125, 502.689697265625, 518.21044921875]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 8.0, 12.0, 8.0, 7.0, 8.0, 11.0, 12.0, 15.0, 18.0, 14.0, 25.0, 32.0, 28.0, 36.0, 44.0, 39.0, 43.0, 58.0, 50.0, 51.0, 40.0, 29.0, 35.0, 43.0, 29.0, 48.0, 34.0, 30.0, 30.0, 17.0, 21.0, 19.0, 17.0, 19.0, 14.0, 6.0, 8.0, 12.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.11732482910156, -114.18535614013672, -110.25337982177734, -106.3214111328125, -102.38943481445312, -98.45746612548828, -94.5254898071289, -90.59352111816406, -86.66154479980469, -82.72957611083984, -78.79759979248047, -74.86563110351562, -70.93365478515625, -67.0016860961914, -63.06970977783203, -59.13774108886719, -55.20576858520508, -51.27379608154297, -47.34182357788086, -43.40985107421875, -39.47787857055664, -35.54590606689453, -31.613935470581055, -27.681962966918945, -23.749990463256836, -19.818017959594727, -15.886045455932617, -11.954073905944824, -8.022101402282715, -4.090129852294922, -0.1581573486328125, 3.773815155029297, 7.705787658691406, 11.637760162353516, 15.569732666015625, 19.501705169677734, 23.433677673339844, 27.36564826965332, 31.29762077331543, 35.229591369628906, 39.16156768798828, 43.09354019165039, 47.0255126953125, 50.95748519897461, 54.88945770263672, 58.82142639160156, 62.75340270996094, 66.68537139892578, 70.61734008789062, 74.54930877685547, 78.48128509521484, 82.41325378417969, 86.34523010253906, 90.2771987915039, 94.20917510986328, 98.14114379882812, 102.0731201171875, 106.00508880615234, 109.93706512451172, 113.86903381347656, 117.80101013183594, 121.73297882080078, 125.66495513916016, 129.596923828125, 133.52890014648438]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 2.0, 7.0, 3.0, 7.0, 9.0, 5.0, 10.0, 19.0, 24.0, 51.0, 102.0, 135.0, 354.0, 811.0, 2256.0, 8637.0, 78753.0, 3945293.0, 140226.0, 12526.0, 3034.0, 1058.0, 443.0, 215.0, 114.0, 78.0, 36.0, 27.0, 14.0, 9.0, 11.0, 4.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.0625, -34.53369140625, -33.0048828125, -31.47607421875, -29.947265625, -28.41845703125, -26.8896484375, -25.36083984375, -23.83203125, -22.30322265625, -20.7744140625, -19.24560546875, -17.716796875, -16.18798828125, -14.6591796875, -13.13037109375, -11.6015625, -10.07275390625, -8.5439453125, -7.01513671875, -5.486328125, -3.95751953125, -2.4287109375, -0.89990234375, 0.62890625, 2.15771484375, 3.6865234375, 5.21533203125, 6.744140625, 8.27294921875, 9.8017578125, 11.33056640625, 12.859375, 14.38818359375, 15.9169921875, 17.44580078125, 18.974609375, 20.50341796875, 22.0322265625, 23.56103515625, 25.08984375, 26.61865234375, 28.1474609375, 29.67626953125, 31.205078125, 32.73388671875, 34.2626953125, 35.79150390625, 37.3203125, 38.84912109375, 40.3779296875, 41.90673828125, 43.435546875, 44.96435546875, 46.4931640625, 48.02197265625, 49.55078125, 51.07958984375, 52.6083984375, 54.13720703125, 55.666015625, 57.19482421875, 58.7236328125, 60.25244140625, 61.78125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 17.0, 19.0, 34.0, 56.0, 67.0, 92.0, 89.0, 125.0, 109.0, 91.0, 72.0, 64.0, 59.0, 37.0, 22.0, 16.0, 10.0, 4.0, 2.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.359375, -10.01513671875, -9.6708984375, -9.32666015625, -8.982421875, -8.63818359375, -8.2939453125, -7.94970703125, -7.60546875, -7.26123046875, -6.9169921875, -6.57275390625, -6.228515625, -5.88427734375, -5.5400390625, -5.19580078125, -4.8515625, -4.50732421875, -4.1630859375, -3.81884765625, -3.474609375, -3.13037109375, -2.7861328125, -2.44189453125, -2.09765625, -1.75341796875, -1.4091796875, -1.06494140625, -0.720703125, -0.37646484375, -0.0322265625, 0.31201171875, 0.65625, 1.00048828125, 1.3447265625, 1.68896484375, 2.033203125, 2.37744140625, 2.7216796875, 3.06591796875, 3.41015625, 3.75439453125, 4.0986328125, 4.44287109375, 4.787109375, 5.13134765625, 5.4755859375, 5.81982421875, 6.1640625, 6.50830078125, 6.8525390625, 7.19677734375, 7.541015625, 7.88525390625, 8.2294921875, 8.57373046875, 8.91796875, 9.26220703125, 9.6064453125, 9.95068359375, 10.294921875, 10.63916015625, 10.9833984375, 11.32763671875, 11.671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 6.0, 4.0, 12.0, 19.0, 25.0, 36.0, 55.0, 73.0, 142.0, 180.0, 330.0, 543.0, 1132.0, 2349.0, 5603.0, 15407.0, 55795.0, 425033.0, 3368872.0, 256490.0, 41344.0, 12145.0, 4451.0, 1991.0, 928.0, 516.0, 251.0, 176.0, 93.0, 83.0, 55.0, 46.0, 39.0, 15.0, 11.0, 9.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.015625, -22.3466796875, -21.677734375, -21.0087890625, -20.33984375, -19.6708984375, -19.001953125, -18.3330078125, -17.6640625, -16.9951171875, -16.326171875, -15.6572265625, -14.98828125, -14.3193359375, -13.650390625, -12.9814453125, -12.3125, -11.6435546875, -10.974609375, -10.3056640625, -9.63671875, -8.9677734375, -8.298828125, -7.6298828125, -6.9609375, -6.2919921875, -5.623046875, -4.9541015625, -4.28515625, -3.6162109375, -2.947265625, -2.2783203125, -1.609375, -0.9404296875, -0.271484375, 0.3974609375, 1.06640625, 1.7353515625, 2.404296875, 3.0732421875, 3.7421875, 4.4111328125, 5.080078125, 5.7490234375, 6.41796875, 7.0869140625, 7.755859375, 8.4248046875, 9.09375, 9.7626953125, 10.431640625, 11.1005859375, 11.76953125, 12.4384765625, 13.107421875, 13.7763671875, 14.4453125, 15.1142578125, 15.783203125, 16.4521484375, 17.12109375, 17.7900390625, 18.458984375, 19.1279296875, 19.796875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 8.0, 8.0, 13.0, 23.0, 26.0, 37.0, 55.0, 104.0, 227.0, 465.0, 1524.0, 940.0, 322.0, 135.0, 56.0, 30.0, 22.0, 17.0, 12.0, 9.0, 5.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.4493408203125, -9.015869140625, -8.5823974609375, -8.14892578125, -7.7154541015625, -7.281982421875, -6.8485107421875, -6.4150390625, -5.9815673828125, -5.548095703125, -5.1146240234375, -4.68115234375, -4.2476806640625, -3.814208984375, -3.3807373046875, -2.947265625, -2.5137939453125, -2.080322265625, -1.6468505859375, -1.21337890625, -0.7799072265625, -0.346435546875, 0.0870361328125, 0.5205078125, 0.9539794921875, 1.387451171875, 1.8209228515625, 2.25439453125, 2.6878662109375, 3.121337890625, 3.5548095703125, 3.98828125, 4.4217529296875, 4.855224609375, 5.2886962890625, 5.72216796875, 6.1556396484375, 6.589111328125, 7.0225830078125, 7.4560546875, 7.8895263671875, 8.322998046875, 8.7564697265625, 9.18994140625, 9.6234130859375, 10.056884765625, 10.4903564453125, 10.923828125, 11.3572998046875, 11.790771484375, 12.2242431640625, 12.65771484375, 13.0911865234375, 13.524658203125, 13.9581298828125, 14.3916015625, 14.8250732421875, 15.258544921875, 15.6920166015625, 16.12548828125, 16.5589599609375, 16.992431640625, 17.4259033203125, 17.859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 40.0, 267.0, 555.0, 133.0, 9.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-496.1182556152344, -487.1654357910156, -478.212646484375, -469.25982666015625, -460.3070068359375, -451.3542175292969, -442.4013977050781, -433.4486083984375, -424.49578857421875, -415.54296875, -406.5901794433594, -397.6373596191406, -388.6845703125, -379.73175048828125, -370.7789306640625, -361.8261413574219, -352.8733215332031, -343.9205017089844, -334.96771240234375, -326.014892578125, -317.06207275390625, -308.1092834472656, -299.1564636230469, -290.20367431640625, -281.2508544921875, -272.29803466796875, -263.3452453613281, -254.39242553710938, -245.4396209716797, -236.48681640625, -227.53399658203125, -218.58119201660156, -209.62835693359375, -200.67555236816406, -191.72274780273438, -182.76992797851562, -173.81712341308594, -164.86431884765625, -155.9114990234375, -146.9586944580078, -138.00588989257812, -129.05308532714844, -120.10027313232422, -111.1474609375, -102.19465637207031, -93.24185180664062, -84.2890396118164, -75.33622741699219, -66.3834228515625, -57.43061447143555, -48.477806091308594, -39.52499771118164, -30.572189331054688, -21.619380950927734, -12.666572570800781, -3.713764190673828, 5.239044189453125, 14.191852569580078, 23.14466094970703, 32.097469329833984, 41.05027770996094, 50.00308609008789, 58.955894470214844, 67.90870666503906, 76.86151123046875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 10.0, 11.0, 25.0, 25.0, 32.0, 39.0, 63.0, 62.0, 78.0, 63.0, 80.0, 84.0, 88.0, 73.0, 56.0, 42.0, 43.0, 41.0, 31.0, 15.0, 12.0, 11.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.04608154296875, -69.70710754394531, -67.3681411743164, -65.02916717529297, -62.69019317626953, -60.35122299194336, -58.01225280761719, -55.67327880859375, -53.33430862426758, -50.995338439941406, -48.65636444091797, -46.3173942565918, -43.978424072265625, -41.63945007324219, -39.300479888916016, -36.961509704589844, -34.622535705566406, -32.283565521240234, -29.944591522216797, -27.605621337890625, -25.26664924621582, -22.927677154541016, -20.588706970214844, -18.24973487854004, -15.910762786865234, -13.57179069519043, -11.232819557189941, -8.893848419189453, -6.554876327514648, -4.215904235839844, -1.8769330978393555, 0.4620380401611328, 2.8010101318359375, 5.139981746673584, 7.4789533615112305, 9.817924499511719, 12.156896591186523, 14.495868682861328, 16.8348388671875, 19.173810958862305, 21.51278305053711, 23.851755142211914, 26.19072723388672, 28.52969741821289, 30.868669509887695, 33.2076416015625, 35.54661178588867, 37.885581970214844, 40.22455596923828, 42.56352615356445, 44.90250015258789, 47.24147033691406, 49.5804443359375, 51.91941452026367, 54.258384704589844, 56.59735870361328, 58.93632888793945, 61.275299072265625, 63.61427307128906, 65.9532470703125, 68.2922134399414, 70.63118743896484, 72.97016143798828, 75.30912780761719, 77.64810180664062]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 5.0, 6.0, 18.0, 14.0, 29.0, 29.0, 46.0, 89.0, 153.0, 245.0, 541.0, 1081.0, 2689.0, 7718.0, 29562.0, 158703.0, 676857.0, 133172.0, 26135.0, 6964.0, 2385.0, 991.0, 470.0, 260.0, 143.0, 84.0, 50.0, 27.0, 33.0, 12.0, 12.0, 10.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.84375, -35.7744140625, -34.705078125, -33.6357421875, -32.56640625, -31.4970703125, -30.427734375, -29.3583984375, -28.2890625, -27.2197265625, -26.150390625, -25.0810546875, -24.01171875, -22.9423828125, -21.873046875, -20.8037109375, -19.734375, -18.6650390625, -17.595703125, -16.5263671875, -15.45703125, -14.3876953125, -13.318359375, -12.2490234375, -11.1796875, -10.1103515625, -9.041015625, -7.9716796875, -6.90234375, -5.8330078125, -4.763671875, -3.6943359375, -2.625, -1.5556640625, -0.486328125, 0.5830078125, 1.65234375, 2.7216796875, 3.791015625, 4.8603515625, 5.9296875, 6.9990234375, 8.068359375, 9.1376953125, 10.20703125, 11.2763671875, 12.345703125, 13.4150390625, 14.484375, 15.5537109375, 16.623046875, 17.6923828125, 18.76171875, 19.8310546875, 20.900390625, 21.9697265625, 23.0390625, 24.1083984375, 25.177734375, 26.2470703125, 27.31640625, 28.3857421875, 29.455078125, 30.5244140625, 31.59375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 12.0, 14.0, 26.0, 34.0, 49.0, 71.0, 85.0, 92.0, 114.0, 93.0, 78.0, 67.0, 59.0, 53.0, 52.0, 29.0, 23.0, 13.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66015625, -7.35711669921875, -7.0540771484375, -6.75103759765625, -6.447998046875, -6.14495849609375, -5.8419189453125, -5.53887939453125, -5.23583984375, -4.93280029296875, -4.6297607421875, -4.32672119140625, -4.023681640625, -3.72064208984375, -3.4176025390625, -3.11456298828125, -2.8115234375, -2.50848388671875, -2.2054443359375, -1.90240478515625, -1.599365234375, -1.29632568359375, -0.9932861328125, -0.69024658203125, -0.38720703125, -0.08416748046875, 0.2188720703125, 0.52191162109375, 0.824951171875, 1.12799072265625, 1.4310302734375, 1.73406982421875, 2.037109375, 2.34014892578125, 2.6431884765625, 2.94622802734375, 3.249267578125, 3.55230712890625, 3.8553466796875, 4.15838623046875, 4.46142578125, 4.76446533203125, 5.0675048828125, 5.37054443359375, 5.673583984375, 5.97662353515625, 6.2796630859375, 6.58270263671875, 6.8857421875, 7.18878173828125, 7.4918212890625, 7.79486083984375, 8.097900390625, 8.40093994140625, 8.7039794921875, 9.00701904296875, 9.31005859375, 9.61309814453125, 9.9161376953125, 10.21917724609375, 10.522216796875, 10.82525634765625, 11.1282958984375, 11.43133544921875, 11.734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 14.0, 5.0, 13.0, 12.0, 19.0, 32.0, 37.0, 62.0, 97.0, 178.0, 252.0, 486.0, 1081.0, 3408.0, 22455.0, 804491.0, 202134.0, 9835.0, 2158.0, 817.0, 368.0, 183.0, 118.0, 90.0, 56.0, 38.0, 26.0, 24.0, 16.0, 11.0, 13.0, 4.0, 6.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-89.3125, -86.951171875, -84.58984375, -82.228515625, -79.8671875, -77.505859375, -75.14453125, -72.783203125, -70.421875, -68.060546875, -65.69921875, -63.337890625, -60.9765625, -58.615234375, -56.25390625, -53.892578125, -51.53125, -49.169921875, -46.80859375, -44.447265625, -42.0859375, -39.724609375, -37.36328125, -35.001953125, -32.640625, -30.279296875, -27.91796875, -25.556640625, -23.1953125, -20.833984375, -18.47265625, -16.111328125, -13.75, -11.388671875, -9.02734375, -6.666015625, -4.3046875, -1.943359375, 0.41796875, 2.779296875, 5.140625, 7.501953125, 9.86328125, 12.224609375, 14.5859375, 16.947265625, 19.30859375, 21.669921875, 24.03125, 26.392578125, 28.75390625, 31.115234375, 33.4765625, 35.837890625, 38.19921875, 40.560546875, 42.921875, 45.283203125, 47.64453125, 50.005859375, 52.3671875, 54.728515625, 57.08984375, 59.451171875, 61.8125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 15.0, 7.0, 14.0, 26.0, 37.0, 61.0, 52.0, 80.0, 99.0, 97.0, 108.0, 73.0, 77.0, 70.0, 52.0, 44.0, 26.0, 16.0, 8.0, 7.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.28125, -61.57421875, -59.8671875, -58.16015625, -56.453125, -54.74609375, -53.0390625, -51.33203125, -49.625, -47.91796875, -46.2109375, -44.50390625, -42.796875, -41.08984375, -39.3828125, -37.67578125, -35.96875, -34.26171875, -32.5546875, -30.84765625, -29.140625, -27.43359375, -25.7265625, -24.01953125, -22.3125, -20.60546875, -18.8984375, -17.19140625, -15.484375, -13.77734375, -12.0703125, -10.36328125, -8.65625, -6.94921875, -5.2421875, -3.53515625, -1.828125, -0.12109375, 1.5859375, 3.29296875, 5.0, 6.70703125, 8.4140625, 10.12109375, 11.828125, 13.53515625, 15.2421875, 16.94921875, 18.65625, 20.36328125, 22.0703125, 23.77734375, 25.484375, 27.19140625, 28.8984375, 30.60546875, 32.3125, 34.01953125, 35.7265625, 37.43359375, 39.140625, 40.84765625, 42.5546875, 44.26171875, 45.96875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 10.0, 10.0, 9.0, 6.0, 16.0, 12.0, 21.0, 24.0, 51.0, 58.0, 108.0, 197.0, 522.0, 1707.0, 11522.0, 602631.0, 418914.0, 10108.0, 1619.0, 498.0, 206.0, 111.0, 47.0, 32.0, 22.0, 19.0, 18.0, 17.0, 8.0, 7.0, 6.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.90625, -35.5869140625, -34.267578125, -32.9482421875, -31.62890625, -30.3095703125, -28.990234375, -27.6708984375, -26.3515625, -25.0322265625, -23.712890625, -22.3935546875, -21.07421875, -19.7548828125, -18.435546875, -17.1162109375, -15.796875, -14.4775390625, -13.158203125, -11.8388671875, -10.51953125, -9.2001953125, -7.880859375, -6.5615234375, -5.2421875, -3.9228515625, -2.603515625, -1.2841796875, 0.03515625, 1.3544921875, 2.673828125, 3.9931640625, 5.3125, 6.6318359375, 7.951171875, 9.2705078125, 10.58984375, 11.9091796875, 13.228515625, 14.5478515625, 15.8671875, 17.1865234375, 18.505859375, 19.8251953125, 21.14453125, 22.4638671875, 23.783203125, 25.1025390625, 26.421875, 27.7412109375, 29.060546875, 30.3798828125, 31.69921875, 33.0185546875, 34.337890625, 35.6572265625, 36.9765625, 38.2958984375, 39.615234375, 40.9345703125, 42.25390625, 43.5732421875, 44.892578125, 46.2119140625, 47.53125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 10.0, 9.0, 18.0, 24.0, 27.0, 36.0, 70.0, 207.0, 276.0, 112.0, 48.0, 32.0, 29.0, 22.0, 19.0, 11.0, 14.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.002384185791015625, -0.002318471670150757, -0.0022527575492858887, -0.0021870434284210205, -0.0021213293075561523, -0.002055615186691284, -0.001989901065826416, -0.0019241869449615479, -0.0018584728240966797, -0.0017927587032318115, -0.0017270445823669434, -0.0016613304615020752, -0.001595616340637207, -0.0015299022197723389, -0.0014641880989074707, -0.0013984739780426025, -0.0013327598571777344, -0.0012670457363128662, -0.001201331615447998, -0.0011356174945831299, -0.0010699033737182617, -0.0010041892528533936, -0.0009384751319885254, -0.0008727610111236572, -0.0008070468902587891, -0.0007413327693939209, -0.0006756186485290527, -0.0006099045276641846, -0.0005441904067993164, -0.00047847628593444824, -0.0004127621650695801, -0.0003470480442047119, -0.00028133392333984375, -0.00021561980247497559, -0.00014990568161010742, -8.419156074523926e-05, -1.8477439880371094e-05, 4.723668098449707e-05, 0.00011295080184936523, 0.0001786649227142334, 0.00024437904357910156, 0.0003100931644439697, 0.0003758072853088379, 0.00044152140617370605, 0.0005072355270385742, 0.0005729496479034424, 0.0006386637687683105, 0.0007043778896331787, 0.0007700920104980469, 0.000835806131362915, 0.0009015202522277832, 0.0009672343730926514, 0.0010329484939575195, 0.0010986626148223877, 0.0011643767356872559, 0.001230090856552124, 0.0012958049774169922, 0.0013615190982818604, 0.0014272332191467285, 0.0014929473400115967, 0.0015586614608764648, 0.001624375581741333, 0.0016900897026062012, 0.0017558038234710693, 0.0018215179443359375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 5.0, 3.0, 4.0, 13.0, 12.0, 15.0, 30.0, 34.0, 58.0, 81.0, 224.0, 544.0, 2543.0, 30045.0, 995003.0, 17199.0, 1883.0, 432.0, 176.0, 73.0, 57.0, 36.0, 20.0, 14.0, 14.0, 5.0, 11.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.5, -56.44140625, -54.3828125, -52.32421875, -50.265625, -48.20703125, -46.1484375, -44.08984375, -42.03125, -39.97265625, -37.9140625, -35.85546875, -33.796875, -31.73828125, -29.6796875, -27.62109375, -25.5625, -23.50390625, -21.4453125, -19.38671875, -17.328125, -15.26953125, -13.2109375, -11.15234375, -9.09375, -7.03515625, -4.9765625, -2.91796875, -0.859375, 1.19921875, 3.2578125, 5.31640625, 7.375, 9.43359375, 11.4921875, 13.55078125, 15.609375, 17.66796875, 19.7265625, 21.78515625, 23.84375, 25.90234375, 27.9609375, 30.01953125, 32.078125, 34.13671875, 36.1953125, 38.25390625, 40.3125, 42.37109375, 44.4296875, 46.48828125, 48.546875, 50.60546875, 52.6640625, 54.72265625, 56.78125, 58.83984375, 60.8984375, 62.95703125, 65.015625, 67.07421875, 69.1328125, 71.19140625, 73.25]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 11.0, 21.0, 34.0, 134.0, 390.0, 261.0, 65.0, 23.0, 14.0, 8.0, 5.0, 3.0, 2.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.21875, -47.916015625, -46.61328125, -45.310546875, -44.0078125, -42.705078125, -41.40234375, -40.099609375, -38.796875, -37.494140625, -36.19140625, -34.888671875, -33.5859375, -32.283203125, -30.98046875, -29.677734375, -28.375, -27.072265625, -25.76953125, -24.466796875, -23.1640625, -21.861328125, -20.55859375, -19.255859375, -17.953125, -16.650390625, -15.34765625, -14.044921875, -12.7421875, -11.439453125, -10.13671875, -8.833984375, -7.53125, -6.228515625, -4.92578125, -3.623046875, -2.3203125, -1.017578125, 0.28515625, 1.587890625, 2.890625, 4.193359375, 5.49609375, 6.798828125, 8.1015625, 9.404296875, 10.70703125, 12.009765625, 13.3125, 14.615234375, 15.91796875, 17.220703125, 18.5234375, 19.826171875, 21.12890625, 22.431640625, 23.734375, 25.037109375, 26.33984375, 27.642578125, 28.9453125, 30.248046875, 31.55078125, 32.853515625, 34.15625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 11.0, 21.0, 110.0, 341.0, 352.0, 119.0, 27.0, 13.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-666.03369140625, -650.8236083984375, -635.6135864257812, -620.4035034179688, -605.1934204101562, -589.9833374023438, -574.7733154296875, -559.563232421875, -544.3531494140625, -529.14306640625, -513.9330444335938, -498.72296142578125, -483.51287841796875, -468.3028259277344, -453.0927429199219, -437.8826904296875, -422.672607421875, -407.4625549316406, -392.2524719238281, -377.04241943359375, -361.83233642578125, -346.6222839355469, -331.4122009277344, -316.2021484375, -300.9920959472656, -285.78204345703125, -270.57196044921875, -255.3618927001953, -240.15182495117188, -224.9417724609375, -209.731689453125, -194.52163696289062, -179.31155395507812, -164.1014862060547, -148.89141845703125, -133.6813507080078, -118.47128295898438, -103.26122283935547, -88.05115509033203, -72.8410873413086, -57.631019592285156, -42.42095184326172, -27.210886001586914, -12.00082015991211, 3.209247589111328, 18.4193115234375, 33.62937927246094, 48.839447021484375, 64.04951477050781, 79.25958251953125, 94.46965026855469, 109.67971801757812, 124.88978576660156, 140.099853515625, 155.30990600585938, 170.51998901367188, 185.73004150390625, 200.9401092529297, 216.15017700195312, 231.36024475097656, 246.5703125, 261.7803649902344, 276.9904479980469, 292.20050048828125, 307.41058349609375]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 6.0, 14.0, 23.0, 21.0, 25.0, 37.0, 48.0, 54.0, 69.0, 73.0, 79.0, 73.0, 79.0, 76.0, 65.0, 60.0, 61.0, 33.0, 33.0, 20.0, 20.0, 16.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-277.38763427734375, -269.22467041015625, -261.06170654296875, -252.8987274169922, -244.73574829101562, -236.57278442382812, -228.40982055664062, -220.24685668945312, -212.08387756347656, -203.92091369628906, -195.7579345703125, -187.594970703125, -179.4320068359375, -171.26902770996094, -163.10606384277344, -154.94308471679688, -146.78012084960938, -138.61715698242188, -130.4541778564453, -122.29121398925781, -114.12824249267578, -105.96527099609375, -97.80230712890625, -89.63933563232422, -81.47636413574219, -73.31339263916016, -65.15042114257812, -56.987457275390625, -48.824485778808594, -40.66151428222656, -32.4985466003418, -24.33557891845703, -16.172637939453125, -8.009668350219727, 0.15330123901367188, 8.31627082824707, 16.47924041748047, 24.6422119140625, 32.805179595947266, 40.96814727783203, 49.13111877441406, 57.294090270996094, 65.45706176757812, 73.62002563476562, 81.78299713134766, 89.94596862792969, 98.10893249511719, 106.27190399169922, 114.43487548828125, 122.59784698486328, 130.7608184814453, 138.9237823486328, 147.08676147460938, 155.24972534179688, 163.41268920898438, 171.57565307617188, 179.73863220214844, 187.90159606933594, 196.0645751953125, 204.2275390625, 212.3905029296875, 220.55348205566406, 228.71644592285156, 236.87942504882812, 245.04238891601562]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 21.0, 20.0, 32.0, 60.0, 117.0, 215.0, 546.0, 1700.0, 7023.0, 55037.0, 3926251.0, 185501.0, 13085.0, 2992.0, 911.0, 355.0, 166.0, 76.0, 47.0, 35.0, 26.0, 8.0, 18.0, 9.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.09375, -52.27099609375, -50.4482421875, -48.62548828125, -46.802734375, -44.97998046875, -43.1572265625, -41.33447265625, -39.51171875, -37.68896484375, -35.8662109375, -34.04345703125, -32.220703125, -30.39794921875, -28.5751953125, -26.75244140625, -24.9296875, -23.10693359375, -21.2841796875, -19.46142578125, -17.638671875, -15.81591796875, -13.9931640625, -12.17041015625, -10.34765625, -8.52490234375, -6.7021484375, -4.87939453125, -3.056640625, -1.23388671875, 0.5888671875, 2.41162109375, 4.234375, 6.05712890625, 7.8798828125, 9.70263671875, 11.525390625, 13.34814453125, 15.1708984375, 16.99365234375, 18.81640625, 20.63916015625, 22.4619140625, 24.28466796875, 26.107421875, 27.93017578125, 29.7529296875, 31.57568359375, 33.3984375, 35.22119140625, 37.0439453125, 38.86669921875, 40.689453125, 42.51220703125, 44.3349609375, 46.15771484375, 47.98046875, 49.80322265625, 51.6259765625, 53.44873046875, 55.271484375, 57.09423828125, 58.9169921875, 60.73974609375, 62.5625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 13.0, 19.0, 31.0, 49.0, 78.0, 95.0, 119.0, 113.0, 119.0, 97.0, 67.0, 69.0, 54.0, 28.0, 16.0, 14.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.703125, -11.2666015625, -10.830078125, -10.3935546875, -9.95703125, -9.5205078125, -9.083984375, -8.6474609375, -8.2109375, -7.7744140625, -7.337890625, -6.9013671875, -6.46484375, -6.0283203125, -5.591796875, -5.1552734375, -4.71875, -4.2822265625, -3.845703125, -3.4091796875, -2.97265625, -2.5361328125, -2.099609375, -1.6630859375, -1.2265625, -0.7900390625, -0.353515625, 0.0830078125, 0.51953125, 0.9560546875, 1.392578125, 1.8291015625, 2.265625, 2.7021484375, 3.138671875, 3.5751953125, 4.01171875, 4.4482421875, 4.884765625, 5.3212890625, 5.7578125, 6.1943359375, 6.630859375, 7.0673828125, 7.50390625, 7.9404296875, 8.376953125, 8.8134765625, 9.25, 9.6865234375, 10.123046875, 10.5595703125, 10.99609375, 11.4326171875, 11.869140625, 12.3056640625, 12.7421875, 13.1787109375, 13.615234375, 14.0517578125, 14.48828125, 14.9248046875, 15.361328125, 15.7978515625, 16.234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 9.0, 18.0, 21.0, 25.0, 43.0, 51.0, 80.0, 122.0, 193.0, 374.0, 756.0, 1632.0, 4269.0, 13420.0, 67380.0, 3025597.0, 1018817.0, 45613.0, 9958.0, 3266.0, 1320.0, 586.0, 253.0, 165.0, 131.0, 62.0, 44.0, 20.0, 16.0, 13.0, 10.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.890625, -29.822021484375, -28.75341796875, -27.684814453125, -26.6162109375, -25.547607421875, -24.47900390625, -23.410400390625, -22.341796875, -21.273193359375, -20.20458984375, -19.135986328125, -18.0673828125, -16.998779296875, -15.93017578125, -14.861572265625, -13.79296875, -12.724365234375, -11.65576171875, -10.587158203125, -9.5185546875, -8.449951171875, -7.38134765625, -6.312744140625, -5.244140625, -4.175537109375, -3.10693359375, -2.038330078125, -0.9697265625, 0.098876953125, 1.16748046875, 2.236083984375, 3.3046875, 4.373291015625, 5.44189453125, 6.510498046875, 7.5791015625, 8.647705078125, 9.71630859375, 10.784912109375, 11.853515625, 12.922119140625, 13.99072265625, 15.059326171875, 16.1279296875, 17.196533203125, 18.26513671875, 19.333740234375, 20.40234375, 21.470947265625, 22.53955078125, 23.608154296875, 24.6767578125, 25.745361328125, 26.81396484375, 27.882568359375, 28.951171875, 30.019775390625, 31.08837890625, 32.156982421875, 33.2255859375, 34.294189453125, 35.36279296875, 36.431396484375, 37.5]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 5.0, 7.0, 12.0, 13.0, 11.0, 25.0, 30.0, 54.0, 160.0, 365.0, 1961.0, 1036.0, 210.0, 91.0, 39.0, 18.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.296875, -21.7073974609375, -21.117919921875, -20.5284423828125, -19.93896484375, -19.3494873046875, -18.760009765625, -18.1705322265625, -17.5810546875, -16.9915771484375, -16.402099609375, -15.8126220703125, -15.22314453125, -14.6336669921875, -14.044189453125, -13.4547119140625, -12.865234375, -12.2757568359375, -11.686279296875, -11.0968017578125, -10.50732421875, -9.9178466796875, -9.328369140625, -8.7388916015625, -8.1494140625, -7.5599365234375, -6.970458984375, -6.3809814453125, -5.79150390625, -5.2020263671875, -4.612548828125, -4.0230712890625, -3.43359375, -2.8441162109375, -2.254638671875, -1.6651611328125, -1.07568359375, -0.4862060546875, 0.103271484375, 0.6927490234375, 1.2822265625, 1.8717041015625, 2.461181640625, 3.0506591796875, 3.64013671875, 4.2296142578125, 4.819091796875, 5.4085693359375, 5.998046875, 6.5875244140625, 7.177001953125, 7.7664794921875, 8.35595703125, 8.9454345703125, 9.534912109375, 10.1243896484375, 10.7138671875, 11.3033447265625, 11.892822265625, 12.4822998046875, 13.07177734375, 13.6612548828125, 14.250732421875, 14.8402099609375, 15.4296875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 8.0, 20.0, 69.0, 468.0, 406.0, 34.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-537.8612060546875, -527.7481079101562, -517.635009765625, -507.5219421386719, -497.4088439941406, -487.2957458496094, -477.1826477050781, -467.069580078125, -456.95648193359375, -446.8433837890625, -436.73028564453125, -426.6172180175781, -416.5041198730469, -406.3910217285156, -396.2779235839844, -386.16485595703125, -376.0517578125, -365.93865966796875, -355.8255615234375, -345.7124938964844, -335.5993957519531, -325.4862976074219, -315.3731994628906, -305.2601318359375, -295.1470031738281, -285.0339050292969, -274.9208068847656, -264.8077392578125, -254.69464111328125, -244.58154296875, -234.46844482421875, -224.35536193847656, -214.24227905273438, -204.12918090820312, -194.01609802246094, -183.9029998779297, -173.7899169921875, -163.67681884765625, -153.563720703125, -143.4506378173828, -133.33755493164062, -123.2244644165039, -113.11137390136719, -102.99827575683594, -92.88519287109375, -82.7720947265625, -72.65900421142578, -62.54591369628906, -52.43281555175781, -42.319725036621094, -32.206634521484375, -22.09354019165039, -11.980449676513672, -1.8673591613769531, 8.245735168457031, 18.35882568359375, 28.47191619873047, 38.58500671386719, 48.698097229003906, 58.81119155883789, 68.92428588867188, 79.03736877441406, 89.15046691894531, 99.26355743408203, 109.37664794921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 15.0, 14.0, 13.0, 26.0, 27.0, 49.0, 53.0, 54.0, 70.0, 70.0, 48.0, 71.0, 61.0, 70.0, 59.0, 70.0, 50.0, 40.0, 30.0, 20.0, 21.0, 21.0, 15.0, 12.0, 3.0, 4.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.38117218017578, -48.9798583984375, -46.57854461669922, -44.17722702026367, -41.77591323852539, -39.37459945678711, -36.97328186035156, -34.57196807861328, -32.170654296875, -29.76934051513672, -27.368024826049805, -24.96670913696289, -22.56539535522461, -20.164081573486328, -17.762765884399414, -15.3614501953125, -12.960136413574219, -10.558821678161621, -8.157506942749023, -5.756192207336426, -3.354877471923828, -0.9535627365112305, 1.4477519989013672, 3.8490676879882812, 6.2503814697265625, 8.65169620513916, 11.053010940551758, 13.454325675964355, 15.855640411376953, 18.256954193115234, 20.65826988220215, 23.059585571289062, 25.460899353027344, 27.862213134765625, 30.26352882385254, 32.66484451293945, 35.066158294677734, 37.467472076416016, 39.86878967285156, 42.270103454589844, 44.671417236328125, 47.072731018066406, 49.47404479980469, 51.875362396240234, 54.276676177978516, 56.6779899597168, 59.079307556152344, 61.480621337890625, 63.881935119628906, 66.28324890136719, 68.68456268310547, 71.08587646484375, 73.48719787597656, 75.88851165771484, 78.28982543945312, 80.6911392211914, 83.09245300292969, 85.49376678466797, 87.89508056640625, 90.29639434814453, 92.69770812988281, 95.09902954101562, 97.5003433227539, 99.90165710449219, 102.30297088623047]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 11.0, 10.0, 21.0, 34.0, 83.0, 119.0, 236.0, 536.0, 1394.0, 7985.0, 89819.0, 834715.0, 102340.0, 8645.0, 1551.0, 490.0, 253.0, 124.0, 90.0, 29.0, 23.0, 20.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-49.71875, -48.03466796875, -46.3505859375, -44.66650390625, -42.982421875, -41.29833984375, -39.6142578125, -37.93017578125, -36.24609375, -34.56201171875, -32.8779296875, -31.19384765625, -29.509765625, -27.82568359375, -26.1416015625, -24.45751953125, -22.7734375, -21.08935546875, -19.4052734375, -17.72119140625, -16.037109375, -14.35302734375, -12.6689453125, -10.98486328125, -9.30078125, -7.61669921875, -5.9326171875, -4.24853515625, -2.564453125, -0.88037109375, 0.8037109375, 2.48779296875, 4.171875, 5.85595703125, 7.5400390625, 9.22412109375, 10.908203125, 12.59228515625, 14.2763671875, 15.96044921875, 17.64453125, 19.32861328125, 21.0126953125, 22.69677734375, 24.380859375, 26.06494140625, 27.7490234375, 29.43310546875, 31.1171875, 32.80126953125, 34.4853515625, 36.16943359375, 37.853515625, 39.53759765625, 41.2216796875, 42.90576171875, 44.58984375, 46.27392578125, 47.9580078125, 49.64208984375, 51.326171875, 53.01025390625, 54.6943359375, 56.37841796875, 58.0625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 23.0, 50.0, 63.0, 77.0, 93.0, 106.0, 127.0, 113.0, 87.0, 75.0, 63.0, 46.0, 25.0, 14.0, 10.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6796875, -11.2398681640625, -10.800048828125, -10.3602294921875, -9.92041015625, -9.4805908203125, -9.040771484375, -8.6009521484375, -8.1611328125, -7.7213134765625, -7.281494140625, -6.8416748046875, -6.40185546875, -5.9620361328125, -5.522216796875, -5.0823974609375, -4.642578125, -4.2027587890625, -3.762939453125, -3.3231201171875, -2.88330078125, -2.4434814453125, -2.003662109375, -1.5638427734375, -1.1240234375, -0.6842041015625, -0.244384765625, 0.1954345703125, 0.63525390625, 1.0750732421875, 1.514892578125, 1.9547119140625, 2.39453125, 2.8343505859375, 3.274169921875, 3.7139892578125, 4.15380859375, 4.5936279296875, 5.033447265625, 5.4732666015625, 5.9130859375, 6.3529052734375, 6.792724609375, 7.2325439453125, 7.67236328125, 8.1121826171875, 8.552001953125, 8.9918212890625, 9.431640625, 9.8714599609375, 10.311279296875, 10.7510986328125, 11.19091796875, 11.6307373046875, 12.070556640625, 12.5103759765625, 12.9501953125, 13.3900146484375, 13.829833984375, 14.2696533203125, 14.70947265625, 15.1492919921875, 15.589111328125, 16.0289306640625, 16.46875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 4.0, 9.0, 10.0, 7.0, 19.0, 29.0, 44.0, 51.0, 107.0, 114.0, 200.0, 379.0, 750.0, 1722.0, 5243.0, 20166.0, 115303.0, 688017.0, 177085.0, 28364.0, 6713.0, 2166.0, 930.0, 406.0, 242.0, 152.0, 101.0, 62.0, 47.0, 24.0, 28.0, 21.0, 10.0, 7.0, 5.0, 9.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.90625, -24.9677734375, -24.029296875, -23.0908203125, -22.15234375, -21.2138671875, -20.275390625, -19.3369140625, -18.3984375, -17.4599609375, -16.521484375, -15.5830078125, -14.64453125, -13.7060546875, -12.767578125, -11.8291015625, -10.890625, -9.9521484375, -9.013671875, -8.0751953125, -7.13671875, -6.1982421875, -5.259765625, -4.3212890625, -3.3828125, -2.4443359375, -1.505859375, -0.5673828125, 0.37109375, 1.3095703125, 2.248046875, 3.1865234375, 4.125, 5.0634765625, 6.001953125, 6.9404296875, 7.87890625, 8.8173828125, 9.755859375, 10.6943359375, 11.6328125, 12.5712890625, 13.509765625, 14.4482421875, 15.38671875, 16.3251953125, 17.263671875, 18.2021484375, 19.140625, 20.0791015625, 21.017578125, 21.9560546875, 22.89453125, 23.8330078125, 24.771484375, 25.7099609375, 26.6484375, 27.5869140625, 28.525390625, 29.4638671875, 30.40234375, 31.3408203125, 32.279296875, 33.2177734375, 34.15625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 15.0, 10.0, 8.0, 20.0, 20.0, 26.0, 27.0, 41.0, 33.0, 42.0, 57.0, 36.0, 59.0, 60.0, 46.0, 52.0, 50.0, 50.0, 57.0, 54.0, 31.0, 38.0, 25.0, 35.0, 14.0, 18.0, 17.0, 12.0, 5.0, 10.0, 5.0, 6.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.859375, -23.845947265625, -22.83251953125, -21.819091796875, -20.8056640625, -19.792236328125, -18.77880859375, -17.765380859375, -16.751953125, -15.738525390625, -14.72509765625, -13.711669921875, -12.6982421875, -11.684814453125, -10.67138671875, -9.657958984375, -8.64453125, -7.631103515625, -6.61767578125, -5.604248046875, -4.5908203125, -3.577392578125, -2.56396484375, -1.550537109375, -0.537109375, 0.476318359375, 1.48974609375, 2.503173828125, 3.5166015625, 4.530029296875, 5.54345703125, 6.556884765625, 7.5703125, 8.583740234375, 9.59716796875, 10.610595703125, 11.6240234375, 12.637451171875, 13.65087890625, 14.664306640625, 15.677734375, 16.691162109375, 17.70458984375, 18.718017578125, 19.7314453125, 20.744873046875, 21.75830078125, 22.771728515625, 23.78515625, 24.798583984375, 25.81201171875, 26.825439453125, 27.8388671875, 28.852294921875, 29.86572265625, 30.879150390625, 31.892578125, 32.906005859375, 33.91943359375, 34.932861328125, 35.9462890625, 36.959716796875, 37.97314453125, 38.986572265625, 40.0]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 12.0, 11.0, 12.0, 12.0, 28.0, 33.0, 36.0, 78.0, 138.0, 265.0, 696.0, 2009.0, 7006.0, 42690.0, 729287.0, 240968.0, 18826.0, 4173.0, 1300.0, 479.0, 193.0, 125.0, 60.0, 37.0, 18.0, 18.0, 13.0, 10.0, 8.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.25, -17.7796630859375, -17.309326171875, -16.8389892578125, -16.36865234375, -15.8983154296875, -15.427978515625, -14.9576416015625, -14.4873046875, -14.0169677734375, -13.546630859375, -13.0762939453125, -12.60595703125, -12.1356201171875, -11.665283203125, -11.1949462890625, -10.724609375, -10.2542724609375, -9.783935546875, -9.3135986328125, -8.84326171875, -8.3729248046875, -7.902587890625, -7.4322509765625, -6.9619140625, -6.4915771484375, -6.021240234375, -5.5509033203125, -5.08056640625, -4.6102294921875, -4.139892578125, -3.6695556640625, -3.19921875, -2.7288818359375, -2.258544921875, -1.7882080078125, -1.31787109375, -0.8475341796875, -0.377197265625, 0.0931396484375, 0.5634765625, 1.0338134765625, 1.504150390625, 1.9744873046875, 2.44482421875, 2.9151611328125, 3.385498046875, 3.8558349609375, 4.326171875, 4.7965087890625, 5.266845703125, 5.7371826171875, 6.20751953125, 6.6778564453125, 7.148193359375, 7.6185302734375, 8.0888671875, 8.5592041015625, 9.029541015625, 9.4998779296875, 9.97021484375, 10.4405517578125, 10.910888671875, 11.3812255859375, 11.8515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 5.0, 5.0, 11.0, 5.0, 10.0, 12.0, 8.0, 12.0, 29.0, 28.0, 34.0, 56.0, 116.0, 230.0, 180.0, 97.0, 46.0, 27.0, 18.0, 16.0, 6.0, 8.0, 5.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010776519775390625, -0.0010389834642410278, -0.0010003149509429932, -0.0009616464376449585, -0.0009229779243469238, -0.0008843094110488892, -0.0008456408977508545, -0.0008069723844528198, -0.0007683038711547852, -0.0007296353578567505, -0.0006909668445587158, -0.0006522983312606812, -0.0006136298179626465, -0.0005749613046646118, -0.0005362927913665771, -0.0004976242780685425, -0.0004589557647705078, -0.00042028725147247314, -0.0003816187381744385, -0.0003429502248764038, -0.00030428171157836914, -0.00026561319828033447, -0.0002269446849822998, -0.00018827617168426514, -0.00014960765838623047, -0.0001109391450881958, -7.227063179016113e-05, -3.3602118492126465e-05, 5.066394805908203e-06, 4.373490810394287e-05, 8.240342140197754e-05, 0.00012107193470001221, 0.00015974044799804688, 0.00019840896129608154, 0.0002370774745941162, 0.0002757459878921509, 0.00031441450119018555, 0.0003530830144882202, 0.0003917515277862549, 0.00043042004108428955, 0.0004690885543823242, 0.0005077570676803589, 0.0005464255809783936, 0.0005850940942764282, 0.0006237626075744629, 0.0006624311208724976, 0.0007010996341705322, 0.0007397681474685669, 0.0007784366607666016, 0.0008171051740646362, 0.0008557736873626709, 0.0008944422006607056, 0.0009331107139587402, 0.0009717792272567749, 0.0010104477405548096, 0.0010491162538528442, 0.001087784767150879, 0.0011264532804489136, 0.0011651217937469482, 0.001203790307044983, 0.0012424588203430176, 0.0012811273336410522, 0.001319795846939087, 0.0013584643602371216, 0.0013971328735351562]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 10.0, 8.0, 14.0, 16.0, 23.0, 30.0, 45.0, 80.0, 101.0, 199.0, 402.0, 1063.0, 4192.0, 29390.0, 698476.0, 293617.0, 16540.0, 2745.0, 803.0, 302.0, 162.0, 113.0, 70.0, 46.0, 24.0, 24.0, 16.0, 12.0, 16.0, 10.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.796875, -10.30322265625, -9.8095703125, -9.31591796875, -8.822265625, -8.32861328125, -7.8349609375, -7.34130859375, -6.84765625, -6.35400390625, -5.8603515625, -5.36669921875, -4.873046875, -4.37939453125, -3.8857421875, -3.39208984375, -2.8984375, -2.40478515625, -1.9111328125, -1.41748046875, -0.923828125, -0.43017578125, 0.0634765625, 0.55712890625, 1.05078125, 1.54443359375, 2.0380859375, 2.53173828125, 3.025390625, 3.51904296875, 4.0126953125, 4.50634765625, 5.0, 5.49365234375, 5.9873046875, 6.48095703125, 6.974609375, 7.46826171875, 7.9619140625, 8.45556640625, 8.94921875, 9.44287109375, 9.9365234375, 10.43017578125, 10.923828125, 11.41748046875, 11.9111328125, 12.40478515625, 12.8984375, 13.39208984375, 13.8857421875, 14.37939453125, 14.873046875, 15.36669921875, 15.8603515625, 16.35400390625, 16.84765625, 17.34130859375, 17.8349609375, 18.32861328125, 18.822265625, 19.31591796875, 19.8095703125, 20.30322265625, 20.796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 11.0, 23.0, 29.0, 48.0, 62.0, 115.0, 155.0, 169.0, 131.0, 103.0, 54.0, 30.0, 25.0, 10.0, 15.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375, -8.916015625, -8.45703125, -7.998046875, -7.5390625, -7.080078125, -6.62109375, -6.162109375, -5.703125, -5.244140625, -4.78515625, -4.326171875, -3.8671875, -3.408203125, -2.94921875, -2.490234375, -2.03125, -1.572265625, -1.11328125, -0.654296875, -0.1953125, 0.263671875, 0.72265625, 1.181640625, 1.640625, 2.099609375, 2.55859375, 3.017578125, 3.4765625, 3.935546875, 4.39453125, 4.853515625, 5.3125, 5.771484375, 6.23046875, 6.689453125, 7.1484375, 7.607421875, 8.06640625, 8.525390625, 8.984375, 9.443359375, 9.90234375, 10.361328125, 10.8203125, 11.279296875, 11.73828125, 12.197265625, 12.65625, 13.115234375, 13.57421875, 14.033203125, 14.4921875, 14.951171875, 15.41015625, 15.869140625, 16.328125, 16.787109375, 17.24609375, 17.705078125, 18.1640625, 18.623046875, 19.08203125, 19.541015625, 20.0]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 23.0, 47.0, 200.0, 411.0, 238.0, 67.0, 17.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-601.9779663085938, -588.9923706054688, -576.0067138671875, -563.0211181640625, -550.0355224609375, -537.0498657226562, -524.0642700195312, -511.0786437988281, -498.093017578125, -485.1073913574219, -472.1217956542969, -459.13616943359375, -446.1505432128906, -433.1649169921875, -420.1793212890625, -407.1936950683594, -394.20806884765625, -381.2224426269531, -368.2368469238281, -355.251220703125, -342.2655944824219, -329.27996826171875, -316.29437255859375, -303.3087463378906, -290.3231506347656, -277.3375244140625, -264.3519287109375, -251.36630249023438, -238.38067626953125, -225.3950653076172, -212.40945434570312, -199.423828125, -186.4381866455078, -173.45257568359375, -160.46694946289062, -147.48133850097656, -134.49571228027344, -121.51010131835938, -108.52448272705078, -95.53886413574219, -82.5532455444336, -69.567626953125, -56.582008361816406, -43.59639358520508, -30.610774993896484, -17.625160217285156, -4.6395416259765625, 8.346076965332031, 21.331695556640625, 34.31731414794922, 47.30293273925781, 60.28854751586914, 73.274169921875, 86.25978088378906, 99.24539947509766, 112.23101806640625, 125.21663665771484, 138.20225524902344, 151.1878662109375, 164.17349243164062, 177.1591033935547, 190.14471435546875, 203.13034057617188, 216.115966796875, 229.10157775878906]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 5.0, 8.0, 7.0, 11.0, 11.0, 21.0, 18.0, 33.0, 28.0, 36.0, 39.0, 50.0, 37.0, 51.0, 49.0, 49.0, 51.0, 66.0, 47.0, 43.0, 37.0, 48.0, 32.0, 43.0, 40.0, 27.0, 20.0, 17.0, 20.0, 18.0, 11.0, 8.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-174.9173126220703, -170.01104736328125, -165.10476684570312, -160.198486328125, -155.29222106933594, -150.38595581054688, -145.47967529296875, -140.57339477539062, -135.66712951660156, -130.7608642578125, -125.85458374023438, -120.94831085205078, -116.04203796386719, -111.1357650756836, -106.2294921875, -101.3232192993164, -96.41694641113281, -91.51067352294922, -86.60440063476562, -81.69812774658203, -76.79185485839844, -71.88558197021484, -66.97930908203125, -62.073036193847656, -57.16676330566406, -52.26049041748047, -47.354217529296875, -42.44794464111328, -37.54167175292969, -32.635398864746094, -27.7291259765625, -22.822853088378906, -17.916595458984375, -13.010322570800781, -8.104049682617188, -3.1977767944335938, 1.70849609375, 6.614768981933594, 11.521041870117188, 16.42731475830078, 21.333587646484375, 26.23986053466797, 31.146133422851562, 36.052406311035156, 40.95867919921875, 45.864952087402344, 50.77122497558594, 55.67749786376953, 60.583770751953125, 65.49004364013672, 70.39631652832031, 75.3025894165039, 80.2088623046875, 85.1151351928711, 90.02140808105469, 94.92768096923828, 99.83395385742188, 104.74022674560547, 109.64649963378906, 114.55277252197266, 119.45904541015625, 124.36531829833984, 129.27159118652344, 134.1778564453125, 139.08413696289062]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 18.0, 16.0, 22.0, 31.0, 44.0, 65.0, 86.0, 159.0, 282.0, 513.0, 1039.0, 2306.0, 6307.0, 20628.0, 96680.0, 3283128.0, 700244.0, 58945.0, 14618.0, 4999.0, 1974.0, 889.0, 448.0, 268.0, 166.0, 107.0, 69.0, 41.0, 45.0, 27.0, 22.0, 16.0, 13.0, 10.0, 7.0, 5.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-33.125, -32.0517578125, -30.978515625, -29.9052734375, -28.83203125, -27.7587890625, -26.685546875, -25.6123046875, -24.5390625, -23.4658203125, -22.392578125, -21.3193359375, -20.24609375, -19.1728515625, -18.099609375, -17.0263671875, -15.953125, -14.8798828125, -13.806640625, -12.7333984375, -11.66015625, -10.5869140625, -9.513671875, -8.4404296875, -7.3671875, -6.2939453125, -5.220703125, -4.1474609375, -3.07421875, -2.0009765625, -0.927734375, 0.1455078125, 1.21875, 2.2919921875, 3.365234375, 4.4384765625, 5.51171875, 6.5849609375, 7.658203125, 8.7314453125, 9.8046875, 10.8779296875, 11.951171875, 13.0244140625, 14.09765625, 15.1708984375, 16.244140625, 17.3173828125, 18.390625, 19.4638671875, 20.537109375, 21.6103515625, 22.68359375, 23.7568359375, 24.830078125, 25.9033203125, 26.9765625, 28.0498046875, 29.123046875, 30.1962890625, 31.26953125, 32.3427734375, 33.416015625, 34.4892578125, 35.5625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 10.0, 11.0, 17.0, 46.0, 39.0, 75.0, 84.0, 100.0, 115.0, 102.0, 88.0, 93.0, 56.0, 47.0, 43.0, 25.0, 20.0, 12.0, 6.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7109375, -11.279052734375, -10.84716796875, -10.415283203125, -9.9833984375, -9.551513671875, -9.11962890625, -8.687744140625, -8.255859375, -7.823974609375, -7.39208984375, -6.960205078125, -6.5283203125, -6.096435546875, -5.66455078125, -5.232666015625, -4.80078125, -4.368896484375, -3.93701171875, -3.505126953125, -3.0732421875, -2.641357421875, -2.20947265625, -1.777587890625, -1.345703125, -0.913818359375, -0.48193359375, -0.050048828125, 0.3818359375, 0.813720703125, 1.24560546875, 1.677490234375, 2.109375, 2.541259765625, 2.97314453125, 3.405029296875, 3.8369140625, 4.268798828125, 4.70068359375, 5.132568359375, 5.564453125, 5.996337890625, 6.42822265625, 6.860107421875, 7.2919921875, 7.723876953125, 8.15576171875, 8.587646484375, 9.01953125, 9.451416015625, 9.88330078125, 10.315185546875, 10.7470703125, 11.178955078125, 11.61083984375, 12.042724609375, 12.474609375, 12.906494140625, 13.33837890625, 13.770263671875, 14.2021484375, 14.634033203125, 15.06591796875, 15.497802734375, 15.9296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 11.0, 8.0, 15.0, 18.0, 25.0, 30.0, 41.0, 47.0, 69.0, 94.0, 109.0, 185.0, 345.0, 619.0, 1258.0, 2795.0, 7422.0, 23142.0, 102035.0, 2566635.0, 1368054.0, 88858.0, 20545.0, 6732.0, 2560.0, 1136.0, 554.0, 327.0, 153.0, 119.0, 85.0, 57.0, 36.0, 34.0, 30.0, 25.0, 24.0, 11.0, 9.0, 11.0, 3.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-29.90625, -29.025634765625, -28.14501953125, -27.264404296875, -26.3837890625, -25.503173828125, -24.62255859375, -23.741943359375, -22.861328125, -21.980712890625, -21.10009765625, -20.219482421875, -19.3388671875, -18.458251953125, -17.57763671875, -16.697021484375, -15.81640625, -14.935791015625, -14.05517578125, -13.174560546875, -12.2939453125, -11.413330078125, -10.53271484375, -9.652099609375, -8.771484375, -7.890869140625, -7.01025390625, -6.129638671875, -5.2490234375, -4.368408203125, -3.48779296875, -2.607177734375, -1.7265625, -0.845947265625, 0.03466796875, 0.915283203125, 1.7958984375, 2.676513671875, 3.55712890625, 4.437744140625, 5.318359375, 6.198974609375, 7.07958984375, 7.960205078125, 8.8408203125, 9.721435546875, 10.60205078125, 11.482666015625, 12.36328125, 13.243896484375, 14.12451171875, 15.005126953125, 15.8857421875, 16.766357421875, 17.64697265625, 18.527587890625, 19.408203125, 20.288818359375, 21.16943359375, 22.050048828125, 22.9306640625, 23.811279296875, 24.69189453125, 25.572509765625, 26.453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 9.0, 7.0, 13.0, 22.0, 45.0, 100.0, 237.0, 1181.0, 2043.0, 232.0, 82.0, 43.0, 29.0, 19.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.171875, -23.367919921875, -22.56396484375, -21.760009765625, -20.9560546875, -20.152099609375, -19.34814453125, -18.544189453125, -17.740234375, -16.936279296875, -16.13232421875, -15.328369140625, -14.5244140625, -13.720458984375, -12.91650390625, -12.112548828125, -11.30859375, -10.504638671875, -9.70068359375, -8.896728515625, -8.0927734375, -7.288818359375, -6.48486328125, -5.680908203125, -4.876953125, -4.072998046875, -3.26904296875, -2.465087890625, -1.6611328125, -0.857177734375, -0.05322265625, 0.750732421875, 1.5546875, 2.358642578125, 3.16259765625, 3.966552734375, 4.7705078125, 5.574462890625, 6.37841796875, 7.182373046875, 7.986328125, 8.790283203125, 9.59423828125, 10.398193359375, 11.2021484375, 12.006103515625, 12.81005859375, 13.614013671875, 14.41796875, 15.221923828125, 16.02587890625, 16.829833984375, 17.6337890625, 18.437744140625, 19.24169921875, 20.045654296875, 20.849609375, 21.653564453125, 22.45751953125, 23.261474609375, 24.0654296875, 24.869384765625, 25.67333984375, 26.477294921875, 27.28125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 14.0, 77.0, 375.0, 429.0, 90.0, 15.0, 4.0, 1.0, 2.0], "bins": [-420.2679443359375, -413.0373229980469, -405.8066711425781, -398.5760498046875, -391.34539794921875, -384.1147766113281, -376.8841552734375, -369.65350341796875, -362.4228820800781, -355.1922607421875, -347.96160888671875, -340.7309875488281, -333.5003356933594, -326.26971435546875, -319.0390625, -311.8084411621094, -304.57781982421875, -297.3471984863281, -290.1165466308594, -282.88592529296875, -275.6552734375, -268.4246520996094, -261.19403076171875, -253.96337890625, -246.73272705078125, -239.50209045410156, -232.27145385742188, -225.04083251953125, -217.81019592285156, -210.57955932617188, -203.3489227294922, -196.1182861328125, -188.88766479492188, -181.6570281982422, -174.4263916015625, -167.19577026367188, -159.9651336669922, -152.7344970703125, -145.5038604736328, -138.27322387695312, -131.0426025390625, -123.81196594238281, -116.58133697509766, -109.35070037841797, -102.12007141113281, -94.88943481445312, -87.65879821777344, -80.42816162109375, -73.1975326538086, -65.9668960571289, -58.73626708984375, -51.50563049316406, -44.27499771118164, -37.04436492919922, -29.81372833251953, -22.58309555053711, -15.352462768554688, -8.12182903289795, -0.8911952972412109, 6.339439392089844, 13.570072174072266, 20.800704956054688, 28.031341552734375, 35.2619743347168, 42.49260711669922]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 9.0, 7.0, 14.0, 12.0, 27.0, 21.0, 25.0, 45.0, 41.0, 42.0, 55.0, 53.0, 51.0, 71.0, 61.0, 47.0, 57.0, 49.0, 51.0, 55.0, 47.0, 28.0, 26.0, 22.0, 22.0, 12.0, 14.0, 13.0, 2.0, 3.0, 4.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.321712493896484, -50.57841873168945, -48.83512878417969, -47.091835021972656, -45.348541259765625, -43.60525131225586, -41.86195755004883, -40.11866760253906, -38.37537384033203, -36.632080078125, -34.888790130615234, -33.1454963684082, -31.402204513549805, -29.658912658691406, -27.915618896484375, -26.172327041625977, -24.429035186767578, -22.68574333190918, -20.94245147705078, -19.19915771484375, -17.45586585998535, -15.712574005126953, -13.969281196594238, -12.225988388061523, -10.482696533203125, -8.739404678344727, -6.996111869812012, -5.252819538116455, -3.5095272064208984, -1.7662353515625, -0.022942543029785156, 1.7203502655029297, 3.463642120361328, 5.206934452056885, 6.950226783752441, 8.693519592285156, 10.436811447143555, 12.180103302001953, 13.923396110534668, 15.666688919067383, 17.40998077392578, 19.15327262878418, 20.896564483642578, 22.63985824584961, 24.383150100708008, 26.126441955566406, 27.869735717773438, 29.613027572631836, 31.356319427490234, 33.099613189697266, 34.84290313720703, 36.58619689941406, 38.329490661621094, 40.07278060913086, 41.81607437133789, 43.559364318847656, 45.30265808105469, 47.04595184326172, 48.789241790771484, 50.532535552978516, 52.27582550048828, 54.01911926269531, 55.762413024902344, 57.505706787109375, 59.24899673461914]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 18.0, 31.0, 30.0, 53.0, 84.0, 99.0, 151.0, 259.0, 500.0, 959.0, 2170.0, 6315.0, 19926.0, 75414.0, 295536.0, 465702.0, 131576.0, 33905.0, 9669.0, 3296.0, 1353.0, 571.0, 342.0, 208.0, 122.0, 64.0, 63.0, 39.0, 23.0, 15.0, 13.0, 9.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.109375, -28.232666015625, -27.35595703125, -26.479248046875, -25.6025390625, -24.725830078125, -23.84912109375, -22.972412109375, -22.095703125, -21.218994140625, -20.34228515625, -19.465576171875, -18.5888671875, -17.712158203125, -16.83544921875, -15.958740234375, -15.08203125, -14.205322265625, -13.32861328125, -12.451904296875, -11.5751953125, -10.698486328125, -9.82177734375, -8.945068359375, -8.068359375, -7.191650390625, -6.31494140625, -5.438232421875, -4.5615234375, -3.684814453125, -2.80810546875, -1.931396484375, -1.0546875, -0.177978515625, 0.69873046875, 1.575439453125, 2.4521484375, 3.328857421875, 4.20556640625, 5.082275390625, 5.958984375, 6.835693359375, 7.71240234375, 8.589111328125, 9.4658203125, 10.342529296875, 11.21923828125, 12.095947265625, 12.97265625, 13.849365234375, 14.72607421875, 15.602783203125, 16.4794921875, 17.356201171875, 18.23291015625, 19.109619140625, 19.986328125, 20.863037109375, 21.73974609375, 22.616455078125, 23.4931640625, 24.369873046875, 25.24658203125, 26.123291015625, 27.0]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 6.0, 15.0, 26.0, 38.0, 51.0, 69.0, 92.0, 91.0, 104.0, 104.0, 101.0, 82.0, 65.0, 49.0, 38.0, 20.0, 22.0, 11.0, 8.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.3677978515625, -10.930908203125, -10.4940185546875, -10.05712890625, -9.6202392578125, -9.183349609375, -8.7464599609375, -8.3095703125, -7.8726806640625, -7.435791015625, -6.9989013671875, -6.56201171875, -6.1251220703125, -5.688232421875, -5.2513427734375, -4.814453125, -4.3775634765625, -3.940673828125, -3.5037841796875, -3.06689453125, -2.6300048828125, -2.193115234375, -1.7562255859375, -1.3193359375, -0.8824462890625, -0.445556640625, -0.0086669921875, 0.42822265625, 0.8651123046875, 1.302001953125, 1.7388916015625, 2.17578125, 2.6126708984375, 3.049560546875, 3.4864501953125, 3.92333984375, 4.3602294921875, 4.797119140625, 5.2340087890625, 5.6708984375, 6.1077880859375, 6.544677734375, 6.9815673828125, 7.41845703125, 7.8553466796875, 8.292236328125, 8.7291259765625, 9.166015625, 9.6029052734375, 10.039794921875, 10.4766845703125, 10.91357421875, 11.3504638671875, 11.787353515625, 12.2242431640625, 12.6611328125, 13.0980224609375, 13.534912109375, 13.9718017578125, 14.40869140625, 14.8455810546875, 15.282470703125, 15.7193603515625, 16.15625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 9.0, 9.0, 23.0, 19.0, 22.0, 31.0, 54.0, 91.0, 119.0, 167.0, 295.0, 436.0, 748.0, 1482.0, 5211.0, 51155.0, 782590.0, 189290.0, 11949.0, 2345.0, 947.0, 514.0, 330.0, 221.0, 154.0, 116.0, 62.0, 46.0, 38.0, 26.0, 16.0, 14.0, 6.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-65.0625, -63.33740234375, -61.6123046875, -59.88720703125, -58.162109375, -56.43701171875, -54.7119140625, -52.98681640625, -51.26171875, -49.53662109375, -47.8115234375, -46.08642578125, -44.361328125, -42.63623046875, -40.9111328125, -39.18603515625, -37.4609375, -35.73583984375, -34.0107421875, -32.28564453125, -30.560546875, -28.83544921875, -27.1103515625, -25.38525390625, -23.66015625, -21.93505859375, -20.2099609375, -18.48486328125, -16.759765625, -15.03466796875, -13.3095703125, -11.58447265625, -9.859375, -8.13427734375, -6.4091796875, -4.68408203125, -2.958984375, -1.23388671875, 0.4912109375, 2.21630859375, 3.94140625, 5.66650390625, 7.3916015625, 9.11669921875, 10.841796875, 12.56689453125, 14.2919921875, 16.01708984375, 17.7421875, 19.46728515625, 21.1923828125, 22.91748046875, 24.642578125, 26.36767578125, 28.0927734375, 29.81787109375, 31.54296875, 33.26806640625, 34.9931640625, 36.71826171875, 38.443359375, 40.16845703125, 41.8935546875, 43.61865234375, 45.34375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 7.0, 3.0, 6.0, 14.0, 16.0, 19.0, 12.0, 23.0, 25.0, 29.0, 42.0, 33.0, 40.0, 43.0, 60.0, 65.0, 72.0, 69.0, 50.0, 44.0, 58.0, 48.0, 42.0, 33.0, 32.0, 20.0, 20.0, 9.0, 15.0, 14.0, 9.0, 6.0, 8.0, 7.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-45.28125, -44.013671875, -42.74609375, -41.478515625, -40.2109375, -38.943359375, -37.67578125, -36.408203125, -35.140625, -33.873046875, -32.60546875, -31.337890625, -30.0703125, -28.802734375, -27.53515625, -26.267578125, -25.0, -23.732421875, -22.46484375, -21.197265625, -19.9296875, -18.662109375, -17.39453125, -16.126953125, -14.859375, -13.591796875, -12.32421875, -11.056640625, -9.7890625, -8.521484375, -7.25390625, -5.986328125, -4.71875, -3.451171875, -2.18359375, -0.916015625, 0.3515625, 1.619140625, 2.88671875, 4.154296875, 5.421875, 6.689453125, 7.95703125, 9.224609375, 10.4921875, 11.759765625, 13.02734375, 14.294921875, 15.5625, 16.830078125, 18.09765625, 19.365234375, 20.6328125, 21.900390625, 23.16796875, 24.435546875, 25.703125, 26.970703125, 28.23828125, 29.505859375, 30.7734375, 32.041015625, 33.30859375, 34.576171875, 35.84375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 0.0, 5.0, 8.0, 4.0, 8.0, 14.0, 18.0, 11.0, 33.0, 40.0, 59.0, 101.0, 158.0, 260.0, 481.0, 1001.0, 2284.0, 6416.0, 24962.0, 124529.0, 625029.0, 208753.0, 39373.0, 9376.0, 2957.0, 1303.0, 561.0, 306.0, 190.0, 99.0, 65.0, 41.0, 28.0, 23.0, 14.0, 7.0, 3.0, 5.0, 7.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.953125, -11.575439453125, -11.19775390625, -10.820068359375, -10.4423828125, -10.064697265625, -9.68701171875, -9.309326171875, -8.931640625, -8.553955078125, -8.17626953125, -7.798583984375, -7.4208984375, -7.043212890625, -6.66552734375, -6.287841796875, -5.91015625, -5.532470703125, -5.15478515625, -4.777099609375, -4.3994140625, -4.021728515625, -3.64404296875, -3.266357421875, -2.888671875, -2.510986328125, -2.13330078125, -1.755615234375, -1.3779296875, -1.000244140625, -0.62255859375, -0.244873046875, 0.1328125, 0.510498046875, 0.88818359375, 1.265869140625, 1.6435546875, 2.021240234375, 2.39892578125, 2.776611328125, 3.154296875, 3.531982421875, 3.90966796875, 4.287353515625, 4.6650390625, 5.042724609375, 5.42041015625, 5.798095703125, 6.17578125, 6.553466796875, 6.93115234375, 7.308837890625, 7.6865234375, 8.064208984375, 8.44189453125, 8.819580078125, 9.197265625, 9.574951171875, 9.95263671875, 10.330322265625, 10.7080078125, 11.085693359375, 11.46337890625, 11.841064453125, 12.21875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 15.0, 20.0, 30.0, 32.0, 27.0, 62.0, 63.0, 107.0, 196.0, 135.0, 71.0, 60.0, 40.0, 31.0, 19.0, 23.0, 16.0, 13.0, 12.0, 4.0, 3.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010499954223632812, -0.000993475317955017, -0.0009369552135467529, -0.0008804351091384888, -0.0008239150047302246, -0.0007673949003219604, -0.0007108747959136963, -0.0006543546915054321, -0.000597834587097168, -0.0005413144826889038, -0.00048479437828063965, -0.0004282742738723755, -0.00037175416946411133, -0.00031523406505584717, -0.000258713960647583, -0.00020219385623931885, -0.0001456737518310547, -8.915364742279053e-05, -3.263354301452637e-05, 2.3886561393737793e-05, 8.040666580200195e-05, 0.0001369267702102661, 0.00019344687461853027, 0.00024996697902679443, 0.0003064870834350586, 0.00036300718784332275, 0.0004195272922515869, 0.0004760473966598511, 0.0005325675010681152, 0.0005890876054763794, 0.0006456077098846436, 0.0007021278142929077, 0.0007586479187011719, 0.000815168023109436, 0.0008716881275177002, 0.0009282082319259644, 0.0009847283363342285, 0.0010412484407424927, 0.0010977685451507568, 0.001154288649559021, 0.0012108087539672852, 0.0012673288583755493, 0.0013238489627838135, 0.0013803690671920776, 0.0014368891716003418, 0.001493409276008606, 0.0015499293804168701, 0.0016064494848251343, 0.0016629695892333984, 0.0017194896936416626, 0.0017760097980499268, 0.001832529902458191, 0.001889050006866455, 0.0019455701112747192, 0.0020020902156829834, 0.0020586103200912476, 0.0021151304244995117, 0.002171650528907776, 0.00222817063331604, 0.002284690737724304, 0.0023412108421325684, 0.0023977309465408325, 0.0024542510509490967, 0.002510771155357361, 0.002567291259765625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 13.0, 10.0, 18.0, 30.0, 49.0, 65.0, 100.0, 159.0, 252.0, 462.0, 944.0, 2578.0, 14024.0, 329564.0, 668263.0, 26180.0, 3321.0, 1180.0, 562.0, 267.0, 150.0, 100.0, 79.0, 50.0, 37.0, 21.0, 24.0, 11.0, 8.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.96875, -20.294921875, -19.62109375, -18.947265625, -18.2734375, -17.599609375, -16.92578125, -16.251953125, -15.578125, -14.904296875, -14.23046875, -13.556640625, -12.8828125, -12.208984375, -11.53515625, -10.861328125, -10.1875, -9.513671875, -8.83984375, -8.166015625, -7.4921875, -6.818359375, -6.14453125, -5.470703125, -4.796875, -4.123046875, -3.44921875, -2.775390625, -2.1015625, -1.427734375, -0.75390625, -0.080078125, 0.59375, 1.267578125, 1.94140625, 2.615234375, 3.2890625, 3.962890625, 4.63671875, 5.310546875, 5.984375, 6.658203125, 7.33203125, 8.005859375, 8.6796875, 9.353515625, 10.02734375, 10.701171875, 11.375, 12.048828125, 12.72265625, 13.396484375, 14.0703125, 14.744140625, 15.41796875, 16.091796875, 16.765625, 17.439453125, 18.11328125, 18.787109375, 19.4609375, 20.134765625, 20.80859375, 21.482421875, 22.15625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 19.0, 20.0, 30.0, 32.0, 41.0, 45.0, 62.0, 72.0, 86.0, 99.0, 98.0, 91.0, 67.0, 55.0, 48.0, 30.0, 17.0, 19.0, 10.0, 6.0, 7.0, 5.0, 7.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.765625, -9.369873046875, -8.97412109375, -8.578369140625, -8.1826171875, -7.786865234375, -7.39111328125, -6.995361328125, -6.599609375, -6.203857421875, -5.80810546875, -5.412353515625, -5.0166015625, -4.620849609375, -4.22509765625, -3.829345703125, -3.43359375, -3.037841796875, -2.64208984375, -2.246337890625, -1.8505859375, -1.454833984375, -1.05908203125, -0.663330078125, -0.267578125, 0.128173828125, 0.52392578125, 0.919677734375, 1.3154296875, 1.711181640625, 2.10693359375, 2.502685546875, 2.8984375, 3.294189453125, 3.68994140625, 4.085693359375, 4.4814453125, 4.877197265625, 5.27294921875, 5.668701171875, 6.064453125, 6.460205078125, 6.85595703125, 7.251708984375, 7.6474609375, 8.043212890625, 8.43896484375, 8.834716796875, 9.23046875, 9.626220703125, 10.02197265625, 10.417724609375, 10.8134765625, 11.209228515625, 11.60498046875, 12.000732421875, 12.396484375, 12.792236328125, 13.18798828125, 13.583740234375, 13.9794921875, 14.375244140625, 14.77099609375, 15.166748046875, 15.5625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 75.0, 465.0, 372.0, 71.0, 17.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1122.242431640625, -1097.734130859375, -1073.2257080078125, -1048.7174072265625, -1024.2091064453125, -999.7007446289062, -975.1923828125, -950.68408203125, -926.17578125, -901.6674194335938, -877.1591186523438, -852.6507568359375, -828.1424560546875, -803.6340942382812, -779.125732421875, -754.617431640625, -730.1090698242188, -705.6007080078125, -681.0924072265625, -656.5840454101562, -632.0757446289062, -607.5673828125, -583.05908203125, -558.5507202148438, -534.0423583984375, -509.5340270996094, -485.02569580078125, -460.517333984375, -436.009033203125, -411.50067138671875, -386.9923400878906, -362.4840087890625, -337.9757385253906, -313.4674072265625, -288.9590759277344, -264.45074462890625, -239.94239807128906, -215.43406677246094, -190.92572021484375, -166.41738891601562, -141.9090576171875, -117.40072631835938, -92.89238739013672, -68.38404846191406, -43.87571716308594, -19.367385864257812, 5.140960693359375, 29.6492919921875, 54.157623291015625, 78.66595458984375, 103.1742935180664, 127.68263244628906, 152.1909637451172, 176.6992950439453, 201.2076416015625, 225.71597290039062, 250.22430419921875, 274.7326354980469, 299.240966796875, 323.74932861328125, 348.25762939453125, 372.7659912109375, 397.2743225097656, 421.78265380859375, 446.2909851074219]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 4.0, 8.0, 10.0, 7.0, 9.0, 18.0, 13.0, 16.0, 22.0, 23.0, 26.0, 32.0, 28.0, 37.0, 37.0, 32.0, 37.0, 36.0, 43.0, 41.0, 33.0, 42.0, 44.0, 33.0, 32.0, 32.0, 40.0, 39.0, 23.0, 30.0, 22.0, 22.0, 20.0, 17.0, 15.0, 16.0, 13.0, 10.0, 5.0, 6.0, 6.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-148.94924926757812, -144.28082275390625, -139.6123809814453, -134.94395446777344, -130.2755126953125, -125.60708618164062, -120.93865203857422, -116.27021789550781, -111.60179138183594, -106.93335723876953, -102.26492309570312, -97.59649658203125, -92.92806243896484, -88.25962829589844, -83.59119415283203, -78.92276000976562, -74.25432586669922, -69.58589172363281, -64.9174575805664, -60.249027252197266, -55.580596923828125, -50.91216278076172, -46.24372863769531, -41.57529830932617, -36.906864166259766, -32.23843002319336, -27.56999969482422, -22.901565551757812, -18.23313331604004, -13.564701080322266, -8.89626693725586, -4.227836608886719, 0.4405975341796875, 5.109030246734619, 9.77746295928955, 14.44589614868164, 19.114328384399414, 23.782760620117188, 28.451194763183594, 33.119625091552734, 37.78805923461914, 42.45649337768555, 47.12492370605469, 51.793357849121094, 56.4617919921875, 61.13022232055664, 65.79866027832031, 70.46708679199219, 75.1355209350586, 79.803955078125, 84.4723892211914, 89.14082336425781, 93.80924987792969, 98.4776840209961, 103.1461181640625, 107.81454467773438, 112.48298645019531, 117.15142059326172, 121.81985473632812, 126.48828125, 131.15672302246094, 135.8251495361328, 140.49359130859375, 145.16201782226562, 149.8304443359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 9.0, 6.0, 17.0, 17.0, 19.0, 24.0, 46.0, 57.0, 103.0, 215.0, 410.0, 878.0, 2346.0, 6731.0, 23716.0, 143595.0, 3612607.0, 347987.0, 39576.0, 9897.0, 3330.0, 1308.0, 600.0, 295.0, 164.0, 102.0, 67.0, 33.0, 24.0, 15.0, 12.0, 19.0, 9.0, 5.0, 9.0, 6.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.5625, -32.3916015625, -31.220703125, -30.0498046875, -28.87890625, -27.7080078125, -26.537109375, -25.3662109375, -24.1953125, -23.0244140625, -21.853515625, -20.6826171875, -19.51171875, -18.3408203125, -17.169921875, -15.9990234375, -14.828125, -13.6572265625, -12.486328125, -11.3154296875, -10.14453125, -8.9736328125, -7.802734375, -6.6318359375, -5.4609375, -4.2900390625, -3.119140625, -1.9482421875, -0.77734375, 0.3935546875, 1.564453125, 2.7353515625, 3.90625, 5.0771484375, 6.248046875, 7.4189453125, 8.58984375, 9.7607421875, 10.931640625, 12.1025390625, 13.2734375, 14.4443359375, 15.615234375, 16.7861328125, 17.95703125, 19.1279296875, 20.298828125, 21.4697265625, 22.640625, 23.8115234375, 24.982421875, 26.1533203125, 27.32421875, 28.4951171875, 29.666015625, 30.8369140625, 32.0078125, 33.1787109375, 34.349609375, 35.5205078125, 36.69140625, 37.8623046875, 39.033203125, 40.2041015625, 41.375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 5.0, 16.0, 20.0, 24.0, 41.0, 72.0, 73.0, 75.0, 92.0, 94.0, 91.0, 100.0, 79.0, 68.0, 61.0, 30.0, 16.0, 15.0, 10.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.796875, -13.316650390625, -12.83642578125, -12.356201171875, -11.8759765625, -11.395751953125, -10.91552734375, -10.435302734375, -9.955078125, -9.474853515625, -8.99462890625, -8.514404296875, -8.0341796875, -7.553955078125, -7.07373046875, -6.593505859375, -6.11328125, -5.633056640625, -5.15283203125, -4.672607421875, -4.1923828125, -3.712158203125, -3.23193359375, -2.751708984375, -2.271484375, -1.791259765625, -1.31103515625, -0.830810546875, -0.3505859375, 0.129638671875, 0.60986328125, 1.090087890625, 1.5703125, 2.050537109375, 2.53076171875, 3.010986328125, 3.4912109375, 3.971435546875, 4.45166015625, 4.931884765625, 5.412109375, 5.892333984375, 6.37255859375, 6.852783203125, 7.3330078125, 7.813232421875, 8.29345703125, 8.773681640625, 9.25390625, 9.734130859375, 10.21435546875, 10.694580078125, 11.1748046875, 11.655029296875, 12.13525390625, 12.615478515625, 13.095703125, 13.575927734375, 14.05615234375, 14.536376953125, 15.0166015625, 15.496826171875, 15.97705078125, 16.457275390625, 16.9375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 10.0, 13.0, 6.0, 16.0, 29.0, 42.0, 62.0, 97.0, 135.0, 251.0, 386.0, 668.0, 1195.0, 2390.0, 5300.0, 12421.0, 33450.0, 117578.0, 876068.0, 2851359.0, 211127.0, 50490.0, 17474.0, 6967.0, 3130.0, 1512.0, 816.0, 527.0, 289.0, 173.0, 100.0, 73.0, 43.0, 28.0, 22.0, 14.0, 11.0, 6.0, 6.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.09375, -16.46484375, -15.8359375, -15.20703125, -14.578125, -13.94921875, -13.3203125, -12.69140625, -12.0625, -11.43359375, -10.8046875, -10.17578125, -9.546875, -8.91796875, -8.2890625, -7.66015625, -7.03125, -6.40234375, -5.7734375, -5.14453125, -4.515625, -3.88671875, -3.2578125, -2.62890625, -2.0, -1.37109375, -0.7421875, -0.11328125, 0.515625, 1.14453125, 1.7734375, 2.40234375, 3.03125, 3.66015625, 4.2890625, 4.91796875, 5.546875, 6.17578125, 6.8046875, 7.43359375, 8.0625, 8.69140625, 9.3203125, 9.94921875, 10.578125, 11.20703125, 11.8359375, 12.46484375, 13.09375, 13.72265625, 14.3515625, 14.98046875, 15.609375, 16.23828125, 16.8671875, 17.49609375, 18.125, 18.75390625, 19.3828125, 20.01171875, 20.640625, 21.26953125, 21.8984375, 22.52734375, 23.15625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 14.0, 18.0, 5.0, 21.0, 33.0, 43.0, 43.0, 100.0, 140.0, 266.0, 533.0, 1637.0, 602.0, 225.0, 138.0, 87.0, 47.0, 31.0, 16.0, 19.0, 11.0, 9.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6484375, -14.184326171875, -13.72021484375, -13.256103515625, -12.7919921875, -12.327880859375, -11.86376953125, -11.399658203125, -10.935546875, -10.471435546875, -10.00732421875, -9.543212890625, -9.0791015625, -8.614990234375, -8.15087890625, -7.686767578125, -7.22265625, -6.758544921875, -6.29443359375, -5.830322265625, -5.3662109375, -4.902099609375, -4.43798828125, -3.973876953125, -3.509765625, -3.045654296875, -2.58154296875, -2.117431640625, -1.6533203125, -1.189208984375, -0.72509765625, -0.260986328125, 0.203125, 0.667236328125, 1.13134765625, 1.595458984375, 2.0595703125, 2.523681640625, 2.98779296875, 3.451904296875, 3.916015625, 4.380126953125, 4.84423828125, 5.308349609375, 5.7724609375, 6.236572265625, 6.70068359375, 7.164794921875, 7.62890625, 8.093017578125, 8.55712890625, 9.021240234375, 9.4853515625, 9.949462890625, 10.41357421875, 10.877685546875, 11.341796875, 11.805908203125, 12.27001953125, 12.734130859375, 13.1982421875, 13.662353515625, 14.12646484375, 14.590576171875, 15.0546875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 34.0, 101.0, 391.0, 355.0, 100.0, 16.0, 0.0, 2.0], "bins": [-510.11517333984375, -501.5164794921875, -492.91778564453125, -484.3191223144531, -475.7204284667969, -467.1217346191406, -458.5230407714844, -449.9243469238281, -441.32568359375, -432.72698974609375, -424.1282958984375, -415.5296325683594, -406.9309387207031, -398.3322448730469, -389.7335510253906, -381.1348571777344, -372.5361633300781, -363.9374694824219, -355.3387756347656, -346.7401123046875, -338.14141845703125, -329.542724609375, -320.94403076171875, -312.3453369140625, -303.74664306640625, -295.14794921875, -286.54925537109375, -277.9505920410156, -269.3518981933594, -260.7532043457031, -252.15451049804688, -243.55581665039062, -234.95713806152344, -226.3584442138672, -217.759765625, -209.16107177734375, -200.5623779296875, -191.9636993408203, -183.36500549316406, -174.76632690429688, -166.16763305664062, -157.56893920898438, -148.9702606201172, -140.37156677246094, -131.77288818359375, -123.1741943359375, -114.57550048828125, -105.97681427001953, -97.37812805175781, -88.7794418334961, -80.18075561523438, -71.58206176757812, -62.983375549316406, -54.38468933105469, -45.7859992980957, -37.18730926513672, -28.588623046875, -19.98993492126465, -11.391246795654297, -2.7925586700439453, 5.806129455566406, 14.404815673828125, 23.00350570678711, 31.602195739746094, 40.20088195800781]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 4.0, 6.0, 3.0, 10.0, 7.0, 11.0, 20.0, 13.0, 15.0, 16.0, 24.0, 21.0, 22.0, 26.0, 27.0, 46.0, 33.0, 46.0, 37.0, 58.0, 40.0, 47.0, 46.0, 38.0, 37.0, 43.0, 36.0, 30.0, 38.0, 26.0, 30.0, 26.0, 24.0, 14.0, 14.0, 9.0, 13.0, 8.0, 11.0, 5.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-55.14617919921875, -53.54331588745117, -51.940452575683594, -50.33759307861328, -48.7347297668457, -47.131866455078125, -45.52900314331055, -43.92613983154297, -42.323280334472656, -40.72041702270508, -39.1175537109375, -37.51469421386719, -35.91183090209961, -34.30896759033203, -32.70610427856445, -31.103242874145508, -29.50037956237793, -27.89751625061035, -26.294654846191406, -24.691791534423828, -23.088930130004883, -21.486066818237305, -19.88320541381836, -18.28034210205078, -16.677478790283203, -15.074616432189941, -13.47175407409668, -11.868890762329102, -10.266029357910156, -8.663166046142578, -7.060303688049316, -5.457441329956055, -3.8545799255371094, -2.2517175674438477, -0.6488549709320068, 0.954007625579834, 2.5568699836730957, 4.159732818603516, 5.762595176696777, 7.365457534790039, 8.9683198928833, 10.571182250976562, 12.174044609069824, 13.776906967163086, 15.379770278930664, 16.98263168334961, 18.585494995117188, 20.188358306884766, 21.79121971130371, 23.39408302307129, 24.996944427490234, 26.599807739257812, 28.202669143676758, 29.805532455444336, 31.40839385986328, 33.01125717163086, 34.61412048339844, 36.216983795166016, 37.819847106933594, 39.422706604003906, 41.025569915771484, 42.62843322753906, 44.23129653930664, 45.83415985107422, 47.43701934814453]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 10.0, 10.0, 15.0, 22.0, 38.0, 69.0, 108.0, 183.0, 275.0, 537.0, 1196.0, 3162.0, 11580.0, 58666.0, 341090.0, 500347.0, 104545.0, 18947.0, 4524.0, 1555.0, 768.0, 357.0, 215.0, 127.0, 64.0, 44.0, 31.0, 20.0, 14.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.3125, -34.1015625, -32.890625, -31.6796875, -30.46875, -29.2578125, -28.046875, -26.8359375, -25.625, -24.4140625, -23.203125, -21.9921875, -20.78125, -19.5703125, -18.359375, -17.1484375, -15.9375, -14.7265625, -13.515625, -12.3046875, -11.09375, -9.8828125, -8.671875, -7.4609375, -6.25, -5.0390625, -3.828125, -2.6171875, -1.40625, -0.1953125, 1.015625, 2.2265625, 3.4375, 4.6484375, 5.859375, 7.0703125, 8.28125, 9.4921875, 10.703125, 11.9140625, 13.125, 14.3359375, 15.546875, 16.7578125, 17.96875, 19.1796875, 20.390625, 21.6015625, 22.8125, 24.0234375, 25.234375, 26.4453125, 27.65625, 28.8671875, 30.078125, 31.2890625, 32.5, 33.7109375, 34.921875, 36.1328125, 37.34375, 38.5546875, 39.765625, 40.9765625, 42.1875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 1.0, 8.0, 9.0, 9.0, 27.0, 30.0, 42.0, 53.0, 75.0, 89.0, 90.0, 92.0, 101.0, 82.0, 77.0, 74.0, 56.0, 27.0, 30.0, 13.0, 7.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0546875, -13.5643310546875, -13.073974609375, -12.5836181640625, -12.09326171875, -11.6029052734375, -11.112548828125, -10.6221923828125, -10.1318359375, -9.6414794921875, -9.151123046875, -8.6607666015625, -8.17041015625, -7.6800537109375, -7.189697265625, -6.6993408203125, -6.208984375, -5.7186279296875, -5.228271484375, -4.7379150390625, -4.24755859375, -3.7572021484375, -3.266845703125, -2.7764892578125, -2.2861328125, -1.7957763671875, -1.305419921875, -0.8150634765625, -0.32470703125, 0.1656494140625, 0.656005859375, 1.1463623046875, 1.63671875, 2.1270751953125, 2.617431640625, 3.1077880859375, 3.59814453125, 4.0885009765625, 4.578857421875, 5.0692138671875, 5.5595703125, 6.0499267578125, 6.540283203125, 7.0306396484375, 7.52099609375, 8.0113525390625, 8.501708984375, 8.9920654296875, 9.482421875, 9.9727783203125, 10.463134765625, 10.9534912109375, 11.44384765625, 11.9342041015625, 12.424560546875, 12.9149169921875, 13.4052734375, 13.8956298828125, 14.385986328125, 14.8763427734375, 15.36669921875, 15.8570556640625, 16.347412109375, 16.8377685546875, 17.328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 6.0, 7.0, 9.0, 10.0, 20.0, 29.0, 31.0, 49.0, 84.0, 129.0, 174.0, 378.0, 681.0, 1607.0, 6628.0, 123612.0, 875016.0, 33876.0, 3735.0, 1130.0, 565.0, 315.0, 171.0, 108.0, 57.0, 42.0, 34.0, 18.0, 10.0, 6.0, 4.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-116.875, -114.046875, -111.21875, -108.390625, -105.5625, -102.734375, -99.90625, -97.078125, -94.25, -91.421875, -88.59375, -85.765625, -82.9375, -80.109375, -77.28125, -74.453125, -71.625, -68.796875, -65.96875, -63.140625, -60.3125, -57.484375, -54.65625, -51.828125, -49.0, -46.171875, -43.34375, -40.515625, -37.6875, -34.859375, -32.03125, -29.203125, -26.375, -23.546875, -20.71875, -17.890625, -15.0625, -12.234375, -9.40625, -6.578125, -3.75, -0.921875, 1.90625, 4.734375, 7.5625, 10.390625, 13.21875, 16.046875, 18.875, 21.703125, 24.53125, 27.359375, 30.1875, 33.015625, 35.84375, 38.671875, 41.5, 44.328125, 47.15625, 49.984375, 52.8125, 55.640625, 58.46875, 61.296875, 64.125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 8.0, 8.0, 11.0, 13.0, 15.0, 22.0, 20.0, 24.0, 33.0, 39.0, 56.0, 55.0, 66.0, 70.0, 61.0, 70.0, 63.0, 79.0, 52.0, 47.0, 37.0, 27.0, 14.0, 14.0, 18.0, 17.0, 14.0, 10.0, 7.0, 3.0, 3.0, 5.0, 6.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.28125, -54.24560546875, -52.2099609375, -50.17431640625, -48.138671875, -46.10302734375, -44.0673828125, -42.03173828125, -39.99609375, -37.96044921875, -35.9248046875, -33.88916015625, -31.853515625, -29.81787109375, -27.7822265625, -25.74658203125, -23.7109375, -21.67529296875, -19.6396484375, -17.60400390625, -15.568359375, -13.53271484375, -11.4970703125, -9.46142578125, -7.42578125, -5.39013671875, -3.3544921875, -1.31884765625, 0.716796875, 2.75244140625, 4.7880859375, 6.82373046875, 8.859375, 10.89501953125, 12.9306640625, 14.96630859375, 17.001953125, 19.03759765625, 21.0732421875, 23.10888671875, 25.14453125, 27.18017578125, 29.2158203125, 31.25146484375, 33.287109375, 35.32275390625, 37.3583984375, 39.39404296875, 41.4296875, 43.46533203125, 45.5009765625, 47.53662109375, 49.572265625, 51.60791015625, 53.6435546875, 55.67919921875, 57.71484375, 59.75048828125, 61.7861328125, 63.82177734375, 65.857421875, 67.89306640625, 69.9287109375, 71.96435546875, 74.0]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 14.0, 14.0, 16.0, 20.0, 30.0, 52.0, 90.0, 163.0, 448.0, 1979.0, 41283.0, 940085.0, 60913.0, 2515.0, 477.0, 190.0, 93.0, 51.0, 43.0, 17.0, 16.0, 4.0, 12.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.6875, -38.50439453125, -37.3212890625, -36.13818359375, -34.955078125, -33.77197265625, -32.5888671875, -31.40576171875, -30.22265625, -29.03955078125, -27.8564453125, -26.67333984375, -25.490234375, -24.30712890625, -23.1240234375, -21.94091796875, -20.7578125, -19.57470703125, -18.3916015625, -17.20849609375, -16.025390625, -14.84228515625, -13.6591796875, -12.47607421875, -11.29296875, -10.10986328125, -8.9267578125, -7.74365234375, -6.560546875, -5.37744140625, -4.1943359375, -3.01123046875, -1.828125, -0.64501953125, 0.5380859375, 1.72119140625, 2.904296875, 4.08740234375, 5.2705078125, 6.45361328125, 7.63671875, 8.81982421875, 10.0029296875, 11.18603515625, 12.369140625, 13.55224609375, 14.7353515625, 15.91845703125, 17.1015625, 18.28466796875, 19.4677734375, 20.65087890625, 21.833984375, 23.01708984375, 24.2001953125, 25.38330078125, 26.56640625, 27.74951171875, 28.9326171875, 30.11572265625, 31.298828125, 32.48193359375, 33.6650390625, 34.84814453125, 36.03125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 6.0, 15.0, 23.0, 14.0, 18.0, 27.0, 49.0, 53.0, 37.0, 76.0, 64.0, 83.0, 81.0, 68.0, 81.0, 58.0, 45.0, 42.0, 30.0, 25.0, 19.0, 7.0, 13.0, 12.0, 8.0, 11.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.001323699951171875, -0.0012825578451156616, -0.0012414157390594482, -0.0012002736330032349, -0.0011591315269470215, -0.001117989420890808, -0.0010768473148345947, -0.0010357052087783813, -0.000994563102722168, -0.0009534209966659546, -0.0009122788906097412, -0.0008711367845535278, -0.0008299946784973145, -0.0007888525724411011, -0.0007477104663848877, -0.0007065683603286743, -0.0006654262542724609, -0.0006242841482162476, -0.0005831420421600342, -0.0005419999361038208, -0.0005008578300476074, -0.00045971572399139404, -0.00041857361793518066, -0.0003774315118789673, -0.0003362894058227539, -0.00029514729976654053, -0.00025400519371032715, -0.00021286308765411377, -0.0001717209815979004, -0.000130578875541687, -8.943676948547363e-05, -4.8294663429260254e-05, -7.152557373046875e-06, 3.3989548683166504e-05, 7.513165473937988e-05, 0.00011627376079559326, 0.00015741586685180664, 0.00019855797290802002, 0.0002397000789642334, 0.0002808421850204468, 0.00032198429107666016, 0.00036312639713287354, 0.0004042685031890869, 0.0004454106092453003, 0.00048655271530151367, 0.000527694821357727, 0.0005688369274139404, 0.0006099790334701538, 0.0006511211395263672, 0.0006922632455825806, 0.0007334053516387939, 0.0007745474576950073, 0.0008156895637512207, 0.0008568316698074341, 0.0008979737758636475, 0.0009391158819198608, 0.0009802579879760742, 0.0010214000940322876, 0.001062542200088501, 0.0011036843061447144, 0.0011448264122009277, 0.0011859685182571411, 0.0012271106243133545, 0.0012682527303695679, 0.0013093948364257812]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 8.0, 7.0, 23.0, 16.0, 21.0, 36.0, 47.0, 74.0, 111.0, 191.0, 309.0, 664.0, 1847.0, 10933.0, 340677.0, 672200.0, 17399.0, 2347.0, 743.0, 325.0, 196.0, 144.0, 67.0, 47.0, 34.0, 24.0, 19.0, 9.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.71875, -31.66650390625, -30.6142578125, -29.56201171875, -28.509765625, -27.45751953125, -26.4052734375, -25.35302734375, -24.30078125, -23.24853515625, -22.1962890625, -21.14404296875, -20.091796875, -19.03955078125, -17.9873046875, -16.93505859375, -15.8828125, -14.83056640625, -13.7783203125, -12.72607421875, -11.673828125, -10.62158203125, -9.5693359375, -8.51708984375, -7.46484375, -6.41259765625, -5.3603515625, -4.30810546875, -3.255859375, -2.20361328125, -1.1513671875, -0.09912109375, 0.953125, 2.00537109375, 3.0576171875, 4.10986328125, 5.162109375, 6.21435546875, 7.2666015625, 8.31884765625, 9.37109375, 10.42333984375, 11.4755859375, 12.52783203125, 13.580078125, 14.63232421875, 15.6845703125, 16.73681640625, 17.7890625, 18.84130859375, 19.8935546875, 20.94580078125, 21.998046875, 23.05029296875, 24.1025390625, 25.15478515625, 26.20703125, 27.25927734375, 28.3115234375, 29.36376953125, 30.416015625, 31.46826171875, 32.5205078125, 33.57275390625, 34.625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 13.0, 12.0, 10.0, 23.0, 43.0, 49.0, 79.0, 124.0, 147.0, 137.0, 97.0, 66.0, 52.0, 30.0, 10.0, 13.0, 11.0, 8.0, 10.0, 5.0, 6.0, 4.0, 3.0, 7.0, 2.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.015625, -20.354248046875, -19.69287109375, -19.031494140625, -18.3701171875, -17.708740234375, -17.04736328125, -16.385986328125, -15.724609375, -15.063232421875, -14.40185546875, -13.740478515625, -13.0791015625, -12.417724609375, -11.75634765625, -11.094970703125, -10.43359375, -9.772216796875, -9.11083984375, -8.449462890625, -7.7880859375, -7.126708984375, -6.46533203125, -5.803955078125, -5.142578125, -4.481201171875, -3.81982421875, -3.158447265625, -2.4970703125, -1.835693359375, -1.17431640625, -0.512939453125, 0.1484375, 0.809814453125, 1.47119140625, 2.132568359375, 2.7939453125, 3.455322265625, 4.11669921875, 4.778076171875, 5.439453125, 6.100830078125, 6.76220703125, 7.423583984375, 8.0849609375, 8.746337890625, 9.40771484375, 10.069091796875, 10.73046875, 11.391845703125, 12.05322265625, 12.714599609375, 13.3759765625, 14.037353515625, 14.69873046875, 15.360107421875, 16.021484375, 16.682861328125, 17.34423828125, 18.005615234375, 18.6669921875, 19.328369140625, 19.98974609375, 20.651123046875, 21.3125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 20.0, 101.0, 393.0, 377.0, 90.0, 16.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1009.714599609375, -986.197265625, -962.679931640625, -939.16259765625, -915.645263671875, -892.1278686523438, -868.6105346679688, -845.0932006835938, -821.5758666992188, -798.0585327148438, -774.5411987304688, -751.0238647460938, -727.5064697265625, -703.9891357421875, -680.4718017578125, -656.9544677734375, -633.4371337890625, -609.9197998046875, -586.4024658203125, -562.8851318359375, -539.3677978515625, -515.8504028320312, -492.33306884765625, -468.81573486328125, -445.29840087890625, -421.78106689453125, -398.26373291015625, -374.7463684082031, -351.2290344238281, -327.7117004394531, -304.1943359375, -280.677001953125, -257.15966796875, -233.642333984375, -210.12498474121094, -186.60763549804688, -163.09030151367188, -139.57296752929688, -116.05561828613281, -92.53826904296875, -69.02093505859375, -45.50359344482422, -21.986251831054688, 1.5310897827148438, 25.048431396484375, 48.565773010253906, 72.08311462402344, 95.6004638671875, 119.1177978515625, 142.6351318359375, 166.15248107910156, 189.66983032226562, 213.18716430664062, 236.70449829101562, 260.22186279296875, 283.73919677734375, 307.25653076171875, 330.77386474609375, 354.29119873046875, 377.8085632324219, 401.3258972167969, 424.8432312011719, 448.360595703125, 471.8779296875, 495.395263671875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 10.0, 13.0, 14.0, 27.0, 36.0, 37.0, 39.0, 52.0, 54.0, 56.0, 55.0, 59.0, 72.0, 64.0, 78.0, 65.0, 46.0, 48.0, 42.0, 28.0, 24.0, 22.0, 19.0, 7.0, 8.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.25509643554688, -241.0137481689453, -230.7724151611328, -220.53106689453125, -210.28973388671875, -200.0483856201172, -189.80703735351562, -179.56570434570312, -169.32437133789062, -159.08302307128906, -148.84169006347656, -138.600341796875, -128.3590087890625, -118.11766052246094, -107.8763198852539, -97.63497924804688, -87.39363098144531, -77.15229034423828, -66.91094970703125, -56.66960525512695, -46.42826461791992, -36.18692398071289, -25.945579528808594, -15.704238891601562, -5.462898254394531, 4.778443336486816, 15.019784927368164, 25.261127471923828, 35.50246810913086, 45.74380874633789, 55.98515319824219, 66.22649383544922, 76.46783447265625, 86.70917510986328, 96.95051574707031, 107.19186401367188, 117.43319702148438, 127.67454528808594, 137.9158935546875, 148.1572265625, 158.3985595703125, 168.63990783691406, 178.88124084472656, 189.12258911132812, 199.36392211914062, 209.6052703857422, 219.84661865234375, 230.08795166015625, 240.3292999267578, 250.57064819335938, 260.8119812011719, 271.0533142089844, 281.294677734375, 291.5360107421875, 301.77734375, 312.0186767578125, 322.2600402832031, 332.5013732910156, 342.74273681640625, 352.98406982421875, 363.22540283203125, 373.46673583984375, 383.7080993652344, 393.9494323730469, 404.1907653808594]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 14.0, 40.0, 60.0, 108.0, 254.0, 476.0, 1121.0, 3450.0, 17744.0, 3951801.0, 204647.0, 10220.0, 2542.0, 936.0, 433.0, 187.0, 117.0, 59.0, 36.0, 22.0, 8.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.5, -49.4287109375, -47.357421875, -45.2861328125, -43.21484375, -41.1435546875, -39.072265625, -37.0009765625, -34.9296875, -32.8583984375, -30.787109375, -28.7158203125, -26.64453125, -24.5732421875, -22.501953125, -20.4306640625, -18.359375, -16.2880859375, -14.216796875, -12.1455078125, -10.07421875, -8.0029296875, -5.931640625, -3.8603515625, -1.7890625, 0.2822265625, 2.353515625, 4.4248046875, 6.49609375, 8.5673828125, 10.638671875, 12.7099609375, 14.78125, 16.8525390625, 18.923828125, 20.9951171875, 23.06640625, 25.1376953125, 27.208984375, 29.2802734375, 31.3515625, 33.4228515625, 35.494140625, 37.5654296875, 39.63671875, 41.7080078125, 43.779296875, 45.8505859375, 47.921875, 49.9931640625, 52.064453125, 54.1357421875, 56.20703125, 58.2783203125, 60.349609375, 62.4208984375, 64.4921875, 66.5634765625, 68.634765625, 70.7060546875, 72.77734375, 74.8486328125, 76.919921875, 78.9912109375, 81.0625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 7.0, 13.0, 17.0, 33.0, 61.0, 72.0, 75.0, 107.0, 115.0, 106.0, 107.0, 71.0, 65.0, 63.0, 35.0, 22.0, 17.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.875, -19.139892578125, -18.40478515625, -17.669677734375, -16.9345703125, -16.199462890625, -15.46435546875, -14.729248046875, -13.994140625, -13.259033203125, -12.52392578125, -11.788818359375, -11.0537109375, -10.318603515625, -9.58349609375, -8.848388671875, -8.11328125, -7.378173828125, -6.64306640625, -5.907958984375, -5.1728515625, -4.437744140625, -3.70263671875, -2.967529296875, -2.232421875, -1.497314453125, -0.76220703125, -0.027099609375, 0.7080078125, 1.443115234375, 2.17822265625, 2.913330078125, 3.6484375, 4.383544921875, 5.11865234375, 5.853759765625, 6.5888671875, 7.323974609375, 8.05908203125, 8.794189453125, 9.529296875, 10.264404296875, 10.99951171875, 11.734619140625, 12.4697265625, 13.204833984375, 13.93994140625, 14.675048828125, 15.41015625, 16.145263671875, 16.88037109375, 17.615478515625, 18.3505859375, 19.085693359375, 19.82080078125, 20.555908203125, 21.291015625, 22.026123046875, 22.76123046875, 23.496337890625, 24.2314453125, 24.966552734375, 25.70166015625, 26.436767578125, 27.171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 7.0, 4.0, 13.0, 17.0, 29.0, 37.0, 58.0, 85.0, 141.0, 197.0, 289.0, 491.0, 794.0, 1266.0, 2683.0, 6503.0, 21998.0, 195297.0, 3883290.0, 59791.0, 12149.0, 4437.0, 1917.0, 987.0, 585.0, 386.0, 274.0, 182.0, 116.0, 69.0, 56.0, 42.0, 25.0, 23.0, 7.0, 13.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.984375, -25.126220703125, -24.26806640625, -23.409912109375, -22.5517578125, -21.693603515625, -20.83544921875, -19.977294921875, -19.119140625, -18.260986328125, -17.40283203125, -16.544677734375, -15.6865234375, -14.828369140625, -13.97021484375, -13.112060546875, -12.25390625, -11.395751953125, -10.53759765625, -9.679443359375, -8.8212890625, -7.963134765625, -7.10498046875, -6.246826171875, -5.388671875, -4.530517578125, -3.67236328125, -2.814208984375, -1.9560546875, -1.097900390625, -0.23974609375, 0.618408203125, 1.4765625, 2.334716796875, 3.19287109375, 4.051025390625, 4.9091796875, 5.767333984375, 6.62548828125, 7.483642578125, 8.341796875, 9.199951171875, 10.05810546875, 10.916259765625, 11.7744140625, 12.632568359375, 13.49072265625, 14.348876953125, 15.20703125, 16.065185546875, 16.92333984375, 17.781494140625, 18.6396484375, 19.497802734375, 20.35595703125, 21.214111328125, 22.072265625, 22.930419921875, 23.78857421875, 24.646728515625, 25.5048828125, 26.363037109375, 27.22119140625, 28.079345703125, 28.9375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 13.0, 12.0, 39.0, 74.0, 169.0, 3178.0, 368.0, 101.0, 48.0, 18.0, 13.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.8359375, -7.59661865234375, -7.3572998046875, -7.11798095703125, -6.878662109375, -6.63934326171875, -6.4000244140625, -6.16070556640625, -5.92138671875, -5.68206787109375, -5.4427490234375, -5.20343017578125, -4.964111328125, -4.72479248046875, -4.4854736328125, -4.24615478515625, -4.0068359375, -3.76751708984375, -3.5281982421875, -3.28887939453125, -3.049560546875, -2.81024169921875, -2.5709228515625, -2.33160400390625, -2.09228515625, -1.85296630859375, -1.6136474609375, -1.37432861328125, -1.135009765625, -0.89569091796875, -0.6563720703125, -0.41705322265625, -0.177734375, 0.06158447265625, 0.3009033203125, 0.54022216796875, 0.779541015625, 1.01885986328125, 1.2581787109375, 1.49749755859375, 1.73681640625, 1.97613525390625, 2.2154541015625, 2.45477294921875, 2.694091796875, 2.93341064453125, 3.1727294921875, 3.41204833984375, 3.6513671875, 3.89068603515625, 4.1300048828125, 4.36932373046875, 4.608642578125, 4.84796142578125, 5.0872802734375, 5.32659912109375, 5.56591796875, 5.80523681640625, 6.0445556640625, 6.28387451171875, 6.523193359375, 6.76251220703125, 7.0018310546875, 7.24114990234375, 7.48046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 22.0, 48.0, 99.0, 176.0, 222.0, 205.0, 103.0, 74.0, 18.0, 9.0, 10.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.972572326660156, -42.65672302246094, -41.34087371826172, -40.0250244140625, -38.70917510986328, -37.39332580566406, -36.077476501464844, -34.76162338256836, -33.44577407836914, -32.12992477416992, -30.814075469970703, -29.498226165771484, -28.182374954223633, -26.866525650024414, -25.550676345825195, -24.234825134277344, -22.918977737426758, -21.60312843322754, -20.28727912902832, -18.97142791748047, -17.65557861328125, -16.33972930908203, -15.023880004882812, -13.708029747009277, -12.392180442810059, -11.07633113861084, -9.760480880737305, -8.444631576538086, -7.128781795501709, -5.812932014465332, -4.497082710266113, -3.181232452392578, -1.8653831481933594, -0.549533486366272, 0.7663161754608154, 2.0821657180786133, 3.3980154991149902, 4.713865280151367, 6.029714584350586, 7.345564842224121, 8.66141414642334, 9.977263450622559, 11.293113708496094, 12.608963012695312, 13.924812316894531, 15.240662574768066, 16.55651092529297, 17.87236213684082, 19.18821144104004, 20.504060745239258, 21.819910049438477, 23.135761260986328, 24.451610565185547, 25.767459869384766, 27.083309173583984, 28.399158477783203, 29.715007781982422, 31.03085708618164, 32.34670639038086, 33.66255569458008, 34.9784049987793, 36.29425811767578, 37.610107421875, 38.92595672607422, 40.24180603027344]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 12.0, 12.0, 12.0, 9.0, 10.0, 8.0, 16.0, 17.0, 21.0, 24.0, 33.0, 36.0, 34.0, 39.0, 38.0, 54.0, 48.0, 49.0, 57.0, 56.0, 39.0, 37.0, 33.0, 47.0, 34.0, 21.0, 32.0, 23.0, 28.0, 17.0, 13.0, 15.0, 13.0, 15.0, 6.0, 6.0, 7.0, 6.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.272005081176758, -13.820244789123535, -13.368485450744629, -12.916725158691406, -12.4649658203125, -12.013205528259277, -11.561445236206055, -11.109685897827148, -10.657925605773926, -10.206165313720703, -9.754405975341797, -9.302645683288574, -8.850885391235352, -8.399126052856445, -7.947365760803223, -7.495605945587158, -7.043846130371094, -6.592086315155029, -6.140326499938965, -5.688566207885742, -5.236806392669678, -4.785046577453613, -4.333286285400391, -3.881526470184326, -3.4297666549682617, -2.9780068397521973, -2.5262467861175537, -2.07448673248291, -1.6227269172668457, -1.1709671020507812, -0.7192070484161377, -0.26744699478149414, 0.1843128204345703, 0.6360727548599243, 1.0878326892852783, 1.5395926237106323, 1.9913525581359863, 2.443112373352051, 2.8948724269866943, 3.346632480621338, 3.7983922958374023, 4.250152111053467, 4.701911926269531, 5.153672218322754, 5.605432033538818, 6.057191848754883, 6.5089521408081055, 6.96071195602417, 7.412471771240234, 7.864231586456299, 8.315991401672363, 8.767751693725586, 9.219511032104492, 9.671271324157715, 10.123031616210938, 10.574790954589844, 11.026551246643066, 11.478311538696289, 11.930070877075195, 12.381831169128418, 12.83359146118164, 13.285350799560547, 13.73711109161377, 14.188871383666992, 14.640630722045898]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 6.0, 17.0, 26.0, 51.0, 79.0, 140.0, 323.0, 569.0, 1442.0, 4525.0, 22490.0, 196716.0, 653133.0, 145401.0, 17499.0, 3791.0, 1216.0, 537.0, 259.0, 129.0, 96.0, 40.0, 24.0, 15.0, 11.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5, -37.04345703125, -35.5869140625, -34.13037109375, -32.673828125, -31.21728515625, -29.7607421875, -28.30419921875, -26.84765625, -25.39111328125, -23.9345703125, -22.47802734375, -21.021484375, -19.56494140625, -18.1083984375, -16.65185546875, -15.1953125, -13.73876953125, -12.2822265625, -10.82568359375, -9.369140625, -7.91259765625, -6.4560546875, -4.99951171875, -3.54296875, -2.08642578125, -0.6298828125, 0.82666015625, 2.283203125, 3.73974609375, 5.1962890625, 6.65283203125, 8.109375, 9.56591796875, 11.0224609375, 12.47900390625, 13.935546875, 15.39208984375, 16.8486328125, 18.30517578125, 19.76171875, 21.21826171875, 22.6748046875, 24.13134765625, 25.587890625, 27.04443359375, 28.5009765625, 29.95751953125, 31.4140625, 32.87060546875, 34.3271484375, 35.78369140625, 37.240234375, 38.69677734375, 40.1533203125, 41.60986328125, 43.06640625, 44.52294921875, 45.9794921875, 47.43603515625, 48.892578125, 50.34912109375, 51.8056640625, 53.26220703125, 54.71875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 7.0, 18.0, 20.0, 41.0, 66.0, 71.0, 84.0, 93.0, 116.0, 112.0, 93.0, 66.0, 80.0, 45.0, 37.0, 23.0, 6.0, 12.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.46875, -18.7431640625, -18.017578125, -17.2919921875, -16.56640625, -15.8408203125, -15.115234375, -14.3896484375, -13.6640625, -12.9384765625, -12.212890625, -11.4873046875, -10.76171875, -10.0361328125, -9.310546875, -8.5849609375, -7.859375, -7.1337890625, -6.408203125, -5.6826171875, -4.95703125, -4.2314453125, -3.505859375, -2.7802734375, -2.0546875, -1.3291015625, -0.603515625, 0.1220703125, 0.84765625, 1.5732421875, 2.298828125, 3.0244140625, 3.75, 4.4755859375, 5.201171875, 5.9267578125, 6.65234375, 7.3779296875, 8.103515625, 8.8291015625, 9.5546875, 10.2802734375, 11.005859375, 11.7314453125, 12.45703125, 13.1826171875, 13.908203125, 14.6337890625, 15.359375, 16.0849609375, 16.810546875, 17.5361328125, 18.26171875, 18.9873046875, 19.712890625, 20.4384765625, 21.1640625, 21.8896484375, 22.615234375, 23.3408203125, 24.06640625, 24.7919921875, 25.517578125, 26.2431640625, 26.96875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 1.0, 11.0, 4.0, 5.0, 12.0, 7.0, 13.0, 18.0, 21.0, 40.0, 49.0, 61.0, 111.0, 174.0, 274.0, 484.0, 894.0, 2208.0, 9952.0, 340629.0, 673868.0, 14638.0, 2653.0, 985.0, 573.0, 295.0, 170.0, 105.0, 101.0, 50.0, 37.0, 29.0, 19.0, 20.0, 10.0, 7.0, 4.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-95.3125, -92.431640625, -89.55078125, -86.669921875, -83.7890625, -80.908203125, -78.02734375, -75.146484375, -72.265625, -69.384765625, -66.50390625, -63.623046875, -60.7421875, -57.861328125, -54.98046875, -52.099609375, -49.21875, -46.337890625, -43.45703125, -40.576171875, -37.6953125, -34.814453125, -31.93359375, -29.052734375, -26.171875, -23.291015625, -20.41015625, -17.529296875, -14.6484375, -11.767578125, -8.88671875, -6.005859375, -3.125, -0.244140625, 2.63671875, 5.517578125, 8.3984375, 11.279296875, 14.16015625, 17.041015625, 19.921875, 22.802734375, 25.68359375, 28.564453125, 31.4453125, 34.326171875, 37.20703125, 40.087890625, 42.96875, 45.849609375, 48.73046875, 51.611328125, 54.4921875, 57.373046875, 60.25390625, 63.134765625, 66.015625, 68.896484375, 71.77734375, 74.658203125, 77.5390625, 80.419921875, 83.30078125, 86.181640625, 89.0625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 11.0, 1.0, 4.0, 4.0, 6.0, 9.0, 19.0, 24.0, 29.0, 39.0, 39.0, 53.0, 62.0, 75.0, 81.0, 91.0, 95.0, 67.0, 56.0, 56.0, 41.0, 30.0, 18.0, 19.0, 9.0, 10.0, 10.0, 7.0, 2.0, 11.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.6875, -90.7900390625, -87.892578125, -84.9951171875, -82.09765625, -79.2001953125, -76.302734375, -73.4052734375, -70.5078125, -67.6103515625, -64.712890625, -61.8154296875, -58.91796875, -56.0205078125, -53.123046875, -50.2255859375, -47.328125, -44.4306640625, -41.533203125, -38.6357421875, -35.73828125, -32.8408203125, -29.943359375, -27.0458984375, -24.1484375, -21.2509765625, -18.353515625, -15.4560546875, -12.55859375, -9.6611328125, -6.763671875, -3.8662109375, -0.96875, 1.9287109375, 4.826171875, 7.7236328125, 10.62109375, 13.5185546875, 16.416015625, 19.3134765625, 22.2109375, 25.1083984375, 28.005859375, 30.9033203125, 33.80078125, 36.6982421875, 39.595703125, 42.4931640625, 45.390625, 48.2880859375, 51.185546875, 54.0830078125, 56.98046875, 59.8779296875, 62.775390625, 65.6728515625, 68.5703125, 71.4677734375, 74.365234375, 77.2626953125, 80.16015625, 83.0576171875, 85.955078125, 88.8525390625, 91.75]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 5.0, 6.0, 8.0, 4.0, 7.0, 11.0, 11.0, 14.0, 22.0, 27.0, 27.0, 38.0, 59.0, 73.0, 115.0, 244.0, 804.0, 9096.0, 923213.0, 111093.0, 2673.0, 460.0, 153.0, 89.0, 60.0, 53.0, 42.0, 20.0, 16.0, 17.0, 17.0, 16.0, 20.0, 15.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.34375, -54.45166015625, -52.5595703125, -50.66748046875, -48.775390625, -46.88330078125, -44.9912109375, -43.09912109375, -41.20703125, -39.31494140625, -37.4228515625, -35.53076171875, -33.638671875, -31.74658203125, -29.8544921875, -27.96240234375, -26.0703125, -24.17822265625, -22.2861328125, -20.39404296875, -18.501953125, -16.60986328125, -14.7177734375, -12.82568359375, -10.93359375, -9.04150390625, -7.1494140625, -5.25732421875, -3.365234375, -1.47314453125, 0.4189453125, 2.31103515625, 4.203125, 6.09521484375, 7.9873046875, 9.87939453125, 11.771484375, 13.66357421875, 15.5556640625, 17.44775390625, 19.33984375, 21.23193359375, 23.1240234375, 25.01611328125, 26.908203125, 28.80029296875, 30.6923828125, 32.58447265625, 34.4765625, 36.36865234375, 38.2607421875, 40.15283203125, 42.044921875, 43.93701171875, 45.8291015625, 47.72119140625, 49.61328125, 51.50537109375, 53.3974609375, 55.28955078125, 57.181640625, 59.07373046875, 60.9658203125, 62.85791015625, 64.75]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 12.0, 26.0, 37.0, 58.0, 91.0, 148.0, 161.0, 137.0, 97.0, 87.0, 41.0, 31.0, 18.0, 17.0, 8.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002292633056640625, -0.002206563949584961, -0.002120494842529297, -0.002034425735473633, -0.0019483566284179688, -0.0018622875213623047, -0.0017762184143066406, -0.0016901493072509766, -0.0016040802001953125, -0.0015180110931396484, -0.0014319419860839844, -0.0013458728790283203, -0.0012598037719726562, -0.0011737346649169922, -0.0010876655578613281, -0.001001596450805664, -0.00091552734375, -0.0008294582366943359, -0.0007433891296386719, -0.0006573200225830078, -0.0005712509155273438, -0.0004851818084716797, -0.0003991127014160156, -0.00031304359436035156, -0.0002269744873046875, -0.00014090538024902344, -5.4836273193359375e-05, 3.123283386230469e-05, 0.00011730194091796875, 0.0002033710479736328, 0.0002894401550292969, 0.00037550926208496094, 0.000461578369140625, 0.0005476474761962891, 0.0006337165832519531, 0.0007197856903076172, 0.0008058547973632812, 0.0008919239044189453, 0.0009779930114746094, 0.0010640621185302734, 0.0011501312255859375, 0.0012362003326416016, 0.0013222694396972656, 0.0014083385467529297, 0.0014944076538085938, 0.0015804767608642578, 0.0016665458679199219, 0.001752614974975586, 0.00183868408203125, 0.001924753189086914, 0.002010822296142578, 0.002096891403198242, 0.0021829605102539062, 0.0022690296173095703, 0.0023550987243652344, 0.0024411678314208984, 0.0025272369384765625, 0.0026133060455322266, 0.0026993751525878906, 0.0027854442596435547, 0.0028715133666992188, 0.002957582473754883, 0.003043651580810547, 0.003129720687866211, 0.003215789794921875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 13.0, 15.0, 36.0, 66.0, 167.0, 933.0, 67933.0, 977591.0, 1413.0, 218.0, 76.0, 31.0, 16.0, 13.0, 7.0, 5.0, 6.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.0, -176.662109375, -171.32421875, -165.986328125, -160.6484375, -155.310546875, -149.97265625, -144.634765625, -139.296875, -133.958984375, -128.62109375, -123.283203125, -117.9453125, -112.607421875, -107.26953125, -101.931640625, -96.59375, -91.255859375, -85.91796875, -80.580078125, -75.2421875, -69.904296875, -64.56640625, -59.228515625, -53.890625, -48.552734375, -43.21484375, -37.876953125, -32.5390625, -27.201171875, -21.86328125, -16.525390625, -11.1875, -5.849609375, -0.51171875, 4.826171875, 10.1640625, 15.501953125, 20.83984375, 26.177734375, 31.515625, 36.853515625, 42.19140625, 47.529296875, 52.8671875, 58.205078125, 63.54296875, 68.880859375, 74.21875, 79.556640625, 84.89453125, 90.232421875, 95.5703125, 100.908203125, 106.24609375, 111.583984375, 116.921875, 122.259765625, 127.59765625, 132.935546875, 138.2734375, 143.611328125, 148.94921875, 154.287109375, 159.625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 13.0, 19.0, 48.0, 267.0, 471.0, 119.0, 29.0, 12.0, 4.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.6875, -103.15625, -99.625, -96.09375, -92.5625, -89.03125, -85.5, -81.96875, -78.4375, -74.90625, -71.375, -67.84375, -64.3125, -60.78125, -57.25, -53.71875, -50.1875, -46.65625, -43.125, -39.59375, -36.0625, -32.53125, -29.0, -25.46875, -21.9375, -18.40625, -14.875, -11.34375, -7.8125, -4.28125, -0.75, 2.78125, 6.3125, 9.84375, 13.375, 16.90625, 20.4375, 23.96875, 27.5, 31.03125, 34.5625, 38.09375, 41.625, 45.15625, 48.6875, 52.21875, 55.75, 59.28125, 62.8125, 66.34375, 69.875, 73.40625, 76.9375, 80.46875, 84.0, 87.53125, 91.0625, 94.59375, 98.125, 101.65625, 105.1875, 108.71875, 112.25, 115.78125, 119.3125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 13.0, 73.0, 488.0, 375.0, 45.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1467.86962890625, -1433.62548828125, -1399.3812255859375, -1365.1370849609375, -1330.8929443359375, -1296.648681640625, -1262.404541015625, -1228.160400390625, -1193.916259765625, -1159.672119140625, -1125.4278564453125, -1091.1837158203125, -1056.9395751953125, -1022.6953735351562, -988.451171875, -954.20703125, -919.9627685546875, -885.7185668945312, -851.4744262695312, -817.230224609375, -782.986083984375, -748.7418823242188, -714.4976806640625, -680.2535400390625, -646.0093383789062, -611.76513671875, -577.52099609375, -543.2767944335938, -509.0326232910156, -474.7884521484375, -440.54425048828125, -406.3000793457031, -372.055908203125, -337.8117370605469, -303.56756591796875, -269.3233642578125, -235.07919311523438, -200.83502197265625, -166.59083557128906, -132.34664916992188, -98.10247802734375, -63.858299255371094, -29.614120483398438, 4.630058288574219, 38.874237060546875, 73.118408203125, 107.36259460449219, 141.60678100585938, 175.8509521484375, 210.09512329101562, 244.3393096923828, 278.58349609375, 312.8276672363281, 347.07183837890625, 381.3160400390625, 415.5602111816406, 449.80438232421875, 484.0485534667969, 518.292724609375, 552.5369262695312, 586.7811279296875, 621.0252685546875, 655.2694702148438, 689.513671875, 723.7578125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 15.0, 8.0, 11.0, 13.0, 21.0, 18.0, 18.0, 16.0, 21.0, 33.0, 47.0, 48.0, 57.0, 50.0, 48.0, 51.0, 44.0, 47.0, 38.0, 56.0, 41.0, 48.0, 33.0, 32.0, 29.0, 24.0, 24.0, 19.0, 13.0, 13.0, 13.0, 11.0, 12.0, 2.0, 8.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-232.92453002929688, -223.71653747558594, -214.50856018066406, -205.30056762695312, -196.09259033203125, -186.8845977783203, -177.67660522460938, -168.4686279296875, -159.26063537597656, -150.05264282226562, -140.84466552734375, -131.6366729736328, -122.4286880493164, -113.220703125, -104.01271057128906, -94.80472564697266, -85.59674072265625, -76.38875579833984, -67.18077087402344, -57.9727783203125, -48.764793395996094, -39.55680847167969, -30.348819732666016, -21.140830993652344, -11.932846069335938, -2.7248592376708984, 6.483127593994141, 15.69111442565918, 24.89910125732422, 34.107086181640625, 43.3150749206543, 52.52306365966797, 61.7310791015625, 70.9390640258789, 80.14704895019531, 89.35504150390625, 98.56302642822266, 107.77101135253906, 116.97900390625, 126.1869888305664, 135.3949737548828, 144.60296630859375, 153.81094360351562, 163.01893615722656, 172.2269287109375, 181.43490600585938, 190.6428985595703, 199.85089111328125, 209.05886840820312, 218.26686096191406, 227.47483825683594, 236.68283081054688, 245.89080810546875, 255.0988006591797, 264.3067932128906, 273.5147705078125, 282.7227783203125, 291.9307556152344, 301.1387634277344, 310.34674072265625, 319.5547180175781, 328.7626953125, 337.970703125, 347.1786804199219, 356.38665771484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 10.0, 20.0, 20.0, 38.0, 38.0, 75.0, 105.0, 165.0, 278.0, 436.0, 776.0, 1504.0, 3345.0, 9318.0, 40418.0, 3835853.0, 266060.0, 23578.0, 6729.0, 2558.0, 1228.0, 668.0, 406.0, 220.0, 128.0, 95.0, 73.0, 56.0, 31.0, 21.0, 9.0, 9.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.046875, -30.006591796875, -28.96630859375, -27.926025390625, -26.8857421875, -25.845458984375, -24.80517578125, -23.764892578125, -22.724609375, -21.684326171875, -20.64404296875, -19.603759765625, -18.5634765625, -17.523193359375, -16.48291015625, -15.442626953125, -14.40234375, -13.362060546875, -12.32177734375, -11.281494140625, -10.2412109375, -9.200927734375, -8.16064453125, -7.120361328125, -6.080078125, -5.039794921875, -3.99951171875, -2.959228515625, -1.9189453125, -0.878662109375, 0.16162109375, 1.201904296875, 2.2421875, 3.282470703125, 4.32275390625, 5.363037109375, 6.4033203125, 7.443603515625, 8.48388671875, 9.524169921875, 10.564453125, 11.604736328125, 12.64501953125, 13.685302734375, 14.7255859375, 15.765869140625, 16.80615234375, 17.846435546875, 18.88671875, 19.927001953125, 20.96728515625, 22.007568359375, 23.0478515625, 24.088134765625, 25.12841796875, 26.168701171875, 27.208984375, 28.249267578125, 29.28955078125, 30.329833984375, 31.3701171875, 32.410400390625, 33.45068359375, 34.490966796875, 35.53125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 6.0, 17.0, 17.0, 29.0, 59.0, 72.0, 94.0, 99.0, 125.0, 124.0, 106.0, 94.0, 53.0, 48.0, 27.0, 15.0, 6.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.5380859375, -20.669921875, -19.8017578125, -18.93359375, -18.0654296875, -17.197265625, -16.3291015625, -15.4609375, -14.5927734375, -13.724609375, -12.8564453125, -11.98828125, -11.1201171875, -10.251953125, -9.3837890625, -8.515625, -7.6474609375, -6.779296875, -5.9111328125, -5.04296875, -4.1748046875, -3.306640625, -2.4384765625, -1.5703125, -0.7021484375, 0.166015625, 1.0341796875, 1.90234375, 2.7705078125, 3.638671875, 4.5068359375, 5.375, 6.2431640625, 7.111328125, 7.9794921875, 8.84765625, 9.7158203125, 10.583984375, 11.4521484375, 12.3203125, 13.1884765625, 14.056640625, 14.9248046875, 15.79296875, 16.6611328125, 17.529296875, 18.3974609375, 19.265625, 20.1337890625, 21.001953125, 21.8701171875, 22.73828125, 23.6064453125, 24.474609375, 25.3427734375, 26.2109375, 27.0791015625, 27.947265625, 28.8154296875, 29.68359375, 30.5517578125, 31.419921875, 32.2880859375, 33.15625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 12.0, 14.0, 16.0, 21.0, 42.0, 39.0, 64.0, 86.0, 116.0, 153.0, 207.0, 312.0, 483.0, 784.0, 1276.0, 2242.0, 4297.0, 9442.0, 23857.0, 96382.0, 3735816.0, 252039.0, 39800.0, 13611.0, 5820.0, 2996.0, 1563.0, 931.0, 572.0, 339.0, 274.0, 183.0, 135.0, 90.0, 60.0, 44.0, 45.0, 33.0, 26.0, 22.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.707275390625, -17.14892578125, -16.590576171875, -16.0322265625, -15.473876953125, -14.91552734375, -14.357177734375, -13.798828125, -13.240478515625, -12.68212890625, -12.123779296875, -11.5654296875, -11.007080078125, -10.44873046875, -9.890380859375, -9.33203125, -8.773681640625, -8.21533203125, -7.656982421875, -7.0986328125, -6.540283203125, -5.98193359375, -5.423583984375, -4.865234375, -4.306884765625, -3.74853515625, -3.190185546875, -2.6318359375, -2.073486328125, -1.51513671875, -0.956787109375, -0.3984375, 0.159912109375, 0.71826171875, 1.276611328125, 1.8349609375, 2.393310546875, 2.95166015625, 3.510009765625, 4.068359375, 4.626708984375, 5.18505859375, 5.743408203125, 6.3017578125, 6.860107421875, 7.41845703125, 7.976806640625, 8.53515625, 9.093505859375, 9.65185546875, 10.210205078125, 10.7685546875, 11.326904296875, 11.88525390625, 12.443603515625, 13.001953125, 13.560302734375, 14.11865234375, 14.677001953125, 15.2353515625, 15.793701171875, 16.35205078125, 16.910400390625, 17.46875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 9.0, 11.0, 13.0, 15.0, 31.0, 51.0, 59.0, 189.0, 2909.0, 506.0, 123.0, 52.0, 28.0, 23.0, 11.0, 9.0, 4.0, 8.0, 5.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8984375, -5.6865234375, -5.474609375, -5.2626953125, -5.05078125, -4.8388671875, -4.626953125, -4.4150390625, -4.203125, -3.9912109375, -3.779296875, -3.5673828125, -3.35546875, -3.1435546875, -2.931640625, -2.7197265625, -2.5078125, -2.2958984375, -2.083984375, -1.8720703125, -1.66015625, -1.4482421875, -1.236328125, -1.0244140625, -0.8125, -0.6005859375, -0.388671875, -0.1767578125, 0.03515625, 0.2470703125, 0.458984375, 0.6708984375, 0.8828125, 1.0947265625, 1.306640625, 1.5185546875, 1.73046875, 1.9423828125, 2.154296875, 2.3662109375, 2.578125, 2.7900390625, 3.001953125, 3.2138671875, 3.42578125, 3.6376953125, 3.849609375, 4.0615234375, 4.2734375, 4.4853515625, 4.697265625, 4.9091796875, 5.12109375, 5.3330078125, 5.544921875, 5.7568359375, 5.96875, 6.1806640625, 6.392578125, 6.6044921875, 6.81640625, 7.0283203125, 7.240234375, 7.4521484375, 7.6640625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 18.0, 31.0, 76.0, 156.0, 230.0, 228.0, 164.0, 57.0, 19.0, 9.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.80000305175781, -74.1919937133789, -72.58397674560547, -70.97596740722656, -69.36795806884766, -67.75994873046875, -66.15193176269531, -64.5439224243164, -62.935909271240234, -61.32789611816406, -59.719886779785156, -58.111873626708984, -56.50386428833008, -54.895851135253906, -53.287841796875, -51.67982864379883, -50.071815490722656, -48.463802337646484, -46.85579299926758, -45.247779846191406, -43.6397705078125, -42.03175735473633, -40.423744201660156, -38.81573486328125, -37.207725524902344, -35.59971237182617, -33.991703033447266, -32.383689880371094, -30.775678634643555, -29.167667388916016, -27.559656143188477, -25.951644897460938, -24.343631744384766, -22.735620498657227, -21.127609252929688, -19.519596099853516, -17.911584854125977, -16.303573608398438, -14.695562362670898, -13.087550163269043, -11.479538917541504, -9.871527671813965, -8.26351547241211, -6.65550422668457, -5.047492504119873, -3.439480781555176, -1.8314695358276367, -0.22345733642578125, 1.3845539093017578, 2.992565631866455, 4.600577354431152, 6.208588600158691, 7.816600322723389, 9.424612045288086, 11.032623291015625, 12.64063549041748, 14.24864673614502, 15.856657981872559, 17.464670181274414, 19.072681427001953, 20.680692672729492, 22.28870391845703, 23.896717071533203, 25.504728317260742, 27.11273956298828]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 6.0, 7.0, 3.0, 9.0, 13.0, 11.0, 8.0, 19.0, 20.0, 36.0, 31.0, 29.0, 34.0, 29.0, 44.0, 40.0, 51.0, 48.0, 51.0, 45.0, 34.0, 49.0, 40.0, 31.0, 37.0, 50.0, 44.0, 27.0, 21.0, 26.0, 23.0, 8.0, 22.0, 9.0, 10.0, 6.0, 9.0, 7.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-14.383478164672852, -13.938672065734863, -13.493865966796875, -13.049059867858887, -12.604253768920898, -12.15944766998291, -11.714641571044922, -11.269835472106934, -10.825029373168945, -10.380223274230957, -9.935417175292969, -9.49061107635498, -9.045804977416992, -8.600998878479004, -8.156192779541016, -7.711386680603027, -7.266580581665039, -6.821774482727051, -6.3769683837890625, -5.932162284851074, -5.487356185913086, -5.042550086975098, -4.597743988037109, -4.152937889099121, -3.708131790161133, -3.2633256912231445, -2.8185195922851562, -2.373713493347168, -1.9289073944091797, -1.4841012954711914, -1.0392951965332031, -0.5944890975952148, -0.14968204498291016, 0.2951240539550781, 0.7399301528930664, 1.1847362518310547, 1.629542350769043, 2.0743484497070312, 2.5191545486450195, 2.963960647583008, 3.408766746520996, 3.8535728454589844, 4.298378944396973, 4.743185043334961, 5.187991142272949, 5.6327972412109375, 6.077603340148926, 6.522409439086914, 6.967215538024902, 7.412021636962891, 7.856827735900879, 8.301633834838867, 8.746439933776855, 9.191246032714844, 9.636052131652832, 10.08085823059082, 10.525664329528809, 10.970470428466797, 11.415276527404785, 11.860082626342773, 12.304888725280762, 12.74969482421875, 13.194500923156738, 13.639307022094727, 14.084113121032715]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 17.0, 25.0, 54.0, 53.0, 115.0, 227.0, 396.0, 810.0, 1946.0, 7586.0, 51852.0, 431182.0, 480652.0, 61191.0, 8443.0, 2235.0, 837.0, 425.0, 195.0, 120.0, 80.0, 41.0, 21.0, 17.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.71875, -38.47900390625, -37.2392578125, -35.99951171875, -34.759765625, -33.52001953125, -32.2802734375, -31.04052734375, -29.80078125, -28.56103515625, -27.3212890625, -26.08154296875, -24.841796875, -23.60205078125, -22.3623046875, -21.12255859375, -19.8828125, -18.64306640625, -17.4033203125, -16.16357421875, -14.923828125, -13.68408203125, -12.4443359375, -11.20458984375, -9.96484375, -8.72509765625, -7.4853515625, -6.24560546875, -5.005859375, -3.76611328125, -2.5263671875, -1.28662109375, -0.046875, 1.19287109375, 2.4326171875, 3.67236328125, 4.912109375, 6.15185546875, 7.3916015625, 8.63134765625, 9.87109375, 11.11083984375, 12.3505859375, 13.59033203125, 14.830078125, 16.06982421875, 17.3095703125, 18.54931640625, 19.7890625, 21.02880859375, 22.2685546875, 23.50830078125, 24.748046875, 25.98779296875, 27.2275390625, 28.46728515625, 29.70703125, 30.94677734375, 32.1865234375, 33.42626953125, 34.666015625, 35.90576171875, 37.1455078125, 38.38525390625, 39.625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 14.0, 22.0, 24.0, 54.0, 70.0, 86.0, 106.0, 110.0, 117.0, 118.0, 89.0, 79.0, 49.0, 25.0, 12.0, 14.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.81591796875, -20.9443359375, -20.07275390625, -19.201171875, -18.32958984375, -17.4580078125, -16.58642578125, -15.71484375, -14.84326171875, -13.9716796875, -13.10009765625, -12.228515625, -11.35693359375, -10.4853515625, -9.61376953125, -8.7421875, -7.87060546875, -6.9990234375, -6.12744140625, -5.255859375, -4.38427734375, -3.5126953125, -2.64111328125, -1.76953125, -0.89794921875, -0.0263671875, 0.84521484375, 1.716796875, 2.58837890625, 3.4599609375, 4.33154296875, 5.203125, 6.07470703125, 6.9462890625, 7.81787109375, 8.689453125, 9.56103515625, 10.4326171875, 11.30419921875, 12.17578125, 13.04736328125, 13.9189453125, 14.79052734375, 15.662109375, 16.53369140625, 17.4052734375, 18.27685546875, 19.1484375, 20.02001953125, 20.8916015625, 21.76318359375, 22.634765625, 23.50634765625, 24.3779296875, 25.24951171875, 26.12109375, 26.99267578125, 27.8642578125, 28.73583984375, 29.607421875, 30.47900390625, 31.3505859375, 32.22216796875, 33.09375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 6.0, 5.0, 2.0, 7.0, 12.0, 16.0, 24.0, 26.0, 40.0, 53.0, 71.0, 143.0, 248.0, 537.0, 1357.0, 5635.0, 395968.0, 635083.0, 6647.0, 1382.0, 610.0, 256.0, 168.0, 91.0, 46.0, 40.0, 24.0, 17.0, 10.0, 7.0, 5.0, 4.0, 6.0, 4.0, 1.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-163.625, -159.20703125, -154.7890625, -150.37109375, -145.953125, -141.53515625, -137.1171875, -132.69921875, -128.28125, -123.86328125, -119.4453125, -115.02734375, -110.609375, -106.19140625, -101.7734375, -97.35546875, -92.9375, -88.51953125, -84.1015625, -79.68359375, -75.265625, -70.84765625, -66.4296875, -62.01171875, -57.59375, -53.17578125, -48.7578125, -44.33984375, -39.921875, -35.50390625, -31.0859375, -26.66796875, -22.25, -17.83203125, -13.4140625, -8.99609375, -4.578125, -0.16015625, 4.2578125, 8.67578125, 13.09375, 17.51171875, 21.9296875, 26.34765625, 30.765625, 35.18359375, 39.6015625, 44.01953125, 48.4375, 52.85546875, 57.2734375, 61.69140625, 66.109375, 70.52734375, 74.9453125, 79.36328125, 83.78125, 88.19921875, 92.6171875, 97.03515625, 101.453125, 105.87109375, 110.2890625, 114.70703125, 119.125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 2.0, 8.0, 2.0, 8.0, 9.0, 10.0, 13.0, 26.0, 37.0, 38.0, 69.0, 72.0, 83.0, 109.0, 104.0, 98.0, 67.0, 59.0, 43.0, 37.0, 30.0, 15.0, 16.0, 7.0, 7.0, 6.0, 3.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.625, -126.275390625, -121.92578125, -117.576171875, -113.2265625, -108.876953125, -104.52734375, -100.177734375, -95.828125, -91.478515625, -87.12890625, -82.779296875, -78.4296875, -74.080078125, -69.73046875, -65.380859375, -61.03125, -56.681640625, -52.33203125, -47.982421875, -43.6328125, -39.283203125, -34.93359375, -30.583984375, -26.234375, -21.884765625, -17.53515625, -13.185546875, -8.8359375, -4.486328125, -0.13671875, 4.212890625, 8.5625, 12.912109375, 17.26171875, 21.611328125, 25.9609375, 30.310546875, 34.66015625, 39.009765625, 43.359375, 47.708984375, 52.05859375, 56.408203125, 60.7578125, 65.107421875, 69.45703125, 73.806640625, 78.15625, 82.505859375, 86.85546875, 91.205078125, 95.5546875, 99.904296875, 104.25390625, 108.603515625, 112.953125, 117.302734375, 121.65234375, 126.001953125, 130.3515625, 134.701171875, 139.05078125, 143.400390625, 147.75]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 4.0, 7.0, 6.0, 15.0, 15.0, 29.0, 27.0, 47.0, 48.0, 96.0, 175.0, 229.0, 428.0, 918.0, 3756.0, 72194.0, 944245.0, 22391.0, 2295.0, 706.0, 315.0, 205.0, 132.0, 94.0, 56.0, 29.0, 23.0, 21.0, 16.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.59375, -44.2265625, -42.859375, -41.4921875, -40.125, -38.7578125, -37.390625, -36.0234375, -34.65625, -33.2890625, -31.921875, -30.5546875, -29.1875, -27.8203125, -26.453125, -25.0859375, -23.71875, -22.3515625, -20.984375, -19.6171875, -18.25, -16.8828125, -15.515625, -14.1484375, -12.78125, -11.4140625, -10.046875, -8.6796875, -7.3125, -5.9453125, -4.578125, -3.2109375, -1.84375, -0.4765625, 0.890625, 2.2578125, 3.625, 4.9921875, 6.359375, 7.7265625, 9.09375, 10.4609375, 11.828125, 13.1953125, 14.5625, 15.9296875, 17.296875, 18.6640625, 20.03125, 21.3984375, 22.765625, 24.1328125, 25.5, 26.8671875, 28.234375, 29.6015625, 30.96875, 32.3359375, 33.703125, 35.0703125, 36.4375, 37.8046875, 39.171875, 40.5390625, 41.90625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 13.0, 12.0, 21.0, 26.0, 38.0, 85.0, 90.0, 120.0, 124.0, 130.0, 108.0, 72.0, 40.0, 38.0, 15.0, 16.0, 8.0, 11.0, 9.0, 3.0, 3.0, 4.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018720626831054688, -0.0017986148595809937, -0.0017251670360565186, -0.0016517192125320435, -0.0015782713890075684, -0.0015048235654830933, -0.0014313757419586182, -0.001357927918434143, -0.001284480094909668, -0.0012110322713851929, -0.0011375844478607178, -0.0010641366243362427, -0.0009906888008117676, -0.0009172409772872925, -0.0008437931537628174, -0.0007703453302383423, -0.0006968975067138672, -0.0006234496831893921, -0.000550001859664917, -0.0004765540361404419, -0.0004031062126159668, -0.0003296583890914917, -0.0002562105655670166, -0.0001827627420425415, -0.0001093149185180664, -3.586709499359131e-05, 3.758072853088379e-05, 0.00011102855205535889, 0.00018447637557983398, 0.0002579241991043091, 0.0003313720226287842, 0.0004048198461532593, 0.0004782676696777344, 0.0005517154932022095, 0.0006251633167266846, 0.0006986111402511597, 0.0007720589637756348, 0.0008455067873001099, 0.000918954610824585, 0.00099240243434906, 0.0010658502578735352, 0.0011392980813980103, 0.0012127459049224854, 0.0012861937284469604, 0.0013596415519714355, 0.0014330893754959106, 0.0015065371990203857, 0.0015799850225448608, 0.001653432846069336, 0.001726880669593811, 0.0018003284931182861, 0.0018737763166427612, 0.0019472241401672363, 0.0020206719636917114, 0.0020941197872161865, 0.0021675676107406616, 0.0022410154342651367, 0.002314463257789612, 0.002387911081314087, 0.002461358904838562, 0.002534806728363037, 0.002608254551887512, 0.0026817023754119873, 0.0027551501989364624, 0.0028285980224609375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 9.0, 9.0, 5.0, 9.0, 14.0, 20.0, 20.0, 46.0, 70.0, 103.0, 178.0, 289.0, 658.0, 1807.0, 10739.0, 701299.0, 322468.0, 7914.0, 1525.0, 607.0, 286.0, 160.0, 106.0, 66.0, 45.0, 26.0, 13.0, 9.0, 13.0, 3.0, 6.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.34375, -33.98095703125, -32.6181640625, -31.25537109375, -29.892578125, -28.52978515625, -27.1669921875, -25.80419921875, -24.44140625, -23.07861328125, -21.7158203125, -20.35302734375, -18.990234375, -17.62744140625, -16.2646484375, -14.90185546875, -13.5390625, -12.17626953125, -10.8134765625, -9.45068359375, -8.087890625, -6.72509765625, -5.3623046875, -3.99951171875, -2.63671875, -1.27392578125, 0.0888671875, 1.45166015625, 2.814453125, 4.17724609375, 5.5400390625, 6.90283203125, 8.265625, 9.62841796875, 10.9912109375, 12.35400390625, 13.716796875, 15.07958984375, 16.4423828125, 17.80517578125, 19.16796875, 20.53076171875, 21.8935546875, 23.25634765625, 24.619140625, 25.98193359375, 27.3447265625, 28.70751953125, 30.0703125, 31.43310546875, 32.7958984375, 34.15869140625, 35.521484375, 36.88427734375, 38.2470703125, 39.60986328125, 40.97265625, 42.33544921875, 43.6982421875, 45.06103515625, 46.423828125, 47.78662109375, 49.1494140625, 50.51220703125, 51.875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 1.0, 9.0, 5.0, 9.0, 10.0, 12.0, 19.0, 24.0, 25.0, 49.0, 104.0, 172.0, 190.0, 128.0, 79.0, 40.0, 26.0, 21.0, 12.0, 5.0, 9.0, 9.0, 4.0, 5.0, 3.0, 3.0, 7.0, 2.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.84375, -42.671875, -41.5, -40.328125, -39.15625, -37.984375, -36.8125, -35.640625, -34.46875, -33.296875, -32.125, -30.953125, -29.78125, -28.609375, -27.4375, -26.265625, -25.09375, -23.921875, -22.75, -21.578125, -20.40625, -19.234375, -18.0625, -16.890625, -15.71875, -14.546875, -13.375, -12.203125, -11.03125, -9.859375, -8.6875, -7.515625, -6.34375, -5.171875, -4.0, -2.828125, -1.65625, -0.484375, 0.6875, 1.859375, 3.03125, 4.203125, 5.375, 6.546875, 7.71875, 8.890625, 10.0625, 11.234375, 12.40625, 13.578125, 14.75, 15.921875, 17.09375, 18.265625, 19.4375, 20.609375, 21.78125, 22.953125, 24.125, 25.296875, 26.46875, 27.640625, 28.8125, 29.984375, 31.15625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 10.0, 230.0, 714.0, 49.0, 8.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2713.180908203125, -2658.0625, -2602.9443359375, -2547.825927734375, -2492.70751953125, -2437.589111328125, -2382.470703125, -2327.3525390625, -2272.234130859375, -2217.11572265625, -2161.99755859375, -2106.879150390625, -2051.7607421875, -1996.642333984375, -1941.5240478515625, -1886.40576171875, -1831.287353515625, -1776.1689453125, -1721.0506591796875, -1665.932373046875, -1610.81396484375, -1555.695556640625, -1500.5772705078125, -1445.458984375, -1390.340576171875, -1335.22216796875, -1280.1038818359375, -1224.985595703125, -1169.8671875, -1114.748779296875, -1059.6304931640625, -1004.5121459960938, -949.3936767578125, -894.2753295898438, -839.156982421875, -784.0386352539062, -728.9202880859375, -673.8019409179688, -618.68359375, -563.5652465820312, -508.4468994140625, -453.32855224609375, -398.210205078125, -343.09185791015625, -287.9735107421875, -232.85516357421875, -177.73681640625, -122.61846923828125, -67.5001220703125, -12.38177490234375, 42.736572265625, 97.85491943359375, 152.9732666015625, 208.09161376953125, 263.2099609375, 318.32830810546875, 373.4466552734375, 428.56500244140625, 483.683349609375, 538.8016967773438, 593.9200439453125, 649.0383911132812, 704.15673828125, 759.2750854492188, 814.3934326171875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 8.0, 8.0, 7.0, 9.0, 13.0, 16.0, 17.0, 19.0, 26.0, 22.0, 33.0, 49.0, 28.0, 38.0, 38.0, 52.0, 59.0, 36.0, 53.0, 51.0, 42.0, 45.0, 41.0, 39.0, 27.0, 36.0, 35.0, 29.0, 16.0, 17.0, 18.0, 15.0, 22.0, 11.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-259.5472717285156, -250.4111785888672, -241.2750701904297, -232.13897705078125, -223.00286865234375, -213.8667755126953, -204.73068237304688, -195.59457397460938, -186.45848083496094, -177.3223876953125, -168.186279296875, -159.05018615722656, -149.91409301757812, -140.77798461914062, -131.6418914794922, -122.50579071044922, -113.36968994140625, -104.23358917236328, -95.09748840332031, -85.96139526367188, -76.8252944946289, -67.68919372558594, -58.553096771240234, -49.41699981689453, -40.28089904785156, -31.144800186157227, -22.00870132446289, -12.872602462768555, -3.7365036010742188, 5.39959716796875, 14.535694122314453, 23.671791076660156, 32.80792236328125, 41.94402313232422, 51.08012008666992, 60.216217041015625, 69.3523178100586, 78.48841857910156, 87.62451171875, 96.76061248779297, 105.89671325683594, 115.0328140258789, 124.16891479492188, 133.3050079345703, 142.44110107421875, 151.57720947265625, 160.7133026123047, 169.84939575195312, 178.98550415039062, 188.12159729003906, 197.25770568847656, 206.393798828125, 215.5299072265625, 224.66600036621094, 233.80209350585938, 242.93820190429688, 252.0742950439453, 261.21038818359375, 270.34649658203125, 279.48260498046875, 288.6186828613281, 297.7547912597656, 306.8908996582031, 316.0269775390625, 325.1630859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 9.0, 6.0, 6.0, 18.0, 19.0, 37.0, 72.0, 96.0, 187.0, 290.0, 496.0, 864.0, 1898.0, 5821.0, 36979.0, 4100174.0, 37548.0, 5779.0, 1916.0, 852.0, 498.0, 262.0, 180.0, 117.0, 69.0, 30.0, 26.0, 10.0, 8.0, 9.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21875, -41.587890625, -39.95703125, -38.326171875, -36.6953125, -35.064453125, -33.43359375, -31.802734375, -30.171875, -28.541015625, -26.91015625, -25.279296875, -23.6484375, -22.017578125, -20.38671875, -18.755859375, -17.125, -15.494140625, -13.86328125, -12.232421875, -10.6015625, -8.970703125, -7.33984375, -5.708984375, -4.078125, -2.447265625, -0.81640625, 0.814453125, 2.4453125, 4.076171875, 5.70703125, 7.337890625, 8.96875, 10.599609375, 12.23046875, 13.861328125, 15.4921875, 17.123046875, 18.75390625, 20.384765625, 22.015625, 23.646484375, 25.27734375, 26.908203125, 28.5390625, 30.169921875, 31.80078125, 33.431640625, 35.0625, 36.693359375, 38.32421875, 39.955078125, 41.5859375, 43.216796875, 44.84765625, 46.478515625, 48.109375, 49.740234375, 51.37109375, 53.001953125, 54.6328125, 56.263671875, 57.89453125, 59.525390625, 61.15625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 9.0, 16.0, 25.0, 25.0, 50.0, 92.0, 104.0, 125.0, 132.0, 110.0, 101.0, 91.0, 50.0, 24.0, 19.0, 14.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.984375, -23.963134765625, -22.94189453125, -21.920654296875, -20.8994140625, -19.878173828125, -18.85693359375, -17.835693359375, -16.814453125, -15.793212890625, -14.77197265625, -13.750732421875, -12.7294921875, -11.708251953125, -10.68701171875, -9.665771484375, -8.64453125, -7.623291015625, -6.60205078125, -5.580810546875, -4.5595703125, -3.538330078125, -2.51708984375, -1.495849609375, -0.474609375, 0.546630859375, 1.56787109375, 2.589111328125, 3.6103515625, 4.631591796875, 5.65283203125, 6.674072265625, 7.6953125, 8.716552734375, 9.73779296875, 10.759033203125, 11.7802734375, 12.801513671875, 13.82275390625, 14.843994140625, 15.865234375, 16.886474609375, 17.90771484375, 18.928955078125, 19.9501953125, 20.971435546875, 21.99267578125, 23.013916015625, 24.03515625, 25.056396484375, 26.07763671875, 27.098876953125, 28.1201171875, 29.141357421875, 30.16259765625, 31.183837890625, 32.205078125, 33.226318359375, 34.24755859375, 35.268798828125, 36.2900390625, 37.311279296875, 38.33251953125, 39.353759765625, 40.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 16.0, 21.0, 21.0, 26.0, 44.0, 71.0, 94.0, 124.0, 185.0, 297.0, 450.0, 725.0, 1308.0, 3127.0, 9563.0, 57918.0, 4046538.0, 57813.0, 9583.0, 3007.0, 1335.0, 710.0, 451.0, 282.0, 185.0, 111.0, 78.0, 62.0, 30.0, 26.0, 16.0, 21.0, 12.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.796875, -26.821533203125, -25.84619140625, -24.870849609375, -23.8955078125, -22.920166015625, -21.94482421875, -20.969482421875, -19.994140625, -19.018798828125, -18.04345703125, -17.068115234375, -16.0927734375, -15.117431640625, -14.14208984375, -13.166748046875, -12.19140625, -11.216064453125, -10.24072265625, -9.265380859375, -8.2900390625, -7.314697265625, -6.33935546875, -5.364013671875, -4.388671875, -3.413330078125, -2.43798828125, -1.462646484375, -0.4873046875, 0.488037109375, 1.46337890625, 2.438720703125, 3.4140625, 4.389404296875, 5.36474609375, 6.340087890625, 7.3154296875, 8.290771484375, 9.26611328125, 10.241455078125, 11.216796875, 12.192138671875, 13.16748046875, 14.142822265625, 15.1181640625, 16.093505859375, 17.06884765625, 18.044189453125, 19.01953125, 19.994873046875, 20.97021484375, 21.945556640625, 22.9208984375, 23.896240234375, 24.87158203125, 25.846923828125, 26.822265625, 27.797607421875, 28.77294921875, 29.748291015625, 30.7236328125, 31.698974609375, 32.67431640625, 33.649658203125, 34.625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 8.0, 5.0, 10.0, 21.0, 13.0, 59.0, 120.0, 3367.0, 304.0, 65.0, 40.0, 20.0, 13.0, 8.0, 5.0, 8.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.24615478515625, -8.0157470703125, -7.78533935546875, -7.554931640625, -7.32452392578125, -7.0941162109375, -6.86370849609375, -6.63330078125, -6.40289306640625, -6.1724853515625, -5.94207763671875, -5.711669921875, -5.48126220703125, -5.2508544921875, -5.02044677734375, -4.7900390625, -4.55963134765625, -4.3292236328125, -4.09881591796875, -3.868408203125, -3.63800048828125, -3.4075927734375, -3.17718505859375, -2.94677734375, -2.71636962890625, -2.4859619140625, -2.25555419921875, -2.025146484375, -1.79473876953125, -1.5643310546875, -1.33392333984375, -1.103515625, -0.87310791015625, -0.6427001953125, -0.41229248046875, -0.181884765625, 0.04852294921875, 0.2789306640625, 0.50933837890625, 0.73974609375, 0.97015380859375, 1.2005615234375, 1.43096923828125, 1.661376953125, 1.89178466796875, 2.1221923828125, 2.35260009765625, 2.5830078125, 2.81341552734375, 3.0438232421875, 3.27423095703125, 3.504638671875, 3.73504638671875, 3.9654541015625, 4.19586181640625, 4.42626953125, 4.65667724609375, 4.8870849609375, 5.11749267578125, 5.347900390625, 5.57830810546875, 5.8087158203125, 6.03912353515625, 6.26953125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 5.0, 12.0, 21.0, 27.0, 42.0, 81.0, 140.0, 171.0, 159.0, 127.0, 79.0, 44.0, 33.0, 25.0, 15.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.32073974609375, -35.27613830566406, -34.23154067993164, -33.18693923950195, -32.142337799072266, -31.09773826599121, -30.053138732910156, -29.00853729248047, -27.963937759399414, -26.91933822631836, -25.874736785888672, -24.830137252807617, -23.785537719726562, -22.740936279296875, -21.69633674621582, -20.651737213134766, -19.607135772705078, -18.562536239624023, -17.517934799194336, -16.47333526611328, -15.42873477935791, -14.384134292602539, -13.339534759521484, -12.294934272766113, -11.250333786010742, -10.205733299255371, -9.1611328125, -8.116533279418945, -7.071932792663574, -6.027332305908203, -4.98273229598999, -3.9381322860717773, -2.8935279846191406, -1.8489277362823486, -0.8043274879455566, 0.24027276039123535, 1.2848730087280273, 2.3294734954833984, 3.3740735054016113, 4.418673515319824, 5.463274002075195, 6.507874488830566, 7.552474498748779, 8.597074508666992, 9.641674995422363, 10.686275482177734, 11.730875015258789, 12.77547550201416, 13.820075988769531, 14.864676475524902, 15.909276962280273, 16.953876495361328, 17.998477935791016, 19.04307746887207, 20.087677001953125, 21.132278442382812, 22.176877975463867, 23.221477508544922, 24.26607894897461, 25.310678482055664, 26.35527801513672, 27.399879455566406, 28.44447898864746, 29.489078521728516, 30.533679962158203]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 7.0, 9.0, 13.0, 10.0, 17.0, 27.0, 21.0, 31.0, 44.0, 35.0, 49.0, 66.0, 48.0, 55.0, 50.0, 64.0, 60.0, 51.0, 49.0, 58.0, 40.0, 38.0, 33.0, 27.0, 20.0, 19.0, 14.0, 13.0, 2.0, 2.0, 5.0, 9.0, 5.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.431556701660156, -22.84870147705078, -22.265844345092773, -21.6829891204834, -21.10013198852539, -20.517276763916016, -19.934419631958008, -19.351564407348633, -18.768707275390625, -18.18585205078125, -17.602994918823242, -17.020139694213867, -16.43728256225586, -15.854427337646484, -15.271571159362793, -14.688714981079102, -14.105859756469727, -13.523003578186035, -12.940147399902344, -12.357291221618652, -11.774435043334961, -11.191579818725586, -10.608723640441895, -10.025867462158203, -9.443011283874512, -8.86015510559082, -8.277298927307129, -7.694443225860596, -7.111587047576904, -6.528730869293213, -5.94587516784668, -5.363018989562988, -4.78016471862793, -4.197308540344238, -3.614452600479126, -3.0315966606140137, -2.4487404823303223, -1.8658843040466309, -1.2830283641815186, -0.7001724243164062, -0.11731624603271484, 0.465539813041687, 1.0483958721160889, 1.6312519311904907, 2.2141079902648926, 2.796964168548584, 3.3798201084136963, 3.9626760482788086, 4.5455322265625, 5.128388404846191, 5.711244583129883, 6.294100284576416, 6.876956462860107, 7.459812641143799, 8.042668342590332, 8.625524520874023, 9.208380699157715, 9.791236877441406, 10.374093055725098, 10.956949234008789, 11.539804458618164, 12.122661590576172, 12.705516815185547, 13.288372993469238, 13.87122917175293]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 6.0, 7.0, 6.0, 14.0, 13.0, 19.0, 27.0, 35.0, 55.0, 67.0, 99.0, 159.0, 225.0, 359.0, 649.0, 1057.0, 2307.0, 5784.0, 23268.0, 148861.0, 600394.0, 219179.0, 32686.0, 7427.0, 2693.0, 1236.0, 701.0, 443.0, 257.0, 179.0, 91.0, 77.0, 55.0, 35.0, 26.0, 20.0, 17.0, 8.0, 9.0, 2.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-44.09375, -42.951416015625, -41.80908203125, -40.666748046875, -39.5244140625, -38.382080078125, -37.23974609375, -36.097412109375, -34.955078125, -33.812744140625, -32.67041015625, -31.528076171875, -30.3857421875, -29.243408203125, -28.10107421875, -26.958740234375, -25.81640625, -24.674072265625, -23.53173828125, -22.389404296875, -21.2470703125, -20.104736328125, -18.96240234375, -17.820068359375, -16.677734375, -15.535400390625, -14.39306640625, -13.250732421875, -12.1083984375, -10.966064453125, -9.82373046875, -8.681396484375, -7.5390625, -6.396728515625, -5.25439453125, -4.112060546875, -2.9697265625, -1.827392578125, -0.68505859375, 0.457275390625, 1.599609375, 2.741943359375, 3.88427734375, 5.026611328125, 6.1689453125, 7.311279296875, 8.45361328125, 9.595947265625, 10.73828125, 11.880615234375, 13.02294921875, 14.165283203125, 15.3076171875, 16.449951171875, 17.59228515625, 18.734619140625, 19.876953125, 21.019287109375, 22.16162109375, 23.303955078125, 24.4462890625, 25.588623046875, 26.73095703125, 27.873291015625, 29.015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 11.0, 14.0, 24.0, 29.0, 47.0, 67.0, 103.0, 121.0, 134.0, 103.0, 129.0, 84.0, 49.0, 37.0, 25.0, 10.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.21875, -24.197265625, -23.17578125, -22.154296875, -21.1328125, -20.111328125, -19.08984375, -18.068359375, -17.046875, -16.025390625, -15.00390625, -13.982421875, -12.9609375, -11.939453125, -10.91796875, -9.896484375, -8.875, -7.853515625, -6.83203125, -5.810546875, -4.7890625, -3.767578125, -2.74609375, -1.724609375, -0.703125, 0.318359375, 1.33984375, 2.361328125, 3.3828125, 4.404296875, 5.42578125, 6.447265625, 7.46875, 8.490234375, 9.51171875, 10.533203125, 11.5546875, 12.576171875, 13.59765625, 14.619140625, 15.640625, 16.662109375, 17.68359375, 18.705078125, 19.7265625, 20.748046875, 21.76953125, 22.791015625, 23.8125, 24.833984375, 25.85546875, 26.876953125, 27.8984375, 28.919921875, 29.94140625, 30.962890625, 31.984375, 33.005859375, 34.02734375, 35.048828125, 36.0703125, 37.091796875, 38.11328125, 39.134765625, 40.15625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 9.0, 10.0, 11.0, 25.0, 28.0, 44.0, 59.0, 95.0, 160.0, 246.0, 505.0, 1215.0, 5013.0, 280087.0, 751798.0, 6598.0, 1359.0, 526.0, 264.0, 156.0, 98.0, 65.0, 53.0, 31.0, 27.0, 22.0, 5.0, 9.0, 4.0, 3.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-192.0, -186.36328125, -180.7265625, -175.08984375, -169.453125, -163.81640625, -158.1796875, -152.54296875, -146.90625, -141.26953125, -135.6328125, -129.99609375, -124.359375, -118.72265625, -113.0859375, -107.44921875, -101.8125, -96.17578125, -90.5390625, -84.90234375, -79.265625, -73.62890625, -67.9921875, -62.35546875, -56.71875, -51.08203125, -45.4453125, -39.80859375, -34.171875, -28.53515625, -22.8984375, -17.26171875, -11.625, -5.98828125, -0.3515625, 5.28515625, 10.921875, 16.55859375, 22.1953125, 27.83203125, 33.46875, 39.10546875, 44.7421875, 50.37890625, 56.015625, 61.65234375, 67.2890625, 72.92578125, 78.5625, 84.19921875, 89.8359375, 95.47265625, 101.109375, 106.74609375, 112.3828125, 118.01953125, 123.65625, 129.29296875, 134.9296875, 140.56640625, 146.203125, 151.83984375, 157.4765625, 163.11328125, 168.75]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 12.0, 15.0, 11.0, 11.0, 36.0, 56.0, 78.0, 151.0, 160.0, 156.0, 116.0, 63.0, 34.0, 22.0, 20.0, 17.0, 11.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-269.75, -260.9375, -252.125, -243.3125, -234.5, -225.6875, -216.875, -208.0625, -199.25, -190.4375, -181.625, -172.8125, -164.0, -155.1875, -146.375, -137.5625, -128.75, -119.9375, -111.125, -102.3125, -93.5, -84.6875, -75.875, -67.0625, -58.25, -49.4375, -40.625, -31.8125, -23.0, -14.1875, -5.375, 3.4375, 12.25, 21.0625, 29.875, 38.6875, 47.5, 56.3125, 65.125, 73.9375, 82.75, 91.5625, 100.375, 109.1875, 118.0, 126.8125, 135.625, 144.4375, 153.25, 162.0625, 170.875, 179.6875, 188.5, 197.3125, 206.125, 214.9375, 223.75, 232.5625, 241.375, 250.1875, 259.0, 267.8125, 276.625, 285.4375, 294.25]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 15.0, 16.0, 29.0, 29.0, 23.0, 57.0, 87.0, 91.0, 173.0, 315.0, 830.0, 6615.0, 1007732.0, 29987.0, 1457.0, 432.0, 204.0, 122.0, 76.0, 62.0, 40.0, 34.0, 23.0, 13.0, 12.0, 10.0, 14.0, 9.0, 12.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.25, -90.1083984375, -86.966796875, -83.8251953125, -80.68359375, -77.5419921875, -74.400390625, -71.2587890625, -68.1171875, -64.9755859375, -61.833984375, -58.6923828125, -55.55078125, -52.4091796875, -49.267578125, -46.1259765625, -42.984375, -39.8427734375, -36.701171875, -33.5595703125, -30.41796875, -27.2763671875, -24.134765625, -20.9931640625, -17.8515625, -14.7099609375, -11.568359375, -8.4267578125, -5.28515625, -2.1435546875, 0.998046875, 4.1396484375, 7.28125, 10.4228515625, 13.564453125, 16.7060546875, 19.84765625, 22.9892578125, 26.130859375, 29.2724609375, 32.4140625, 35.5556640625, 38.697265625, 41.8388671875, 44.98046875, 48.1220703125, 51.263671875, 54.4052734375, 57.546875, 60.6884765625, 63.830078125, 66.9716796875, 70.11328125, 73.2548828125, 76.396484375, 79.5380859375, 82.6796875, 85.8212890625, 88.962890625, 92.1044921875, 95.24609375, 98.3876953125, 101.529296875, 104.6708984375, 107.8125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 10.0, 13.0, 17.0, 34.0, 47.0, 97.0, 158.0, 197.0, 169.0, 95.0, 51.0, 36.0, 23.0, 12.0, 11.0, 6.0, 4.0, 7.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032711029052734375, -0.0031568706035614014, -0.0030426383018493652, -0.002928406000137329, -0.002814173698425293, -0.002699941396713257, -0.0025857090950012207, -0.0024714767932891846, -0.0023572444915771484, -0.0022430121898651123, -0.002128779888153076, -0.00201454758644104, -0.001900315284729004, -0.0017860829830169678, -0.0016718506813049316, -0.0015576183795928955, -0.0014433860778808594, -0.0013291537761688232, -0.0012149214744567871, -0.001100689172744751, -0.0009864568710327148, -0.0008722245693206787, -0.0007579922676086426, -0.0006437599658966064, -0.0005295276641845703, -0.0004152953624725342, -0.00030106306076049805, -0.00018683075904846191, -7.259845733642578e-05, 4.163384437561035e-05, 0.00015586614608764648, 0.0002700984477996826, 0.00038433074951171875, 0.0004985630512237549, 0.000612795352935791, 0.0007270276546478271, 0.0008412599563598633, 0.0009554922580718994, 0.0010697245597839355, 0.0011839568614959717, 0.0012981891632080078, 0.001412421464920044, 0.00152665376663208, 0.0016408860683441162, 0.0017551183700561523, 0.0018693506717681885, 0.0019835829734802246, 0.0020978152751922607, 0.002212047576904297, 0.002326279878616333, 0.002440512180328369, 0.0025547444820404053, 0.0026689767837524414, 0.0027832090854644775, 0.0028974413871765137, 0.00301167368888855, 0.003125905990600586, 0.003240138292312622, 0.003354370594024658, 0.0034686028957366943, 0.0035828351974487305, 0.0036970674991607666, 0.0038112998008728027, 0.003925532102584839, 0.004039764404296875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 7.0, 9.0, 17.0, 23.0, 26.0, 24.0, 72.0, 63.0, 105.0, 149.0, 225.0, 467.0, 1289.0, 6307.0, 361411.0, 668188.0, 7430.0, 1462.0, 545.0, 222.0, 138.0, 100.0, 73.0, 48.0, 43.0, 20.0, 22.0, 13.0, 6.0, 8.0, 11.0, 6.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.46875, -52.52587890625, -50.5830078125, -48.64013671875, -46.697265625, -44.75439453125, -42.8115234375, -40.86865234375, -38.92578125, -36.98291015625, -35.0400390625, -33.09716796875, -31.154296875, -29.21142578125, -27.2685546875, -25.32568359375, -23.3828125, -21.43994140625, -19.4970703125, -17.55419921875, -15.611328125, -13.66845703125, -11.7255859375, -9.78271484375, -7.83984375, -5.89697265625, -3.9541015625, -2.01123046875, -0.068359375, 1.87451171875, 3.8173828125, 5.76025390625, 7.703125, 9.64599609375, 11.5888671875, 13.53173828125, 15.474609375, 17.41748046875, 19.3603515625, 21.30322265625, 23.24609375, 25.18896484375, 27.1318359375, 29.07470703125, 31.017578125, 32.96044921875, 34.9033203125, 36.84619140625, 38.7890625, 40.73193359375, 42.6748046875, 44.61767578125, 46.560546875, 48.50341796875, 50.4462890625, 52.38916015625, 54.33203125, 56.27490234375, 58.2177734375, 60.16064453125, 62.103515625, 64.04638671875, 65.9892578125, 67.93212890625, 69.875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 14.0, 13.0, 23.0, 27.0, 66.0, 156.0, 311.0, 175.0, 73.0, 32.0, 26.0, 14.0, 9.0, 7.0, 9.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-97.0, -94.6630859375, -92.326171875, -89.9892578125, -87.65234375, -85.3154296875, -82.978515625, -80.6416015625, -78.3046875, -75.9677734375, -73.630859375, -71.2939453125, -68.95703125, -66.6201171875, -64.283203125, -61.9462890625, -59.609375, -57.2724609375, -54.935546875, -52.5986328125, -50.26171875, -47.9248046875, -45.587890625, -43.2509765625, -40.9140625, -38.5771484375, -36.240234375, -33.9033203125, -31.56640625, -29.2294921875, -26.892578125, -24.5556640625, -22.21875, -19.8818359375, -17.544921875, -15.2080078125, -12.87109375, -10.5341796875, -8.197265625, -5.8603515625, -3.5234375, -1.1865234375, 1.150390625, 3.4873046875, 5.82421875, 8.1611328125, 10.498046875, 12.8349609375, 15.171875, 17.5087890625, 19.845703125, 22.1826171875, 24.51953125, 26.8564453125, 29.193359375, 31.5302734375, 33.8671875, 36.2041015625, 38.541015625, 40.8779296875, 43.21484375, 45.5517578125, 47.888671875, 50.2255859375, 52.5625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 17.0, 141.0, 624.0, 188.0, 20.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-778.3920288085938, -733.8359985351562, -689.2799682617188, -644.7239379882812, -600.1679077148438, -555.6118774414062, -511.0558776855469, -466.4998474121094, -421.9438171386719, -377.3877868652344, -332.8317565917969, -288.2757568359375, -243.71971130371094, -199.16368103027344, -154.607666015625, -110.0516357421875, -65.49560546875, -20.939579010009766, 23.61644744873047, 68.17247009277344, 112.72850036621094, 157.28453063964844, 201.84054565429688, 246.39657592773438, 290.9526062011719, 335.5086364746094, 380.0646667480469, 424.62066650390625, 469.17669677734375, 513.7327270507812, 558.2887573242188, 602.8447875976562, 647.4007568359375, 691.956787109375, 736.5128173828125, 781.06884765625, 825.6248779296875, 870.180908203125, 914.7369384765625, 959.29296875, 1003.8489990234375, 1048.405029296875, 1092.9610595703125, 1137.51708984375, 1182.0731201171875, 1226.629150390625, 1271.1851806640625, 1315.7412109375, 1360.297119140625, 1404.8531494140625, 1449.4091796875, 1493.9652099609375, 1538.521240234375, 1583.0772705078125, 1627.63330078125, 1672.1893310546875, 1716.745361328125, 1761.3013916015625, 1805.857421875, 1850.4134521484375, 1894.969482421875, 1939.5255126953125, 1984.08154296875, 2028.6375732421875, 2073.193603515625]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 9.0, 29.0, 28.0, 28.0, 49.0, 51.0, 73.0, 92.0, 105.0, 87.0, 73.0, 88.0, 77.0, 50.0, 47.0, 41.0, 30.0, 16.0, 10.0, 10.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-796.7935180664062, -776.0010375976562, -755.20849609375, -734.416015625, -713.6234741210938, -692.8309936523438, -672.0384521484375, -651.2459716796875, -630.4534912109375, -609.6610107421875, -588.8684692382812, -568.0759887695312, -547.283447265625, -526.490966796875, -505.6984558105469, -484.90594482421875, -464.1134033203125, -443.3208923339844, -422.52838134765625, -401.7358703613281, -380.943359375, -360.15087890625, -339.3583679199219, -318.56585693359375, -297.7733459472656, -276.9808349609375, -256.1883239746094, -235.3958282470703, -214.6033172607422, -193.81080627441406, -173.018310546875, -152.22579956054688, -131.433349609375, -110.64083862304688, -89.84833526611328, -69.05583190917969, -48.26332092285156, -27.470809936523438, -6.678306579589844, 14.11419677734375, 34.906707763671875, 55.699214935302734, 76.4917221069336, 97.28422546386719, 118.07673645019531, 138.86924743652344, 159.6617431640625, 180.45425415039062, 201.24676513671875, 222.03927612304688, 242.831787109375, 263.6242980957031, 284.41680908203125, 305.20928955078125, 326.0018005371094, 346.7943115234375, 367.5868225097656, 388.37933349609375, 409.1718444824219, 429.96435546875, 450.7568359375, 471.54937744140625, 492.34185791015625, 513.1343994140625, 533.9268798828125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 19.0, 58.0, 107.0, 386.0, 1631.0, 14854.0, 4116721.0, 56416.0, 3186.0, 609.0, 194.0, 53.0, 17.0, 15.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.9375, -37.6787109375, -35.419921875, -33.1611328125, -30.90234375, -28.6435546875, -26.384765625, -24.1259765625, -21.8671875, -19.6083984375, -17.349609375, -15.0908203125, -12.83203125, -10.5732421875, -8.314453125, -6.0556640625, -3.796875, -1.5380859375, 0.720703125, 2.9794921875, 5.23828125, 7.4970703125, 9.755859375, 12.0146484375, 14.2734375, 16.5322265625, 18.791015625, 21.0498046875, 23.30859375, 25.5673828125, 27.826171875, 30.0849609375, 32.34375, 34.6025390625, 36.861328125, 39.1201171875, 41.37890625, 43.6376953125, 45.896484375, 48.1552734375, 50.4140625, 52.6728515625, 54.931640625, 57.1904296875, 59.44921875, 61.7080078125, 63.966796875, 66.2255859375, 68.484375, 70.7431640625, 73.001953125, 75.2607421875, 77.51953125, 79.7783203125, 82.037109375, 84.2958984375, 86.5546875, 88.8134765625, 91.072265625, 93.3310546875, 95.58984375, 97.8486328125, 100.107421875, 102.3662109375, 104.625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 6.0, 13.0, 15.0, 21.0, 28.0, 34.0, 35.0, 58.0, 54.0, 77.0, 78.0, 90.0, 76.0, 71.0, 57.0, 56.0, 54.0, 33.0, 37.0, 23.0, 20.0, 10.0, 4.0, 13.0, 3.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1875, -18.4990234375, -17.810546875, -17.1220703125, -16.43359375, -15.7451171875, -15.056640625, -14.3681640625, -13.6796875, -12.9912109375, -12.302734375, -11.6142578125, -10.92578125, -10.2373046875, -9.548828125, -8.8603515625, -8.171875, -7.4833984375, -6.794921875, -6.1064453125, -5.41796875, -4.7294921875, -4.041015625, -3.3525390625, -2.6640625, -1.9755859375, -1.287109375, -0.5986328125, 0.08984375, 0.7783203125, 1.466796875, 2.1552734375, 2.84375, 3.5322265625, 4.220703125, 4.9091796875, 5.59765625, 6.2861328125, 6.974609375, 7.6630859375, 8.3515625, 9.0400390625, 9.728515625, 10.4169921875, 11.10546875, 11.7939453125, 12.482421875, 13.1708984375, 13.859375, 14.5478515625, 15.236328125, 15.9248046875, 16.61328125, 17.3017578125, 17.990234375, 18.6787109375, 19.3671875, 20.0556640625, 20.744140625, 21.4326171875, 22.12109375, 22.8095703125, 23.498046875, 24.1865234375, 24.875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 12.0, 15.0, 21.0, 16.0, 32.0, 45.0, 53.0, 88.0, 109.0, 168.0, 290.0, 524.0, 1193.0, 3371.0, 14355.0, 359055.0, 3785190.0, 22397.0, 4360.0, 1430.0, 584.0, 303.0, 197.0, 140.0, 104.0, 60.0, 46.0, 40.0, 25.0, 16.0, 9.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-37.6875, -36.614013671875, -35.54052734375, -34.467041015625, -33.3935546875, -32.320068359375, -31.24658203125, -30.173095703125, -29.099609375, -28.026123046875, -26.95263671875, -25.879150390625, -24.8056640625, -23.732177734375, -22.65869140625, -21.585205078125, -20.51171875, -19.438232421875, -18.36474609375, -17.291259765625, -16.2177734375, -15.144287109375, -14.07080078125, -12.997314453125, -11.923828125, -10.850341796875, -9.77685546875, -8.703369140625, -7.6298828125, -6.556396484375, -5.48291015625, -4.409423828125, -3.3359375, -2.262451171875, -1.18896484375, -0.115478515625, 0.9580078125, 2.031494140625, 3.10498046875, 4.178466796875, 5.251953125, 6.325439453125, 7.39892578125, 8.472412109375, 9.5458984375, 10.619384765625, 11.69287109375, 12.766357421875, 13.83984375, 14.913330078125, 15.98681640625, 17.060302734375, 18.1337890625, 19.207275390625, 20.28076171875, 21.354248046875, 22.427734375, 23.501220703125, 24.57470703125, 25.648193359375, 26.7216796875, 27.795166015625, 28.86865234375, 29.942138671875, 31.015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 10.0, 13.0, 33.0, 140.0, 3172.0, 564.0, 84.0, 23.0, 22.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15625, -18.46826171875, -17.7802734375, -17.09228515625, -16.404296875, -15.71630859375, -15.0283203125, -14.34033203125, -13.65234375, -12.96435546875, -12.2763671875, -11.58837890625, -10.900390625, -10.21240234375, -9.5244140625, -8.83642578125, -8.1484375, -7.46044921875, -6.7724609375, -6.08447265625, -5.396484375, -4.70849609375, -4.0205078125, -3.33251953125, -2.64453125, -1.95654296875, -1.2685546875, -0.58056640625, 0.107421875, 0.79541015625, 1.4833984375, 2.17138671875, 2.859375, 3.54736328125, 4.2353515625, 4.92333984375, 5.611328125, 6.29931640625, 6.9873046875, 7.67529296875, 8.36328125, 9.05126953125, 9.7392578125, 10.42724609375, 11.115234375, 11.80322265625, 12.4912109375, 13.17919921875, 13.8671875, 14.55517578125, 15.2431640625, 15.93115234375, 16.619140625, 17.30712890625, 17.9951171875, 18.68310546875, 19.37109375, 20.05908203125, 20.7470703125, 21.43505859375, 22.123046875, 22.81103515625, 23.4990234375, 24.18701171875, 24.875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 8.0, 9.0, 25.0, 69.0, 168.0, 239.0, 269.0, 130.0, 51.0, 22.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.85598754882812, -81.0434341430664, -78.23088073730469, -75.41831970214844, -72.60576629638672, -69.793212890625, -66.98065948486328, -64.16810607910156, -61.35554885864258, -58.54299545288086, -55.730438232421875, -52.917884826660156, -50.10533142089844, -47.29277420043945, -44.480220794677734, -41.66766357421875, -38.85511016845703, -36.04255676269531, -33.22999954223633, -30.41744613647461, -27.604890823364258, -24.792335510253906, -21.979782104492188, -19.167226791381836, -16.354671478271484, -13.542116165161133, -10.729561805725098, -7.9170074462890625, -5.104452133178711, -2.2918968200683594, 0.5206565856933594, 3.333211898803711, 6.1457672119140625, 8.958322525024414, 11.77087688446045, 14.583431243896484, 17.395986557006836, 20.208541870117188, 23.021095275878906, 25.833650588989258, 28.64620590209961, 31.45876121520996, 34.27131652832031, 37.08386993408203, 39.89642333984375, 42.708980560302734, 45.52153396606445, 48.33409118652344, 51.146644592285156, 53.959197998046875, 56.77175521850586, 59.58430862426758, 62.39686584472656, 65.20941925048828, 68.02197265625, 70.83452606201172, 73.64707946777344, 76.45963287353516, 79.27218627929688, 82.08474731445312, 84.89730072021484, 87.70985412597656, 90.52240753173828, 93.3349609375, 96.14752197265625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 7.0, 1.0, 9.0, 12.0, 18.0, 20.0, 17.0, 25.0, 38.0, 41.0, 49.0, 45.0, 52.0, 62.0, 60.0, 65.0, 61.0, 72.0, 62.0, 40.0, 48.0, 40.0, 39.0, 26.0, 27.0, 14.0, 16.0, 11.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.14964294433594, -32.95511245727539, -31.760578155517578, -30.5660457611084, -29.37151336669922, -28.176982879638672, -26.982450485229492, -25.787918090820312, -24.593385696411133, -23.398853302001953, -22.204320907592773, -21.009788513183594, -19.815258026123047, -18.620723724365234, -17.426193237304688, -16.231660842895508, -15.037128448486328, -13.842596054077148, -12.648063659667969, -11.453532218933105, -10.258999824523926, -9.064467430114746, -7.869935512542725, -6.675403594970703, -5.480871200561523, -4.286338806152344, -3.0918068885803223, -1.8972747325897217, -0.7027425765991211, 0.4917898178100586, 1.68632173538208, 2.8808536529541016, 4.075386047363281, 5.269918441772461, 6.464450359344482, 7.658982276916504, 8.853514671325684, 10.048047065734863, 11.242578506469727, 12.437110900878906, 13.631643295288086, 14.826175689697266, 16.020708084106445, 17.215240478515625, 18.409770965576172, 19.604305267333984, 20.79883575439453, 21.99336814880371, 23.18790054321289, 24.38243293762207, 25.57696533203125, 26.77149772644043, 27.96603012084961, 29.160560607910156, 30.355093002319336, 31.549625396728516, 32.74415588378906, 33.93868637084961, 35.13322067260742, 36.32775115966797, 37.52228546142578, 38.71681594848633, 39.91135025024414, 41.10588073730469, 42.3004150390625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 11.0, 3.0, 14.0, 20.0, 22.0, 41.0, 69.0, 94.0, 170.0, 342.0, 614.0, 1438.0, 4291.0, 21736.0, 257095.0, 685734.0, 64088.0, 8456.0, 2376.0, 904.0, 437.0, 227.0, 133.0, 86.0, 57.0, 32.0, 21.0, 17.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.84375, -51.93701171875, -50.0302734375, -48.12353515625, -46.216796875, -44.31005859375, -42.4033203125, -40.49658203125, -38.58984375, -36.68310546875, -34.7763671875, -32.86962890625, -30.962890625, -29.05615234375, -27.1494140625, -25.24267578125, -23.3359375, -21.42919921875, -19.5224609375, -17.61572265625, -15.708984375, -13.80224609375, -11.8955078125, -9.98876953125, -8.08203125, -6.17529296875, -4.2685546875, -2.36181640625, -0.455078125, 1.45166015625, 3.3583984375, 5.26513671875, 7.171875, 9.07861328125, 10.9853515625, 12.89208984375, 14.798828125, 16.70556640625, 18.6123046875, 20.51904296875, 22.42578125, 24.33251953125, 26.2392578125, 28.14599609375, 30.052734375, 31.95947265625, 33.8662109375, 35.77294921875, 37.6796875, 39.58642578125, 41.4931640625, 43.39990234375, 45.306640625, 47.21337890625, 49.1201171875, 51.02685546875, 52.93359375, 54.84033203125, 56.7470703125, 58.65380859375, 60.560546875, 62.46728515625, 64.3740234375, 66.28076171875, 68.1875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 12.0, 6.0, 14.0, 24.0, 29.0, 37.0, 42.0, 51.0, 55.0, 58.0, 88.0, 90.0, 67.0, 72.0, 53.0, 53.0, 55.0, 48.0, 32.0, 21.0, 27.0, 14.0, 5.0, 7.0, 7.0, 7.0, 4.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.4423828125, -17.759765625, -17.0771484375, -16.39453125, -15.7119140625, -15.029296875, -14.3466796875, -13.6640625, -12.9814453125, -12.298828125, -11.6162109375, -10.93359375, -10.2509765625, -9.568359375, -8.8857421875, -8.203125, -7.5205078125, -6.837890625, -6.1552734375, -5.47265625, -4.7900390625, -4.107421875, -3.4248046875, -2.7421875, -2.0595703125, -1.376953125, -0.6943359375, -0.01171875, 0.6708984375, 1.353515625, 2.0361328125, 2.71875, 3.4013671875, 4.083984375, 4.7666015625, 5.44921875, 6.1318359375, 6.814453125, 7.4970703125, 8.1796875, 8.8623046875, 9.544921875, 10.2275390625, 10.91015625, 11.5927734375, 12.275390625, 12.9580078125, 13.640625, 14.3232421875, 15.005859375, 15.6884765625, 16.37109375, 17.0537109375, 17.736328125, 18.4189453125, 19.1015625, 19.7841796875, 20.466796875, 21.1494140625, 21.83203125, 22.5146484375, 23.197265625, 23.8798828125, 24.5625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 2.0, 5.0, 6.0, 7.0, 10.0, 19.0, 23.0, 30.0, 38.0, 62.0, 125.0, 205.0, 398.0, 1068.0, 4731.0, 231777.0, 800610.0, 6998.0, 1393.0, 465.0, 223.0, 128.0, 73.0, 34.0, 32.0, 26.0, 17.0, 15.0, 2.0, 9.0, 5.0, 2.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.25, -168.984375, -163.71875, -158.453125, -153.1875, -147.921875, -142.65625, -137.390625, -132.125, -126.859375, -121.59375, -116.328125, -111.0625, -105.796875, -100.53125, -95.265625, -90.0, -84.734375, -79.46875, -74.203125, -68.9375, -63.671875, -58.40625, -53.140625, -47.875, -42.609375, -37.34375, -32.078125, -26.8125, -21.546875, -16.28125, -11.015625, -5.75, -0.484375, 4.78125, 10.046875, 15.3125, 20.578125, 25.84375, 31.109375, 36.375, 41.640625, 46.90625, 52.171875, 57.4375, 62.703125, 67.96875, 73.234375, 78.5, 83.765625, 89.03125, 94.296875, 99.5625, 104.828125, 110.09375, 115.359375, 120.625, 125.890625, 131.15625, 136.421875, 141.6875, 146.953125, 152.21875, 157.484375, 162.75]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 10.0, 10.0, 14.0, 33.0, 51.0, 60.0, 82.0, 111.0, 119.0, 125.0, 108.0, 83.0, 65.0, 36.0, 25.0, 20.0, 14.0, 10.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-197.0, -191.5, -186.0, -180.5, -175.0, -169.5, -164.0, -158.5, -153.0, -147.5, -142.0, -136.5, -131.0, -125.5, -120.0, -114.5, -109.0, -103.5, -98.0, -92.5, -87.0, -81.5, -76.0, -70.5, -65.0, -59.5, -54.0, -48.5, -43.0, -37.5, -32.0, -26.5, -21.0, -15.5, -10.0, -4.5, 1.0, 6.5, 12.0, 17.5, 23.0, 28.5, 34.0, 39.5, 45.0, 50.5, 56.0, 61.5, 67.0, 72.5, 78.0, 83.5, 89.0, 94.5, 100.0, 105.5, 111.0, 116.5, 122.0, 127.5, 133.0, 138.5, 144.0, 149.5, 155.0]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 9.0, 15.0, 13.0, 23.0, 52.0, 69.0, 104.0, 206.0, 413.0, 1050.0, 4684.0, 76571.0, 943641.0, 17815.0, 2412.0, 742.0, 296.0, 169.0, 101.0, 58.0, 33.0, 25.0, 10.0, 11.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.03125, -42.708984375, -41.38671875, -40.064453125, -38.7421875, -37.419921875, -36.09765625, -34.775390625, -33.453125, -32.130859375, -30.80859375, -29.486328125, -28.1640625, -26.841796875, -25.51953125, -24.197265625, -22.875, -21.552734375, -20.23046875, -18.908203125, -17.5859375, -16.263671875, -14.94140625, -13.619140625, -12.296875, -10.974609375, -9.65234375, -8.330078125, -7.0078125, -5.685546875, -4.36328125, -3.041015625, -1.71875, -0.396484375, 0.92578125, 2.248046875, 3.5703125, 4.892578125, 6.21484375, 7.537109375, 8.859375, 10.181640625, 11.50390625, 12.826171875, 14.1484375, 15.470703125, 16.79296875, 18.115234375, 19.4375, 20.759765625, 22.08203125, 23.404296875, 24.7265625, 26.048828125, 27.37109375, 28.693359375, 30.015625, 31.337890625, 32.66015625, 33.982421875, 35.3046875, 36.626953125, 37.94921875, 39.271484375, 40.59375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 12.0, 3.0, 9.0, 18.0, 24.0, 47.0, 39.0, 62.0, 100.0, 139.0, 172.0, 92.0, 68.0, 58.0, 33.0, 34.0, 16.0, 18.0, 10.0, 6.0, 6.0, 4.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.003055572509765625, -0.0029730796813964844, -0.0028905868530273438, -0.002808094024658203, -0.0027256011962890625, -0.002643108367919922, -0.0025606155395507812, -0.0024781227111816406, -0.0023956298828125, -0.0023131370544433594, -0.0022306442260742188, -0.002148151397705078, -0.0020656585693359375, -0.001983165740966797, -0.0019006729125976562, -0.0018181800842285156, -0.001735687255859375, -0.0016531944274902344, -0.0015707015991210938, -0.0014882087707519531, -0.0014057159423828125, -0.0013232231140136719, -0.0012407302856445312, -0.0011582374572753906, -0.00107574462890625, -0.0009932518005371094, -0.0009107589721679688, -0.0008282661437988281, -0.0007457733154296875, -0.0006632804870605469, -0.0005807876586914062, -0.0004982948303222656, -0.000415802001953125, -0.0003333091735839844, -0.00025081634521484375, -0.00016832351684570312, -8.58306884765625e-05, -3.337860107421875e-06, 7.915496826171875e-05, 0.00016164779663085938, 0.000244140625, 0.0003266334533691406, 0.00040912628173828125, 0.0004916191101074219, 0.0005741119384765625, 0.0006566047668457031, 0.0007390975952148438, 0.0008215904235839844, 0.000904083251953125, 0.0009865760803222656, 0.0010690689086914062, 0.0011515617370605469, 0.0012340545654296875, 0.0013165473937988281, 0.0013990402221679688, 0.0014815330505371094, 0.00156402587890625, 0.0016465187072753906, 0.0017290115356445312, 0.0018115043640136719, 0.0018939971923828125, 0.001976490020751953, 0.0020589828491210938, 0.0021414756774902344, 0.002223968505859375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 9.0, 8.0, 12.0, 14.0, 18.0, 31.0, 54.0, 85.0, 161.0, 309.0, 780.0, 3659.0, 90687.0, 941162.0, 9209.0, 1388.0, 478.0, 200.0, 92.0, 45.0, 35.0, 21.0, 14.0, 5.0, 12.0, 11.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.53125, -43.05712890625, -41.5830078125, -40.10888671875, -38.634765625, -37.16064453125, -35.6865234375, -34.21240234375, -32.73828125, -31.26416015625, -29.7900390625, -28.31591796875, -26.841796875, -25.36767578125, -23.8935546875, -22.41943359375, -20.9453125, -19.47119140625, -17.9970703125, -16.52294921875, -15.048828125, -13.57470703125, -12.1005859375, -10.62646484375, -9.15234375, -7.67822265625, -6.2041015625, -4.72998046875, -3.255859375, -1.78173828125, -0.3076171875, 1.16650390625, 2.640625, 4.11474609375, 5.5888671875, 7.06298828125, 8.537109375, 10.01123046875, 11.4853515625, 12.95947265625, 14.43359375, 15.90771484375, 17.3818359375, 18.85595703125, 20.330078125, 21.80419921875, 23.2783203125, 24.75244140625, 26.2265625, 27.70068359375, 29.1748046875, 30.64892578125, 32.123046875, 33.59716796875, 35.0712890625, 36.54541015625, 38.01953125, 39.49365234375, 40.9677734375, 42.44189453125, 43.916015625, 45.39013671875, 46.8642578125, 48.33837890625, 49.8125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 6.0, 7.0, 8.0, 26.0, 45.0, 48.0, 98.0, 138.0, 162.0, 148.0, 117.0, 62.0, 37.0, 22.0, 18.0, 9.0, 6.0, 3.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.796875, -28.857177734375, -27.91748046875, -26.977783203125, -26.0380859375, -25.098388671875, -24.15869140625, -23.218994140625, -22.279296875, -21.339599609375, -20.39990234375, -19.460205078125, -18.5205078125, -17.580810546875, -16.64111328125, -15.701416015625, -14.76171875, -13.822021484375, -12.88232421875, -11.942626953125, -11.0029296875, -10.063232421875, -9.12353515625, -8.183837890625, -7.244140625, -6.304443359375, -5.36474609375, -4.425048828125, -3.4853515625, -2.545654296875, -1.60595703125, -0.666259765625, 0.2734375, 1.213134765625, 2.15283203125, 3.092529296875, 4.0322265625, 4.971923828125, 5.91162109375, 6.851318359375, 7.791015625, 8.730712890625, 9.67041015625, 10.610107421875, 11.5498046875, 12.489501953125, 13.42919921875, 14.368896484375, 15.30859375, 16.248291015625, 17.18798828125, 18.127685546875, 19.0673828125, 20.007080078125, 20.94677734375, 21.886474609375, 22.826171875, 23.765869140625, 24.70556640625, 25.645263671875, 26.5849609375, 27.524658203125, 28.46435546875, 29.404052734375, 30.34375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 75.0, 584.0, 297.0, 35.0, 3.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1130.808349609375, -1083.1214599609375, -1035.4345703125, -987.7477416992188, -940.0609130859375, -892.3740234375, -844.6871337890625, -797.000244140625, -749.3134155273438, -701.6265258789062, -653.939697265625, -606.2528076171875, -558.56591796875, -510.87908935546875, -463.19219970703125, -415.5053405761719, -367.8184814453125, -320.1316223144531, -272.44476318359375, -224.75787353515625, -177.07101440429688, -129.3841552734375, -81.697265625, -34.010406494140625, 13.67645263671875, 61.363319396972656, 109.05018615722656, 156.737060546875, 204.42391967773438, 252.11077880859375, 299.79766845703125, 347.4845275878906, 395.1715087890625, 442.8583679199219, 490.54522705078125, 538.2321166992188, 585.9189453125, 633.6058349609375, 681.292724609375, 728.9796142578125, 776.6664428710938, 824.3533325195312, 872.0401611328125, 919.72705078125, 967.4139404296875, 1015.1007690429688, 1062.78759765625, 1110.4744873046875, 1158.161376953125, 1205.8482666015625, 1253.53515625, 1301.221923828125, 1348.9088134765625, 1396.595703125, 1444.2825927734375, 1491.969482421875, 1539.65625, 1587.3431396484375, 1635.030029296875, 1682.716796875, 1730.4036865234375, 1778.090576171875, 1825.7774658203125, 1873.46435546875, 1921.1512451171875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 11.0, 7.0, 8.0, 18.0, 24.0, 29.0, 19.0, 29.0, 45.0, 35.0, 38.0, 35.0, 37.0, 44.0, 43.0, 45.0, 64.0, 53.0, 41.0, 48.0, 54.0, 36.0, 36.0, 28.0, 37.0, 19.0, 23.0, 16.0, 12.0, 19.0, 6.0, 10.0, 2.0, 2.0, 5.0, 3.0, 2.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-357.4586486816406, -347.0057373046875, -336.5528564453125, -326.0999450683594, -315.64703369140625, -305.19415283203125, -294.7412414550781, -284.288330078125, -273.83544921875, -263.3825378417969, -252.92965698242188, -242.47674560546875, -232.0238494873047, -221.57095336914062, -211.1180419921875, -200.66514587402344, -190.21224975585938, -179.7593536376953, -169.30645751953125, -158.85354614257812, -148.40065002441406, -137.94775390625, -127.4948501586914, -117.04194641113281, -106.58905029296875, -96.13615417480469, -85.6832504272461, -75.2303466796875, -64.77745056152344, -54.32455062866211, -43.87165069580078, -33.41874694824219, -22.965850830078125, -12.512950897216797, -2.0600509643554688, 8.39284896850586, 18.845748901367188, 29.298648834228516, 39.751548767089844, 50.20445251464844, 60.6573486328125, 71.11024475097656, 81.56314849853516, 92.01605224609375, 102.46894836425781, 112.92184448242188, 123.37474822998047, 133.82765197753906, 144.28054809570312, 154.7334442138672, 165.18634033203125, 175.63925170898438, 186.09214782714844, 196.5450439453125, 206.99795532226562, 217.4508514404297, 227.90374755859375, 238.3566436767578, 248.80953979492188, 259.262451171875, 269.71533203125, 280.1682434082031, 290.62115478515625, 301.07403564453125, 311.5269470214844]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 15.0, 12.0, 23.0, 25.0, 76.0, 121.0, 206.0, 462.0, 1016.0, 2721.0, 9488.0, 72748.0, 3666735.0, 413302.0, 20200.0, 4356.0, 1450.0, 633.0, 317.0, 145.0, 81.0, 38.0, 38.0, 23.0, 7.0, 15.0, 5.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.84375, -22.693359375, -21.54296875, -20.392578125, -19.2421875, -18.091796875, -16.94140625, -15.791015625, -14.640625, -13.490234375, -12.33984375, -11.189453125, -10.0390625, -8.888671875, -7.73828125, -6.587890625, -5.4375, -4.287109375, -3.13671875, -1.986328125, -0.8359375, 0.314453125, 1.46484375, 2.615234375, 3.765625, 4.916015625, 6.06640625, 7.216796875, 8.3671875, 9.517578125, 10.66796875, 11.818359375, 12.96875, 14.119140625, 15.26953125, 16.419921875, 17.5703125, 18.720703125, 19.87109375, 21.021484375, 22.171875, 23.322265625, 24.47265625, 25.623046875, 26.7734375, 27.923828125, 29.07421875, 30.224609375, 31.375, 32.525390625, 33.67578125, 34.826171875, 35.9765625, 37.126953125, 38.27734375, 39.427734375, 40.578125, 41.728515625, 42.87890625, 44.029296875, 45.1796875, 46.330078125, 47.48046875, 48.630859375, 49.78125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 10.0, 8.0, 10.0, 19.0, 12.0, 28.0, 30.0, 44.0, 59.0, 73.0, 73.0, 86.0, 88.0, 88.0, 60.0, 71.0, 65.0, 52.0, 43.0, 23.0, 18.0, 11.0, 6.0, 3.0, 6.0, 8.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.9375, -22.1318359375, -21.326171875, -20.5205078125, -19.71484375, -18.9091796875, -18.103515625, -17.2978515625, -16.4921875, -15.6865234375, -14.880859375, -14.0751953125, -13.26953125, -12.4638671875, -11.658203125, -10.8525390625, -10.046875, -9.2412109375, -8.435546875, -7.6298828125, -6.82421875, -6.0185546875, -5.212890625, -4.4072265625, -3.6015625, -2.7958984375, -1.990234375, -1.1845703125, -0.37890625, 0.4267578125, 1.232421875, 2.0380859375, 2.84375, 3.6494140625, 4.455078125, 5.2607421875, 6.06640625, 6.8720703125, 7.677734375, 8.4833984375, 9.2890625, 10.0947265625, 10.900390625, 11.7060546875, 12.51171875, 13.3173828125, 14.123046875, 14.9287109375, 15.734375, 16.5400390625, 17.345703125, 18.1513671875, 18.95703125, 19.7626953125, 20.568359375, 21.3740234375, 22.1796875, 22.9853515625, 23.791015625, 24.5966796875, 25.40234375, 26.2080078125, 27.013671875, 27.8193359375, 28.625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 6.0, 10.0, 7.0, 15.0, 20.0, 34.0, 56.0, 115.0, 300.0, 875.0, 2970.0, 16347.0, 332823.0, 3789565.0, 43632.0, 5438.0, 1298.0, 419.0, 132.0, 78.0, 41.0, 24.0, 17.0, 11.0, 8.0, 6.0, 5.0, 6.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-47.03125, -45.61572265625, -44.2001953125, -42.78466796875, -41.369140625, -39.95361328125, -38.5380859375, -37.12255859375, -35.70703125, -34.29150390625, -32.8759765625, -31.46044921875, -30.044921875, -28.62939453125, -27.2138671875, -25.79833984375, -24.3828125, -22.96728515625, -21.5517578125, -20.13623046875, -18.720703125, -17.30517578125, -15.8896484375, -14.47412109375, -13.05859375, -11.64306640625, -10.2275390625, -8.81201171875, -7.396484375, -5.98095703125, -4.5654296875, -3.14990234375, -1.734375, -0.31884765625, 1.0966796875, 2.51220703125, 3.927734375, 5.34326171875, 6.7587890625, 8.17431640625, 9.58984375, 11.00537109375, 12.4208984375, 13.83642578125, 15.251953125, 16.66748046875, 18.0830078125, 19.49853515625, 20.9140625, 22.32958984375, 23.7451171875, 25.16064453125, 26.576171875, 27.99169921875, 29.4072265625, 30.82275390625, 32.23828125, 33.65380859375, 35.0693359375, 36.48486328125, 37.900390625, 39.31591796875, 40.7314453125, 42.14697265625, 43.5625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 8.0, 13.0, 14.0, 29.0, 24.0, 37.0, 92.0, 179.0, 494.0, 1506.0, 1092.0, 343.0, 96.0, 46.0, 23.0, 20.0, 8.0, 8.0, 4.0, 5.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.15625, -37.84375, -36.53125, -35.21875, -33.90625, -32.59375, -31.28125, -29.96875, -28.65625, -27.34375, -26.03125, -24.71875, -23.40625, -22.09375, -20.78125, -19.46875, -18.15625, -16.84375, -15.53125, -14.21875, -12.90625, -11.59375, -10.28125, -8.96875, -7.65625, -6.34375, -5.03125, -3.71875, -2.40625, -1.09375, 0.21875, 1.53125, 2.84375, 4.15625, 5.46875, 6.78125, 8.09375, 9.40625, 10.71875, 12.03125, 13.34375, 14.65625, 15.96875, 17.28125, 18.59375, 19.90625, 21.21875, 22.53125, 23.84375, 25.15625, 26.46875, 27.78125, 29.09375, 30.40625, 31.71875, 33.03125, 34.34375, 35.65625, 36.96875, 38.28125, 39.59375, 40.90625, 42.21875, 43.53125, 44.84375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 8.0, 11.0, 27.0, 58.0, 141.0, 327.0, 310.0, 78.0, 22.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-676.4151611328125, -662.9236450195312, -649.4321899414062, -635.940673828125, -622.4491577148438, -608.9576416015625, -595.4661865234375, -581.9746704101562, -568.483154296875, -554.9916381835938, -541.5001831054688, -528.0086669921875, -514.5171508789062, -501.0256652832031, -487.5341491699219, -474.04266357421875, -460.5511474609375, -447.0596618652344, -433.5681457519531, -420.07666015625, -406.58514404296875, -393.0936584472656, -379.6021423339844, -366.11065673828125, -352.6191711425781, -339.127685546875, -325.63616943359375, -312.1446838378906, -298.6531677246094, -285.16168212890625, -271.670166015625, -258.1786804199219, -244.68716430664062, -231.19566345214844, -217.70416259765625, -204.21266174316406, -190.72116088867188, -177.22967529296875, -163.7381591796875, -150.24667358398438, -136.75515747070312, -123.26365661621094, -109.77215576171875, -96.28065490722656, -82.78915405273438, -69.29766082763672, -55.80615997314453, -42.314659118652344, -28.823165893554688, -15.331665992736816, -1.8401660919189453, 11.65133285522461, 25.142833709716797, 38.63433074951172, 52.125831604003906, 65.6173324584961, 79.10883331298828, 92.60033416748047, 106.09183502197266, 119.58332824707031, 133.0748291015625, 146.5663299560547, 160.05783081054688, 173.54933166503906, 187.04083251953125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 10.0, 12.0, 7.0, 14.0, 18.0, 32.0, 24.0, 41.0, 56.0, 63.0, 64.0, 65.0, 73.0, 61.0, 54.0, 67.0, 72.0, 45.0, 49.0, 43.0, 30.0, 19.0, 14.0, 24.0, 10.0, 11.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-232.3013153076172, -225.70785522460938, -219.1143798828125, -212.52090454101562, -205.9274444580078, -199.333984375, -192.74050903320312, -186.14703369140625, -179.55357360839844, -172.96011352539062, -166.36663818359375, -159.77316284179688, -153.17970275878906, -146.58624267578125, -139.99276733398438, -133.3992919921875, -126.80583190917969, -120.21236419677734, -113.618896484375, -107.02542877197266, -100.43196105957031, -93.83849334716797, -87.24502563476562, -80.65155792236328, -74.05809020996094, -67.4646224975586, -60.87115478515625, -54.277687072753906, -47.68421936035156, -41.09075164794922, -34.497283935546875, -27.90381622314453, -21.310333251953125, -14.716865539550781, -8.123397827148438, -1.5299301147460938, 5.06353759765625, 11.657005310058594, 18.250473022460938, 24.84394073486328, 31.437408447265625, 38.03087615966797, 44.62434387207031, 51.217811584472656, 57.811279296875, 64.40474700927734, 70.99821472167969, 77.59168243408203, 84.18515014648438, 90.77861785888672, 97.37208557128906, 103.9655532836914, 110.55902099609375, 117.1524887084961, 123.74595642089844, 130.33941650390625, 136.93289184570312, 143.5263671875, 150.1198272705078, 156.71328735351562, 163.3067626953125, 169.90023803710938, 176.4936981201172, 183.087158203125, 189.68063354492188]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 6.0, 6.0, 5.0, 9.0, 14.0, 19.0, 27.0, 37.0, 53.0, 90.0, 120.0, 239.0, 353.0, 644.0, 1197.0, 2570.0, 6756.0, 23426.0, 113815.0, 619617.0, 223538.0, 38646.0, 10258.0, 3635.0, 1560.0, 721.0, 451.0, 259.0, 153.0, 102.0, 68.0, 44.0, 36.0, 24.0, 17.0, 12.0, 5.0, 10.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.3125, -35.0888671875, -33.865234375, -32.6416015625, -31.41796875, -30.1943359375, -28.970703125, -27.7470703125, -26.5234375, -25.2998046875, -24.076171875, -22.8525390625, -21.62890625, -20.4052734375, -19.181640625, -17.9580078125, -16.734375, -15.5107421875, -14.287109375, -13.0634765625, -11.83984375, -10.6162109375, -9.392578125, -8.1689453125, -6.9453125, -5.7216796875, -4.498046875, -3.2744140625, -2.05078125, -0.8271484375, 0.396484375, 1.6201171875, 2.84375, 4.0673828125, 5.291015625, 6.5146484375, 7.73828125, 8.9619140625, 10.185546875, 11.4091796875, 12.6328125, 13.8564453125, 15.080078125, 16.3037109375, 17.52734375, 18.7509765625, 19.974609375, 21.1982421875, 22.421875, 23.6455078125, 24.869140625, 26.0927734375, 27.31640625, 28.5400390625, 29.763671875, 30.9873046875, 32.2109375, 33.4345703125, 34.658203125, 35.8818359375, 37.10546875, 38.3291015625, 39.552734375, 40.7763671875, 42.0]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 18.0, 15.0, 19.0, 20.0, 41.0, 51.0, 74.0, 69.0, 95.0, 92.0, 109.0, 68.0, 66.0, 68.0, 49.0, 46.0, 35.0, 16.0, 12.0, 8.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.28125, -22.4765625, -21.671875, -20.8671875, -20.0625, -19.2578125, -18.453125, -17.6484375, -16.84375, -16.0390625, -15.234375, -14.4296875, -13.625, -12.8203125, -12.015625, -11.2109375, -10.40625, -9.6015625, -8.796875, -7.9921875, -7.1875, -6.3828125, -5.578125, -4.7734375, -3.96875, -3.1640625, -2.359375, -1.5546875, -0.75, 0.0546875, 0.859375, 1.6640625, 2.46875, 3.2734375, 4.078125, 4.8828125, 5.6875, 6.4921875, 7.296875, 8.1015625, 8.90625, 9.7109375, 10.515625, 11.3203125, 12.125, 12.9296875, 13.734375, 14.5390625, 15.34375, 16.1484375, 16.953125, 17.7578125, 18.5625, 19.3671875, 20.171875, 20.9765625, 21.78125, 22.5859375, 23.390625, 24.1953125, 25.0, 25.8046875, 26.609375, 27.4140625, 28.21875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 12.0, 12.0, 18.0, 41.0, 34.0, 67.0, 99.0, 194.0, 389.0, 1350.0, 8918.0, 979397.0, 53767.0, 2939.0, 672.0, 269.0, 126.0, 88.0, 38.0, 34.0, 19.0, 13.0, 13.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-200.375, -194.4375, -188.5, -182.5625, -176.625, -170.6875, -164.75, -158.8125, -152.875, -146.9375, -141.0, -135.0625, -129.125, -123.1875, -117.25, -111.3125, -105.375, -99.4375, -93.5, -87.5625, -81.625, -75.6875, -69.75, -63.8125, -57.875, -51.9375, -46.0, -40.0625, -34.125, -28.1875, -22.25, -16.3125, -10.375, -4.4375, 1.5, 7.4375, 13.375, 19.3125, 25.25, 31.1875, 37.125, 43.0625, 49.0, 54.9375, 60.875, 66.8125, 72.75, 78.6875, 84.625, 90.5625, 96.5, 102.4375, 108.375, 114.3125, 120.25, 126.1875, 132.125, 138.0625, 144.0, 149.9375, 155.875, 161.8125, 167.75, 173.6875, 179.625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 8.0, 4.0, 4.0, 25.0, 21.0, 43.0, 72.0, 107.0, 130.0, 146.0, 128.0, 119.0, 83.0, 46.0, 23.0, 14.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-222.5, -216.587890625, -210.67578125, -204.763671875, -198.8515625, -192.939453125, -187.02734375, -181.115234375, -175.203125, -169.291015625, -163.37890625, -157.466796875, -151.5546875, -145.642578125, -139.73046875, -133.818359375, -127.90625, -121.994140625, -116.08203125, -110.169921875, -104.2578125, -98.345703125, -92.43359375, -86.521484375, -80.609375, -74.697265625, -68.78515625, -62.873046875, -56.9609375, -51.048828125, -45.13671875, -39.224609375, -33.3125, -27.400390625, -21.48828125, -15.576171875, -9.6640625, -3.751953125, 2.16015625, 8.072265625, 13.984375, 19.896484375, 25.80859375, 31.720703125, 37.6328125, 43.544921875, 49.45703125, 55.369140625, 61.28125, 67.193359375, 73.10546875, 79.017578125, 84.9296875, 90.841796875, 96.75390625, 102.666015625, 108.578125, 114.490234375, 120.40234375, 126.314453125, 132.2265625, 138.138671875, 144.05078125, 149.962890625, 155.875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 11.0, 13.0, 12.0, 25.0, 30.0, 42.0, 81.0, 141.0, 228.0, 608.0, 2022.0, 14382.0, 988254.0, 38092.0, 3057.0, 793.0, 317.0, 150.0, 86.0, 54.0, 42.0, 29.0, 14.0, 17.0, 7.0, 8.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.875, -62.94677734375, -61.0185546875, -59.09033203125, -57.162109375, -55.23388671875, -53.3056640625, -51.37744140625, -49.44921875, -47.52099609375, -45.5927734375, -43.66455078125, -41.736328125, -39.80810546875, -37.8798828125, -35.95166015625, -34.0234375, -32.09521484375, -30.1669921875, -28.23876953125, -26.310546875, -24.38232421875, -22.4541015625, -20.52587890625, -18.59765625, -16.66943359375, -14.7412109375, -12.81298828125, -10.884765625, -8.95654296875, -7.0283203125, -5.10009765625, -3.171875, -1.24365234375, 0.6845703125, 2.61279296875, 4.541015625, 6.46923828125, 8.3974609375, 10.32568359375, 12.25390625, 14.18212890625, 16.1103515625, 18.03857421875, 19.966796875, 21.89501953125, 23.8232421875, 25.75146484375, 27.6796875, 29.60791015625, 31.5361328125, 33.46435546875, 35.392578125, 37.32080078125, 39.2490234375, 41.17724609375, 43.10546875, 45.03369140625, 46.9619140625, 48.89013671875, 50.818359375, 52.74658203125, 54.6748046875, 56.60302734375, 58.53125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 6.0, 15.0, 23.0, 21.0, 27.0, 35.0, 79.0, 133.0, 242.0, 172.0, 75.0, 41.0, 38.0, 22.0, 15.0, 12.0, 9.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.004375457763671875, -0.004262089729309082, -0.004148721694946289, -0.004035353660583496, -0.003921985626220703, -0.00380861759185791, -0.003695249557495117, -0.0035818815231323242, -0.0034685134887695312, -0.0033551454544067383, -0.0032417774200439453, -0.0031284093856811523, -0.0030150413513183594, -0.0029016733169555664, -0.0027883052825927734, -0.0026749372482299805, -0.0025615692138671875, -0.0024482011795043945, -0.0023348331451416016, -0.0022214651107788086, -0.0021080970764160156, -0.0019947290420532227, -0.0018813610076904297, -0.0017679929733276367, -0.0016546249389648438, -0.0015412569046020508, -0.0014278888702392578, -0.0013145208358764648, -0.0012011528015136719, -0.001087784767150879, -0.0009744167327880859, -0.000861048698425293, -0.0007476806640625, -0.000634312629699707, -0.0005209445953369141, -0.0004075765609741211, -0.0002942085266113281, -0.00018084049224853516, -6.747245788574219e-05, 4.589557647705078e-05, 0.00015926361083984375, 0.0002726316452026367, 0.0003859996795654297, 0.0004993677139282227, 0.0006127357482910156, 0.0007261037826538086, 0.0008394718170166016, 0.0009528398513793945, 0.0010662078857421875, 0.0011795759201049805, 0.0012929439544677734, 0.0014063119888305664, 0.0015196800231933594, 0.0016330480575561523, 0.0017464160919189453, 0.0018597841262817383, 0.0019731521606445312, 0.0020865201950073242, 0.002199888229370117, 0.00231325626373291, 0.002426624298095703, 0.002539992332458496, 0.002653360366821289, 0.002766728401184082, 0.002880096435546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 5.0, 12.0, 27.0, 30.0, 39.0, 50.0, 55.0, 101.0, 154.0, 267.0, 503.0, 1326.0, 5466.0, 87583.0, 935833.0, 13127.0, 2249.0, 777.0, 356.0, 195.0, 111.0, 64.0, 58.0, 33.0, 29.0, 20.0, 16.0, 13.0, 8.0, 11.0, 3.0, 4.0, 3.0, 0.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.3125, -41.830078125, -40.34765625, -38.865234375, -37.3828125, -35.900390625, -34.41796875, -32.935546875, -31.453125, -29.970703125, -28.48828125, -27.005859375, -25.5234375, -24.041015625, -22.55859375, -21.076171875, -19.59375, -18.111328125, -16.62890625, -15.146484375, -13.6640625, -12.181640625, -10.69921875, -9.216796875, -7.734375, -6.251953125, -4.76953125, -3.287109375, -1.8046875, -0.322265625, 1.16015625, 2.642578125, 4.125, 5.607421875, 7.08984375, 8.572265625, 10.0546875, 11.537109375, 13.01953125, 14.501953125, 15.984375, 17.466796875, 18.94921875, 20.431640625, 21.9140625, 23.396484375, 24.87890625, 26.361328125, 27.84375, 29.326171875, 30.80859375, 32.291015625, 33.7734375, 35.255859375, 36.73828125, 38.220703125, 39.703125, 41.185546875, 42.66796875, 44.150390625, 45.6328125, 47.115234375, 48.59765625, 50.080078125, 51.5625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 4.0, 10.0, 14.0, 13.0, 30.0, 53.0, 96.0, 191.0, 228.0, 140.0, 74.0, 44.0, 18.0, 13.0, 10.0, 13.0, 13.0, 3.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.25, -35.09326171875, -33.9365234375, -32.77978515625, -31.623046875, -30.46630859375, -29.3095703125, -28.15283203125, -26.99609375, -25.83935546875, -24.6826171875, -23.52587890625, -22.369140625, -21.21240234375, -20.0556640625, -18.89892578125, -17.7421875, -16.58544921875, -15.4287109375, -14.27197265625, -13.115234375, -11.95849609375, -10.8017578125, -9.64501953125, -8.48828125, -7.33154296875, -6.1748046875, -5.01806640625, -3.861328125, -2.70458984375, -1.5478515625, -0.39111328125, 0.765625, 1.92236328125, 3.0791015625, 4.23583984375, 5.392578125, 6.54931640625, 7.7060546875, 8.86279296875, 10.01953125, 11.17626953125, 12.3330078125, 13.48974609375, 14.646484375, 15.80322265625, 16.9599609375, 18.11669921875, 19.2734375, 20.43017578125, 21.5869140625, 22.74365234375, 23.900390625, 25.05712890625, 26.2138671875, 27.37060546875, 28.52734375, 29.68408203125, 30.8408203125, 31.99755859375, 33.154296875, 34.31103515625, 35.4677734375, 36.62451171875, 37.78125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 28.0, 203.0, 483.0, 211.0, 36.0, 11.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-652.607666015625, -624.6851196289062, -596.7625732421875, -568.8400268554688, -540.91748046875, -512.9949340820312, -485.0724182128906, -457.1498718261719, -429.2273254394531, -401.3047790527344, -373.3822326660156, -345.459716796875, -317.53717041015625, -289.6146240234375, -261.69207763671875, -233.76953125, -205.84698486328125, -177.9244384765625, -150.00189208984375, -122.07936096191406, -94.15681457519531, -66.23426818847656, -38.311737060546875, -10.389190673828125, 17.533355712890625, 45.45589828491211, 73.3784408569336, 101.30097961425781, 129.22352600097656, 157.1460723876953, 185.068603515625, 212.99114990234375, 240.9136962890625, 268.83624267578125, 296.7587890625, 324.68133544921875, 352.6038818359375, 380.52642822265625, 408.4489440917969, 436.3714904785156, 464.2940368652344, 492.2165832519531, 520.1390991210938, 548.0616455078125, 575.9841918945312, 603.90673828125, 631.8292846679688, 659.7518310546875, 687.6743774414062, 715.596923828125, 743.5194702148438, 771.4420166015625, 799.3645629882812, 827.287109375, 855.2095947265625, 883.1322021484375, 911.0546875, 938.9772338867188, 966.8997802734375, 994.8223266601562, 1022.744873046875, 1050.6673583984375, 1078.5899658203125, 1106.512451171875, 1134.43505859375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 6.0, 15.0, 9.0, 18.0, 22.0, 26.0, 26.0, 27.0, 39.0, 30.0, 39.0, 44.0, 35.0, 33.0, 62.0, 57.0, 60.0, 57.0, 59.0, 52.0, 35.0, 45.0, 30.0, 27.0, 25.0, 28.0, 7.0, 11.0, 17.0, 11.0, 6.0, 5.0, 7.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-281.2420349121094, -271.57293701171875, -261.90380859375, -252.23471069335938, -242.56561279296875, -232.89651489257812, -223.22740173339844, -213.55828857421875, -203.88919067382812, -194.2200927734375, -184.5509796142578, -174.88186645507812, -165.2127685546875, -155.54367065429688, -145.8745574951172, -136.2054443359375, -126.53634643554688, -116.86724090576172, -107.19813537597656, -97.5290298461914, -87.85992431640625, -78.1908187866211, -68.52171325683594, -58.85260772705078, -49.183502197265625, -39.51439666748047, -29.845291137695312, -20.176185607910156, -10.507080078125, -0.8379745483398438, 8.831130981445312, 18.50023651123047, 28.16937255859375, 37.838478088378906, 47.50758361816406, 57.17668914794922, 66.84579467773438, 76.51490020751953, 86.18400573730469, 95.85311126708984, 105.522216796875, 115.19132232666016, 124.86042785644531, 134.529541015625, 144.19863891601562, 153.86773681640625, 163.53684997558594, 173.20596313476562, 182.87506103515625, 192.54415893554688, 202.21327209472656, 211.88238525390625, 221.55148315429688, 231.2205810546875, 240.8896942138672, 250.55880737304688, 260.2279052734375, 269.8970031738281, 279.56610107421875, 289.2352294921875, 298.9043273925781, 308.57342529296875, 318.2425537109375, 327.9116516113281, 337.58074951171875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 10.0, 11.0, 22.0, 41.0, 81.0, 190.0, 487.0, 1362.0, 4516.0, 26114.0, 3121207.0, 1018680.0, 16430.0, 3283.0, 1030.0, 423.0, 182.0, 99.0, 38.0, 32.0, 19.0, 11.0, 14.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-44.78125, -43.5341796875, -42.287109375, -41.0400390625, -39.79296875, -38.5458984375, -37.298828125, -36.0517578125, -34.8046875, -33.5576171875, -32.310546875, -31.0634765625, -29.81640625, -28.5693359375, -27.322265625, -26.0751953125, -24.828125, -23.5810546875, -22.333984375, -21.0869140625, -19.83984375, -18.5927734375, -17.345703125, -16.0986328125, -14.8515625, -13.6044921875, -12.357421875, -11.1103515625, -9.86328125, -8.6162109375, -7.369140625, -6.1220703125, -4.875, -3.6279296875, -2.380859375, -1.1337890625, 0.11328125, 1.3603515625, 2.607421875, 3.8544921875, 5.1015625, 6.3486328125, 7.595703125, 8.8427734375, 10.08984375, 11.3369140625, 12.583984375, 13.8310546875, 15.078125, 16.3251953125, 17.572265625, 18.8193359375, 20.06640625, 21.3134765625, 22.560546875, 23.8076171875, 25.0546875, 26.3017578125, 27.548828125, 28.7958984375, 30.04296875, 31.2900390625, 32.537109375, 33.7841796875, 35.03125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 8.0, 8.0, 12.0, 17.0, 11.0, 26.0, 38.0, 47.0, 46.0, 59.0, 67.0, 65.0, 76.0, 81.0, 70.0, 64.0, 43.0, 51.0, 53.0, 40.0, 25.0, 18.0, 21.0, 14.0, 11.0, 3.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.54150390625, -12.9580078125, -12.37451171875, -11.791015625, -11.20751953125, -10.6240234375, -10.04052734375, -9.45703125, -8.87353515625, -8.2900390625, -7.70654296875, -7.123046875, -6.53955078125, -5.9560546875, -5.37255859375, -4.7890625, -4.20556640625, -3.6220703125, -3.03857421875, -2.455078125, -1.87158203125, -1.2880859375, -0.70458984375, -0.12109375, 0.46240234375, 1.0458984375, 1.62939453125, 2.212890625, 2.79638671875, 3.3798828125, 3.96337890625, 4.546875, 5.13037109375, 5.7138671875, 6.29736328125, 6.880859375, 7.46435546875, 8.0478515625, 8.63134765625, 9.21484375, 9.79833984375, 10.3818359375, 10.96533203125, 11.548828125, 12.13232421875, 12.7158203125, 13.29931640625, 13.8828125, 14.46630859375, 15.0498046875, 15.63330078125, 16.216796875, 16.80029296875, 17.3837890625, 17.96728515625, 18.55078125, 19.13427734375, 19.7177734375, 20.30126953125, 20.884765625, 21.46826171875, 22.0517578125, 22.63525390625, 23.21875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 9.0, 12.0, 16.0, 32.0, 64.0, 134.0, 294.0, 735.0, 2084.0, 7545.0, 45121.0, 3242508.0, 862942.0, 25316.0, 4924.0, 1561.0, 570.0, 219.0, 87.0, 53.0, 18.0, 12.0, 3.0, 8.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.875, -36.847900390625, -35.82080078125, -34.793701171875, -33.7666015625, -32.739501953125, -31.71240234375, -30.685302734375, -29.658203125, -28.631103515625, -27.60400390625, -26.576904296875, -25.5498046875, -24.522705078125, -23.49560546875, -22.468505859375, -21.44140625, -20.414306640625, -19.38720703125, -18.360107421875, -17.3330078125, -16.305908203125, -15.27880859375, -14.251708984375, -13.224609375, -12.197509765625, -11.17041015625, -10.143310546875, -9.1162109375, -8.089111328125, -7.06201171875, -6.034912109375, -5.0078125, -3.980712890625, -2.95361328125, -1.926513671875, -0.8994140625, 0.127685546875, 1.15478515625, 2.181884765625, 3.208984375, 4.236083984375, 5.26318359375, 6.290283203125, 7.3173828125, 8.344482421875, 9.37158203125, 10.398681640625, 11.42578125, 12.452880859375, 13.47998046875, 14.507080078125, 15.5341796875, 16.561279296875, 17.58837890625, 18.615478515625, 19.642578125, 20.669677734375, 21.69677734375, 22.723876953125, 23.7509765625, 24.778076171875, 25.80517578125, 26.832275390625, 27.859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 9.0, 8.0, 5.0, 18.0, 19.0, 47.0, 104.0, 272.0, 795.0, 1473.0, 811.0, 251.0, 111.0, 47.0, 35.0, 22.0, 11.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.65625, -35.65478515625, -34.6533203125, -33.65185546875, -32.650390625, -31.64892578125, -30.6474609375, -29.64599609375, -28.64453125, -27.64306640625, -26.6416015625, -25.64013671875, -24.638671875, -23.63720703125, -22.6357421875, -21.63427734375, -20.6328125, -19.63134765625, -18.6298828125, -17.62841796875, -16.626953125, -15.62548828125, -14.6240234375, -13.62255859375, -12.62109375, -11.61962890625, -10.6181640625, -9.61669921875, -8.615234375, -7.61376953125, -6.6123046875, -5.61083984375, -4.609375, -3.60791015625, -2.6064453125, -1.60498046875, -0.603515625, 0.39794921875, 1.3994140625, 2.40087890625, 3.40234375, 4.40380859375, 5.4052734375, 6.40673828125, 7.408203125, 8.40966796875, 9.4111328125, 10.41259765625, 11.4140625, 12.41552734375, 13.4169921875, 14.41845703125, 15.419921875, 16.42138671875, 17.4228515625, 18.42431640625, 19.42578125, 20.42724609375, 21.4287109375, 22.43017578125, 23.431640625, 24.43310546875, 25.4345703125, 26.43603515625, 27.4375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 4.0, 9.0, 28.0, 34.0, 124.0, 235.0, 282.0, 168.0, 67.0, 21.0, 7.0, 8.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-300.57952880859375, -292.78155517578125, -284.9836120605469, -277.1856384277344, -269.3876647949219, -261.5897216796875, -253.791748046875, -245.99378967285156, -238.19583129882812, -230.3978729248047, -222.5998992919922, -214.80194091796875, -207.0039825439453, -199.20602416992188, -191.40805053710938, -183.61009216308594, -175.81211853027344, -168.01416015625, -160.2161865234375, -152.41822814941406, -144.62026977539062, -136.82229614257812, -129.0243377685547, -121.22637939453125, -113.42841339111328, -105.63044738769531, -97.83248901367188, -90.0345230102539, -82.23655700683594, -74.4385986328125, -66.64063262939453, -58.84267044067383, -51.04472351074219, -43.246761322021484, -35.44879913330078, -27.650833129882812, -19.85287094116211, -12.054908752441406, -4.2569427490234375, 3.5410194396972656, 11.338981628417969, 19.136943817138672, 26.934907913208008, 34.732872009277344, 42.53083419799805, 50.32879638671875, 58.12676239013672, 65.92472839355469, 73.72268676757812, 81.5206527709961, 89.31861114501953, 97.1165771484375, 104.91453552246094, 112.7125015258789, 120.51046752929688, 128.3084259033203, 136.10638427734375, 143.9043426513672, 151.7023162841797, 159.50027465820312, 167.29823303222656, 175.09619140625, 182.8941650390625, 190.69212341308594, 198.49009704589844]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 2.0, 2.0, 9.0, 10.0, 18.0, 12.0, 18.0, 23.0, 23.0, 31.0, 37.0, 42.0, 52.0, 46.0, 53.0, 45.0, 63.0, 54.0, 65.0, 67.0, 48.0, 50.0, 48.0, 39.0, 36.0, 19.0, 18.0, 13.0, 11.0, 12.0, 5.0, 5.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-140.1543426513672, -135.87466430664062, -131.59500122070312, -127.31532287597656, -123.03565216064453, -118.7559814453125, -114.47630310058594, -110.1966323852539, -105.91696166992188, -101.63729095458984, -97.35761260986328, -93.07794189453125, -88.79827117919922, -84.51860046386719, -80.23892211914062, -75.9592514038086, -71.67957305908203, -67.39990234375, -63.1202278137207, -58.840553283691406, -54.560882568359375, -50.28120803833008, -46.00153350830078, -41.72186279296875, -37.44218826293945, -33.162513732910156, -28.882843017578125, -24.603168487548828, -20.323495864868164, -16.0438232421875, -11.764148712158203, -7.484476089477539, -3.204803466796875, 1.0748696327209473, 5.3545427322387695, 9.63421630859375, 13.913888931274414, 18.193561553955078, 22.473236083984375, 26.75290870666504, 31.032581329345703, 35.312255859375, 39.59192657470703, 43.87160110473633, 48.151275634765625, 52.430946350097656, 56.71062088012695, 60.99029541015625, 65.26996612548828, 69.54963684082031, 73.82931518554688, 78.1089859008789, 82.38865661621094, 86.6683349609375, 90.94800567626953, 95.22767639160156, 99.50735473632812, 103.78702545166016, 108.06670379638672, 112.34637451171875, 116.62604522705078, 120.90571594238281, 125.18539428710938, 129.46507263183594, 133.74473571777344]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 6.0, 6.0, 8.0, 15.0, 23.0, 26.0, 37.0, 40.0, 66.0, 107.0, 173.0, 245.0, 431.0, 835.0, 1737.0, 4306.0, 12966.0, 51363.0, 291896.0, 547653.0, 102197.0, 22615.0, 6688.0, 2457.0, 1091.0, 579.0, 350.0, 194.0, 150.0, 77.0, 68.0, 42.0, 29.0, 20.0, 18.0, 14.0, 3.0, 9.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-31.171875, -30.28662109375, -29.4013671875, -28.51611328125, -27.630859375, -26.74560546875, -25.8603515625, -24.97509765625, -24.08984375, -23.20458984375, -22.3193359375, -21.43408203125, -20.548828125, -19.66357421875, -18.7783203125, -17.89306640625, -17.0078125, -16.12255859375, -15.2373046875, -14.35205078125, -13.466796875, -12.58154296875, -11.6962890625, -10.81103515625, -9.92578125, -9.04052734375, -8.1552734375, -7.27001953125, -6.384765625, -5.49951171875, -4.6142578125, -3.72900390625, -2.84375, -1.95849609375, -1.0732421875, -0.18798828125, 0.697265625, 1.58251953125, 2.4677734375, 3.35302734375, 4.23828125, 5.12353515625, 6.0087890625, 6.89404296875, 7.779296875, 8.66455078125, 9.5498046875, 10.43505859375, 11.3203125, 12.20556640625, 13.0908203125, 13.97607421875, 14.861328125, 15.74658203125, 16.6318359375, 17.51708984375, 18.40234375, 19.28759765625, 20.1728515625, 21.05810546875, 21.943359375, 22.82861328125, 23.7138671875, 24.59912109375, 25.484375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 10.0, 10.0, 5.0, 13.0, 15.0, 17.0, 31.0, 45.0, 39.0, 48.0, 51.0, 61.0, 63.0, 60.0, 73.0, 68.0, 64.0, 61.0, 60.0, 42.0, 47.0, 24.0, 16.0, 20.0, 14.0, 14.0, 4.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.4921875, -12.9346923828125, -12.377197265625, -11.8197021484375, -11.26220703125, -10.7047119140625, -10.147216796875, -9.5897216796875, -9.0322265625, -8.4747314453125, -7.917236328125, -7.3597412109375, -6.80224609375, -6.2447509765625, -5.687255859375, -5.1297607421875, -4.572265625, -4.0147705078125, -3.457275390625, -2.8997802734375, -2.34228515625, -1.7847900390625, -1.227294921875, -0.6697998046875, -0.1123046875, 0.4451904296875, 1.002685546875, 1.5601806640625, 2.11767578125, 2.6751708984375, 3.232666015625, 3.7901611328125, 4.34765625, 4.9051513671875, 5.462646484375, 6.0201416015625, 6.57763671875, 7.1351318359375, 7.692626953125, 8.2501220703125, 8.8076171875, 9.3651123046875, 9.922607421875, 10.4801025390625, 11.03759765625, 11.5950927734375, 12.152587890625, 12.7100830078125, 13.267578125, 13.8250732421875, 14.382568359375, 14.9400634765625, 15.49755859375, 16.0550537109375, 16.612548828125, 17.1700439453125, 17.7275390625, 18.2850341796875, 18.842529296875, 19.4000244140625, 19.95751953125, 20.5150146484375, 21.072509765625, 21.6300048828125, 22.1875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 5.0, 7.0, 6.0, 17.0, 16.0, 26.0, 31.0, 55.0, 79.0, 160.0, 226.0, 466.0, 1040.0, 3498.0, 19828.0, 726895.0, 279090.0, 12607.0, 2649.0, 872.0, 415.0, 182.0, 127.0, 76.0, 55.0, 36.0, 32.0, 15.0, 12.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.375, -69.205078125, -67.03515625, -64.865234375, -62.6953125, -60.525390625, -58.35546875, -56.185546875, -54.015625, -51.845703125, -49.67578125, -47.505859375, -45.3359375, -43.166015625, -40.99609375, -38.826171875, -36.65625, -34.486328125, -32.31640625, -30.146484375, -27.9765625, -25.806640625, -23.63671875, -21.466796875, -19.296875, -17.126953125, -14.95703125, -12.787109375, -10.6171875, -8.447265625, -6.27734375, -4.107421875, -1.9375, 0.232421875, 2.40234375, 4.572265625, 6.7421875, 8.912109375, 11.08203125, 13.251953125, 15.421875, 17.591796875, 19.76171875, 21.931640625, 24.1015625, 26.271484375, 28.44140625, 30.611328125, 32.78125, 34.951171875, 37.12109375, 39.291015625, 41.4609375, 43.630859375, 45.80078125, 47.970703125, 50.140625, 52.310546875, 54.48046875, 56.650390625, 58.8203125, 60.990234375, 63.16015625, 65.330078125, 67.5]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 6.0, 7.0, 15.0, 9.0, 12.0, 23.0, 16.0, 37.0, 41.0, 45.0, 61.0, 61.0, 68.0, 77.0, 66.0, 67.0, 76.0, 62.0, 50.0, 39.0, 34.0, 32.0, 24.0, 18.0, 16.0, 13.0, 10.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.0, -62.748046875, -60.49609375, -58.244140625, -55.9921875, -53.740234375, -51.48828125, -49.236328125, -46.984375, -44.732421875, -42.48046875, -40.228515625, -37.9765625, -35.724609375, -33.47265625, -31.220703125, -28.96875, -26.716796875, -24.46484375, -22.212890625, -19.9609375, -17.708984375, -15.45703125, -13.205078125, -10.953125, -8.701171875, -6.44921875, -4.197265625, -1.9453125, 0.306640625, 2.55859375, 4.810546875, 7.0625, 9.314453125, 11.56640625, 13.818359375, 16.0703125, 18.322265625, 20.57421875, 22.826171875, 25.078125, 27.330078125, 29.58203125, 31.833984375, 34.0859375, 36.337890625, 38.58984375, 40.841796875, 43.09375, 45.345703125, 47.59765625, 49.849609375, 52.1015625, 54.353515625, 56.60546875, 58.857421875, 61.109375, 63.361328125, 65.61328125, 67.865234375, 70.1171875, 72.369140625, 74.62109375, 76.873046875, 79.125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 6.0, 6.0, 8.0, 15.0, 24.0, 55.0, 71.0, 162.0, 665.0, 5262.0, 1011060.0, 29058.0, 1589.0, 333.0, 106.0, 49.0, 25.0, 21.0, 4.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.125, -70.10595703125, -68.0869140625, -66.06787109375, -64.048828125, -62.02978515625, -60.0107421875, -57.99169921875, -55.97265625, -53.95361328125, -51.9345703125, -49.91552734375, -47.896484375, -45.87744140625, -43.8583984375, -41.83935546875, -39.8203125, -37.80126953125, -35.7822265625, -33.76318359375, -31.744140625, -29.72509765625, -27.7060546875, -25.68701171875, -23.66796875, -21.64892578125, -19.6298828125, -17.61083984375, -15.591796875, -13.57275390625, -11.5537109375, -9.53466796875, -7.515625, -5.49658203125, -3.4775390625, -1.45849609375, 0.560546875, 2.57958984375, 4.5986328125, 6.61767578125, 8.63671875, 10.65576171875, 12.6748046875, 14.69384765625, 16.712890625, 18.73193359375, 20.7509765625, 22.77001953125, 24.7890625, 26.80810546875, 28.8271484375, 30.84619140625, 32.865234375, 34.88427734375, 36.9033203125, 38.92236328125, 40.94140625, 42.96044921875, 44.9794921875, 46.99853515625, 49.017578125, 51.03662109375, 53.0556640625, 55.07470703125, 57.09375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 11.0, 15.0, 14.0, 23.0, 24.0, 50.0, 94.0, 169.0, 228.0, 139.0, 72.0, 46.0, 23.0, 18.0, 14.0, 12.0, 11.0, 7.0, 9.0, 2.0, 3.0, 1.0, 1.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00281524658203125, -0.0027283430099487305, -0.002641439437866211, -0.0025545358657836914, -0.002467632293701172, -0.0023807287216186523, -0.002293825149536133, -0.0022069215774536133, -0.0021200180053710938, -0.0020331144332885742, -0.0019462108612060547, -0.0018593072891235352, -0.0017724037170410156, -0.001685500144958496, -0.0015985965728759766, -0.001511693000793457, -0.0014247894287109375, -0.001337885856628418, -0.0012509822845458984, -0.001164078712463379, -0.0010771751403808594, -0.0009902715682983398, -0.0009033679962158203, -0.0008164644241333008, -0.0007295608520507812, -0.0006426572799682617, -0.0005557537078857422, -0.00046885013580322266, -0.0003819465637207031, -0.0002950429916381836, -0.00020813941955566406, -0.00012123584747314453, -3.4332275390625e-05, 5.257129669189453e-05, 0.00013947486877441406, 0.0002263784408569336, 0.0003132820129394531, 0.00040018558502197266, 0.0004870891571044922, 0.0005739927291870117, 0.0006608963012695312, 0.0007477998733520508, 0.0008347034454345703, 0.0009216070175170898, 0.0010085105895996094, 0.001095414161682129, 0.0011823177337646484, 0.001269221305847168, 0.0013561248779296875, 0.001443028450012207, 0.0015299320220947266, 0.001616835594177246, 0.0017037391662597656, 0.0017906427383422852, 0.0018775463104248047, 0.0019644498825073242, 0.0020513534545898438, 0.0021382570266723633, 0.002225160598754883, 0.0023120641708374023, 0.002398967742919922, 0.0024858713150024414, 0.002572774887084961, 0.0026596784591674805, 0.00274658203125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 6.0, 3.0, 5.0, 17.0, 20.0, 28.0, 51.0, 87.0, 128.0, 249.0, 475.0, 1162.0, 3948.0, 24939.0, 925235.0, 82410.0, 6720.0, 1742.0, 598.0, 314.0, 161.0, 81.0, 67.0, 38.0, 18.0, 15.0, 8.0, 9.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.84375, -30.025146484375, -29.20654296875, -28.387939453125, -27.5693359375, -26.750732421875, -25.93212890625, -25.113525390625, -24.294921875, -23.476318359375, -22.65771484375, -21.839111328125, -21.0205078125, -20.201904296875, -19.38330078125, -18.564697265625, -17.74609375, -16.927490234375, -16.10888671875, -15.290283203125, -14.4716796875, -13.653076171875, -12.83447265625, -12.015869140625, -11.197265625, -10.378662109375, -9.56005859375, -8.741455078125, -7.9228515625, -7.104248046875, -6.28564453125, -5.467041015625, -4.6484375, -3.829833984375, -3.01123046875, -2.192626953125, -1.3740234375, -0.555419921875, 0.26318359375, 1.081787109375, 1.900390625, 2.718994140625, 3.53759765625, 4.356201171875, 5.1748046875, 5.993408203125, 6.81201171875, 7.630615234375, 8.44921875, 9.267822265625, 10.08642578125, 10.905029296875, 11.7236328125, 12.542236328125, 13.36083984375, 14.179443359375, 14.998046875, 15.816650390625, 16.63525390625, 17.453857421875, 18.2724609375, 19.091064453125, 19.90966796875, 20.728271484375, 21.546875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 7.0, 12.0, 11.0, 32.0, 64.0, 94.0, 153.0, 200.0, 164.0, 100.0, 66.0, 31.0, 19.0, 15.0, 8.0, 6.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.140625, -23.39990234375, -22.6591796875, -21.91845703125, -21.177734375, -20.43701171875, -19.6962890625, -18.95556640625, -18.21484375, -17.47412109375, -16.7333984375, -15.99267578125, -15.251953125, -14.51123046875, -13.7705078125, -13.02978515625, -12.2890625, -11.54833984375, -10.8076171875, -10.06689453125, -9.326171875, -8.58544921875, -7.8447265625, -7.10400390625, -6.36328125, -5.62255859375, -4.8818359375, -4.14111328125, -3.400390625, -2.65966796875, -1.9189453125, -1.17822265625, -0.4375, 0.30322265625, 1.0439453125, 1.78466796875, 2.525390625, 3.26611328125, 4.0068359375, 4.74755859375, 5.48828125, 6.22900390625, 6.9697265625, 7.71044921875, 8.451171875, 9.19189453125, 9.9326171875, 10.67333984375, 11.4140625, 12.15478515625, 12.8955078125, 13.63623046875, 14.376953125, 15.11767578125, 15.8583984375, 16.59912109375, 17.33984375, 18.08056640625, 18.8212890625, 19.56201171875, 20.302734375, 21.04345703125, 21.7841796875, 22.52490234375, 23.265625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 8.0, 5.0, 14.0, 67.0, 224.0, 381.0, 209.0, 48.0, 13.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-292.90435791015625, -277.8301086425781, -262.7558898925781, -247.681640625, -232.60740661621094, -217.53317260742188, -202.45892333984375, -187.3846893310547, -172.31045532226562, -157.23622131347656, -142.1619873046875, -127.08773803710938, -112.01350402832031, -96.93927001953125, -81.86502838134766, -66.79078674316406, -51.716552734375, -36.64231491088867, -21.568077087402344, -6.493839263916016, 8.580398559570312, 23.654632568359375, 38.72887420654297, 53.80311584472656, 68.87734985351562, 83.95158386230469, 99.02582550048828, 114.10006713867188, 129.17430114746094, 144.24853515625, 159.32278442382812, 174.3970184326172, 189.47125244140625, 204.5454864501953, 219.61972045898438, 234.6939697265625, 249.76820373535156, 264.8424377441406, 279.91668701171875, 294.99090576171875, 310.0651550292969, 325.139404296875, 340.213623046875, 355.2878723144531, 370.36212158203125, 385.43634033203125, 400.5105895996094, 415.5848388671875, 430.6590576171875, 445.7333068847656, 460.8075256347656, 475.88177490234375, 490.95599365234375, 506.0302429199219, 521.1044921875, 536.1787109375, 551.2529296875, 566.3271484375, 581.4014282226562, 596.4756469726562, 611.5498657226562, 626.6241455078125, 641.6983642578125, 656.7725830078125, 671.8468627929688]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 7.0, 9.0, 17.0, 8.0, 17.0, 25.0, 26.0, 30.0, 38.0, 34.0, 42.0, 51.0, 42.0, 62.0, 63.0, 67.0, 62.0, 54.0, 54.0, 40.0, 40.0, 41.0, 30.0, 26.0, 22.0, 21.0, 11.0, 11.0, 10.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.97264099121094, -185.02105712890625, -177.0694580078125, -169.11785888671875, -161.16627502441406, -153.21469116210938, -145.26309204101562, -137.31149291992188, -129.3599090576172, -121.40831756591797, -113.45672607421875, -105.50513458251953, -97.55354309082031, -89.6019515991211, -81.65036010742188, -73.69876861572266, -65.74717712402344, -57.79558563232422, -49.843994140625, -41.89240264892578, -33.94081115722656, -25.989219665527344, -18.037628173828125, -10.086036682128906, -2.1344451904296875, 5.817146301269531, 13.76873779296875, 21.72032928466797, 29.671920776367188, 37.623512268066406, 45.575103759765625, 53.526695251464844, 61.478271484375, 69.42986297607422, 77.38145446777344, 85.33304595947266, 93.28463745117188, 101.2362289428711, 109.18782043457031, 117.13941192626953, 125.09100341796875, 133.0426025390625, 140.9941864013672, 148.94577026367188, 156.89736938476562, 164.84896850585938, 172.80055236816406, 180.75213623046875, 188.7037353515625, 196.65533447265625, 204.60691833496094, 212.55850219726562, 220.51010131835938, 228.46170043945312, 236.4132843017578, 244.3648681640625, 252.31646728515625, 260.26806640625, 268.21966552734375, 276.1712341308594, 284.1228332519531, 292.0744323730469, 300.0260009765625, 307.97760009765625, 315.92919921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 8.0, 17.0, 13.0, 29.0, 47.0, 60.0, 93.0, 186.0, 282.0, 430.0, 767.0, 1412.0, 3092.0, 7475.0, 21660.0, 100062.0, 1035664.0, 2674870.0, 287741.0, 40499.0, 10985.0, 4217.0, 1993.0, 1025.0, 601.0, 329.0, 226.0, 141.0, 83.0, 77.0, 46.0, 36.0, 28.0, 25.0, 13.0, 8.0, 8.0, 7.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0], "bins": [-17.796875, -17.2919921875, -16.787109375, -16.2822265625, -15.77734375, -15.2724609375, -14.767578125, -14.2626953125, -13.7578125, -13.2529296875, -12.748046875, -12.2431640625, -11.73828125, -11.2333984375, -10.728515625, -10.2236328125, -9.71875, -9.2138671875, -8.708984375, -8.2041015625, -7.69921875, -7.1943359375, -6.689453125, -6.1845703125, -5.6796875, -5.1748046875, -4.669921875, -4.1650390625, -3.66015625, -3.1552734375, -2.650390625, -2.1455078125, -1.640625, -1.1357421875, -0.630859375, -0.1259765625, 0.37890625, 0.8837890625, 1.388671875, 1.8935546875, 2.3984375, 2.9033203125, 3.408203125, 3.9130859375, 4.41796875, 4.9228515625, 5.427734375, 5.9326171875, 6.4375, 6.9423828125, 7.447265625, 7.9521484375, 8.45703125, 8.9619140625, 9.466796875, 9.9716796875, 10.4765625, 10.9814453125, 11.486328125, 11.9912109375, 12.49609375, 13.0009765625, 13.505859375, 14.0107421875, 14.515625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 11.0, 6.0, 10.0, 15.0, 22.0, 28.0, 42.0, 51.0, 42.0, 64.0, 67.0, 76.0, 83.0, 69.0, 75.0, 52.0, 53.0, 31.0, 46.0, 30.0, 31.0, 20.0, 22.0, 13.0, 14.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.5836181640625, -11.081298828125, -10.5789794921875, -10.07666015625, -9.5743408203125, -9.072021484375, -8.5697021484375, -8.0673828125, -7.5650634765625, -7.062744140625, -6.5604248046875, -6.05810546875, -5.5557861328125, -5.053466796875, -4.5511474609375, -4.048828125, -3.5465087890625, -3.044189453125, -2.5418701171875, -2.03955078125, -1.5372314453125, -1.034912109375, -0.5325927734375, -0.0302734375, 0.4720458984375, 0.974365234375, 1.4766845703125, 1.97900390625, 2.4813232421875, 2.983642578125, 3.4859619140625, 3.98828125, 4.4906005859375, 4.992919921875, 5.4952392578125, 5.99755859375, 6.4998779296875, 7.002197265625, 7.5045166015625, 8.0068359375, 8.5091552734375, 9.011474609375, 9.5137939453125, 10.01611328125, 10.5184326171875, 11.020751953125, 11.5230712890625, 12.025390625, 12.5277099609375, 13.030029296875, 13.5323486328125, 14.03466796875, 14.5369873046875, 15.039306640625, 15.5416259765625, 16.0439453125, 16.5462646484375, 17.048583984375, 17.5509033203125, 18.05322265625, 18.5555419921875, 19.057861328125, 19.5601806640625, 20.0625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 13.0, 24.0, 58.0, 141.0, 323.0, 659.0, 3265.0, 113342.0, 4029940.0, 43593.0, 2227.0, 433.0, 140.0, 63.0, 29.0, 15.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.90625, -45.310546875, -43.71484375, -42.119140625, -40.5234375, -38.927734375, -37.33203125, -35.736328125, -34.140625, -32.544921875, -30.94921875, -29.353515625, -27.7578125, -26.162109375, -24.56640625, -22.970703125, -21.375, -19.779296875, -18.18359375, -16.587890625, -14.9921875, -13.396484375, -11.80078125, -10.205078125, -8.609375, -7.013671875, -5.41796875, -3.822265625, -2.2265625, -0.630859375, 0.96484375, 2.560546875, 4.15625, 5.751953125, 7.34765625, 8.943359375, 10.5390625, 12.134765625, 13.73046875, 15.326171875, 16.921875, 18.517578125, 20.11328125, 21.708984375, 23.3046875, 24.900390625, 26.49609375, 28.091796875, 29.6875, 31.283203125, 32.87890625, 34.474609375, 36.0703125, 37.666015625, 39.26171875, 40.857421875, 42.453125, 44.048828125, 45.64453125, 47.240234375, 48.8359375, 50.431640625, 52.02734375, 53.623046875, 55.21875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 7.0, 12.0, 25.0, 39.0, 70.0, 152.0, 455.0, 1229.0, 1224.0, 489.0, 179.0, 97.0, 41.0, 17.0, 12.0, 8.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.8125, -54.45361328125, -53.0947265625, -51.73583984375, -50.376953125, -49.01806640625, -47.6591796875, -46.30029296875, -44.94140625, -43.58251953125, -42.2236328125, -40.86474609375, -39.505859375, -38.14697265625, -36.7880859375, -35.42919921875, -34.0703125, -32.71142578125, -31.3525390625, -29.99365234375, -28.634765625, -27.27587890625, -25.9169921875, -24.55810546875, -23.19921875, -21.84033203125, -20.4814453125, -19.12255859375, -17.763671875, -16.40478515625, -15.0458984375, -13.68701171875, -12.328125, -10.96923828125, -9.6103515625, -8.25146484375, -6.892578125, -5.53369140625, -4.1748046875, -2.81591796875, -1.45703125, -0.09814453125, 1.2607421875, 2.61962890625, 3.978515625, 5.33740234375, 6.6962890625, 8.05517578125, 9.4140625, 10.77294921875, 12.1318359375, 13.49072265625, 14.849609375, 16.20849609375, 17.5673828125, 18.92626953125, 20.28515625, 21.64404296875, 23.0029296875, 24.36181640625, 25.720703125, 27.07958984375, 28.4384765625, 29.79736328125, 31.15625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 8.0, 16.0, 41.0, 107.0, 180.0, 237.0, 203.0, 110.0, 43.0, 20.0, 7.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-294.5251159667969, -286.91607666015625, -279.3070068359375, -271.6979675292969, -264.08892822265625, -256.4798889160156, -248.87083435058594, -241.26177978515625, -233.65274047851562, -226.04368591308594, -218.4346466064453, -210.82559204101562, -203.216552734375, -195.6074981689453, -187.9984588623047, -180.389404296875, -172.78036499023438, -165.1713104248047, -157.56227111816406, -149.95321655273438, -142.34417724609375, -134.73512268066406, -127.12608337402344, -119.51702880859375, -111.90797424316406, -104.2989273071289, -96.68988037109375, -89.0808334350586, -81.47178649902344, -73.86273193359375, -66.25369262695312, -58.6446418762207, -51.03559875488281, -43.426551818847656, -35.8175048828125, -28.20845603942871, -20.599409103393555, -12.990360260009766, -5.381313323974609, 2.227733612060547, 9.836780548095703, 17.44582748413086, 25.054874420166016, 32.66392517089844, 40.272972106933594, 47.88201904296875, 55.491065979003906, 63.10011291503906, 70.70915985107422, 78.31820678710938, 85.92725372314453, 93.53630065917969, 101.14534759521484, 108.75439453125, 116.36344909667969, 123.97248840332031, 131.58154296875, 139.1905975341797, 146.7996368408203, 154.40869140625, 162.01773071289062, 169.6267852783203, 177.23582458496094, 184.84487915039062, 192.45391845703125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 6.0, 11.0, 14.0, 18.0, 14.0, 18.0, 23.0, 22.0, 38.0, 49.0, 51.0, 44.0, 44.0, 59.0, 73.0, 56.0, 49.0, 47.0, 62.0, 56.0, 44.0, 41.0, 33.0, 27.0, 16.0, 23.0, 13.0, 6.0, 10.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-162.22637939453125, -157.39866638183594, -152.5709686279297, -147.74325561523438, -142.91555786132812, -138.0878448486328, -133.2601318359375, -128.43243408203125, -123.60472106933594, -118.77701568603516, -113.94931030273438, -109.12159729003906, -104.29389190673828, -99.4661865234375, -94.63847351074219, -89.8107681274414, -84.98306274414062, -80.15535736083984, -75.32765197753906, -70.49993896484375, -65.67223358154297, -60.84452819824219, -56.01681900024414, -51.189109802246094, -46.36140441894531, -41.53369903564453, -36.705989837646484, -31.87828254699707, -27.050575256347656, -22.222867965698242, -17.395160675048828, -12.567451477050781, -7.73974609375, -2.912038803100586, 1.9156684875488281, 6.743375778198242, 11.571083068847656, 16.39879035949707, 21.226497650146484, 26.05420684814453, 30.881912231445312, 35.709617614746094, 40.53732681274414, 45.36503601074219, 50.19274139404297, 55.02044677734375, 59.8481559753418, 64.67586517333984, 69.50357055664062, 74.3312759399414, 79.15898132324219, 83.9866943359375, 88.81439971923828, 93.64210510253906, 98.46981811523438, 103.29752349853516, 108.12522888183594, 112.95293426513672, 117.7806396484375, 122.60835266113281, 127.4360580444336, 132.26376342773438, 137.0914764404297, 141.919189453125, 146.74688720703125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 7.0, 13.0, 8.0, 15.0, 16.0, 26.0, 44.0, 87.0, 133.0, 279.0, 578.0, 1483.0, 5339.0, 38307.0, 536955.0, 427513.0, 30505.0, 4796.0, 1371.0, 517.0, 250.0, 123.0, 59.0, 44.0, 33.0, 13.0, 11.0, 8.0, 9.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.0625, -56.4912109375, -54.919921875, -53.3486328125, -51.77734375, -50.2060546875, -48.634765625, -47.0634765625, -45.4921875, -43.9208984375, -42.349609375, -40.7783203125, -39.20703125, -37.6357421875, -36.064453125, -34.4931640625, -32.921875, -31.3505859375, -29.779296875, -28.2080078125, -26.63671875, -25.0654296875, -23.494140625, -21.9228515625, -20.3515625, -18.7802734375, -17.208984375, -15.6376953125, -14.06640625, -12.4951171875, -10.923828125, -9.3525390625, -7.78125, -6.2099609375, -4.638671875, -3.0673828125, -1.49609375, 0.0751953125, 1.646484375, 3.2177734375, 4.7890625, 6.3603515625, 7.931640625, 9.5029296875, 11.07421875, 12.6455078125, 14.216796875, 15.7880859375, 17.359375, 18.9306640625, 20.501953125, 22.0732421875, 23.64453125, 25.2158203125, 26.787109375, 28.3583984375, 29.9296875, 31.5009765625, 33.072265625, 34.6435546875, 36.21484375, 37.7861328125, 39.357421875, 40.9287109375, 42.5]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 9.0, 11.0, 14.0, 10.0, 25.0, 32.0, 35.0, 51.0, 42.0, 62.0, 71.0, 69.0, 57.0, 68.0, 81.0, 63.0, 57.0, 51.0, 38.0, 37.0, 35.0, 19.0, 20.0, 11.0, 10.0, 10.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.28125, -10.79248046875, -10.3037109375, -9.81494140625, -9.326171875, -8.83740234375, -8.3486328125, -7.85986328125, -7.37109375, -6.88232421875, -6.3935546875, -5.90478515625, -5.416015625, -4.92724609375, -4.4384765625, -3.94970703125, -3.4609375, -2.97216796875, -2.4833984375, -1.99462890625, -1.505859375, -1.01708984375, -0.5283203125, -0.03955078125, 0.44921875, 0.93798828125, 1.4267578125, 1.91552734375, 2.404296875, 2.89306640625, 3.3818359375, 3.87060546875, 4.359375, 4.84814453125, 5.3369140625, 5.82568359375, 6.314453125, 6.80322265625, 7.2919921875, 7.78076171875, 8.26953125, 8.75830078125, 9.2470703125, 9.73583984375, 10.224609375, 10.71337890625, 11.2021484375, 11.69091796875, 12.1796875, 12.66845703125, 13.1572265625, 13.64599609375, 14.134765625, 14.62353515625, 15.1123046875, 15.60107421875, 16.08984375, 16.57861328125, 17.0673828125, 17.55615234375, 18.044921875, 18.53369140625, 19.0224609375, 19.51123046875, 20.0]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 7.0, 3.0, 5.0, 11.0, 20.0, 30.0, 34.0, 63.0, 114.0, 206.0, 411.0, 1122.0, 4246.0, 87517.0, 940754.0, 10728.0, 1929.0, 687.0, 276.0, 148.0, 86.0, 56.0, 40.0, 18.0, 15.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-145.5, -141.4833984375, -137.466796875, -133.4501953125, -129.43359375, -125.4169921875, -121.400390625, -117.3837890625, -113.3671875, -109.3505859375, -105.333984375, -101.3173828125, -97.30078125, -93.2841796875, -89.267578125, -85.2509765625, -81.234375, -77.2177734375, -73.201171875, -69.1845703125, -65.16796875, -61.1513671875, -57.134765625, -53.1181640625, -49.1015625, -45.0849609375, -41.068359375, -37.0517578125, -33.03515625, -29.0185546875, -25.001953125, -20.9853515625, -16.96875, -12.9521484375, -8.935546875, -4.9189453125, -0.90234375, 3.1142578125, 7.130859375, 11.1474609375, 15.1640625, 19.1806640625, 23.197265625, 27.2138671875, 31.23046875, 35.2470703125, 39.263671875, 43.2802734375, 47.296875, 51.3134765625, 55.330078125, 59.3466796875, 63.36328125, 67.3798828125, 71.396484375, 75.4130859375, 79.4296875, 83.4462890625, 87.462890625, 91.4794921875, 95.49609375, 99.5126953125, 103.529296875, 107.5458984375, 111.5625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 14.0, 10.0, 13.0, 26.0, 28.0, 33.0, 51.0, 58.0, 82.0, 58.0, 74.0, 64.0, 72.0, 70.0, 47.0, 56.0, 47.0, 43.0, 31.0, 26.0, 16.0, 16.0, 15.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-82.375, -80.24365234375, -78.1123046875, -75.98095703125, -73.849609375, -71.71826171875, -69.5869140625, -67.45556640625, -65.32421875, -63.19287109375, -61.0615234375, -58.93017578125, -56.798828125, -54.66748046875, -52.5361328125, -50.40478515625, -48.2734375, -46.14208984375, -44.0107421875, -41.87939453125, -39.748046875, -37.61669921875, -35.4853515625, -33.35400390625, -31.22265625, -29.09130859375, -26.9599609375, -24.82861328125, -22.697265625, -20.56591796875, -18.4345703125, -16.30322265625, -14.171875, -12.04052734375, -9.9091796875, -7.77783203125, -5.646484375, -3.51513671875, -1.3837890625, 0.74755859375, 2.87890625, 5.01025390625, 7.1416015625, 9.27294921875, 11.404296875, 13.53564453125, 15.6669921875, 17.79833984375, 19.9296875, 22.06103515625, 24.1923828125, 26.32373046875, 28.455078125, 30.58642578125, 32.7177734375, 34.84912109375, 36.98046875, 39.11181640625, 41.2431640625, 43.37451171875, 45.505859375, 47.63720703125, 49.7685546875, 51.89990234375, 54.03125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 16.0, 14.0, 19.0, 34.0, 36.0, 49.0, 100.0, 115.0, 220.0, 483.0, 1582.0, 8168.0, 261947.0, 760973.0, 11503.0, 1954.0, 564.0, 266.0, 157.0, 82.0, 52.0, 52.0, 35.0, 23.0, 11.0, 18.0, 10.0, 9.0, 6.0, 3.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.484375, -25.573486328125, -24.66259765625, -23.751708984375, -22.8408203125, -21.929931640625, -21.01904296875, -20.108154296875, -19.197265625, -18.286376953125, -17.37548828125, -16.464599609375, -15.5537109375, -14.642822265625, -13.73193359375, -12.821044921875, -11.91015625, -10.999267578125, -10.08837890625, -9.177490234375, -8.2666015625, -7.355712890625, -6.44482421875, -5.533935546875, -4.623046875, -3.712158203125, -2.80126953125, -1.890380859375, -0.9794921875, -0.068603515625, 0.84228515625, 1.753173828125, 2.6640625, 3.574951171875, 4.48583984375, 5.396728515625, 6.3076171875, 7.218505859375, 8.12939453125, 9.040283203125, 9.951171875, 10.862060546875, 11.77294921875, 12.683837890625, 13.5947265625, 14.505615234375, 15.41650390625, 16.327392578125, 17.23828125, 18.149169921875, 19.06005859375, 19.970947265625, 20.8818359375, 21.792724609375, 22.70361328125, 23.614501953125, 24.525390625, 25.436279296875, 26.34716796875, 27.258056640625, 28.1689453125, 29.079833984375, 29.99072265625, 30.901611328125, 31.8125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 3.0, 7.0, 7.0, 11.0, 12.0, 19.0, 19.0, 26.0, 30.0, 57.0, 69.0, 139.0, 186.0, 120.0, 83.0, 53.0, 30.0, 36.0, 26.0, 16.0, 13.0, 16.0, 8.0, 3.0, 1.0, 8.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003078460693359375, -0.002986311912536621, -0.002894163131713867, -0.0028020143508911133, -0.0027098655700683594, -0.0026177167892456055, -0.0025255680084228516, -0.0024334192276000977, -0.0023412704467773438, -0.00224912166595459, -0.002156972885131836, -0.002064824104309082, -0.001972675323486328, -0.0018805265426635742, -0.0017883777618408203, -0.0016962289810180664, -0.0016040802001953125, -0.0015119314193725586, -0.0014197826385498047, -0.0013276338577270508, -0.0012354850769042969, -0.001143336296081543, -0.001051187515258789, -0.0009590387344360352, -0.0008668899536132812, -0.0007747411727905273, -0.0006825923919677734, -0.0005904436111450195, -0.0004982948303222656, -0.0004061460494995117, -0.0003139972686767578, -0.0002218484878540039, -0.00012969970703125, -3.7550926208496094e-05, 5.459785461425781e-05, 0.00014674663543701172, 0.00023889541625976562, 0.00033104419708251953, 0.00042319297790527344, 0.0005153417587280273, 0.0006074905395507812, 0.0006996393203735352, 0.0007917881011962891, 0.000883936882019043, 0.0009760856628417969, 0.0010682344436645508, 0.0011603832244873047, 0.0012525320053100586, 0.0013446807861328125, 0.0014368295669555664, 0.0015289783477783203, 0.0016211271286010742, 0.0017132759094238281, 0.001805424690246582, 0.001897573471069336, 0.00198972225189209, 0.0020818710327148438, 0.0021740198135375977, 0.0022661685943603516, 0.0023583173751831055, 0.0024504661560058594, 0.0025426149368286133, 0.002634763717651367, 0.002726912498474121, 0.002819061279296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 0.0, 4.0, 6.0, 4.0, 6.0, 8.0, 9.0, 12.0, 19.0, 25.0, 32.0, 38.0, 50.0, 89.0, 155.0, 211.0, 378.0, 891.0, 2802.0, 14229.0, 831851.0, 185017.0, 9110.0, 1973.0, 707.0, 366.0, 186.0, 120.0, 68.0, 52.0, 38.0, 27.0, 18.0, 7.0, 5.0, 10.0, 9.0, 6.0, 4.0, 1.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -28.037841796875, -27.18505859375, -26.332275390625, -25.4794921875, -24.626708984375, -23.77392578125, -22.921142578125, -22.068359375, -21.215576171875, -20.36279296875, -19.510009765625, -18.6572265625, -17.804443359375, -16.95166015625, -16.098876953125, -15.24609375, -14.393310546875, -13.54052734375, -12.687744140625, -11.8349609375, -10.982177734375, -10.12939453125, -9.276611328125, -8.423828125, -7.571044921875, -6.71826171875, -5.865478515625, -5.0126953125, -4.159912109375, -3.30712890625, -2.454345703125, -1.6015625, -0.748779296875, 0.10400390625, 0.956787109375, 1.8095703125, 2.662353515625, 3.51513671875, 4.367919921875, 5.220703125, 6.073486328125, 6.92626953125, 7.779052734375, 8.6318359375, 9.484619140625, 10.33740234375, 11.190185546875, 12.04296875, 12.895751953125, 13.74853515625, 14.601318359375, 15.4541015625, 16.306884765625, 17.15966796875, 18.012451171875, 18.865234375, 19.718017578125, 20.57080078125, 21.423583984375, 22.2763671875, 23.129150390625, 23.98193359375, 24.834716796875, 25.6875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 14.0, 10.0, 22.0, 42.0, 44.0, 71.0, 115.0, 170.0, 184.0, 117.0, 80.0, 33.0, 30.0, 17.0, 5.0, 9.0, 6.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.609375, -14.00146484375, -13.3935546875, -12.78564453125, -12.177734375, -11.56982421875, -10.9619140625, -10.35400390625, -9.74609375, -9.13818359375, -8.5302734375, -7.92236328125, -7.314453125, -6.70654296875, -6.0986328125, -5.49072265625, -4.8828125, -4.27490234375, -3.6669921875, -3.05908203125, -2.451171875, -1.84326171875, -1.2353515625, -0.62744140625, -0.01953125, 0.58837890625, 1.1962890625, 1.80419921875, 2.412109375, 3.02001953125, 3.6279296875, 4.23583984375, 4.84375, 5.45166015625, 6.0595703125, 6.66748046875, 7.275390625, 7.88330078125, 8.4912109375, 9.09912109375, 9.70703125, 10.31494140625, 10.9228515625, 11.53076171875, 12.138671875, 12.74658203125, 13.3544921875, 13.96240234375, 14.5703125, 15.17822265625, 15.7861328125, 16.39404296875, 17.001953125, 17.60986328125, 18.2177734375, 18.82568359375, 19.43359375, 20.04150390625, 20.6494140625, 21.25732421875, 21.865234375, 22.47314453125, 23.0810546875, 23.68896484375, 24.296875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 8.0, 22.0, 73.0, 182.0, 404.0, 204.0, 59.0, 19.0, 2.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-518.3729248046875, -504.5660705566406, -490.7591857910156, -476.95233154296875, -463.14544677734375, -449.3385925292969, -435.53173828125, -421.724853515625, -407.9179992675781, -394.11114501953125, -380.30426025390625, -366.4974060058594, -352.6905517578125, -338.8836669921875, -325.0768127441406, -311.26995849609375, -297.46307373046875, -283.6562194824219, -269.8493347167969, -256.04248046875, -242.23561096191406, -228.42874145507812, -214.62188720703125, -200.8150177001953, -187.00814819335938, -173.20127868652344, -159.3944091796875, -145.58755493164062, -131.7806854248047, -117.97381591796875, -104.16695404052734, -90.36009216308594, -76.55319213867188, -62.7463264465332, -48.93946075439453, -35.13259506225586, -21.325729370117188, -7.51885986328125, 6.288002014160156, 20.094863891601562, 33.9017333984375, 47.70859909057617, 61.515464782714844, 75.32232666015625, 89.12919616699219, 102.93606567382812, 116.74292755126953, 130.54978942871094, 144.35665893554688, 158.1635284423828, 171.97039794921875, 185.77725219726562, 199.58412170410156, 213.3909912109375, 227.19784545898438, 241.0047149658203, 254.81158447265625, 268.6184387207031, 282.4253234863281, 296.232177734375, 310.0390625, 323.8459167480469, 337.65277099609375, 351.45965576171875, 365.2665100097656]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 10.0, 4.0, 11.0, 7.0, 8.0, 14.0, 21.0, 10.0, 20.0, 22.0, 20.0, 20.0, 25.0, 32.0, 26.0, 22.0, 29.0, 37.0, 56.0, 56.0, 58.0, 61.0, 50.0, 36.0, 39.0, 35.0, 35.0, 36.0, 27.0, 23.0, 24.0, 19.0, 20.0, 14.0, 15.0, 8.0, 9.0, 7.0, 9.0, 5.0, 9.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-146.6016082763672, -141.68582153320312, -136.77003479003906, -131.85426330566406, -126.9384765625, -122.02268981933594, -117.10690307617188, -112.19111633300781, -107.27533721923828, -102.35955047607422, -97.44377136230469, -92.52798461914062, -87.61219787597656, -82.69641876220703, -77.78063201904297, -72.86485290527344, -67.94906616210938, -63.03328323364258, -58.11750030517578, -53.20171356201172, -48.28593063354492, -43.370147705078125, -38.45436096191406, -33.538578033447266, -28.62279510498047, -23.707012176513672, -18.791227340698242, -13.875443458557129, -8.959659576416016, -4.043876647949219, 0.8719081878662109, 5.787693023681641, 10.7034912109375, 15.619275093078613, 20.535058975219727, 25.450843811035156, 30.366626739501953, 35.28240966796875, 40.19819641113281, 45.11397933959961, 50.029762268066406, 54.9455451965332, 59.861328125, 64.77711486816406, 69.69290161132812, 74.60868072509766, 79.52446746826172, 84.44024658203125, 89.35603332519531, 94.27182006835938, 99.1875991821289, 104.10338592529297, 109.0191650390625, 113.93495178222656, 118.85073852539062, 123.76652526855469, 128.68231201171875, 133.5980987548828, 138.51388549804688, 143.42965698242188, 148.34544372558594, 153.26123046875, 158.17701721191406, 163.09280395507812, 168.00857543945312]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 4.0, 4.0, 10.0, 18.0, 24.0, 34.0, 62.0, 98.0, 175.0, 321.0, 660.0, 1633.0, 5187.0, 23972.0, 632558.0, 3424947.0, 90542.0, 9407.0, 2566.0, 971.0, 464.0, 235.0, 142.0, 81.0, 64.0, 29.0, 17.0, 20.0, 9.0, 1.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.1875, -27.41015625, -26.6328125, -25.85546875, -25.078125, -24.30078125, -23.5234375, -22.74609375, -21.96875, -21.19140625, -20.4140625, -19.63671875, -18.859375, -18.08203125, -17.3046875, -16.52734375, -15.75, -14.97265625, -14.1953125, -13.41796875, -12.640625, -11.86328125, -11.0859375, -10.30859375, -9.53125, -8.75390625, -7.9765625, -7.19921875, -6.421875, -5.64453125, -4.8671875, -4.08984375, -3.3125, -2.53515625, -1.7578125, -0.98046875, -0.203125, 0.57421875, 1.3515625, 2.12890625, 2.90625, 3.68359375, 4.4609375, 5.23828125, 6.015625, 6.79296875, 7.5703125, 8.34765625, 9.125, 9.90234375, 10.6796875, 11.45703125, 12.234375, 13.01171875, 13.7890625, 14.56640625, 15.34375, 16.12109375, 16.8984375, 17.67578125, 18.453125, 19.23046875, 20.0078125, 20.78515625, 21.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 12.0, 5.0, 10.0, 15.0, 22.0, 30.0, 43.0, 56.0, 60.0, 112.0, 90.0, 82.0, 97.0, 79.0, 74.0, 68.0, 51.0, 43.0, 16.0, 25.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8203125, -14.1951904296875, -13.570068359375, -12.9449462890625, -12.31982421875, -11.6947021484375, -11.069580078125, -10.4444580078125, -9.8193359375, -9.1942138671875, -8.569091796875, -7.9439697265625, -7.31884765625, -6.6937255859375, -6.068603515625, -5.4434814453125, -4.818359375, -4.1932373046875, -3.568115234375, -2.9429931640625, -2.31787109375, -1.6927490234375, -1.067626953125, -0.4425048828125, 0.1826171875, 0.8077392578125, 1.432861328125, 2.0579833984375, 2.68310546875, 3.3082275390625, 3.933349609375, 4.5584716796875, 5.18359375, 5.8087158203125, 6.433837890625, 7.0589599609375, 7.68408203125, 8.3092041015625, 8.934326171875, 9.5594482421875, 10.1845703125, 10.8096923828125, 11.434814453125, 12.0599365234375, 12.68505859375, 13.3101806640625, 13.935302734375, 14.5604248046875, 15.185546875, 15.8106689453125, 16.435791015625, 17.0609130859375, 17.68603515625, 18.3111572265625, 18.936279296875, 19.5614013671875, 20.1865234375, 20.8116455078125, 21.436767578125, 22.0618896484375, 22.68701171875, 23.3121337890625, 23.937255859375, 24.5623779296875, 25.1875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 14.0, 18.0, 43.0, 60.0, 135.0, 284.0, 571.0, 1123.0, 2923.0, 14443.0, 276135.0, 3813310.0, 74151.0, 7504.0, 1853.0, 716.0, 356.0, 238.0, 129.0, 92.0, 63.0, 27.0, 25.0, 18.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.484375, -20.522705078125, -19.56103515625, -18.599365234375, -17.6376953125, -16.676025390625, -15.71435546875, -14.752685546875, -13.791015625, -12.829345703125, -11.86767578125, -10.906005859375, -9.9443359375, -8.982666015625, -8.02099609375, -7.059326171875, -6.09765625, -5.135986328125, -4.17431640625, -3.212646484375, -2.2509765625, -1.289306640625, -0.32763671875, 0.634033203125, 1.595703125, 2.557373046875, 3.51904296875, 4.480712890625, 5.4423828125, 6.404052734375, 7.36572265625, 8.327392578125, 9.2890625, 10.250732421875, 11.21240234375, 12.174072265625, 13.1357421875, 14.097412109375, 15.05908203125, 16.020751953125, 16.982421875, 17.944091796875, 18.90576171875, 19.867431640625, 20.8291015625, 21.790771484375, 22.75244140625, 23.714111328125, 24.67578125, 25.637451171875, 26.59912109375, 27.560791015625, 28.5224609375, 29.484130859375, 30.44580078125, 31.407470703125, 32.369140625, 33.330810546875, 34.29248046875, 35.254150390625, 36.2158203125, 37.177490234375, 38.13916015625, 39.100830078125, 40.0625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 8.0, 7.0, 7.0, 22.0, 18.0, 42.0, 67.0, 144.0, 430.0, 997.0, 1362.0, 607.0, 198.0, 64.0, 41.0, 22.0, 15.0, 8.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.21875, -33.0869140625, -31.955078125, -30.8232421875, -29.69140625, -28.5595703125, -27.427734375, -26.2958984375, -25.1640625, -24.0322265625, -22.900390625, -21.7685546875, -20.63671875, -19.5048828125, -18.373046875, -17.2412109375, -16.109375, -14.9775390625, -13.845703125, -12.7138671875, -11.58203125, -10.4501953125, -9.318359375, -8.1865234375, -7.0546875, -5.9228515625, -4.791015625, -3.6591796875, -2.52734375, -1.3955078125, -0.263671875, 0.8681640625, 2.0, 3.1318359375, 4.263671875, 5.3955078125, 6.52734375, 7.6591796875, 8.791015625, 9.9228515625, 11.0546875, 12.1865234375, 13.318359375, 14.4501953125, 15.58203125, 16.7138671875, 17.845703125, 18.9775390625, 20.109375, 21.2412109375, 22.373046875, 23.5048828125, 24.63671875, 25.7685546875, 26.900390625, 28.0322265625, 29.1640625, 30.2958984375, 31.427734375, 32.5595703125, 33.69140625, 34.8232421875, 35.955078125, 37.0869140625, 38.21875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 18.0, 76.0, 348.0, 399.0, 106.0, 18.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-390.8502197265625, -378.28790283203125, -365.7255859375, -353.16326904296875, -340.6009216308594, -328.0386047363281, -315.4762878417969, -302.9139709472656, -290.35162353515625, -277.789306640625, -265.22698974609375, -252.66465759277344, -240.10232543945312, -227.54000854492188, -214.97769165039062, -202.41537475585938, -189.85305786132812, -177.29074096679688, -164.72840881347656, -152.1660919189453, -139.603759765625, -127.04144287109375, -114.4791259765625, -101.91680145263672, -89.35447692871094, -76.79215240478516, -64.22982788085938, -51.667510986328125, -39.105186462402344, -26.542861938476562, -13.980545043945312, -1.4182205200195312, 11.144134521484375, 23.706457138061523, 36.26877975463867, 48.83110046386719, 61.39342498779297, 73.95574951171875, 86.51806640625, 99.08039093017578, 111.64271545410156, 124.20503997802734, 136.76736450195312, 149.32968139648438, 161.89199829101562, 174.45433044433594, 187.0166473388672, 199.5789794921875, 212.14129638671875, 224.70361328125, 237.2659454345703, 249.82826232910156, 262.3905944824219, 274.9529113769531, 287.5152282714844, 300.0775451660156, 312.639892578125, 325.20220947265625, 337.7645263671875, 350.32684326171875, 362.8891906738281, 375.4515075683594, 388.0138244628906, 400.5761413574219, 413.1384582519531]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 8.0, 14.0, 13.0, 30.0, 17.0, 36.0, 36.0, 79.0, 71.0, 83.0, 77.0, 95.0, 81.0, 84.0, 80.0, 46.0, 42.0, 35.0, 20.0, 15.0, 16.0, 7.0, 10.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.0839385986328, -241.26461791992188, -235.44529724121094, -229.6259765625, -223.80667114257812, -217.9873504638672, -212.16802978515625, -206.3487091064453, -200.52938842773438, -194.71006774902344, -188.8907470703125, -183.07144165039062, -177.2521209716797, -171.43280029296875, -165.6134796142578, -159.79415893554688, -153.974853515625, -148.15553283691406, -142.33621215820312, -136.51690673828125, -130.6975860595703, -124.87826538085938, -119.05894470214844, -113.2396240234375, -107.42030334472656, -101.60098266601562, -95.78166961669922, -89.96234893798828, -84.14302825927734, -78.32371520996094, -72.50439453125, -66.68507385253906, -60.865760803222656, -55.046443939208984, -49.22712326049805, -43.407806396484375, -37.58848571777344, -31.769168853759766, -25.949851989746094, -20.130531311035156, -14.311214447021484, -8.49189567565918, -2.6725778579711914, 3.146739959716797, 8.966058731079102, 14.785377502441406, 20.604694366455078, 26.424015045166016, 32.24333190917969, 38.06264877319336, 43.8819694519043, 49.70128631591797, 55.520606994628906, 61.33992385864258, 67.15924072265625, 72.97856140136719, 78.79788208007812, 84.61720275878906, 90.43651580810547, 96.2558364868164, 102.07515716552734, 107.89447021484375, 113.71379089355469, 119.53311157226562, 125.35242462158203]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 10.0, 9.0, 17.0, 14.0, 18.0, 22.0, 28.0, 50.0, 51.0, 75.0, 129.0, 185.0, 298.0, 513.0, 1167.0, 3099.0, 11483.0, 66380.0, 635630.0, 286480.0, 32044.0, 6679.0, 2105.0, 857.0, 439.0, 239.0, 158.0, 88.0, 68.0, 46.0, 42.0, 26.0, 17.0, 18.0, 12.0, 6.0, 12.0, 10.0, 6.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-32.125, -31.04736328125, -29.9697265625, -28.89208984375, -27.814453125, -26.73681640625, -25.6591796875, -24.58154296875, -23.50390625, -22.42626953125, -21.3486328125, -20.27099609375, -19.193359375, -18.11572265625, -17.0380859375, -15.96044921875, -14.8828125, -13.80517578125, -12.7275390625, -11.64990234375, -10.572265625, -9.49462890625, -8.4169921875, -7.33935546875, -6.26171875, -5.18408203125, -4.1064453125, -3.02880859375, -1.951171875, -0.87353515625, 0.2041015625, 1.28173828125, 2.359375, 3.43701171875, 4.5146484375, 5.59228515625, 6.669921875, 7.74755859375, 8.8251953125, 9.90283203125, 10.98046875, 12.05810546875, 13.1357421875, 14.21337890625, 15.291015625, 16.36865234375, 17.4462890625, 18.52392578125, 19.6015625, 20.67919921875, 21.7568359375, 22.83447265625, 23.912109375, 24.98974609375, 26.0673828125, 27.14501953125, 28.22265625, 29.30029296875, 30.3779296875, 31.45556640625, 32.533203125, 33.61083984375, 34.6884765625, 35.76611328125, 36.84375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 6.0, 6.0, 12.0, 14.0, 10.0, 24.0, 31.0, 45.0, 60.0, 68.0, 73.0, 74.0, 86.0, 85.0, 77.0, 67.0, 70.0, 57.0, 33.0, 41.0, 20.0, 13.0, 10.0, 6.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.4453125, -13.9268798828125, -13.408447265625, -12.8900146484375, -12.37158203125, -11.8531494140625, -11.334716796875, -10.8162841796875, -10.2978515625, -9.7794189453125, -9.260986328125, -8.7425537109375, -8.22412109375, -7.7056884765625, -7.187255859375, -6.6688232421875, -6.150390625, -5.6319580078125, -5.113525390625, -4.5950927734375, -4.07666015625, -3.5582275390625, -3.039794921875, -2.5213623046875, -2.0029296875, -1.4844970703125, -0.966064453125, -0.4476318359375, 0.07080078125, 0.5892333984375, 1.107666015625, 1.6260986328125, 2.14453125, 2.6629638671875, 3.181396484375, 3.6998291015625, 4.21826171875, 4.7366943359375, 5.255126953125, 5.7735595703125, 6.2919921875, 6.8104248046875, 7.328857421875, 7.8472900390625, 8.36572265625, 8.8841552734375, 9.402587890625, 9.9210205078125, 10.439453125, 10.9578857421875, 11.476318359375, 11.9947509765625, 12.51318359375, 13.0316162109375, 13.550048828125, 14.0684814453125, 14.5869140625, 15.1053466796875, 15.623779296875, 16.1422119140625, 16.66064453125, 17.1790771484375, 17.697509765625, 18.2159423828125, 18.734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 4.0, 2.0, 0.0, 5.0, 7.0, 7.0, 16.0, 17.0, 20.0, 27.0, 41.0, 74.0, 91.0, 204.0, 393.0, 966.0, 2995.0, 20987.0, 964083.0, 51804.0, 4435.0, 1295.0, 492.0, 236.0, 113.0, 64.0, 45.0, 39.0, 25.0, 16.0, 14.0, 11.0, 4.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-90.0625, -87.21484375, -84.3671875, -81.51953125, -78.671875, -75.82421875, -72.9765625, -70.12890625, -67.28125, -64.43359375, -61.5859375, -58.73828125, -55.890625, -53.04296875, -50.1953125, -47.34765625, -44.5, -41.65234375, -38.8046875, -35.95703125, -33.109375, -30.26171875, -27.4140625, -24.56640625, -21.71875, -18.87109375, -16.0234375, -13.17578125, -10.328125, -7.48046875, -4.6328125, -1.78515625, 1.0625, 3.91015625, 6.7578125, 9.60546875, 12.453125, 15.30078125, 18.1484375, 20.99609375, 23.84375, 26.69140625, 29.5390625, 32.38671875, 35.234375, 38.08203125, 40.9296875, 43.77734375, 46.625, 49.47265625, 52.3203125, 55.16796875, 58.015625, 60.86328125, 63.7109375, 66.55859375, 69.40625, 72.25390625, 75.1015625, 77.94921875, 80.796875, 83.64453125, 86.4921875, 89.33984375, 92.1875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 14.0, 18.0, 26.0, 34.0, 45.0, 48.0, 60.0, 84.0, 94.0, 86.0, 83.0, 77.0, 72.0, 60.0, 42.0, 32.0, 28.0, 23.0, 11.0, 15.0, 6.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.5, -69.3671875, -67.234375, -65.1015625, -62.96875, -60.8359375, -58.703125, -56.5703125, -54.4375, -52.3046875, -50.171875, -48.0390625, -45.90625, -43.7734375, -41.640625, -39.5078125, -37.375, -35.2421875, -33.109375, -30.9765625, -28.84375, -26.7109375, -24.578125, -22.4453125, -20.3125, -18.1796875, -16.046875, -13.9140625, -11.78125, -9.6484375, -7.515625, -5.3828125, -3.25, -1.1171875, 1.015625, 3.1484375, 5.28125, 7.4140625, 9.546875, 11.6796875, 13.8125, 15.9453125, 18.078125, 20.2109375, 22.34375, 24.4765625, 26.609375, 28.7421875, 30.875, 33.0078125, 35.140625, 37.2734375, 39.40625, 41.5390625, 43.671875, 45.8046875, 47.9375, 50.0703125, 52.203125, 54.3359375, 56.46875, 58.6015625, 60.734375, 62.8671875, 65.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 10.0, 7.0, 14.0, 19.0, 22.0, 29.0, 35.0, 59.0, 91.0, 108.0, 211.0, 385.0, 920.0, 2598.0, 11814.0, 866088.0, 154510.0, 7954.0, 2044.0, 706.0, 306.0, 220.0, 104.0, 74.0, 54.0, 38.0, 34.0, 22.0, 8.0, 13.0, 8.0, 10.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.25, -29.30126953125, -28.3525390625, -27.40380859375, -26.455078125, -25.50634765625, -24.5576171875, -23.60888671875, -22.66015625, -21.71142578125, -20.7626953125, -19.81396484375, -18.865234375, -17.91650390625, -16.9677734375, -16.01904296875, -15.0703125, -14.12158203125, -13.1728515625, -12.22412109375, -11.275390625, -10.32666015625, -9.3779296875, -8.42919921875, -7.48046875, -6.53173828125, -5.5830078125, -4.63427734375, -3.685546875, -2.73681640625, -1.7880859375, -0.83935546875, 0.109375, 1.05810546875, 2.0068359375, 2.95556640625, 3.904296875, 4.85302734375, 5.8017578125, 6.75048828125, 7.69921875, 8.64794921875, 9.5966796875, 10.54541015625, 11.494140625, 12.44287109375, 13.3916015625, 14.34033203125, 15.2890625, 16.23779296875, 17.1865234375, 18.13525390625, 19.083984375, 20.03271484375, 20.9814453125, 21.93017578125, 22.87890625, 23.82763671875, 24.7763671875, 25.72509765625, 26.673828125, 27.62255859375, 28.5712890625, 29.52001953125, 30.46875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 5.0, 10.0, 22.0, 43.0, 69.0, 157.0, 351.0, 185.0, 57.0, 25.0, 16.0, 20.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.003997802734375, -0.003852665424346924, -0.0037075281143188477, -0.0035623908042907715, -0.0034172534942626953, -0.003272116184234619, -0.003126978874206543, -0.002981841564178467, -0.0028367042541503906, -0.0026915669441223145, -0.0025464296340942383, -0.002401292324066162, -0.002256155014038086, -0.0021110177040100098, -0.0019658803939819336, -0.0018207430839538574, -0.0016756057739257812, -0.001530468463897705, -0.001385331153869629, -0.0012401938438415527, -0.0010950565338134766, -0.0009499192237854004, -0.0008047819137573242, -0.000659644603729248, -0.0005145072937011719, -0.0003693699836730957, -0.00022423267364501953, -7.909536361694336e-05, 6.604194641113281e-05, 0.00021117925643920898, 0.00035631656646728516, 0.0005014538764953613, 0.0006465911865234375, 0.0007917284965515137, 0.0009368658065795898, 0.001082003116607666, 0.0012271404266357422, 0.0013722777366638184, 0.0015174150466918945, 0.0016625523567199707, 0.0018076896667480469, 0.001952826976776123, 0.0020979642868041992, 0.0022431015968322754, 0.0023882389068603516, 0.0025333762168884277, 0.002678513526916504, 0.00282365083694458, 0.0029687881469726562, 0.0031139254570007324, 0.0032590627670288086, 0.0034042000770568848, 0.003549337387084961, 0.003694474697113037, 0.0038396120071411133, 0.0039847493171691895, 0.004129886627197266, 0.004275023937225342, 0.004420161247253418, 0.004565298557281494, 0.00471043586730957, 0.0048555731773376465, 0.005000710487365723, 0.005145847797393799, 0.005290985107421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 11.0, 22.0, 32.0, 58.0, 79.0, 132.0, 294.0, 648.0, 2993.0, 30300.0, 991404.0, 19266.0, 2120.0, 612.0, 230.0, 125.0, 77.0, 50.0, 32.0, 17.0, 13.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.375, -33.43115234375, -32.4873046875, -31.54345703125, -30.599609375, -29.65576171875, -28.7119140625, -27.76806640625, -26.82421875, -25.88037109375, -24.9365234375, -23.99267578125, -23.048828125, -22.10498046875, -21.1611328125, -20.21728515625, -19.2734375, -18.32958984375, -17.3857421875, -16.44189453125, -15.498046875, -14.55419921875, -13.6103515625, -12.66650390625, -11.72265625, -10.77880859375, -9.8349609375, -8.89111328125, -7.947265625, -7.00341796875, -6.0595703125, -5.11572265625, -4.171875, -3.22802734375, -2.2841796875, -1.34033203125, -0.396484375, 0.54736328125, 1.4912109375, 2.43505859375, 3.37890625, 4.32275390625, 5.2666015625, 6.21044921875, 7.154296875, 8.09814453125, 9.0419921875, 9.98583984375, 10.9296875, 11.87353515625, 12.8173828125, 13.76123046875, 14.705078125, 15.64892578125, 16.5927734375, 17.53662109375, 18.48046875, 19.42431640625, 20.3681640625, 21.31201171875, 22.255859375, 23.19970703125, 24.1435546875, 25.08740234375, 26.03125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 6.0, 8.0, 4.0, 9.0, 13.0, 32.0, 69.0, 189.0, 315.0, 189.0, 72.0, 31.0, 11.0, 14.0, 5.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.078125, -21.39892578125, -20.7197265625, -20.04052734375, -19.361328125, -18.68212890625, -18.0029296875, -17.32373046875, -16.64453125, -15.96533203125, -15.2861328125, -14.60693359375, -13.927734375, -13.24853515625, -12.5693359375, -11.89013671875, -11.2109375, -10.53173828125, -9.8525390625, -9.17333984375, -8.494140625, -7.81494140625, -7.1357421875, -6.45654296875, -5.77734375, -5.09814453125, -4.4189453125, -3.73974609375, -3.060546875, -2.38134765625, -1.7021484375, -1.02294921875, -0.34375, 0.33544921875, 1.0146484375, 1.69384765625, 2.373046875, 3.05224609375, 3.7314453125, 4.41064453125, 5.08984375, 5.76904296875, 6.4482421875, 7.12744140625, 7.806640625, 8.48583984375, 9.1650390625, 9.84423828125, 10.5234375, 11.20263671875, 11.8818359375, 12.56103515625, 13.240234375, 13.91943359375, 14.5986328125, 15.27783203125, 15.95703125, 16.63623046875, 17.3154296875, 17.99462890625, 18.673828125, 19.35302734375, 20.0322265625, 20.71142578125, 21.390625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 9.0, 46.0, 340.0, 504.0, 66.0, 12.0, 3.0, 5.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-575.5166015625, -552.5615234375, -529.6063842773438, -506.65130615234375, -483.69622802734375, -460.7411193847656, -437.7860107421875, -414.8309326171875, -391.8758239746094, -368.92071533203125, -345.96563720703125, -323.0105285644531, -300.055419921875, -277.100341796875, -254.14523315429688, -231.1901397705078, -208.23504638671875, -185.2799530029297, -162.32485961914062, -139.3697509765625, -116.41465759277344, -93.45956420898438, -70.50445556640625, -47.54936218261719, -24.594268798828125, -1.6391716003417969, 21.31592559814453, 44.271026611328125, 67.22611999511719, 90.18121337890625, 113.13632202148438, 136.09141540527344, 159.0465087890625, 182.00160217285156, 204.95669555664062, 227.91180419921875, 250.8668975830078, 273.8219909667969, 296.777099609375, 319.732177734375, 342.6872863769531, 365.64239501953125, 388.59747314453125, 411.5525817871094, 434.5076904296875, 457.4627685546875, 480.4178771972656, 503.37298583984375, 526.3280639648438, 549.2831420898438, 572.23828125, 595.193359375, 618.1484375, 641.103515625, 664.0586547851562, 687.0137329101562, 709.9688720703125, 732.9239501953125, 755.8790893554688, 778.8341674804688, 801.7892456054688, 824.744384765625, 847.699462890625, 870.654541015625, 893.609619140625]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 8.0, 9.0, 15.0, 11.0, 22.0, 14.0, 20.0, 22.0, 34.0, 39.0, 48.0, 35.0, 55.0, 67.0, 81.0, 58.0, 83.0, 61.0, 41.0, 41.0, 34.0, 28.0, 32.0, 25.0, 25.0, 14.0, 17.0, 7.0, 9.0, 10.0, 6.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-167.3512420654297, -161.45753479003906, -155.5638427734375, -149.67013549804688, -143.7764434814453, -137.8827362060547, -131.98904418945312, -126.0953369140625, -120.2016372680664, -114.30793762207031, -108.41423797607422, -102.52053833007812, -96.6268310546875, -90.73313903808594, -84.83943176269531, -78.94573211669922, -73.05203247070312, -67.15833282470703, -61.26463317871094, -55.37092971801758, -49.477230072021484, -43.58353042602539, -37.68982696533203, -31.796127319335938, -25.902427673339844, -20.00872802734375, -14.115026473999023, -8.221324920654297, -2.327625274658203, 3.5660743713378906, 9.45977783203125, 15.353477478027344, 21.247177124023438, 27.14087677001953, 33.034576416015625, 38.928279876708984, 44.82197952270508, 50.71567916870117, 56.60938262939453, 62.503082275390625, 68.39678192138672, 74.29048156738281, 80.1841812133789, 86.077880859375, 91.97158813476562, 97.86528015136719, 103.75898742675781, 109.6526870727539, 115.54638671875, 121.4400863647461, 127.33378601074219, 133.2274932861328, 139.12118530273438, 145.014892578125, 150.90859985351562, 156.8022918701172, 162.69598388671875, 168.58969116210938, 174.48338317871094, 180.37709045410156, 186.27078247070312, 192.16448974609375, 198.05819702148438, 203.95188903808594, 209.84559631347656]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 6.0, 9.0, 23.0, 15.0, 25.0, 56.0, 102.0, 187.0, 695.0, 2310.0, 14514.0, 3124510.0, 1038999.0, 9751.0, 1955.0, 621.0, 225.0, 95.0, 64.0, 35.0, 23.0, 18.0, 6.0, 7.0, 6.0, 0.0, 6.0, 2.0, 0.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.21875, -43.80224609375, -42.3857421875, -40.96923828125, -39.552734375, -38.13623046875, -36.7197265625, -35.30322265625, -33.88671875, -32.47021484375, -31.0537109375, -29.63720703125, -28.220703125, -26.80419921875, -25.3876953125, -23.97119140625, -22.5546875, -21.13818359375, -19.7216796875, -18.30517578125, -16.888671875, -15.47216796875, -14.0556640625, -12.63916015625, -11.22265625, -9.80615234375, -8.3896484375, -6.97314453125, -5.556640625, -4.14013671875, -2.7236328125, -1.30712890625, 0.109375, 1.52587890625, 2.9423828125, 4.35888671875, 5.775390625, 7.19189453125, 8.6083984375, 10.02490234375, 11.44140625, 12.85791015625, 14.2744140625, 15.69091796875, 17.107421875, 18.52392578125, 19.9404296875, 21.35693359375, 22.7734375, 24.18994140625, 25.6064453125, 27.02294921875, 28.439453125, 29.85595703125, 31.2724609375, 32.68896484375, 34.10546875, 35.52197265625, 36.9384765625, 38.35498046875, 39.771484375, 41.18798828125, 42.6044921875, 44.02099609375, 45.4375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 16.0, 27.0, 66.0, 104.0, 135.0, 164.0, 163.0, 125.0, 100.0, 52.0, 28.0, 11.0, 6.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.65625, -31.6650390625, -30.673828125, -29.6826171875, -28.69140625, -27.7001953125, -26.708984375, -25.7177734375, -24.7265625, -23.7353515625, -22.744140625, -21.7529296875, -20.76171875, -19.7705078125, -18.779296875, -17.7880859375, -16.796875, -15.8056640625, -14.814453125, -13.8232421875, -12.83203125, -11.8408203125, -10.849609375, -9.8583984375, -8.8671875, -7.8759765625, -6.884765625, -5.8935546875, -4.90234375, -3.9111328125, -2.919921875, -1.9287109375, -0.9375, 0.0537109375, 1.044921875, 2.0361328125, 3.02734375, 4.0185546875, 5.009765625, 6.0009765625, 6.9921875, 7.9833984375, 8.974609375, 9.9658203125, 10.95703125, 11.9482421875, 12.939453125, 13.9306640625, 14.921875, 15.9130859375, 16.904296875, 17.8955078125, 18.88671875, 19.8779296875, 20.869140625, 21.8603515625, 22.8515625, 23.8427734375, 24.833984375, 25.8251953125, 26.81640625, 27.8076171875, 28.798828125, 29.7900390625, 30.78125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 2.0, 6.0, 13.0, 15.0, 16.0, 39.0, 40.0, 98.0, 158.0, 254.0, 522.0, 992.0, 1838.0, 3879.0, 16746.0, 3936742.0, 221046.0, 7307.0, 2372.0, 1098.0, 522.0, 258.0, 108.0, 78.0, 52.0, 29.0, 21.0, 6.0, 12.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.46875, -37.87744140625, -36.2861328125, -34.69482421875, -33.103515625, -31.51220703125, -29.9208984375, -28.32958984375, -26.73828125, -25.14697265625, -23.5556640625, -21.96435546875, -20.373046875, -18.78173828125, -17.1904296875, -15.59912109375, -14.0078125, -12.41650390625, -10.8251953125, -9.23388671875, -7.642578125, -6.05126953125, -4.4599609375, -2.86865234375, -1.27734375, 0.31396484375, 1.9052734375, 3.49658203125, 5.087890625, 6.67919921875, 8.2705078125, 9.86181640625, 11.453125, 13.04443359375, 14.6357421875, 16.22705078125, 17.818359375, 19.40966796875, 21.0009765625, 22.59228515625, 24.18359375, 25.77490234375, 27.3662109375, 28.95751953125, 30.548828125, 32.14013671875, 33.7314453125, 35.32275390625, 36.9140625, 38.50537109375, 40.0966796875, 41.68798828125, 43.279296875, 44.87060546875, 46.4619140625, 48.05322265625, 49.64453125, 51.23583984375, 52.8271484375, 54.41845703125, 56.009765625, 57.60107421875, 59.1923828125, 60.78369140625, 62.375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 6.0, 8.0, 23.0, 32.0, 208.0, 1489.0, 1908.0, 271.0, 74.0, 19.0, 13.0, 7.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.0, -74.05810546875, -72.1162109375, -70.17431640625, -68.232421875, -66.29052734375, -64.3486328125, -62.40673828125, -60.46484375, -58.52294921875, -56.5810546875, -54.63916015625, -52.697265625, -50.75537109375, -48.8134765625, -46.87158203125, -44.9296875, -42.98779296875, -41.0458984375, -39.10400390625, -37.162109375, -35.22021484375, -33.2783203125, -31.33642578125, -29.39453125, -27.45263671875, -25.5107421875, -23.56884765625, -21.626953125, -19.68505859375, -17.7431640625, -15.80126953125, -13.859375, -11.91748046875, -9.9755859375, -8.03369140625, -6.091796875, -4.14990234375, -2.2080078125, -0.26611328125, 1.67578125, 3.61767578125, 5.5595703125, 7.50146484375, 9.443359375, 11.38525390625, 13.3271484375, 15.26904296875, 17.2109375, 19.15283203125, 21.0947265625, 23.03662109375, 24.978515625, 26.92041015625, 28.8623046875, 30.80419921875, 32.74609375, 34.68798828125, 36.6298828125, 38.57177734375, 40.513671875, 42.45556640625, 44.3974609375, 46.33935546875, 48.28125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 11.0, 30.0, 267.0, 590.0, 60.0, 15.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-927.4464111328125, -908.6227416992188, -889.7991333007812, -870.9754638671875, -852.15185546875, -833.3281860351562, -814.5045166015625, -795.680908203125, -776.8572387695312, -758.0335693359375, -739.2099609375, -720.3862915039062, -701.5626220703125, -682.739013671875, -663.9153442382812, -645.0916748046875, -626.26806640625, -607.4443969726562, -588.6207885742188, -569.797119140625, -550.9735107421875, -532.1498413085938, -513.326171875, -494.5025329589844, -475.67889404296875, -456.8552551269531, -438.0316162109375, -419.20794677734375, -400.3843078613281, -381.5606689453125, -362.73699951171875, -343.9133605957031, -325.08966064453125, -306.2660217285156, -287.4423828125, -268.61871337890625, -249.79507446289062, -230.971435546875, -212.1477813720703, -193.32412719726562, -174.50048828125, -155.67684936523438, -136.8531951904297, -118.02954864501953, -99.20590209960938, -80.38225555419922, -61.55860900878906, -42.734954833984375, -23.91131591796875, -5.087669372558594, 13.735977172851562, 32.55962371826172, 51.383270263671875, 70.20691680908203, 89.03056335449219, 107.85421752929688, 126.6778564453125, 145.50149536132812, 164.3251495361328, 183.1488037109375, 201.97244262695312, 220.79608154296875, 239.61973571777344, 258.4433898925781, 277.26702880859375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 11.0, 26.0, 30.0, 78.0, 75.0, 130.0, 137.0, 133.0, 132.0, 101.0, 63.0, 40.0, 21.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-261.275390625, -252.9762725830078, -244.6771697998047, -236.3780517578125, -228.0789337158203, -219.77981567382812, -211.480712890625, -203.1815948486328, -194.88247680664062, -186.58335876464844, -178.2842559814453, -169.98513793945312, -161.68601989746094, -153.38690185546875, -145.08779907226562, -136.78868103027344, -128.4895782470703, -120.19046783447266, -111.89134979248047, -103.59223937988281, -95.29312133789062, -86.99401092529297, -78.69490051269531, -70.39578247070312, -62.09667205810547, -53.79755783081055, -45.498443603515625, -37.19933319091797, -28.900218963623047, -20.601104736328125, -12.301994323730469, -4.002880096435547, 4.296234130859375, 12.59534740447998, 20.894460678100586, 29.193572998046875, 37.4926872253418, 45.79180145263672, 54.090911865234375, 62.3900260925293, 70.68914031982422, 78.98825073242188, 87.28736877441406, 95.58647918701172, 103.88558959960938, 112.18470764160156, 120.48381805419922, 128.78292846679688, 137.08204650878906, 145.38116455078125, 153.68026733398438, 161.97938537597656, 170.27850341796875, 178.57760620117188, 186.87672424316406, 195.17584228515625, 203.47494506835938, 211.77406311035156, 220.0731658935547, 228.37228393554688, 236.67140197753906, 244.97052001953125, 253.26962280273438, 261.5687255859375, 269.86785888671875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 4.0, 4.0, 11.0, 13.0, 11.0, 16.0, 27.0, 53.0, 84.0, 168.0, 298.0, 552.0, 1579.0, 10603.0, 358202.0, 655853.0, 17634.0, 2075.0, 663.0, 277.0, 154.0, 90.0, 76.0, 24.0, 21.0, 15.0, 13.0, 16.0, 6.0, 2.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.0625, -44.75, -43.4375, -42.125, -40.8125, -39.5, -38.1875, -36.875, -35.5625, -34.25, -32.9375, -31.625, -30.3125, -29.0, -27.6875, -26.375, -25.0625, -23.75, -22.4375, -21.125, -19.8125, -18.5, -17.1875, -15.875, -14.5625, -13.25, -11.9375, -10.625, -9.3125, -8.0, -6.6875, -5.375, -4.0625, -2.75, -1.4375, -0.125, 1.1875, 2.5, 3.8125, 5.125, 6.4375, 7.75, 9.0625, 10.375, 11.6875, 13.0, 14.3125, 15.625, 16.9375, 18.25, 19.5625, 20.875, 22.1875, 23.5, 24.8125, 26.125, 27.4375, 28.75, 30.0625, 31.375, 32.6875, 34.0, 35.3125, 36.625, 37.9375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 7.0, 27.0, 35.0, 70.0, 106.0, 156.0, 142.0, 155.0, 124.0, 85.0, 49.0, 26.0, 13.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.046875, -26.104736328125, -25.16259765625, -24.220458984375, -23.2783203125, -22.336181640625, -21.39404296875, -20.451904296875, -19.509765625, -18.567626953125, -17.62548828125, -16.683349609375, -15.7412109375, -14.799072265625, -13.85693359375, -12.914794921875, -11.97265625, -11.030517578125, -10.08837890625, -9.146240234375, -8.2041015625, -7.261962890625, -6.31982421875, -5.377685546875, -4.435546875, -3.493408203125, -2.55126953125, -1.609130859375, -0.6669921875, 0.275146484375, 1.21728515625, 2.159423828125, 3.1015625, 4.043701171875, 4.98583984375, 5.927978515625, 6.8701171875, 7.812255859375, 8.75439453125, 9.696533203125, 10.638671875, 11.580810546875, 12.52294921875, 13.465087890625, 14.4072265625, 15.349365234375, 16.29150390625, 17.233642578125, 18.17578125, 19.117919921875, 20.06005859375, 21.002197265625, 21.9443359375, 22.886474609375, 23.82861328125, 24.770751953125, 25.712890625, 26.655029296875, 27.59716796875, 28.539306640625, 29.4814453125, 30.423583984375, 31.36572265625, 32.307861328125, 33.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 10.0, 7.0, 16.0, 26.0, 25.0, 50.0, 91.0, 169.0, 382.0, 1055.0, 4184.0, 32903.0, 704183.0, 283897.0, 17211.0, 2882.0, 785.0, 298.0, 160.0, 75.0, 51.0, 24.0, 23.0, 13.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.79736328125, -29.8603515625, -28.92333984375, -27.986328125, -27.04931640625, -26.1123046875, -25.17529296875, -24.23828125, -23.30126953125, -22.3642578125, -21.42724609375, -20.490234375, -19.55322265625, -18.6162109375, -17.67919921875, -16.7421875, -15.80517578125, -14.8681640625, -13.93115234375, -12.994140625, -12.05712890625, -11.1201171875, -10.18310546875, -9.24609375, -8.30908203125, -7.3720703125, -6.43505859375, -5.498046875, -4.56103515625, -3.6240234375, -2.68701171875, -1.75, -0.81298828125, 0.1240234375, 1.06103515625, 1.998046875, 2.93505859375, 3.8720703125, 4.80908203125, 5.74609375, 6.68310546875, 7.6201171875, 8.55712890625, 9.494140625, 10.43115234375, 11.3681640625, 12.30517578125, 13.2421875, 14.17919921875, 15.1162109375, 16.05322265625, 16.990234375, 17.92724609375, 18.8642578125, 19.80126953125, 20.73828125, 21.67529296875, 22.6123046875, 23.54931640625, 24.486328125, 25.42333984375, 26.3603515625, 27.29736328125, 28.234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 11.0, 10.0, 19.0, 18.0, 17.0, 22.0, 31.0, 36.0, 34.0, 35.0, 55.0, 52.0, 52.0, 46.0, 58.0, 50.0, 54.0, 52.0, 48.0, 53.0, 38.0, 37.0, 31.0, 26.0, 17.0, 24.0, 11.0, 13.0, 9.0, 7.0, 8.0, 5.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.71875, -39.598876953125, -38.47900390625, -37.359130859375, -36.2392578125, -35.119384765625, -33.99951171875, -32.879638671875, -31.759765625, -30.639892578125, -29.52001953125, -28.400146484375, -27.2802734375, -26.160400390625, -25.04052734375, -23.920654296875, -22.80078125, -21.680908203125, -20.56103515625, -19.441162109375, -18.3212890625, -17.201416015625, -16.08154296875, -14.961669921875, -13.841796875, -12.721923828125, -11.60205078125, -10.482177734375, -9.3623046875, -8.242431640625, -7.12255859375, -6.002685546875, -4.8828125, -3.762939453125, -2.64306640625, -1.523193359375, -0.4033203125, 0.716552734375, 1.83642578125, 2.956298828125, 4.076171875, 5.196044921875, 6.31591796875, 7.435791015625, 8.5556640625, 9.675537109375, 10.79541015625, 11.915283203125, 13.03515625, 14.155029296875, 15.27490234375, 16.394775390625, 17.5146484375, 18.634521484375, 19.75439453125, 20.874267578125, 21.994140625, 23.114013671875, 24.23388671875, 25.353759765625, 26.4736328125, 27.593505859375, 28.71337890625, 29.833251953125, 30.953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 8.0, 7.0, 12.0, 19.0, 17.0, 38.0, 56.0, 81.0, 185.0, 443.0, 1053.0, 3716.0, 18730.0, 227191.0, 744782.0, 42864.0, 6448.0, 1676.0, 560.0, 272.0, 132.0, 75.0, 46.0, 28.0, 14.0, 21.0, 12.0, 8.0, 9.0, 5.0, 9.0, 7.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.6640625, -6.443359375, -6.22265625, -6.001953125, -5.78125, -5.560546875, -5.33984375, -5.119140625, -4.8984375, -4.677734375, -4.45703125, -4.236328125, -4.015625, -3.794921875, -3.57421875, -3.353515625, -3.1328125, -2.912109375, -2.69140625, -2.470703125, -2.25, -2.029296875, -1.80859375, -1.587890625, -1.3671875, -1.146484375, -0.92578125, -0.705078125, -0.484375, -0.263671875, -0.04296875, 0.177734375, 0.3984375, 0.619140625, 0.83984375, 1.060546875, 1.28125, 1.501953125, 1.72265625, 1.943359375, 2.1640625, 2.384765625, 2.60546875, 2.826171875, 3.046875, 3.267578125, 3.48828125, 3.708984375, 3.9296875, 4.150390625, 4.37109375, 4.591796875, 4.8125, 5.033203125, 5.25390625, 5.474609375, 5.6953125, 5.916015625, 6.13671875, 6.357421875, 6.578125, 6.798828125, 7.01953125, 7.240234375, 7.4609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 11.0, 15.0, 22.0, 30.0, 30.0, 50.0, 65.0, 126.0, 146.0, 154.0, 115.0, 77.0, 44.0, 35.0, 18.0, 11.0, 8.0, 5.0, 9.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012359619140625, -0.0011984705924987793, -0.0011609792709350586, -0.0011234879493713379, -0.0010859966278076172, -0.0010485053062438965, -0.0010110139846801758, -0.0009735226631164551, -0.0009360313415527344, -0.0008985400199890137, -0.000861048698425293, -0.0008235573768615723, -0.0007860660552978516, -0.0007485747337341309, -0.0007110834121704102, -0.0006735920906066895, -0.0006361007690429688, -0.000598609447479248, -0.0005611181259155273, -0.0005236268043518066, -0.00048613548278808594, -0.00044864416122436523, -0.00041115283966064453, -0.00037366151809692383, -0.0003361701965332031, -0.0002986788749694824, -0.0002611875534057617, -0.00022369623184204102, -0.0001862049102783203, -0.0001487135887145996, -0.0001112222671508789, -7.37309455871582e-05, -3.62396240234375e-05, 1.2516975402832031e-06, 3.8743019104003906e-05, 7.623434066772461e-05, 0.00011372566223144531, 0.00015121698379516602, 0.00018870830535888672, 0.00022619962692260742, 0.0002636909484863281, 0.00030118227005004883, 0.00033867359161376953, 0.00037616491317749023, 0.00041365623474121094, 0.00045114755630493164, 0.0004886388778686523, 0.000526130199432373, 0.0005636215209960938, 0.0006011128425598145, 0.0006386041641235352, 0.0006760954856872559, 0.0007135868072509766, 0.0007510781288146973, 0.000788569450378418, 0.0008260607719421387, 0.0008635520935058594, 0.0009010434150695801, 0.0009385347366333008, 0.0009760260581970215, 0.0010135173797607422, 0.0010510087013244629, 0.0010885000228881836, 0.0011259913444519043, 0.001163482666015625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 8.0, 9.0, 11.0, 13.0, 32.0, 48.0, 87.0, 121.0, 273.0, 564.0, 1496.0, 4340.0, 18328.0, 201375.0, 760562.0, 48945.0, 8116.0, 2477.0, 908.0, 408.0, 166.0, 92.0, 49.0, 28.0, 24.0, 21.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.37890625, -7.1500244140625, -6.921142578125, -6.6922607421875, -6.46337890625, -6.2344970703125, -6.005615234375, -5.7767333984375, -5.5478515625, -5.3189697265625, -5.090087890625, -4.8612060546875, -4.63232421875, -4.4034423828125, -4.174560546875, -3.9456787109375, -3.716796875, -3.4879150390625, -3.259033203125, -3.0301513671875, -2.80126953125, -2.5723876953125, -2.343505859375, -2.1146240234375, -1.8857421875, -1.6568603515625, -1.427978515625, -1.1990966796875, -0.97021484375, -0.7413330078125, -0.512451171875, -0.2835693359375, -0.0546875, 0.1741943359375, 0.403076171875, 0.6319580078125, 0.86083984375, 1.0897216796875, 1.318603515625, 1.5474853515625, 1.7763671875, 2.0052490234375, 2.234130859375, 2.4630126953125, 2.69189453125, 2.9207763671875, 3.149658203125, 3.3785400390625, 3.607421875, 3.8363037109375, 4.065185546875, 4.2940673828125, 4.52294921875, 4.7518310546875, 4.980712890625, 5.2095947265625, 5.4384765625, 5.6673583984375, 5.896240234375, 6.1251220703125, 6.35400390625, 6.5828857421875, 6.811767578125, 7.0406494140625, 7.26953125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 6.0, 7.0, 10.0, 18.0, 20.0, 33.0, 46.0, 71.0, 73.0, 107.0, 107.0, 116.0, 105.0, 70.0, 55.0, 39.0, 32.0, 28.0, 17.0, 8.0, 5.0, 5.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.75408935546875, -4.5706787109375, -4.38726806640625, -4.203857421875, -4.02044677734375, -3.8370361328125, -3.65362548828125, -3.47021484375, -3.28680419921875, -3.1033935546875, -2.91998291015625, -2.736572265625, -2.55316162109375, -2.3697509765625, -2.18634033203125, -2.0029296875, -1.81951904296875, -1.6361083984375, -1.45269775390625, -1.269287109375, -1.08587646484375, -0.9024658203125, -0.71905517578125, -0.53564453125, -0.35223388671875, -0.1688232421875, 0.01458740234375, 0.197998046875, 0.38140869140625, 0.5648193359375, 0.74822998046875, 0.931640625, 1.11505126953125, 1.2984619140625, 1.48187255859375, 1.665283203125, 1.84869384765625, 2.0321044921875, 2.21551513671875, 2.39892578125, 2.58233642578125, 2.7657470703125, 2.94915771484375, 3.132568359375, 3.31597900390625, 3.4993896484375, 3.68280029296875, 3.8662109375, 4.04962158203125, 4.2330322265625, 4.41644287109375, 4.599853515625, 4.78326416015625, 4.9666748046875, 5.15008544921875, 5.33349609375, 5.51690673828125, 5.7003173828125, 5.88372802734375, 6.067138671875, 6.25054931640625, 6.4339599609375, 6.61737060546875, 6.80078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 12.0, 16.0, 149.0, 570.0, 197.0, 35.0, 10.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-261.16143798828125, -249.56187438964844, -237.96231079101562, -226.36276245117188, -214.76318359375, -203.16363525390625, -191.56407165527344, -179.96450805664062, -168.3649444580078, -156.765380859375, -145.1658172607422, -133.56625366210938, -121.9666976928711, -110.36713409423828, -98.767578125, -87.16801452636719, -75.56845092773438, -63.96888732910156, -52.369327545166016, -40.76976776123047, -29.170204162597656, -17.570640563964844, -5.9710845947265625, 5.62847900390625, 17.228042602539062, 28.827604293823242, 40.42716598510742, 52.02672576904297, 63.62628936767578, 75.2258529663086, 86.82540893554688, 98.42497253417969, 110.0245361328125, 121.62409973144531, 133.22366333007812, 144.82321166992188, 156.42279052734375, 168.0223388671875, 179.6219024658203, 191.22146606445312, 202.82102966308594, 214.42059326171875, 226.02015686035156, 237.61972045898438, 249.21926879882812, 260.81884765625, 272.41839599609375, 284.0179443359375, 295.6175231933594, 307.2170715332031, 318.816650390625, 330.41619873046875, 342.0157775878906, 353.6153259277344, 365.21490478515625, 376.814453125, 388.41400146484375, 400.0135498046875, 411.6131286621094, 423.2126770019531, 434.812255859375, 446.41180419921875, 458.0113525390625, 469.6109313964844, 481.21051025390625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 14.0, 19.0, 15.0, 37.0, 38.0, 53.0, 51.0, 60.0, 92.0, 147.0, 113.0, 71.0, 45.0, 60.0, 37.0, 35.0, 24.0, 27.0, 14.0, 7.0, 15.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.95297241210938, -178.7249298095703, -172.4968719482422, -166.26882934570312, -160.04078674316406, -153.81272888183594, -147.58468627929688, -141.35662841796875, -135.1285858154297, -128.90054321289062, -122.67249298095703, -116.44444274902344, -110.21639251708984, -103.98834228515625, -97.76029968261719, -91.5322494506836, -85.30420684814453, -79.07615661621094, -72.84811401367188, -66.62006378173828, -60.39201354980469, -54.16396713256836, -47.93592071533203, -41.70787048339844, -35.47982406616211, -29.25177574157715, -23.023727416992188, -16.79568099975586, -10.567632675170898, -4.3395843505859375, 1.8884620666503906, 8.116512298583984, 14.344558715820312, 20.572607040405273, 26.800655364990234, 33.02870178222656, 39.256752014160156, 45.484798431396484, 51.71284484863281, 57.940895080566406, 64.1689453125, 70.3969955444336, 76.62503814697266, 82.85308837890625, 89.08113861083984, 95.30918884277344, 101.5372314453125, 107.7652816772461, 113.99332427978516, 120.22137451171875, 126.44941711425781, 132.67745971679688, 138.905517578125, 145.13356018066406, 151.36160278320312, 157.58966064453125, 163.8177032470703, 170.04574584960938, 176.2738037109375, 182.50184631347656, 188.72988891601562, 194.95794677734375, 201.1859893798828, 207.41403198242188, 213.64208984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 16.0, 20.0, 29.0, 48.0, 97.0, 151.0, 327.0, 620.0, 1386.0, 3357.0, 11404.0, 166375.0, 3812491.0, 184554.0, 9539.0, 2240.0, 846.0, 364.0, 184.0, 89.0, 38.0, 29.0, 21.0, 14.0, 7.0, 4.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.84375, -13.168701171875, -12.49365234375, -11.818603515625, -11.1435546875, -10.468505859375, -9.79345703125, -9.118408203125, -8.443359375, -7.768310546875, -7.09326171875, -6.418212890625, -5.7431640625, -5.068115234375, -4.39306640625, -3.718017578125, -3.04296875, -2.367919921875, -1.69287109375, -1.017822265625, -0.3427734375, 0.332275390625, 1.00732421875, 1.682373046875, 2.357421875, 3.032470703125, 3.70751953125, 4.382568359375, 5.0576171875, 5.732666015625, 6.40771484375, 7.082763671875, 7.7578125, 8.432861328125, 9.10791015625, 9.782958984375, 10.4580078125, 11.133056640625, 11.80810546875, 12.483154296875, 13.158203125, 13.833251953125, 14.50830078125, 15.183349609375, 15.8583984375, 16.533447265625, 17.20849609375, 17.883544921875, 18.55859375, 19.233642578125, 19.90869140625, 20.583740234375, 21.2587890625, 21.933837890625, 22.60888671875, 23.283935546875, 23.958984375, 24.634033203125, 25.30908203125, 25.984130859375, 26.6591796875, 27.334228515625, 28.00927734375, 28.684326171875, 29.359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 10.0, 18.0, 48.0, 56.0, 90.0, 119.0, 125.0, 135.0, 120.0, 125.0, 75.0, 38.0, 18.0, 16.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5390625, -13.7840576171875, -13.029052734375, -12.2740478515625, -11.51904296875, -10.7640380859375, -10.009033203125, -9.2540283203125, -8.4990234375, -7.7440185546875, -6.989013671875, -6.2340087890625, -5.47900390625, -4.7239990234375, -3.968994140625, -3.2139892578125, -2.458984375, -1.7039794921875, -0.948974609375, -0.1939697265625, 0.56103515625, 1.3160400390625, 2.071044921875, 2.8260498046875, 3.5810546875, 4.3360595703125, 5.091064453125, 5.8460693359375, 6.60107421875, 7.3560791015625, 8.111083984375, 8.8660888671875, 9.62109375, 10.3760986328125, 11.131103515625, 11.8861083984375, 12.64111328125, 13.3961181640625, 14.151123046875, 14.9061279296875, 15.6611328125, 16.4161376953125, 17.171142578125, 17.9261474609375, 18.68115234375, 19.4361572265625, 20.191162109375, 20.9461669921875, 21.701171875, 22.4561767578125, 23.211181640625, 23.9661865234375, 24.72119140625, 25.4761962890625, 26.231201171875, 26.9862060546875, 27.7412109375, 28.4962158203125, 29.251220703125, 30.0062255859375, 30.76123046875, 31.5162353515625, 32.271240234375, 33.0262451171875, 33.78125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 3.0, 7.0, 10.0, 10.0, 19.0, 26.0, 31.0, 51.0, 103.0, 198.0, 564.0, 1861.0, 8956.0, 92127.0, 3744105.0, 325019.0, 16807.0, 2915.0, 849.0, 289.0, 114.0, 70.0, 42.0, 31.0, 24.0, 8.0, 8.0, 7.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-22.671875, -22.08544921875, -21.4990234375, -20.91259765625, -20.326171875, -19.73974609375, -19.1533203125, -18.56689453125, -17.98046875, -17.39404296875, -16.8076171875, -16.22119140625, -15.634765625, -15.04833984375, -14.4619140625, -13.87548828125, -13.2890625, -12.70263671875, -12.1162109375, -11.52978515625, -10.943359375, -10.35693359375, -9.7705078125, -9.18408203125, -8.59765625, -8.01123046875, -7.4248046875, -6.83837890625, -6.251953125, -5.66552734375, -5.0791015625, -4.49267578125, -3.90625, -3.31982421875, -2.7333984375, -2.14697265625, -1.560546875, -0.97412109375, -0.3876953125, 0.19873046875, 0.78515625, 1.37158203125, 1.9580078125, 2.54443359375, 3.130859375, 3.71728515625, 4.3037109375, 4.89013671875, 5.4765625, 6.06298828125, 6.6494140625, 7.23583984375, 7.822265625, 8.40869140625, 8.9951171875, 9.58154296875, 10.16796875, 10.75439453125, 11.3408203125, 11.92724609375, 12.513671875, 13.10009765625, 13.6865234375, 14.27294921875, 14.859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 11.0, 9.0, 13.0, 15.0, 27.0, 40.0, 75.0, 174.0, 268.0, 494.0, 692.0, 792.0, 576.0, 363.0, 184.0, 102.0, 64.0, 41.0, 31.0, 20.0, 20.0, 15.0, 8.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2265625, -12.7896728515625, -12.352783203125, -11.9158935546875, -11.47900390625, -11.0421142578125, -10.605224609375, -10.1683349609375, -9.7314453125, -9.2945556640625, -8.857666015625, -8.4207763671875, -7.98388671875, -7.5469970703125, -7.110107421875, -6.6732177734375, -6.236328125, -5.7994384765625, -5.362548828125, -4.9256591796875, -4.48876953125, -4.0518798828125, -3.614990234375, -3.1781005859375, -2.7412109375, -2.3043212890625, -1.867431640625, -1.4305419921875, -0.99365234375, -0.5567626953125, -0.119873046875, 0.3170166015625, 0.75390625, 1.1907958984375, 1.627685546875, 2.0645751953125, 2.50146484375, 2.9383544921875, 3.375244140625, 3.8121337890625, 4.2490234375, 4.6859130859375, 5.122802734375, 5.5596923828125, 5.99658203125, 6.4334716796875, 6.870361328125, 7.3072509765625, 7.744140625, 8.1810302734375, 8.617919921875, 9.0548095703125, 9.49169921875, 9.9285888671875, 10.365478515625, 10.8023681640625, 11.2392578125, 11.6761474609375, 12.113037109375, 12.5499267578125, 12.98681640625, 13.4237060546875, 13.860595703125, 14.2974853515625, 14.734375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 11.0, 45.0, 310.0, 503.0, 114.0, 15.0, 11.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.47637939453125, -191.0307159423828, -181.58506774902344, -172.139404296875, -162.69375610351562, -153.2480926513672, -143.80242919921875, -134.35678100585938, -124.91112518310547, -115.46546936035156, -106.01981353759766, -96.57415771484375, -87.12849426269531, -77.68284606933594, -68.2371826171875, -58.791526794433594, -49.34587097167969, -39.90021514892578, -30.454557418823242, -21.008899688720703, -11.563243865966797, -2.1175880432128906, 7.328071594238281, 16.773727416992188, 26.219383239746094, 35.6650390625, 45.110694885253906, 54.55635452270508, 64.00201416015625, 73.44766235351562, 82.89332580566406, 92.33898162841797, 101.78463745117188, 111.23029327392578, 120.67594909667969, 130.12161254882812, 139.5672607421875, 149.01292419433594, 158.45858764648438, 167.90423583984375, 177.34988403320312, 186.79554748535156, 196.24119567871094, 205.68685913085938, 215.13250732421875, 224.5781707763672, 234.02383422851562, 243.469482421875, 252.91514587402344, 262.3608093261719, 271.80645751953125, 281.2521057128906, 290.6977844238281, 300.1434326171875, 309.5890808105469, 319.03472900390625, 328.48040771484375, 337.9260559082031, 347.3717346191406, 356.8173828125, 366.2630310058594, 375.70867919921875, 385.15435791015625, 394.6000061035156, 404.045654296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 7.0, 4.0, 8.0, 9.0, 15.0, 22.0, 18.0, 26.0, 31.0, 31.0, 42.0, 41.0, 44.0, 55.0, 47.0, 46.0, 50.0, 58.0, 48.0, 47.0, 54.0, 37.0, 37.0, 38.0, 40.0, 23.0, 16.0, 23.0, 27.0, 9.0, 14.0, 10.0, 3.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.53143310546875, -57.66530227661133, -55.79916763305664, -53.93303680419922, -52.06690216064453, -50.20077133178711, -48.33464050292969, -46.468505859375, -44.60237503051758, -42.736244201660156, -40.87010955810547, -39.00397872924805, -37.13784408569336, -35.27171325683594, -33.40557861328125, -31.539447784423828, -29.673315048217773, -27.80718231201172, -25.941049575805664, -24.07491683959961, -22.208786010742188, -20.342653274536133, -18.476520538330078, -16.610389709472656, -14.744256019592285, -12.87812328338623, -11.011991500854492, -9.145858764648438, -7.279726505279541, -5.4135942459106445, -3.54746150970459, -1.6813297271728516, 0.18480300903320312, 2.0509352684020996, 3.917067766189575, 5.783200263977051, 7.649332523345947, 9.515464782714844, 11.381597518920898, 13.247729301452637, 15.113862037658691, 16.97999382019043, 18.846126556396484, 20.71225929260254, 22.578392028808594, 24.444522857666016, 26.310657501220703, 28.176788330078125, 30.04292106628418, 31.909053802490234, 33.775184631347656, 35.641319274902344, 37.507450103759766, 39.37358093261719, 41.239715576171875, 43.1058464050293, 44.971981048583984, 46.838111877441406, 48.704246520996094, 50.570377349853516, 52.4365119934082, 54.302642822265625, 56.16877746582031, 58.034908294677734, 59.901039123535156]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 11.0, 8.0, 19.0, 18.0, 24.0, 42.0, 48.0, 84.0, 140.0, 254.0, 499.0, 1398.0, 6419.0, 87060.0, 872321.0, 72132.0, 5708.0, 1315.0, 450.0, 227.0, 128.0, 84.0, 55.0, 29.0, 13.0, 18.0, 13.0, 10.0, 8.0, 6.0, 3.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.765625, -27.718505859375, -26.67138671875, -25.624267578125, -24.5771484375, -23.530029296875, -22.48291015625, -21.435791015625, -20.388671875, -19.341552734375, -18.29443359375, -17.247314453125, -16.2001953125, -15.153076171875, -14.10595703125, -13.058837890625, -12.01171875, -10.964599609375, -9.91748046875, -8.870361328125, -7.8232421875, -6.776123046875, -5.72900390625, -4.681884765625, -3.634765625, -2.587646484375, -1.54052734375, -0.493408203125, 0.5537109375, 1.600830078125, 2.64794921875, 3.695068359375, 4.7421875, 5.789306640625, 6.83642578125, 7.883544921875, 8.9306640625, 9.977783203125, 11.02490234375, 12.072021484375, 13.119140625, 14.166259765625, 15.21337890625, 16.260498046875, 17.3076171875, 18.354736328125, 19.40185546875, 20.448974609375, 21.49609375, 22.543212890625, 23.59033203125, 24.637451171875, 25.6845703125, 26.731689453125, 27.77880859375, 28.825927734375, 29.873046875, 30.920166015625, 31.96728515625, 33.014404296875, 34.0615234375, 35.108642578125, 36.15576171875, 37.202880859375, 38.25]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 13.0, 25.0, 43.0, 48.0, 91.0, 119.0, 134.0, 143.0, 115.0, 101.0, 72.0, 52.0, 21.0, 13.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5625, -13.80615234375, -13.0498046875, -12.29345703125, -11.537109375, -10.78076171875, -10.0244140625, -9.26806640625, -8.51171875, -7.75537109375, -6.9990234375, -6.24267578125, -5.486328125, -4.72998046875, -3.9736328125, -3.21728515625, -2.4609375, -1.70458984375, -0.9482421875, -0.19189453125, 0.564453125, 1.32080078125, 2.0771484375, 2.83349609375, 3.58984375, 4.34619140625, 5.1025390625, 5.85888671875, 6.615234375, 7.37158203125, 8.1279296875, 8.88427734375, 9.640625, 10.39697265625, 11.1533203125, 11.90966796875, 12.666015625, 13.42236328125, 14.1787109375, 14.93505859375, 15.69140625, 16.44775390625, 17.2041015625, 17.96044921875, 18.716796875, 19.47314453125, 20.2294921875, 20.98583984375, 21.7421875, 22.49853515625, 23.2548828125, 24.01123046875, 24.767578125, 25.52392578125, 26.2802734375, 27.03662109375, 27.79296875, 28.54931640625, 29.3056640625, 30.06201171875, 30.818359375, 31.57470703125, 32.3310546875, 33.08740234375, 33.84375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 8.0, 8.0, 8.0, 1.0, 7.0, 8.0, 7.0, 17.0, 18.0, 29.0, 31.0, 47.0, 80.0, 118.0, 211.0, 501.0, 1365.0, 5417.0, 71528.0, 931744.0, 31546.0, 3783.0, 1083.0, 426.0, 206.0, 118.0, 75.0, 32.0, 30.0, 30.0, 17.0, 12.0, 11.0, 10.0, 6.0, 4.0, 5.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.125, -37.83740234375, -36.5498046875, -35.26220703125, -33.974609375, -32.68701171875, -31.3994140625, -30.11181640625, -28.82421875, -27.53662109375, -26.2490234375, -24.96142578125, -23.673828125, -22.38623046875, -21.0986328125, -19.81103515625, -18.5234375, -17.23583984375, -15.9482421875, -14.66064453125, -13.373046875, -12.08544921875, -10.7978515625, -9.51025390625, -8.22265625, -6.93505859375, -5.6474609375, -4.35986328125, -3.072265625, -1.78466796875, -0.4970703125, 0.79052734375, 2.078125, 3.36572265625, 4.6533203125, 5.94091796875, 7.228515625, 8.51611328125, 9.8037109375, 11.09130859375, 12.37890625, 13.66650390625, 14.9541015625, 16.24169921875, 17.529296875, 18.81689453125, 20.1044921875, 21.39208984375, 22.6796875, 23.96728515625, 25.2548828125, 26.54248046875, 27.830078125, 29.11767578125, 30.4052734375, 31.69287109375, 32.98046875, 34.26806640625, 35.5556640625, 36.84326171875, 38.130859375, 39.41845703125, 40.7060546875, 41.99365234375, 43.28125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 1.0, 6.0, 4.0, 10.0, 11.0, 11.0, 11.0, 16.0, 23.0, 29.0, 32.0, 42.0, 45.0, 41.0, 45.0, 70.0, 57.0, 52.0, 56.0, 49.0, 44.0, 50.0, 44.0, 37.0, 36.0, 28.0, 25.0, 22.0, 17.0, 15.0, 15.0, 14.0, 9.0, 8.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.0625, -33.9638671875, -32.865234375, -31.7666015625, -30.66796875, -29.5693359375, -28.470703125, -27.3720703125, -26.2734375, -25.1748046875, -24.076171875, -22.9775390625, -21.87890625, -20.7802734375, -19.681640625, -18.5830078125, -17.484375, -16.3857421875, -15.287109375, -14.1884765625, -13.08984375, -11.9912109375, -10.892578125, -9.7939453125, -8.6953125, -7.5966796875, -6.498046875, -5.3994140625, -4.30078125, -3.2021484375, -2.103515625, -1.0048828125, 0.09375, 1.1923828125, 2.291015625, 3.3896484375, 4.48828125, 5.5869140625, 6.685546875, 7.7841796875, 8.8828125, 9.9814453125, 11.080078125, 12.1787109375, 13.27734375, 14.3759765625, 15.474609375, 16.5732421875, 17.671875, 18.7705078125, 19.869140625, 20.9677734375, 22.06640625, 23.1650390625, 24.263671875, 25.3623046875, 26.4609375, 27.5595703125, 28.658203125, 29.7568359375, 30.85546875, 31.9541015625, 33.052734375, 34.1513671875, 35.25]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 4.0, 13.0, 9.0, 6.0, 15.0, 26.0, 25.0, 26.0, 57.0, 96.0, 163.0, 385.0, 926.0, 2693.0, 12179.0, 907826.0, 114416.0, 6597.0, 1755.0, 651.0, 268.0, 138.0, 84.0, 48.0, 39.0, 22.0, 22.0, 13.0, 14.0, 4.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-15.484375, -15.0638427734375, -14.643310546875, -14.2227783203125, -13.80224609375, -13.3817138671875, -12.961181640625, -12.5406494140625, -12.1201171875, -11.6995849609375, -11.279052734375, -10.8585205078125, -10.43798828125, -10.0174560546875, -9.596923828125, -9.1763916015625, -8.755859375, -8.3353271484375, -7.914794921875, -7.4942626953125, -7.07373046875, -6.6531982421875, -6.232666015625, -5.8121337890625, -5.3916015625, -4.9710693359375, -4.550537109375, -4.1300048828125, -3.70947265625, -3.2889404296875, -2.868408203125, -2.4478759765625, -2.02734375, -1.6068115234375, -1.186279296875, -0.7657470703125, -0.34521484375, 0.0753173828125, 0.495849609375, 0.9163818359375, 1.3369140625, 1.7574462890625, 2.177978515625, 2.5985107421875, 3.01904296875, 3.4395751953125, 3.860107421875, 4.2806396484375, 4.701171875, 5.1217041015625, 5.542236328125, 5.9627685546875, 6.38330078125, 6.8038330078125, 7.224365234375, 7.6448974609375, 8.0654296875, 8.4859619140625, 8.906494140625, 9.3270263671875, 9.74755859375, 10.1680908203125, 10.588623046875, 11.0091552734375, 11.4296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 8.0, 10.0, 21.0, 30.0, 78.0, 230.0, 338.0, 142.0, 61.0, 22.0, 19.0, 13.0, 6.0, 4.0, 5.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00201416015625, -0.0019429028034210205, -0.001871645450592041, -0.0018003880977630615, -0.001729130744934082, -0.0016578733921051025, -0.001586616039276123, -0.0015153586864471436, -0.001444101333618164, -0.0013728439807891846, -0.001301586627960205, -0.0012303292751312256, -0.001159071922302246, -0.0010878145694732666, -0.0010165572166442871, -0.0009452998638153076, -0.0008740425109863281, -0.0008027851581573486, -0.0007315278053283691, -0.0006602704524993896, -0.0005890130996704102, -0.0005177557468414307, -0.00044649839401245117, -0.0003752410411834717, -0.0003039836883544922, -0.0002327263355255127, -0.0001614689826965332, -9.021162986755371e-05, -1.895427703857422e-05, 5.2303075790405273e-05, 0.00012356042861938477, 0.00019481778144836426, 0.00026607513427734375, 0.00033733248710632324, 0.00040858983993530273, 0.0004798471927642822, 0.0005511045455932617, 0.0006223618984222412, 0.0006936192512512207, 0.0007648766040802002, 0.0008361339569091797, 0.0009073913097381592, 0.0009786486625671387, 0.0010499060153961182, 0.0011211633682250977, 0.0011924207210540771, 0.0012636780738830566, 0.0013349354267120361, 0.0014061927795410156, 0.0014774501323699951, 0.0015487074851989746, 0.001619964838027954, 0.0016912221908569336, 0.001762479543685913, 0.0018337368965148926, 0.001904994249343872, 0.0019762516021728516, 0.002047508955001831, 0.0021187663078308105, 0.00219002366065979, 0.0022612810134887695, 0.002332538366317749, 0.0024037957191467285, 0.002475053071975708, 0.0025463104248046875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 7.0, 6.0, 8.0, 8.0, 12.0, 15.0, 24.0, 16.0, 23.0, 38.0, 49.0, 99.0, 125.0, 224.0, 404.0, 768.0, 1477.0, 3584.0, 11454.0, 112349.0, 870315.0, 35550.0, 6906.0, 2552.0, 1133.0, 553.0, 286.0, 190.0, 113.0, 60.0, 48.0, 46.0, 27.0, 14.0, 19.0, 11.0, 10.0, 9.0, 7.0, 8.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.6015625, -7.3507080078125, -7.099853515625, -6.8489990234375, -6.59814453125, -6.3472900390625, -6.096435546875, -5.8455810546875, -5.5947265625, -5.3438720703125, -5.093017578125, -4.8421630859375, -4.59130859375, -4.3404541015625, -4.089599609375, -3.8387451171875, -3.587890625, -3.3370361328125, -3.086181640625, -2.8353271484375, -2.58447265625, -2.3336181640625, -2.082763671875, -1.8319091796875, -1.5810546875, -1.3302001953125, -1.079345703125, -0.8284912109375, -0.57763671875, -0.3267822265625, -0.075927734375, 0.1749267578125, 0.42578125, 0.6766357421875, 0.927490234375, 1.1783447265625, 1.42919921875, 1.6800537109375, 1.930908203125, 2.1817626953125, 2.4326171875, 2.6834716796875, 2.934326171875, 3.1851806640625, 3.43603515625, 3.6868896484375, 3.937744140625, 4.1885986328125, 4.439453125, 4.6903076171875, 4.941162109375, 5.1920166015625, 5.44287109375, 5.6937255859375, 5.944580078125, 6.1954345703125, 6.4462890625, 6.6971435546875, 6.947998046875, 7.1988525390625, 7.44970703125, 7.7005615234375, 7.951416015625, 8.2022705078125, 8.453125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 5.0, 2.0, 10.0, 36.0, 82.0, 358.0, 359.0, 92.0, 27.0, 13.0, 7.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.9619140625, -24.267578125, -23.5732421875, -22.87890625, -22.1845703125, -21.490234375, -20.7958984375, -20.1015625, -19.4072265625, -18.712890625, -18.0185546875, -17.32421875, -16.6298828125, -15.935546875, -15.2412109375, -14.546875, -13.8525390625, -13.158203125, -12.4638671875, -11.76953125, -11.0751953125, -10.380859375, -9.6865234375, -8.9921875, -8.2978515625, -7.603515625, -6.9091796875, -6.21484375, -5.5205078125, -4.826171875, -4.1318359375, -3.4375, -2.7431640625, -2.048828125, -1.3544921875, -0.66015625, 0.0341796875, 0.728515625, 1.4228515625, 2.1171875, 2.8115234375, 3.505859375, 4.2001953125, 4.89453125, 5.5888671875, 6.283203125, 6.9775390625, 7.671875, 8.3662109375, 9.060546875, 9.7548828125, 10.44921875, 11.1435546875, 11.837890625, 12.5322265625, 13.2265625, 13.9208984375, 14.615234375, 15.3095703125, 16.00390625, 16.6982421875, 17.392578125, 18.0869140625, 18.78125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 1.0, 10.0, 31.0, 78.0, 412.0, 355.0, 78.0, 12.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-403.9385070800781, -393.5765686035156, -383.2146301269531, -372.85272216796875, -362.49078369140625, -352.12884521484375, -341.76690673828125, -331.40496826171875, -321.0430603027344, -310.6811218261719, -300.3191833496094, -289.957275390625, -279.5953369140625, -269.2333984375, -258.8714599609375, -248.50953674316406, -238.14759826660156, -227.78565979003906, -217.42373657226562, -207.06179809570312, -196.6998748779297, -186.3379364013672, -175.97601318359375, -165.61407470703125, -155.25213623046875, -144.89019775390625, -134.5282745361328, -124.16633605957031, -113.80441284179688, -103.44247436523438, -93.0805435180664, -82.71861267089844, -72.356689453125, -61.99475860595703, -51.63282775878906, -41.27089309692383, -30.90896224975586, -20.54703140258789, -10.185096740722656, 0.1768341064453125, 10.538764953613281, 20.90069580078125, 31.26262855529785, 41.62456130981445, 51.98649215698242, 62.34842300415039, 72.71035766601562, 83.0722885131836, 93.43421936035156, 103.79615020751953, 114.1580810546875, 124.52001953125, 134.88194274902344, 145.24388122558594, 155.60580444335938, 165.96774291992188, 176.32968139648438, 186.69161987304688, 197.0535430908203, 207.4154815673828, 217.77740478515625, 228.13934326171875, 238.50128173828125, 248.8632049560547, 259.2251281738281]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 11.0, 11.0, 24.0, 26.0, 22.0, 25.0, 36.0, 37.0, 41.0, 52.0, 54.0, 141.0, 113.0, 84.0, 67.0, 39.0, 44.0, 34.0, 38.0, 26.0, 17.0, 10.0, 19.0, 10.0, 4.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.90231323242188, -174.29664611816406, -168.69097900390625, -163.08531188964844, -157.47964477539062, -151.8739776611328, -146.268310546875, -140.66265869140625, -135.05697631835938, -129.45130920410156, -123.84564208984375, -118.23997497558594, -112.63430786132812, -107.02864074707031, -101.42298126220703, -95.81731414794922, -90.21165466308594, -84.60598754882812, -79.00032043457031, -73.3946533203125, -67.78898620605469, -62.18332290649414, -56.577659606933594, -50.97199249267578, -45.36632537841797, -39.760658264160156, -34.154991149902344, -28.549327850341797, -22.943660736083984, -17.337993621826172, -11.732330322265625, -6.1266632080078125, -0.52099609375, 5.084670066833496, 10.690336227416992, 16.296001434326172, 21.901668548583984, 27.507335662841797, 33.112998962402344, 38.718666076660156, 44.32433319091797, 49.93000030517578, 55.535667419433594, 61.14133071899414, 66.74699401855469, 72.3526611328125, 77.95832824707031, 83.56399536132812, 89.16966247558594, 94.77532958984375, 100.38099670410156, 105.98666381835938, 111.59233093261719, 117.197998046875, 122.80365753173828, 128.40933227539062, 134.01498413085938, 139.6206512451172, 145.226318359375, 150.8319854736328, 156.43765258789062, 162.04331970214844, 167.64898681640625, 173.254638671875, 178.86032104492188]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 12.0, 10.0, 13.0, 3.0, 21.0, 25.0, 50.0, 76.0, 130.0, 158.0, 308.0, 464.0, 800.0, 1334.0, 2605.0, 6486.0, 24880.0, 290221.0, 3248684.0, 576112.0, 31850.0, 6115.0, 2075.0, 789.0, 428.0, 233.0, 116.0, 81.0, 58.0, 46.0, 21.0, 22.0, 6.0, 13.0, 5.0, 6.0, 9.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.390625, -13.9351806640625, -13.479736328125, -13.0242919921875, -12.56884765625, -12.1134033203125, -11.657958984375, -11.2025146484375, -10.7470703125, -10.2916259765625, -9.836181640625, -9.3807373046875, -8.92529296875, -8.4698486328125, -8.014404296875, -7.5589599609375, -7.103515625, -6.6480712890625, -6.192626953125, -5.7371826171875, -5.28173828125, -4.8262939453125, -4.370849609375, -3.9154052734375, -3.4599609375, -3.0045166015625, -2.549072265625, -2.0936279296875, -1.63818359375, -1.1827392578125, -0.727294921875, -0.2718505859375, 0.18359375, 0.6390380859375, 1.094482421875, 1.5499267578125, 2.00537109375, 2.4608154296875, 2.916259765625, 3.3717041015625, 3.8271484375, 4.2825927734375, 4.738037109375, 5.1934814453125, 5.64892578125, 6.1043701171875, 6.559814453125, 7.0152587890625, 7.470703125, 7.9261474609375, 8.381591796875, 8.8370361328125, 9.29248046875, 9.7479248046875, 10.203369140625, 10.6588134765625, 11.1142578125, 11.5697021484375, 12.025146484375, 12.4805908203125, 12.93603515625, 13.3914794921875, 13.846923828125, 14.3023681640625, 14.7578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 11.0, 23.0, 34.0, 44.0, 54.0, 95.0, 104.0, 96.0, 105.0, 119.0, 105.0, 61.0, 49.0, 47.0, 23.0, 12.0, 11.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.5546875, -11.9388427734375, -11.322998046875, -10.7071533203125, -10.09130859375, -9.4754638671875, -8.859619140625, -8.2437744140625, -7.6279296875, -7.0120849609375, -6.396240234375, -5.7803955078125, -5.16455078125, -4.5487060546875, -3.932861328125, -3.3170166015625, -2.701171875, -2.0853271484375, -1.469482421875, -0.8536376953125, -0.23779296875, 0.3780517578125, 0.993896484375, 1.6097412109375, 2.2255859375, 2.8414306640625, 3.457275390625, 4.0731201171875, 4.68896484375, 5.3048095703125, 5.920654296875, 6.5364990234375, 7.15234375, 7.7681884765625, 8.384033203125, 8.9998779296875, 9.61572265625, 10.2315673828125, 10.847412109375, 11.4632568359375, 12.0791015625, 12.6949462890625, 13.310791015625, 13.9266357421875, 14.54248046875, 15.1583251953125, 15.774169921875, 16.3900146484375, 17.005859375, 17.6217041015625, 18.237548828125, 18.8533935546875, 19.46923828125, 20.0850830078125, 20.700927734375, 21.3167724609375, 21.9326171875, 22.5484619140625, 23.164306640625, 23.7801513671875, 24.39599609375, 25.0118408203125, 25.627685546875, 26.2435302734375, 26.859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 6.0, 13.0, 6.0, 17.0, 24.0, 22.0, 59.0, 78.0, 164.0, 328.0, 892.0, 3734.0, 20887.0, 610998.0, 3483403.0, 63503.0, 7290.0, 1787.0, 482.0, 235.0, 116.0, 74.0, 37.0, 31.0, 26.0, 18.0, 7.0, 11.0, 5.0, 8.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.4375, -19.857177734375, -19.27685546875, -18.696533203125, -18.1162109375, -17.535888671875, -16.95556640625, -16.375244140625, -15.794921875, -15.214599609375, -14.63427734375, -14.053955078125, -13.4736328125, -12.893310546875, -12.31298828125, -11.732666015625, -11.15234375, -10.572021484375, -9.99169921875, -9.411376953125, -8.8310546875, -8.250732421875, -7.67041015625, -7.090087890625, -6.509765625, -5.929443359375, -5.34912109375, -4.768798828125, -4.1884765625, -3.608154296875, -3.02783203125, -2.447509765625, -1.8671875, -1.286865234375, -0.70654296875, -0.126220703125, 0.4541015625, 1.034423828125, 1.61474609375, 2.195068359375, 2.775390625, 3.355712890625, 3.93603515625, 4.516357421875, 5.0966796875, 5.677001953125, 6.25732421875, 6.837646484375, 7.41796875, 7.998291015625, 8.57861328125, 9.158935546875, 9.7392578125, 10.319580078125, 10.89990234375, 11.480224609375, 12.060546875, 12.640869140625, 13.22119140625, 13.801513671875, 14.3818359375, 14.962158203125, 15.54248046875, 16.122802734375, 16.703125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 7.0, 5.0, 19.0, 17.0, 31.0, 40.0, 72.0, 105.0, 213.0, 387.0, 662.0, 827.0, 645.0, 456.0, 240.0, 117.0, 72.0, 39.0, 29.0, 23.0, 16.0, 12.0, 5.0, 9.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-19.25, -18.7645263671875, -18.279052734375, -17.7935791015625, -17.30810546875, -16.8226318359375, -16.337158203125, -15.8516845703125, -15.3662109375, -14.8807373046875, -14.395263671875, -13.9097900390625, -13.42431640625, -12.9388427734375, -12.453369140625, -11.9678955078125, -11.482421875, -10.9969482421875, -10.511474609375, -10.0260009765625, -9.54052734375, -9.0550537109375, -8.569580078125, -8.0841064453125, -7.5986328125, -7.1131591796875, -6.627685546875, -6.1422119140625, -5.65673828125, -5.1712646484375, -4.685791015625, -4.2003173828125, -3.71484375, -3.2293701171875, -2.743896484375, -2.2584228515625, -1.77294921875, -1.2874755859375, -0.802001953125, -0.3165283203125, 0.1689453125, 0.6544189453125, 1.139892578125, 1.6253662109375, 2.11083984375, 2.5963134765625, 3.081787109375, 3.5672607421875, 4.052734375, 4.5382080078125, 5.023681640625, 5.5091552734375, 5.99462890625, 6.4801025390625, 6.965576171875, 7.4510498046875, 7.9365234375, 8.4219970703125, 8.907470703125, 9.3929443359375, 9.87841796875, 10.3638916015625, 10.849365234375, 11.3348388671875, 11.8203125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 7.0, 15.0, 34.0, 70.0, 129.0, 180.0, 209.0, 162.0, 86.0, 35.0, 23.0, 15.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-134.03045654296875, -130.5371856689453, -127.04390716552734, -123.5506362915039, -120.05736541748047, -116.5640869140625, -113.07081604003906, -109.57754516601562, -106.08427429199219, -102.59100341796875, -99.09772491455078, -95.60445404052734, -92.1111831665039, -88.61790466308594, -85.1246337890625, -81.63136291503906, -78.13809204101562, -74.64482116699219, -71.15154266357422, -67.65827178955078, -64.16500091552734, -60.67172622680664, -57.17845153808594, -53.6851806640625, -50.19190216064453, -46.69862747192383, -43.20535659790039, -39.71208190917969, -36.21881103515625, -32.72553634643555, -29.232263565063477, -25.738990783691406, -22.24571990966797, -18.7524471282959, -15.259174346923828, -11.765900611877441, -8.272627830505371, -4.779354095458984, -1.286081314086914, 2.2071914672851562, 5.700464248657227, 9.193737030029297, 12.687009811401367, 16.180282592773438, 19.67355728149414, 23.16683006286621, 26.66010284423828, 30.15337562561035, 33.64664840698242, 37.139923095703125, 40.63319396972656, 44.126468658447266, 47.6197395324707, 51.113014221191406, 54.606285095214844, 58.09955978393555, 61.59283447265625, 65.08610534667969, 68.57938385009766, 72.0726547241211, 75.56592559814453, 79.0592041015625, 82.55247497558594, 86.04574584960938, 89.53901672363281]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 9.0, 13.0, 9.0, 10.0, 12.0, 13.0, 21.0, 22.0, 22.0, 33.0, 32.0, 37.0, 36.0, 28.0, 29.0, 53.0, 41.0, 41.0, 35.0, 57.0, 37.0, 46.0, 41.0, 36.0, 39.0, 32.0, 36.0, 26.0, 25.0, 23.0, 16.0, 18.0, 7.0, 9.0, 14.0, 6.0, 8.0, 6.0, 5.0, 2.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0], "bins": [-53.862239837646484, -52.25047302246094, -50.63870620727539, -49.026939392089844, -47.41516876220703, -45.80340576171875, -44.19163513183594, -42.57986831665039, -40.968101501464844, -39.3563346862793, -37.74456787109375, -36.1328010559082, -34.521034240722656, -32.909263610839844, -31.297496795654297, -29.68572998046875, -28.073963165283203, -26.462196350097656, -24.85042953491211, -23.23866081237793, -21.626893997192383, -20.015127182006836, -18.403358459472656, -16.79159164428711, -15.179824829101562, -13.568058013916016, -11.956290245056152, -10.344522476196289, -8.732755661010742, -7.120988845825195, -5.509221076965332, -3.8974533081054688, -2.2856826782226562, -0.6739153861999512, 0.9378519058227539, 2.549619197845459, 4.161386489868164, 5.773153305053711, 7.384921073913574, 8.996688842773438, 10.608455657958984, 12.220222473144531, 13.831990242004395, 15.443758010864258, 17.055524826049805, 18.66729164123535, 20.27906036376953, 21.890827178955078, 23.502593994140625, 25.114360809326172, 26.72612762451172, 28.3378963470459, 29.949663162231445, 31.561429977416992, 33.17319869995117, 34.78496551513672, 36.396732330322266, 38.00849914550781, 39.62026596069336, 41.232032775878906, 42.84380340576172, 44.45556640625, 46.06733703613281, 47.67910385131836, 49.290870666503906]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 10.0, 16.0, 19.0, 29.0, 51.0, 106.0, 175.0, 310.0, 798.0, 2921.0, 23544.0, 610054.0, 390748.0, 16206.0, 2256.0, 652.0, 264.0, 156.0, 69.0, 56.0, 41.0, 25.0, 11.0, 12.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.75, -37.60791015625, -36.4658203125, -35.32373046875, -34.181640625, -33.03955078125, -31.8974609375, -30.75537109375, -29.61328125, -28.47119140625, -27.3291015625, -26.18701171875, -25.044921875, -23.90283203125, -22.7607421875, -21.61865234375, -20.4765625, -19.33447265625, -18.1923828125, -17.05029296875, -15.908203125, -14.76611328125, -13.6240234375, -12.48193359375, -11.33984375, -10.19775390625, -9.0556640625, -7.91357421875, -6.771484375, -5.62939453125, -4.4873046875, -3.34521484375, -2.203125, -1.06103515625, 0.0810546875, 1.22314453125, 2.365234375, 3.50732421875, 4.6494140625, 5.79150390625, 6.93359375, 8.07568359375, 9.2177734375, 10.35986328125, 11.501953125, 12.64404296875, 13.7861328125, 14.92822265625, 16.0703125, 17.21240234375, 18.3544921875, 19.49658203125, 20.638671875, 21.78076171875, 22.9228515625, 24.06494140625, 25.20703125, 26.34912109375, 27.4912109375, 28.63330078125, 29.775390625, 30.91748046875, 32.0595703125, 33.20166015625, 34.34375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 15.0, 23.0, 35.0, 37.0, 68.0, 72.0, 104.0, 113.0, 106.0, 114.0, 95.0, 69.0, 43.0, 51.0, 29.0, 14.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.5546875, -11.9388427734375, -11.322998046875, -10.7071533203125, -10.09130859375, -9.4754638671875, -8.859619140625, -8.2437744140625, -7.6279296875, -7.0120849609375, -6.396240234375, -5.7803955078125, -5.16455078125, -4.5487060546875, -3.932861328125, -3.3170166015625, -2.701171875, -2.0853271484375, -1.469482421875, -0.8536376953125, -0.23779296875, 0.3780517578125, 0.993896484375, 1.6097412109375, 2.2255859375, 2.8414306640625, 3.457275390625, 4.0731201171875, 4.68896484375, 5.3048095703125, 5.920654296875, 6.5364990234375, 7.15234375, 7.7681884765625, 8.384033203125, 8.9998779296875, 9.61572265625, 10.2315673828125, 10.847412109375, 11.4632568359375, 12.0791015625, 12.6949462890625, 13.310791015625, 13.9266357421875, 14.54248046875, 15.1583251953125, 15.774169921875, 16.3900146484375, 17.005859375, 17.6217041015625, 18.237548828125, 18.8533935546875, 19.46923828125, 20.0850830078125, 20.700927734375, 21.3167724609375, 21.9326171875, 22.5484619140625, 23.164306640625, 23.7801513671875, 24.39599609375, 25.0118408203125, 25.627685546875, 26.2435302734375, 26.859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 15.0, 4.0, 6.0, 15.0, 21.0, 27.0, 32.0, 24.0, 32.0, 46.0, 79.0, 132.0, 162.0, 325.0, 504.0, 885.0, 1914.0, 4653.0, 19236.0, 256342.0, 724006.0, 29251.0, 5977.0, 2158.0, 1079.0, 579.0, 360.0, 231.0, 143.0, 77.0, 75.0, 44.0, 23.0, 24.0, 15.0, 9.0, 6.0, 9.0, 6.0, 8.0, 1.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-26.9375, -26.071533203125, -25.20556640625, -24.339599609375, -23.4736328125, -22.607666015625, -21.74169921875, -20.875732421875, -20.009765625, -19.143798828125, -18.27783203125, -17.411865234375, -16.5458984375, -15.679931640625, -14.81396484375, -13.947998046875, -13.08203125, -12.216064453125, -11.35009765625, -10.484130859375, -9.6181640625, -8.752197265625, -7.88623046875, -7.020263671875, -6.154296875, -5.288330078125, -4.42236328125, -3.556396484375, -2.6904296875, -1.824462890625, -0.95849609375, -0.092529296875, 0.7734375, 1.639404296875, 2.50537109375, 3.371337890625, 4.2373046875, 5.103271484375, 5.96923828125, 6.835205078125, 7.701171875, 8.567138671875, 9.43310546875, 10.299072265625, 11.1650390625, 12.031005859375, 12.89697265625, 13.762939453125, 14.62890625, 15.494873046875, 16.36083984375, 17.226806640625, 18.0927734375, 18.958740234375, 19.82470703125, 20.690673828125, 21.556640625, 22.422607421875, 23.28857421875, 24.154541015625, 25.0205078125, 25.886474609375, 26.75244140625, 27.618408203125, 28.484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 19.0, 11.0, 31.0, 29.0, 52.0, 73.0, 95.0, 94.0, 128.0, 94.0, 87.0, 77.0, 70.0, 44.0, 22.0, 19.0, 19.0, 7.0, 9.0, 8.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.375, -63.3125, -61.25, -59.1875, -57.125, -55.0625, -53.0, -50.9375, -48.875, -46.8125, -44.75, -42.6875, -40.625, -38.5625, -36.5, -34.4375, -32.375, -30.3125, -28.25, -26.1875, -24.125, -22.0625, -20.0, -17.9375, -15.875, -13.8125, -11.75, -9.6875, -7.625, -5.5625, -3.5, -1.4375, 0.625, 2.6875, 4.75, 6.8125, 8.875, 10.9375, 13.0, 15.0625, 17.125, 19.1875, 21.25, 23.3125, 25.375, 27.4375, 29.5, 31.5625, 33.625, 35.6875, 37.75, 39.8125, 41.875, 43.9375, 46.0, 48.0625, 50.125, 52.1875, 54.25, 56.3125, 58.375, 60.4375, 62.5, 64.5625, 66.625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 4.0, 15.0, 16.0, 13.0, 28.0, 44.0, 59.0, 65.0, 123.0, 199.0, 411.0, 945.0, 2899.0, 10773.0, 909701.0, 113041.0, 6558.0, 2097.0, 754.0, 301.0, 178.0, 112.0, 65.0, 35.0, 34.0, 20.0, 11.0, 11.0, 8.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6875, -12.276123046875, -11.86474609375, -11.453369140625, -11.0419921875, -10.630615234375, -10.21923828125, -9.807861328125, -9.396484375, -8.985107421875, -8.57373046875, -8.162353515625, -7.7509765625, -7.339599609375, -6.92822265625, -6.516845703125, -6.10546875, -5.694091796875, -5.28271484375, -4.871337890625, -4.4599609375, -4.048583984375, -3.63720703125, -3.225830078125, -2.814453125, -2.403076171875, -1.99169921875, -1.580322265625, -1.1689453125, -0.757568359375, -0.34619140625, 0.065185546875, 0.4765625, 0.887939453125, 1.29931640625, 1.710693359375, 2.1220703125, 2.533447265625, 2.94482421875, 3.356201171875, 3.767578125, 4.178955078125, 4.59033203125, 5.001708984375, 5.4130859375, 5.824462890625, 6.23583984375, 6.647216796875, 7.05859375, 7.469970703125, 7.88134765625, 8.292724609375, 8.7041015625, 9.115478515625, 9.52685546875, 9.938232421875, 10.349609375, 10.760986328125, 11.17236328125, 11.583740234375, 11.9951171875, 12.406494140625, 12.81787109375, 13.229248046875, 13.640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 6.0, 14.0, 19.0, 33.0, 78.0, 206.0, 323.0, 140.0, 62.0, 32.0, 15.0, 12.0, 14.0, 3.0, 7.0, 4.0, 3.0, 0.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026149749755859375, -0.0025449544191360474, -0.0024749338626861572, -0.002404913306236267, -0.002334892749786377, -0.002264872193336487, -0.0021948516368865967, -0.0021248310804367065, -0.0020548105239868164, -0.0019847899675369263, -0.0019147694110870361, -0.001844748854637146, -0.0017747282981872559, -0.0017047077417373657, -0.0016346871852874756, -0.0015646666288375854, -0.0014946460723876953, -0.0014246255159378052, -0.001354604959487915, -0.001284584403038025, -0.0012145638465881348, -0.0011445432901382446, -0.0010745227336883545, -0.0010045021772384644, -0.0009344816207885742, -0.0008644610643386841, -0.0007944405078887939, -0.0007244199514389038, -0.0006543993949890137, -0.0005843788385391235, -0.0005143582820892334, -0.00044433772563934326, -0.0003743171691894531, -0.000304296612739563, -0.00023427605628967285, -0.00016425549983978271, -9.423494338989258e-05, -2.421438694000244e-05, 4.5806169509887695e-05, 0.00011582672595977783, 0.00018584728240966797, 0.0002558678388595581, 0.00032588839530944824, 0.0003959089517593384, 0.0004659295082092285, 0.0005359500646591187, 0.0006059706211090088, 0.0006759911775588989, 0.0007460117340087891, 0.0008160322904586792, 0.0008860528469085693, 0.0009560734033584595, 0.0010260939598083496, 0.0010961145162582397, 0.0011661350727081299, 0.00123615562915802, 0.0013061761856079102, 0.0013761967420578003, 0.0014462172985076904, 0.0015162378549575806, 0.0015862584114074707, 0.0016562789678573608, 0.001726299524307251, 0.0017963200807571411, 0.0018663406372070312]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 9.0, 3.0, 9.0, 10.0, 11.0, 14.0, 16.0, 23.0, 39.0, 45.0, 63.0, 107.0, 158.0, 252.0, 439.0, 896.0, 1983.0, 5036.0, 18330.0, 798459.0, 203342.0, 12015.0, 3786.0, 1644.0, 736.0, 378.0, 234.0, 141.0, 84.0, 57.0, 47.0, 41.0, 36.0, 27.0, 24.0, 13.0, 12.0, 10.0, 3.0, 3.0, 2.0, 3.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.359375, -8.1051025390625, -7.850830078125, -7.5965576171875, -7.34228515625, -7.0880126953125, -6.833740234375, -6.5794677734375, -6.3251953125, -6.0709228515625, -5.816650390625, -5.5623779296875, -5.30810546875, -5.0538330078125, -4.799560546875, -4.5452880859375, -4.291015625, -4.0367431640625, -3.782470703125, -3.5281982421875, -3.27392578125, -3.0196533203125, -2.765380859375, -2.5111083984375, -2.2568359375, -2.0025634765625, -1.748291015625, -1.4940185546875, -1.23974609375, -0.9854736328125, -0.731201171875, -0.4769287109375, -0.22265625, 0.0316162109375, 0.285888671875, 0.5401611328125, 0.79443359375, 1.0487060546875, 1.302978515625, 1.5572509765625, 1.8115234375, 2.0657958984375, 2.320068359375, 2.5743408203125, 2.82861328125, 3.0828857421875, 3.337158203125, 3.5914306640625, 3.845703125, 4.0999755859375, 4.354248046875, 4.6085205078125, 4.86279296875, 5.1170654296875, 5.371337890625, 5.6256103515625, 5.8798828125, 6.1341552734375, 6.388427734375, 6.6427001953125, 6.89697265625, 7.1512451171875, 7.405517578125, 7.6597900390625, 7.9140625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 9.0, 7.0, 10.0, 14.0, 19.0, 41.0, 54.0, 86.0, 160.0, 169.0, 131.0, 93.0, 59.0, 36.0, 33.0, 18.0, 14.0, 14.0, 10.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.109375, -4.892822265625, -4.67626953125, -4.459716796875, -4.2431640625, -4.026611328125, -3.81005859375, -3.593505859375, -3.376953125, -3.160400390625, -2.94384765625, -2.727294921875, -2.5107421875, -2.294189453125, -2.07763671875, -1.861083984375, -1.64453125, -1.427978515625, -1.21142578125, -0.994873046875, -0.7783203125, -0.561767578125, -0.34521484375, -0.128662109375, 0.087890625, 0.304443359375, 0.52099609375, 0.737548828125, 0.9541015625, 1.170654296875, 1.38720703125, 1.603759765625, 1.8203125, 2.036865234375, 2.25341796875, 2.469970703125, 2.6865234375, 2.903076171875, 3.11962890625, 3.336181640625, 3.552734375, 3.769287109375, 3.98583984375, 4.202392578125, 4.4189453125, 4.635498046875, 4.85205078125, 5.068603515625, 5.28515625, 5.501708984375, 5.71826171875, 5.934814453125, 6.1513671875, 6.367919921875, 6.58447265625, 6.801025390625, 7.017578125, 7.234130859375, 7.45068359375, 7.667236328125, 7.8837890625, 8.100341796875, 8.31689453125, 8.533447265625, 8.75]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 23.0, 136.0, 760.0, 62.0, 10.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-793.3284912109375, -770.2240600585938, -747.11962890625, -724.0151977539062, -700.9107666015625, -677.8062744140625, -654.7018432617188, -631.597412109375, -608.4929809570312, -585.3885498046875, -562.2841186523438, -539.1796875, -516.0751953125, -492.9707946777344, -469.8663330078125, -446.76190185546875, -423.657470703125, -400.55303955078125, -377.4486083984375, -354.3441467285156, -331.2397155761719, -308.1352844238281, -285.03082275390625, -261.9263916015625, -238.82196044921875, -215.717529296875, -192.6130828857422, -169.50863647460938, -146.40420532226562, -123.29976654052734, -100.19532775878906, -77.09088134765625, -53.98651123046875, -30.88207244873047, -7.7776336669921875, 15.326805114746094, 38.431243896484375, 61.535682678222656, 84.64012145996094, 107.74456787109375, 130.8489990234375, 153.95343017578125, 177.05787658691406, 200.16232299804688, 223.26675415039062, 246.37118530273438, 269.47564697265625, 292.580078125, 315.68450927734375, 338.7889404296875, 361.89337158203125, 384.9978332519531, 408.1022644042969, 431.2066955566406, 454.3111572265625, 477.41558837890625, 500.52001953125, 523.6244506835938, 546.7288818359375, 569.8333129882812, 592.937744140625, 616.042236328125, 639.1466674804688, 662.2510986328125, 685.3555297851562]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 10.0, 20.0, 13.0, 31.0, 20.0, 44.0, 50.0, 43.0, 64.0, 112.0, 162.0, 103.0, 61.0, 49.0, 29.0, 32.0, 30.0, 37.0, 18.0, 25.0, 13.0, 8.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0], "bins": [-259.38421630859375, -253.55169677734375, -247.71917724609375, -241.88665771484375, -236.05413818359375, -230.2216339111328, -224.3891143798828, -218.5565948486328, -212.7240753173828, -206.8915557861328, -201.0590362548828, -195.2265167236328, -189.39401245117188, -183.56149291992188, -177.72897338867188, -171.89645385742188, -166.06393432617188, -160.23141479492188, -154.39889526367188, -148.56637573242188, -142.73385620117188, -136.90135192871094, -131.06883239746094, -125.23631286621094, -119.40379333496094, -113.57127380371094, -107.73875427246094, -101.90624237060547, -96.07372283935547, -90.24120330810547, -84.40869140625, -78.576171875, -72.74366760253906, -66.91114807128906, -61.07863235473633, -55.246116638183594, -49.413597106933594, -43.581077575683594, -37.74856185913086, -31.916046142578125, -26.083526611328125, -20.251008987426758, -14.41849136352539, -8.585973739624023, -2.7534561157226562, 3.079061508178711, 8.911579132080078, 14.744094848632812, 20.576614379882812, 26.40913200378418, 32.24164962768555, 38.07416534423828, 43.90668487548828, 49.73920440673828, 55.571720123291016, 61.40423583984375, 67.23675537109375, 73.06927490234375, 78.90179443359375, 84.73430633544922, 90.56682586669922, 96.39934539794922, 102.23185729980469, 108.06437683105469, 113.89689636230469]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 6.0, 10.0, 18.0, 17.0, 34.0, 75.0, 140.0, 380.0, 1221.0, 4177.0, 23946.0, 2748309.0, 1398306.0, 14035.0, 2351.0, 708.0, 252.0, 114.0, 64.0, 33.0, 28.0, 13.0, 10.0, 11.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.8125, -26.41650390625, -25.0205078125, -23.62451171875, -22.228515625, -20.83251953125, -19.4365234375, -18.04052734375, -16.64453125, -15.24853515625, -13.8525390625, -12.45654296875, -11.060546875, -9.66455078125, -8.2685546875, -6.87255859375, -5.4765625, -4.08056640625, -2.6845703125, -1.28857421875, 0.107421875, 1.50341796875, 2.8994140625, 4.29541015625, 5.69140625, 7.08740234375, 8.4833984375, 9.87939453125, 11.275390625, 12.67138671875, 14.0673828125, 15.46337890625, 16.859375, 18.25537109375, 19.6513671875, 21.04736328125, 22.443359375, 23.83935546875, 25.2353515625, 26.63134765625, 28.02734375, 29.42333984375, 30.8193359375, 32.21533203125, 33.611328125, 35.00732421875, 36.4033203125, 37.79931640625, 39.1953125, 40.59130859375, 41.9873046875, 43.38330078125, 44.779296875, 46.17529296875, 47.5712890625, 48.96728515625, 50.36328125, 51.75927734375, 53.1552734375, 54.55126953125, 55.947265625, 57.34326171875, 58.7392578125, 60.13525390625, 61.53125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 9.0, 15.0, 26.0, 33.0, 69.0, 65.0, 109.0, 101.0, 113.0, 115.0, 107.0, 77.0, 58.0, 41.0, 35.0, 19.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.287109375, -10.68359375, -10.080078125, -9.4765625, -8.873046875, -8.26953125, -7.666015625, -7.0625, -6.458984375, -5.85546875, -5.251953125, -4.6484375, -4.044921875, -3.44140625, -2.837890625, -2.234375, -1.630859375, -1.02734375, -0.423828125, 0.1796875, 0.783203125, 1.38671875, 1.990234375, 2.59375, 3.197265625, 3.80078125, 4.404296875, 5.0078125, 5.611328125, 6.21484375, 6.818359375, 7.421875, 8.025390625, 8.62890625, 9.232421875, 9.8359375, 10.439453125, 11.04296875, 11.646484375, 12.25, 12.853515625, 13.45703125, 14.060546875, 14.6640625, 15.267578125, 15.87109375, 16.474609375, 17.078125, 17.681640625, 18.28515625, 18.888671875, 19.4921875, 20.095703125, 20.69921875, 21.302734375, 21.90625, 22.509765625, 23.11328125, 23.716796875, 24.3203125, 24.923828125, 25.52734375, 26.130859375, 26.734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 2.0, 5.0, 6.0, 7.0, 9.0, 17.0, 32.0, 69.0, 112.0, 271.0, 892.0, 3909.0, 112026.0, 4065676.0, 8894.0, 1551.0, 430.0, 166.0, 75.0, 49.0, 31.0, 19.0, 14.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.4375, -70.833984375, -68.23046875, -65.626953125, -63.0234375, -60.419921875, -57.81640625, -55.212890625, -52.609375, -50.005859375, -47.40234375, -44.798828125, -42.1953125, -39.591796875, -36.98828125, -34.384765625, -31.78125, -29.177734375, -26.57421875, -23.970703125, -21.3671875, -18.763671875, -16.16015625, -13.556640625, -10.953125, -8.349609375, -5.74609375, -3.142578125, -0.5390625, 2.064453125, 4.66796875, 7.271484375, 9.875, 12.478515625, 15.08203125, 17.685546875, 20.2890625, 22.892578125, 25.49609375, 28.099609375, 30.703125, 33.306640625, 35.91015625, 38.513671875, 41.1171875, 43.720703125, 46.32421875, 48.927734375, 51.53125, 54.134765625, 56.73828125, 59.341796875, 61.9453125, 64.548828125, 67.15234375, 69.755859375, 72.359375, 74.962890625, 77.56640625, 80.169921875, 82.7734375, 85.376953125, 87.98046875, 90.583984375, 93.1875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 8.0, 8.0, 15.0, 20.0, 47.0, 70.0, 160.0, 351.0, 780.0, 1296.0, 757.0, 291.0, 142.0, 61.0, 20.0, 22.0, 9.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-63.5625, -62.068359375, -60.57421875, -59.080078125, -57.5859375, -56.091796875, -54.59765625, -53.103515625, -51.609375, -50.115234375, -48.62109375, -47.126953125, -45.6328125, -44.138671875, -42.64453125, -41.150390625, -39.65625, -38.162109375, -36.66796875, -35.173828125, -33.6796875, -32.185546875, -30.69140625, -29.197265625, -27.703125, -26.208984375, -24.71484375, -23.220703125, -21.7265625, -20.232421875, -18.73828125, -17.244140625, -15.75, -14.255859375, -12.76171875, -11.267578125, -9.7734375, -8.279296875, -6.78515625, -5.291015625, -3.796875, -2.302734375, -0.80859375, 0.685546875, 2.1796875, 3.673828125, 5.16796875, 6.662109375, 8.15625, 9.650390625, 11.14453125, 12.638671875, 14.1328125, 15.626953125, 17.12109375, 18.615234375, 20.109375, 21.603515625, 23.09765625, 24.591796875, 26.0859375, 27.580078125, 29.07421875, 30.568359375, 32.0625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 11.0, 21.0, 29.0, 73.0, 168.0, 309.0, 201.0, 80.0, 44.0, 15.0, 10.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-437.33099365234375, -425.4548034667969, -413.5786437988281, -401.70245361328125, -389.8262939453125, -377.9501037597656, -366.07391357421875, -354.19775390625, -342.3215637207031, -330.44537353515625, -318.5692138671875, -306.6930236816406, -294.8168640136719, -282.940673828125, -271.06451416015625, -259.1883239746094, -247.31214904785156, -235.43597412109375, -223.55979919433594, -211.68362426757812, -199.80743408203125, -187.93125915527344, -176.05508422851562, -164.17889404296875, -152.302734375, -140.4265594482422, -128.55038452148438, -116.67420196533203, -104.79801940917969, -92.92184448242188, -81.04566955566406, -69.16948699951172, -57.293304443359375, -45.4171257019043, -33.54094696044922, -21.664772033691406, -9.788593292236328, 2.08758544921875, 13.963760375976562, 25.839942932128906, 37.71611785888672, 49.5922966003418, 61.468475341796875, 73.34465026855469, 85.2208251953125, 97.09700775146484, 108.97318267822266, 120.849365234375, 132.7255401611328, 144.60171508789062, 156.47789001464844, 168.35406494140625, 180.23025512695312, 192.10643005371094, 203.98260498046875, 215.85879516601562, 227.73495483398438, 239.6111297607422, 251.4873046875, 263.3634948730469, 275.2396545410156, 287.1158447265625, 298.99200439453125, 310.8681945800781, 322.744384765625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 6.0, 10.0, 23.0, 38.0, 34.0, 56.0, 63.0, 80.0, 94.0, 104.0, 114.0, 73.0, 72.0, 69.0, 42.0, 25.0, 34.0, 20.0, 21.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-253.4017333984375, -245.37399291992188, -237.34625244140625, -229.3185272216797, -221.29078674316406, -213.26304626464844, -205.23532104492188, -197.20758056640625, -189.17984008789062, -181.152099609375, -173.12435913085938, -165.0966339111328, -157.0688934326172, -149.04115295410156, -141.013427734375, -132.98568725585938, -124.95794677734375, -116.93020629882812, -108.90247344970703, -100.87474060058594, -92.84700012207031, -84.81925964355469, -76.7915267944336, -68.7637939453125, -60.736053466796875, -52.708316802978516, -44.680580139160156, -36.6528434753418, -28.625106811523438, -20.597370147705078, -12.569633483886719, -4.541896820068359, 3.48583984375, 11.51357650756836, 19.54131317138672, 27.569049835205078, 35.59678649902344, 43.6245231628418, 51.652259826660156, 59.679996490478516, 67.70773315429688, 75.7354736328125, 83.7632064819336, 91.79093933105469, 99.81867980957031, 107.84642028808594, 115.87415313720703, 123.90188598632812, 131.92962646484375, 139.95736694335938, 147.985107421875, 156.01283264160156, 164.0405731201172, 172.0683135986328, 180.09603881835938, 188.123779296875, 196.15151977539062, 204.17926025390625, 212.20700073242188, 220.23472595214844, 228.26246643066406, 236.2902069091797, 244.31793212890625, 252.34567260742188, 260.3734130859375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 17.0, 15.0, 28.0, 28.0, 45.0, 69.0, 111.0, 192.0, 353.0, 762.0, 1713.0, 5656.0, 27772.0, 407978.0, 560774.0, 33072.0, 6440.0, 1958.0, 732.0, 341.0, 174.0, 127.0, 63.0, 31.0, 21.0, 13.0, 22.0, 13.0, 3.0, 8.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.46875, -25.691162109375, -24.91357421875, -24.135986328125, -23.3583984375, -22.580810546875, -21.80322265625, -21.025634765625, -20.248046875, -19.470458984375, -18.69287109375, -17.915283203125, -17.1376953125, -16.360107421875, -15.58251953125, -14.804931640625, -14.02734375, -13.249755859375, -12.47216796875, -11.694580078125, -10.9169921875, -10.139404296875, -9.36181640625, -8.584228515625, -7.806640625, -7.029052734375, -6.25146484375, -5.473876953125, -4.6962890625, -3.918701171875, -3.14111328125, -2.363525390625, -1.5859375, -0.808349609375, -0.03076171875, 0.746826171875, 1.5244140625, 2.302001953125, 3.07958984375, 3.857177734375, 4.634765625, 5.412353515625, 6.18994140625, 6.967529296875, 7.7451171875, 8.522705078125, 9.30029296875, 10.077880859375, 10.85546875, 11.633056640625, 12.41064453125, 13.188232421875, 13.9658203125, 14.743408203125, 15.52099609375, 16.298583984375, 17.076171875, 17.853759765625, 18.63134765625, 19.408935546875, 20.1865234375, 20.964111328125, 21.74169921875, 22.519287109375, 23.296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 10.0, 22.0, 22.0, 31.0, 50.0, 79.0, 74.0, 108.0, 82.0, 92.0, 120.0, 71.0, 68.0, 51.0, 40.0, 29.0, 17.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.2724609375, -10.685546875, -10.0986328125, -9.51171875, -8.9248046875, -8.337890625, -7.7509765625, -7.1640625, -6.5771484375, -5.990234375, -5.4033203125, -4.81640625, -4.2294921875, -3.642578125, -3.0556640625, -2.46875, -1.8818359375, -1.294921875, -0.7080078125, -0.12109375, 0.4658203125, 1.052734375, 1.6396484375, 2.2265625, 2.8134765625, 3.400390625, 3.9873046875, 4.57421875, 5.1611328125, 5.748046875, 6.3349609375, 6.921875, 7.5087890625, 8.095703125, 8.6826171875, 9.26953125, 9.8564453125, 10.443359375, 11.0302734375, 11.6171875, 12.2041015625, 12.791015625, 13.3779296875, 13.96484375, 14.5517578125, 15.138671875, 15.7255859375, 16.3125, 16.8994140625, 17.486328125, 18.0732421875, 18.66015625, 19.2470703125, 19.833984375, 20.4208984375, 21.0078125, 21.5947265625, 22.181640625, 22.7685546875, 23.35546875, 23.9423828125, 24.529296875, 25.1162109375, 25.703125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 14.0, 11.0, 13.0, 16.0, 23.0, 42.0, 48.0, 66.0, 113.0, 148.0, 248.0, 352.0, 673.0, 1499.0, 5408.0, 41395.0, 912727.0, 74064.0, 7833.0, 1972.0, 712.0, 348.0, 264.0, 145.0, 109.0, 71.0, 54.0, 54.0, 29.0, 20.0, 24.0, 14.0, 10.0, 6.0, 7.0, 2.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.71875, -22.042724609375, -21.36669921875, -20.690673828125, -20.0146484375, -19.338623046875, -18.66259765625, -17.986572265625, -17.310546875, -16.634521484375, -15.95849609375, -15.282470703125, -14.6064453125, -13.930419921875, -13.25439453125, -12.578369140625, -11.90234375, -11.226318359375, -10.55029296875, -9.874267578125, -9.1982421875, -8.522216796875, -7.84619140625, -7.170166015625, -6.494140625, -5.818115234375, -5.14208984375, -4.466064453125, -3.7900390625, -3.114013671875, -2.43798828125, -1.761962890625, -1.0859375, -0.409912109375, 0.26611328125, 0.942138671875, 1.6181640625, 2.294189453125, 2.97021484375, 3.646240234375, 4.322265625, 4.998291015625, 5.67431640625, 6.350341796875, 7.0263671875, 7.702392578125, 8.37841796875, 9.054443359375, 9.73046875, 10.406494140625, 11.08251953125, 11.758544921875, 12.4345703125, 13.110595703125, 13.78662109375, 14.462646484375, 15.138671875, 15.814697265625, 16.49072265625, 17.166748046875, 17.8427734375, 18.518798828125, 19.19482421875, 19.870849609375, 20.546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 2.0, 14.0, 8.0, 18.0, 14.0, 16.0, 18.0, 22.0, 29.0, 31.0, 44.0, 43.0, 53.0, 66.0, 63.0, 94.0, 67.0, 59.0, 64.0, 42.0, 33.0, 43.0, 29.0, 17.0, 18.0, 21.0, 15.0, 6.0, 9.0, 7.0, 8.0, 10.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-43.28125, -41.95458984375, -40.6279296875, -39.30126953125, -37.974609375, -36.64794921875, -35.3212890625, -33.99462890625, -32.66796875, -31.34130859375, -30.0146484375, -28.68798828125, -27.361328125, -26.03466796875, -24.7080078125, -23.38134765625, -22.0546875, -20.72802734375, -19.4013671875, -18.07470703125, -16.748046875, -15.42138671875, -14.0947265625, -12.76806640625, -11.44140625, -10.11474609375, -8.7880859375, -7.46142578125, -6.134765625, -4.80810546875, -3.4814453125, -2.15478515625, -0.828125, 0.49853515625, 1.8251953125, 3.15185546875, 4.478515625, 5.80517578125, 7.1318359375, 8.45849609375, 9.78515625, 11.11181640625, 12.4384765625, 13.76513671875, 15.091796875, 16.41845703125, 17.7451171875, 19.07177734375, 20.3984375, 21.72509765625, 23.0517578125, 24.37841796875, 25.705078125, 27.03173828125, 28.3583984375, 29.68505859375, 31.01171875, 32.33837890625, 33.6650390625, 34.99169921875, 36.318359375, 37.64501953125, 38.9716796875, 40.29833984375, 41.625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 10.0, 15.0, 13.0, 9.0, 16.0, 37.0, 55.0, 86.0, 162.0, 337.0, 1040.0, 3808.0, 29048.0, 953670.0, 52785.0, 5240.0, 1286.0, 455.0, 203.0, 105.0, 47.0, 45.0, 20.0, 20.0, 11.0, 12.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.0535888671875, -3.911865234375, -3.7701416015625, -3.62841796875, -3.4866943359375, -3.344970703125, -3.2032470703125, -3.0615234375, -2.9197998046875, -2.778076171875, -2.6363525390625, -2.49462890625, -2.3529052734375, -2.211181640625, -2.0694580078125, -1.927734375, -1.7860107421875, -1.644287109375, -1.5025634765625, -1.36083984375, -1.2191162109375, -1.077392578125, -0.9356689453125, -0.7939453125, -0.6522216796875, -0.510498046875, -0.3687744140625, -0.22705078125, -0.0853271484375, 0.056396484375, 0.1981201171875, 0.33984375, 0.4815673828125, 0.623291015625, 0.7650146484375, 0.90673828125, 1.0484619140625, 1.190185546875, 1.3319091796875, 1.4736328125, 1.6153564453125, 1.757080078125, 1.8988037109375, 2.04052734375, 2.1822509765625, 2.323974609375, 2.4656982421875, 2.607421875, 2.7491455078125, 2.890869140625, 3.0325927734375, 3.17431640625, 3.3160400390625, 3.457763671875, 3.5994873046875, 3.7412109375, 3.8829345703125, 4.024658203125, 4.1663818359375, 4.30810546875, 4.4498291015625, 4.591552734375, 4.7332763671875, 4.875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 6.0, 9.0, 4.0, 10.0, 9.0, 14.0, 17.0, 18.0, 17.0, 17.0, 30.0, 50.0, 76.0, 87.0, 94.0, 107.0, 92.0, 72.0, 54.0, 50.0, 32.0, 23.0, 22.0, 14.0, 13.0, 7.0, 5.0, 9.0, 7.0, 8.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0005636215209960938, -0.0005484633147716522, -0.0005333051085472107, -0.0005181469023227692, -0.0005029886960983276, -0.0004878304898738861, -0.0004726722836494446, -0.00045751407742500305, -0.0004423558712005615, -0.00042719766497612, -0.00041203945875167847, -0.00039688125252723694, -0.0003817230463027954, -0.0003665648400783539, -0.00035140663385391235, -0.0003362484276294708, -0.0003210902214050293, -0.00030593201518058777, -0.00029077380895614624, -0.0002756156027317047, -0.0002604573965072632, -0.00024529919028282166, -0.00023014098405838013, -0.0002149827778339386, -0.00019982457160949707, -0.00018466636538505554, -0.00016950815916061401, -0.00015434995293617249, -0.00013919174671173096, -0.00012403354048728943, -0.0001088753342628479, -9.371712803840637e-05, -7.855892181396484e-05, -6.340071558952332e-05, -4.824250936508179e-05, -3.308430314064026e-05, -1.792609691619873e-05, -2.767890691757202e-06, 1.2390315532684326e-05, 2.7548521757125854e-05, 4.270672798156738e-05, 5.786493420600891e-05, 7.302314043045044e-05, 8.818134665489197e-05, 0.0001033395528793335, 0.00011849775910377502, 0.00013365596532821655, 0.00014881417155265808, 0.0001639723777770996, 0.00017913058400154114, 0.00019428879022598267, 0.0002094469964504242, 0.00022460520267486572, 0.00023976340889930725, 0.0002549216151237488, 0.0002700798213481903, 0.00028523802757263184, 0.00030039623379707336, 0.0003155544400215149, 0.0003307126462459564, 0.00034587085247039795, 0.0003610290586948395, 0.000376187264919281, 0.00039134547114372253, 0.00040650367736816406]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 12.0, 11.0, 36.0, 28.0, 66.0, 150.0, 286.0, 659.0, 1964.0, 8422.0, 69181.0, 915431.0, 43523.0, 6081.0, 1606.0, 534.0, 232.0, 132.0, 66.0, 51.0, 26.0, 20.0, 9.0, 12.0, 1.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -1.99700927734375, -1.8885498046875, -1.78009033203125, -1.671630859375, -1.56317138671875, -1.4547119140625, -1.34625244140625, -1.23779296875, -1.12933349609375, -1.0208740234375, -0.91241455078125, -0.803955078125, -0.69549560546875, -0.5870361328125, -0.47857666015625, -0.3701171875, -0.26165771484375, -0.1531982421875, -0.04473876953125, 0.063720703125, 0.17218017578125, 0.2806396484375, 0.38909912109375, 0.49755859375, 0.60601806640625, 0.7144775390625, 0.82293701171875, 0.931396484375, 1.03985595703125, 1.1483154296875, 1.25677490234375, 1.365234375, 1.47369384765625, 1.5821533203125, 1.69061279296875, 1.799072265625, 1.90753173828125, 2.0159912109375, 2.12445068359375, 2.23291015625, 2.34136962890625, 2.4498291015625, 2.55828857421875, 2.666748046875, 2.77520751953125, 2.8836669921875, 2.99212646484375, 3.1005859375, 3.20904541015625, 3.3175048828125, 3.42596435546875, 3.534423828125, 3.64288330078125, 3.7513427734375, 3.85980224609375, 3.96826171875, 4.07672119140625, 4.1851806640625, 4.29364013671875, 4.402099609375, 4.51055908203125, 4.6190185546875, 4.72747802734375, 4.8359375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 5.0, 4.0, 6.0, 2.0, 8.0, 6.0, 6.0, 15.0, 20.0, 16.0, 22.0, 20.0, 34.0, 52.0, 72.0, 87.0, 119.0, 104.0, 103.0, 68.0, 53.0, 19.0, 30.0, 28.0, 15.0, 13.0, 16.0, 11.0, 5.0, 9.0, 8.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.73046875, -3.62127685546875, -3.5120849609375, -3.40289306640625, -3.293701171875, -3.18450927734375, -3.0753173828125, -2.96612548828125, -2.85693359375, -2.74774169921875, -2.6385498046875, -2.52935791015625, -2.420166015625, -2.31097412109375, -2.2017822265625, -2.09259033203125, -1.9833984375, -1.87420654296875, -1.7650146484375, -1.65582275390625, -1.546630859375, -1.43743896484375, -1.3282470703125, -1.21905517578125, -1.10986328125, -1.00067138671875, -0.8914794921875, -0.78228759765625, -0.673095703125, -0.56390380859375, -0.4547119140625, -0.34552001953125, -0.236328125, -0.12713623046875, -0.0179443359375, 0.09124755859375, 0.200439453125, 0.30963134765625, 0.4188232421875, 0.52801513671875, 0.63720703125, 0.74639892578125, 0.8555908203125, 0.96478271484375, 1.073974609375, 1.18316650390625, 1.2923583984375, 1.40155029296875, 1.5107421875, 1.61993408203125, 1.7291259765625, 1.83831787109375, 1.947509765625, 2.05670166015625, 2.1658935546875, 2.27508544921875, 2.38427734375, 2.49346923828125, 2.6026611328125, 2.71185302734375, 2.821044921875, 2.93023681640625, 3.0394287109375, 3.14862060546875, 3.2578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 15.0, 37.0, 117.0, 602.0, 131.0, 54.0, 27.0, 10.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.75347900390625, -281.3962097167969, -273.0389404296875, -264.681640625, -256.3243713378906, -247.96710205078125, -239.60983276367188, -231.2525634765625, -222.89527893066406, -214.5380096435547, -206.18072509765625, -197.82345581054688, -189.4661865234375, -181.10890197753906, -172.7516326904297, -164.39434814453125, -156.03707885742188, -147.6798095703125, -139.32252502441406, -130.9652557373047, -122.60797882080078, -114.25070190429688, -105.8934326171875, -97.5361557006836, -89.17887878417969, -80.82160186767578, -72.46432495117188, -64.1070556640625, -55.749778747558594, -47.39250183105469, -39.03522872924805, -30.677955627441406, -22.3206787109375, -13.963403701782227, -5.606128692626953, 2.7511463165283203, 11.108421325683594, 19.4656982421875, 27.82297134399414, 36.18024444580078, 44.53752136230469, 52.894798278808594, 61.252071380615234, 69.60934448242188, 77.96662139892578, 86.32389831542969, 94.68116760253906, 103.03844451904297, 111.39572143554688, 119.75299835205078, 128.1102752685547, 136.46754455566406, 144.8248291015625, 153.18209838867188, 161.53936767578125, 169.89663696289062, 178.25392150878906, 186.61119079589844, 194.96847534179688, 203.32574462890625, 211.68301391601562, 220.04029846191406, 228.39756774902344, 236.75485229492188, 245.11212158203125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 14.0, 19.0, 29.0, 38.0, 55.0, 49.0, 66.0, 369.0, 151.0, 63.0, 50.0, 35.0, 16.0, 14.0, 17.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-133.61251831054688, -125.6063461303711, -117.60017395019531, -109.593994140625, -101.58782196044922, -93.58164978027344, -85.57546997070312, -77.56929779052734, -69.56312561035156, -61.55695343017578, -53.550777435302734, -45.54460144042969, -37.538429260253906, -29.532257080078125, -21.526081085205078, -13.519905090332031, -5.51373291015625, 2.492441177368164, 10.498615264892578, 18.504789352416992, 26.510963439941406, 34.51713562011719, 42.523311614990234, 50.52948760986328, 58.53565979003906, 66.54183197021484, 74.54800415039062, 82.55418395996094, 90.56035614013672, 98.5665283203125, 106.57270812988281, 114.5788803100586, 122.5850830078125, 130.5912628173828, 138.59742736816406, 146.60360717773438, 154.60977172851562, 162.61595153808594, 170.62213134765625, 178.6282958984375, 186.6344757080078, 194.64065551757812, 202.64682006835938, 210.6529998779297, 218.6591796875, 226.66534423828125, 234.67152404785156, 242.67770385742188, 250.68386840820312, 258.6900329589844, 266.69622802734375, 274.702392578125, 282.70855712890625, 290.7147216796875, 298.7209167480469, 306.7270812988281, 314.7332763671875, 322.73944091796875, 330.7456359863281, 338.7518005371094, 346.7579650878906, 354.76416015625, 362.77032470703125, 370.7764892578125, 378.78265380859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 6.0, 4.0, 10.0, 15.0, 24.0, 19.0, 40.0, 50.0, 47.0, 77.0, 177.0, 312.0, 52.0, 54.0, 35.0, 36.0, 19.0, 9.0, 4.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.177734375, -10.62109375, -10.064453125, -9.5078125, -8.951171875, -8.39453125, -7.837890625, -7.28125, -6.724609375, -6.16796875, -5.611328125, -5.0546875, -4.498046875, -3.94140625, -3.384765625, -2.828125, -2.271484375, -1.71484375, -1.158203125, -0.6015625, -0.044921875, 0.51171875, 1.068359375, 1.625, 2.181640625, 2.73828125, 3.294921875, 3.8515625, 4.408203125, 4.96484375, 5.521484375, 6.078125, 6.634765625, 7.19140625, 7.748046875, 8.3046875, 8.861328125, 9.41796875, 9.974609375, 10.53125, 11.087890625, 11.64453125, 12.201171875, 12.7578125, 13.314453125, 13.87109375, 14.427734375, 14.984375, 15.541015625, 16.09765625, 16.654296875, 17.2109375, 17.767578125, 18.32421875, 18.880859375, 19.4375, 19.994140625, 20.55078125, 21.107421875, 21.6640625, 22.220703125, 22.77734375, 23.333984375, 23.890625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 2.0, 5.0, 3.0, 7.0, 17.0, 15.0, 10.0, 15.0, 20.0, 45.0, 53.0, 145.0, 283.0, 1177.0, 25972.0, 8357535.0, 2387.0, 472.0, 169.0, 66.0, 54.0, 28.0, 12.0, 26.0, 13.0, 1.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-240.01898193359375, -232.9963836669922, -225.97378540039062, -218.951171875, -211.92857360839844, -204.90597534179688, -197.8833770751953, -190.86077880859375, -183.8381805419922, -176.81558227539062, -169.79298400878906, -162.7703857421875, -155.74777221679688, -148.7251739501953, -141.70257568359375, -134.6799774169922, -127.6573715209961, -120.63477325439453, -113.61216735839844, -106.58956909179688, -99.56697082519531, -92.54437255859375, -85.52176666259766, -78.4991683959961, -71.4765625, -64.45396423339844, -57.43136215209961, -50.40876007080078, -43.38616180419922, -36.36355972290039, -29.340957641601562, -22.318359375, -15.295761108398438, -8.273160934448242, -1.2505598068237305, 5.772041320800781, 12.794641494750977, 19.817241668701172, 26.83984375, 33.86244201660156, 40.88504409790039, 47.90764617919922, 54.93024444580078, 61.95284652709961, 68.97544860839844, 75.998046875, 83.02064514160156, 90.04324340820312, 97.06584930419922, 104.08844757080078, 111.11105346679688, 118.13365173339844, 125.15625, 132.17884826660156, 139.20144653320312, 146.22406005859375, 153.2466583251953, 160.26925659179688, 167.29185485839844, 174.314453125, 181.33706665039062, 188.3596649169922, 195.38226318359375, 202.4048614501953, 209.42745971679688]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 5.0, 12.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-395.9598083496094, -386.100830078125, -376.2418518066406, -366.38287353515625, -356.52386474609375, -346.6648864746094, -336.805908203125, -326.9469299316406, -317.08795166015625, -307.2289733886719, -297.3699951171875, -287.5110168457031, -277.65203857421875, -267.79302978515625, -257.9340515136719, -248.0750732421875, -238.21609497070312, -228.35711669921875, -218.49813842773438, -208.63914489746094, -198.78016662597656, -188.9211883544922, -179.06219482421875, -169.20321655273438, -159.34423828125, -149.48526000976562, -139.62628173828125, -129.7672882080078, -119.90830993652344, -110.04933166503906, -100.19034576416016, -90.33135986328125, -80.472412109375, -70.61343383789062, -60.75444793701172, -50.89546585083008, -41.03648376464844, -31.177501678466797, -21.318519592285156, -11.45953369140625, -1.600555419921875, 8.258426666259766, 18.117408752441406, 27.976390838623047, 37.83537292480469, 47.69435501098633, 57.55333709716797, 67.41232299804688, 77.27130126953125, 87.13027954101562, 96.98926544189453, 106.84825134277344, 116.70722961425781, 126.56620788574219, 136.42520141601562, 146.2841796875, 156.14315795898438, 166.00213623046875, 175.86111450195312, 185.72010803222656, 195.57908630371094, 205.4380645751953, 215.29705810546875, 225.15603637695312, 235.0150146484375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 2.0, 3.0, 4.0, 11.0, 12.0, 19.0, 25.0, 28.0, 41.0, 88.0, 125.0, 239.0, 454.0, 1087.0, 3568.0, 14954.0, 80272.0, 286764.0, 107935.0, 20454.0, 4985.0, 1615.0, 695.0, 311.0, 185.0, 130.0, 59.0, 56.0, 34.0, 23.0, 19.0, 18.0, 10.0, 11.0, 8.0, 12.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.375, -73.5009765625, -70.626953125, -67.7529296875, -64.87890625, -62.0048828125, -59.130859375, -56.2568359375, -53.3828125, -50.5087890625, -47.634765625, -44.7607421875, -41.88671875, -39.0126953125, -36.138671875, -33.2646484375, -30.390625, -27.5166015625, -24.642578125, -21.7685546875, -18.89453125, -16.0205078125, -13.146484375, -10.2724609375, -7.3984375, -4.5244140625, -1.650390625, 1.2236328125, 4.09765625, 6.9716796875, 9.845703125, 12.7197265625, 15.59375, 18.4677734375, 21.341796875, 24.2158203125, 27.08984375, 29.9638671875, 32.837890625, 35.7119140625, 38.5859375, 41.4599609375, 44.333984375, 47.2080078125, 50.08203125, 52.9560546875, 55.830078125, 58.7041015625, 61.578125, 64.4521484375, 67.326171875, 70.2001953125, 73.07421875, 75.9482421875, 78.822265625, 81.6962890625, 84.5703125, 87.4443359375, 90.318359375, 93.1923828125, 96.06640625, 98.9404296875, 101.814453125, 104.6884765625, 107.5625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 9.0, 17.0, 38.0, 36.0, 60.0, 86.0, 112.0, 125.0, 129.0, 103.0, 80.0, 57.0, 35.0, 32.0, 24.0, 16.0, 13.0, 13.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3046875, -10.5943603515625, -9.884033203125, -9.1737060546875, -8.46337890625, -7.7530517578125, -7.042724609375, -6.3323974609375, -5.6220703125, -4.9117431640625, -4.201416015625, -3.4910888671875, -2.78076171875, -2.0704345703125, -1.360107421875, -0.6497802734375, 0.060546875, 0.7708740234375, 1.481201171875, 2.1915283203125, 2.90185546875, 3.6121826171875, 4.322509765625, 5.0328369140625, 5.7431640625, 6.4534912109375, 7.163818359375, 7.8741455078125, 8.58447265625, 9.2947998046875, 10.005126953125, 10.7154541015625, 11.42578125, 12.1361083984375, 12.846435546875, 13.5567626953125, 14.26708984375, 14.9774169921875, 15.687744140625, 16.3980712890625, 17.1083984375, 17.8187255859375, 18.529052734375, 19.2393798828125, 19.94970703125, 20.6600341796875, 21.370361328125, 22.0806884765625, 22.791015625, 23.5013427734375, 24.211669921875, 24.9219970703125, 25.63232421875, 26.3426513671875, 27.052978515625, 27.7633056640625, 28.4736328125, 29.1839599609375, 29.894287109375, 30.6046142578125, 31.31494140625, 32.0252685546875, 32.735595703125, 33.4459228515625, 34.15625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 25.0, 30.0, 64.0, 78.0, 93.0, 77.0, 50.0, 23.0, 10.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.19784545898438, -118.62834930419922, -115.05884552001953, -111.48934936523438, -107.91985321044922, -104.35035705566406, -100.78085327148438, -97.21135711669922, -93.64186096191406, -90.0723648071289, -86.50286102294922, -82.93336486816406, -79.3638687133789, -75.79437255859375, -72.22486877441406, -68.6553726196289, -65.08587646484375, -61.51637649536133, -57.94688034057617, -54.37738037109375, -50.807884216308594, -47.23838424682617, -43.66888427734375, -40.099388122558594, -36.529884338378906, -32.960384368896484, -29.390888214111328, -25.821388244628906, -22.25189208984375, -18.682392120361328, -15.112894058227539, -11.54339599609375, -7.973899841308594, -4.404401779174805, -0.8349032402038574, 2.73459529876709, 6.304093360900879, 9.873592376708984, 13.443090438842773, 17.012588500976562, 20.58208656311035, 24.15158462524414, 27.72108268737793, 31.29058074951172, 34.86008071899414, 38.42958068847656, 41.99907684326172, 45.568572998046875, 49.1380729675293, 52.70757293701172, 56.277069091796875, 59.8465690612793, 63.41606521606445, 66.98556518554688, 70.55506134033203, 74.12455749511719, 77.69406127929688, 81.26355743408203, 84.83306121826172, 88.40255737304688, 91.97205352783203, 95.54154968261719, 99.11105346679688, 102.68054962158203, 106.25004577636719]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 13.0, 16.0, 28.0, 48.0, 74.0, 85.0, 67.0, 49.0, 21.0, 13.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.279029846191406, -60.375274658203125, -58.471519470214844, -56.56776428222656, -54.66400909423828, -52.76025390625, -50.85649871826172, -48.95274353027344, -47.048988342285156, -45.145233154296875, -43.241477966308594, -41.33772277832031, -39.43396759033203, -37.53021240234375, -35.62645721435547, -33.72270202636719, -31.818946838378906, -29.915191650390625, -28.011436462402344, -26.107681274414062, -24.20392608642578, -22.3001708984375, -20.39641571044922, -18.492660522460938, -16.588905334472656, -14.685150146484375, -12.781394958496094, -10.877639770507812, -8.973884582519531, -7.07012939453125, -5.166374206542969, -3.2626190185546875, -1.3588676452636719, 0.5448875427246094, 2.4486427307128906, 4.352397918701172, 6.256153106689453, 8.159908294677734, 10.063663482666016, 11.967418670654297, 13.871173858642578, 15.77492904663086, 17.67868423461914, 19.582439422607422, 21.486194610595703, 23.389949798583984, 25.293704986572266, 27.197460174560547, 29.101215362548828, 31.00497055053711, 32.90872573852539, 34.81248092651367, 36.71623611450195, 38.619991302490234, 40.523746490478516, 42.4275016784668, 44.33125686645508, 46.23501205444336, 48.13876724243164, 50.04252243041992, 51.9462776184082, 53.850032806396484, 55.753787994384766, 57.65754318237305, 59.56129837036133]}, "eval/loss": 5.7725830078125, "eval/wer": 0.7927852848383833, "eval/runtime": 1037.3103, "eval/samples_per_second": 2.547, "eval/steps_per_second": 0.319, "train/train_runtime": 29013.0161, "train/train_samples_per_second": 4.918, "train/train_steps_per_second": 0.154, "train/total_flos": 0.0, "train/train_loss": 6.2593836770463955} \ No newline at end of file +{"train/loss": 3.5204, "train/learning_rate": 5.780346820809249e-08, "train/epoch": 5.0, "train/global_step": 4460, "_runtime": 30356, "_timestamp": 1646288237, "_step": 4463, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 26.0, 74.0, 15.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 29845.0, 341.0, 77.0, 31.0, 17.0, 12.0, 11.0, 2.0, 8.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.0625, -95.99365234375, -93.9248046875, -91.85595703125, -89.787109375, -87.71826171875, -85.6494140625, -83.58056640625, -81.51171875, -79.44287109375, -77.3740234375, -75.30517578125, -73.236328125, -71.16748046875, -69.0986328125, -67.02978515625, -64.9609375, -62.89208984375, -60.8232421875, -58.75439453125, -56.685546875, -54.61669921875, -52.5478515625, -50.47900390625, -48.41015625, -46.34130859375, -44.2724609375, -42.20361328125, -40.134765625, -38.06591796875, -35.9970703125, -33.92822265625, -31.859375, -29.79052734375, -27.7216796875, -25.65283203125, -23.583984375, -21.51513671875, -19.4462890625, -17.37744140625, -15.30859375, -13.23974609375, -11.1708984375, -9.10205078125, -7.033203125, -4.96435546875, -2.8955078125, -0.82666015625, 1.2421875, 3.31103515625, 5.3798828125, 7.44873046875, 9.517578125, 11.58642578125, 13.6552734375, 15.72412109375, 17.79296875, 19.86181640625, 21.9306640625, 23.99951171875, 26.068359375, 28.13720703125, 30.2060546875, 32.27490234375, 34.34375]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 6.0, 8.0, 7.0, 7.0, 15.0, 13.0, 22.0, 20.0, 29.0, 26.0, 25.0, 42.0, 35.0, 45.0, 45.0, 55.0, 51.0, 55.0, 69.0, 56.0, 61.0, 48.0, 56.0, 31.0, 43.0, 33.0, 24.0, 14.0, 22.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-47.140663146972656, -46.067935943603516, -44.995208740234375, -43.922481536865234, -42.849754333496094, -41.77703094482422, -40.70430374145508, -39.63157653808594, -38.5588493347168, -37.486122131347656, -36.413394927978516, -35.340667724609375, -34.2679443359375, -33.19521713256836, -32.12248992919922, -31.049762725830078, -29.977035522460938, -28.904308319091797, -27.831581115722656, -26.75885581970215, -25.686128616333008, -24.613401412963867, -23.54067611694336, -22.46794891357422, -21.395221710205078, -20.322494506835938, -19.249767303466797, -18.17704200744629, -17.10431480407715, -16.031587600708008, -14.958861351013184, -13.88613510131836, -12.813411712646484, -11.740684509277344, -10.66795825958252, -9.595232009887695, -8.522504806518555, -7.449778079986572, -6.37705135345459, -5.304324626922607, -4.231597900390625, -3.1588711738586426, -2.08614444732666, -1.0134177207946777, 0.05930900573730469, 1.132035732269287, 2.2047624588012695, 3.277489185333252, 4.350215911865234, 5.422942638397217, 6.495669364929199, 7.568396091461182, 8.641122817993164, 9.713850021362305, 10.786576271057129, 11.859302520751953, 12.932029724121094, 14.004756927490234, 15.077483177185059, 16.150209426879883, 17.222936630249023, 18.295663833618164, 19.368389129638672, 20.441116333007812, 21.513843536376953]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 5.0, 11.0, 12.0, 13.0, 12.0, 17.0, 21.0, 21.0, 27.0, 23.0, 38.0, 30.0, 35.0, 38.0, 39.0, 41.0, 41.0, 29.0, 34.0, 43.0, 44.0, 41.0, 35.0, 34.0, 47.0, 36.0, 23.0, 32.0, 25.0, 25.0, 20.0, 23.0, 11.0, 10.0, 13.0, 8.0, 7.0, 5.0, 4.0, 5.0, 3.0, 7.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-27.810733795166016, -26.96071434020996, -26.110692977905273, -25.26067352294922, -24.41065216064453, -23.560632705688477, -22.710613250732422, -21.860591888427734, -21.010570526123047, -20.160551071166992, -19.310529708862305, -18.46051025390625, -17.610488891601562, -16.760469436645508, -15.910449028015137, -15.060428619384766, -14.210409164428711, -13.36038875579834, -12.510368347167969, -11.660348892211914, -10.810327529907227, -9.960308074951172, -9.1102876663208, -8.26026725769043, -7.410246849060059, -6.5602264404296875, -5.710206031799316, -4.8601861000061035, -4.010165691375732, -3.1601452827453613, -2.3101253509521484, -1.4601049423217773, -0.6100864410400391, 0.23993384838104248, 1.089954137802124, 1.939974308013916, 2.789994716644287, 3.640015125274658, 4.490035057067871, 5.340055465698242, 6.190075874328613, 7.040096282958984, 7.8901166915893555, 8.740137100219727, 9.590156555175781, 10.440177917480469, 11.290197372436523, 12.140217781066895, 12.990238189697266, 13.840258598327637, 14.690279006958008, 15.540298461914062, 16.39031982421875, 17.240339279174805, 18.09035873413086, 18.940380096435547, 19.790401458740234, 20.64042091369629, 21.490442276000977, 22.34046173095703, 23.19048309326172, 24.040502548217773, 24.890522003173828, 25.740543365478516, 26.59056282043457]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 10.0, 13.0, 23.0, 36.0, 47.0, 61.0, 97.0, 185.0, 279.0, 417.0, 699.0, 1105.0, 1899.0, 2858.0, 4604.0, 7230.0, 11395.0, 17506.0, 26139.0, 38377.0, 54357.0, 75168.0, 104453.0, 168303.0, 175372.0, 107937.0, 77328.0, 56011.0, 39384.0, 27044.0, 18022.0, 11798.0, 7626.0, 4813.0, 2994.0, 1853.0, 1114.0, 759.0, 447.0, 284.0, 176.0, 107.0, 66.0, 64.0, 33.0, 20.0, 17.0, 7.0, 10.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.8125, -66.595703125, -64.37890625, -62.162109375, -59.9453125, -57.728515625, -55.51171875, -53.294921875, -51.078125, -48.861328125, -46.64453125, -44.427734375, -42.2109375, -39.994140625, -37.77734375, -35.560546875, -33.34375, -31.126953125, -28.91015625, -26.693359375, -24.4765625, -22.259765625, -20.04296875, -17.826171875, -15.609375, -13.392578125, -11.17578125, -8.958984375, -6.7421875, -4.525390625, -2.30859375, -0.091796875, 2.125, 4.341796875, 6.55859375, 8.775390625, 10.9921875, 13.208984375, 15.42578125, 17.642578125, 19.859375, 22.076171875, 24.29296875, 26.509765625, 28.7265625, 30.943359375, 33.16015625, 35.376953125, 37.59375, 39.810546875, 42.02734375, 44.244140625, 46.4609375, 48.677734375, 50.89453125, 53.111328125, 55.328125, 57.544921875, 59.76171875, 61.978515625, 64.1953125, 66.412109375, 68.62890625, 70.845703125, 73.0625]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 11.0, 12.0, 7.0, 7.0, 10.0, 13.0, 15.0, 22.0, 11.0, 23.0, 38.0, 33.0, 28.0, 39.0, 45.0, 42.0, 69.0, 83.0, 72.0, 59.0, 56.0, 35.0, 44.0, 35.0, 24.0, 26.0, 24.0, 16.0, 14.0, 16.0, 18.0, 9.0, 9.0, 8.0, 7.0, 1.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.453125, -27.559326171875, -26.66552734375, -25.771728515625, -24.8779296875, -23.984130859375, -23.09033203125, -22.196533203125, -21.302734375, -20.408935546875, -19.51513671875, -18.621337890625, -17.7275390625, -16.833740234375, -15.93994140625, -15.046142578125, -14.15234375, -13.258544921875, -12.36474609375, -11.470947265625, -10.5771484375, -9.683349609375, -8.78955078125, -7.895751953125, -7.001953125, -6.108154296875, -5.21435546875, -4.320556640625, -3.4267578125, -2.532958984375, -1.63916015625, -0.745361328125, 0.1484375, 1.042236328125, 1.93603515625, 2.829833984375, 3.7236328125, 4.617431640625, 5.51123046875, 6.405029296875, 7.298828125, 8.192626953125, 9.08642578125, 9.980224609375, 10.8740234375, 11.767822265625, 12.66162109375, 13.555419921875, 14.44921875, 15.343017578125, 16.23681640625, 17.130615234375, 18.0244140625, 18.918212890625, 19.81201171875, 20.705810546875, 21.599609375, 22.493408203125, 23.38720703125, 24.281005859375, 25.1748046875, 26.068603515625, 26.96240234375, 27.856201171875, 28.75]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 6.0, 6.0, 8.0, 14.0, 12.0, 9.0, 20.0, 19.0, 32.0, 24.0, 34.0, 32.0, 31.0, 24.0, 35.0, 43.0, 49.0, 37.0, 50.0, 41.0, 41.0, 47.0, 49.0, 35.0, 40.0, 28.0, 34.0, 27.0, 25.0, 14.0, 23.0, 13.0, 19.0, 15.0, 14.0, 5.0, 8.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.58609676361084, -15.049652099609375, -14.51320743560791, -13.976762771606445, -13.440317153930664, -12.9038724899292, -12.367427825927734, -11.83098316192627, -11.294538497924805, -10.75809383392334, -10.221649169921875, -9.685203552246094, -9.148758888244629, -8.612314224243164, -8.0758695602417, -7.539424896240234, -7.002979278564453, -6.466534614562988, -5.930089473724365, -5.3936448097229, -4.857199668884277, -4.3207550048828125, -3.7843103408813477, -3.2478654384613037, -2.7114205360412598, -2.174975633621216, -1.6385308504104614, -1.102086067199707, -0.5656411647796631, -0.02919626235961914, 0.5072484016418457, 1.0436933040618896, 1.58013916015625, 2.116584062576294, 2.653028964996338, 3.1894736289978027, 3.7259185314178467, 4.262363433837891, 4.7988080978393555, 5.33525276184082, 5.871697902679443, 6.408142566680908, 6.944587707519531, 7.481032371520996, 8.017477035522461, 8.553922653198242, 9.09036636352539, 9.626811981201172, 10.163256645202637, 10.699701309204102, 11.236145973205566, 11.772590637207031, 12.309036254882812, 12.845480918884277, 13.381925582885742, 13.918370246887207, 14.454814910888672, 14.991259574890137, 15.527704238891602, 16.064149856567383, 16.60059356689453, 17.137039184570312, 17.673484802246094, 18.209928512573242, 18.746374130249023]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 8.0, 8.0, 3.0, 6.0, 9.0, 8.0, 12.0, 13.0, 25.0, 22.0, 25.0, 25.0, 22.0, 26.0, 22.0, 29.0, 43.0, 30.0, 43.0, 51.0, 44.0, 44.0, 49.0, 37.0, 34.0, 37.0, 35.0, 35.0, 26.0, 26.0, 29.0, 26.0, 27.0, 18.0, 22.0, 17.0, 13.0, 10.0, 9.0, 4.0, 6.0, 4.0, 1.0, 7.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-16.44671630859375, -15.948348045349121, -15.449978828430176, -14.951610565185547, -14.453241348266602, -13.954873085021973, -13.456504821777344, -12.958135604858398, -12.45976734161377, -11.96139907836914, -11.463029861450195, -10.964661598205566, -10.466293334960938, -9.967924118041992, -9.469555854797363, -8.971187591552734, -8.472818374633789, -7.974449634552002, -7.476080894470215, -6.977712631225586, -6.479343891143799, -5.980975151062012, -5.482606887817383, -4.984238147735596, -4.485869407653809, -3.9875006675720215, -3.4891321659088135, -2.9907636642456055, -2.4923949241638184, -1.9940261840820312, -1.4956576824188232, -0.9972891807556152, -0.4989204406738281, -0.0005518198013305664, 0.497816801071167, 0.9961854219436646, 1.494554042816162, 1.9929227828979492, 2.4912912845611572, 2.9896597862243652, 3.4880285263061523, 3.9863972663879395, 4.484766006469727, 4.9831342697143555, 5.481503009796143, 5.97987174987793, 6.478240013122559, 6.976608753204346, 7.474977493286133, 7.97334623336792, 8.471714973449707, 8.970083236694336, 9.468452453613281, 9.96682071685791, 10.465188980102539, 10.963558197021484, 11.461926460266113, 11.960294723510742, 12.458663940429688, 12.957032203674316, 13.455400466918945, 13.95376968383789, 14.45213794708252, 14.950506210327148, 15.448875427246094]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 2.0, 4.0, 8.0, 15.0, 12.0, 19.0, 25.0, 35.0, 66.0, 105.0, 185.0, 341.0, 567.0, 1158.0, 2227.0, 4543.0, 9617.0, 21755.0, 51677.0, 135006.0, 399320.0, 1160400.0, 1479153.0, 598464.0, 200068.0, 74061.0, 30175.0, 13092.0, 5989.0, 2871.0, 1504.0, 776.0, 412.0, 254.0, 138.0, 69.0, 60.0, 30.0, 31.0, 16.0, 8.0, 7.0, 5.0, 3.0, 3.0, 5.0, 2.0, 3.0], "bins": [-40.8125, -39.74365234375, -38.6748046875, -37.60595703125, -36.537109375, -35.46826171875, -34.3994140625, -33.33056640625, -32.26171875, -31.19287109375, -30.1240234375, -29.05517578125, -27.986328125, -26.91748046875, -25.8486328125, -24.77978515625, -23.7109375, -22.64208984375, -21.5732421875, -20.50439453125, -19.435546875, -18.36669921875, -17.2978515625, -16.22900390625, -15.16015625, -14.09130859375, -13.0224609375, -11.95361328125, -10.884765625, -9.81591796875, -8.7470703125, -7.67822265625, -6.609375, -5.54052734375, -4.4716796875, -3.40283203125, -2.333984375, -1.26513671875, -0.1962890625, 0.87255859375, 1.94140625, 3.01025390625, 4.0791015625, 5.14794921875, 6.216796875, 7.28564453125, 8.3544921875, 9.42333984375, 10.4921875, 11.56103515625, 12.6298828125, 13.69873046875, 14.767578125, 15.83642578125, 16.9052734375, 17.97412109375, 19.04296875, 20.11181640625, 21.1806640625, 22.24951171875, 23.318359375, 24.38720703125, 25.4560546875, 26.52490234375, 27.59375]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 1.0, 1.0, 5.0, 2.0, 4.0, 10.0, 7.0, 8.0, 5.0, 13.0, 18.0, 12.0, 17.0, 21.0, 24.0, 25.0, 23.0, 42.0, 36.0, 34.0, 31.0, 36.0, 39.0, 36.0, 48.0, 48.0, 52.0, 41.0, 30.0, 33.0, 33.0, 37.0, 29.0, 27.0, 26.0, 19.0, 28.0, 18.0, 15.0, 16.0, 13.0, 7.0, 6.0, 6.0, 7.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.265625, -13.8173828125, -13.369140625, -12.9208984375, -12.47265625, -12.0244140625, -11.576171875, -11.1279296875, -10.6796875, -10.2314453125, -9.783203125, -9.3349609375, -8.88671875, -8.4384765625, -7.990234375, -7.5419921875, -7.09375, -6.6455078125, -6.197265625, -5.7490234375, -5.30078125, -4.8525390625, -4.404296875, -3.9560546875, -3.5078125, -3.0595703125, -2.611328125, -2.1630859375, -1.71484375, -1.2666015625, -0.818359375, -0.3701171875, 0.078125, 0.5263671875, 0.974609375, 1.4228515625, 1.87109375, 2.3193359375, 2.767578125, 3.2158203125, 3.6640625, 4.1123046875, 4.560546875, 5.0087890625, 5.45703125, 5.9052734375, 6.353515625, 6.8017578125, 7.25, 7.6982421875, 8.146484375, 8.5947265625, 9.04296875, 9.4912109375, 9.939453125, 10.3876953125, 10.8359375, 11.2841796875, 11.732421875, 12.1806640625, 12.62890625, 13.0771484375, 13.525390625, 13.9736328125, 14.421875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 11.0, 10.0, 17.0, 27.0, 44.0, 47.0, 99.0, 148.0, 296.0, 467.0, 828.0, 1470.0, 2754.0, 5287.0, 10157.0, 21992.0, 48979.0, 115171.0, 281655.0, 692035.0, 1380355.0, 951061.0, 396105.0, 160315.0, 67318.0, 29282.0, 13749.0, 6752.0, 3433.0, 1849.0, 1026.0, 603.0, 370.0, 225.0, 141.0, 70.0, 53.0, 27.0, 19.0, 16.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-33.78125, -32.807373046875, -31.83349609375, -30.859619140625, -29.8857421875, -28.911865234375, -27.93798828125, -26.964111328125, -25.990234375, -25.016357421875, -24.04248046875, -23.068603515625, -22.0947265625, -21.120849609375, -20.14697265625, -19.173095703125, -18.19921875, -17.225341796875, -16.25146484375, -15.277587890625, -14.3037109375, -13.329833984375, -12.35595703125, -11.382080078125, -10.408203125, -9.434326171875, -8.46044921875, -7.486572265625, -6.5126953125, -5.538818359375, -4.56494140625, -3.591064453125, -2.6171875, -1.643310546875, -0.66943359375, 0.304443359375, 1.2783203125, 2.252197265625, 3.22607421875, 4.199951171875, 5.173828125, 6.147705078125, 7.12158203125, 8.095458984375, 9.0693359375, 10.043212890625, 11.01708984375, 11.990966796875, 12.96484375, 13.938720703125, 14.91259765625, 15.886474609375, 16.8603515625, 17.834228515625, 18.80810546875, 19.781982421875, 20.755859375, 21.729736328125, 22.70361328125, 23.677490234375, 24.6513671875, 25.625244140625, 26.59912109375, 27.572998046875, 28.546875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 13.0, 9.0, 16.0, 16.0, 16.0, 23.0, 30.0, 39.0, 45.0, 57.0, 67.0, 99.0, 115.0, 117.0, 171.0, 222.0, 257.0, 311.0, 319.0, 365.0, 344.0, 266.0, 255.0, 198.0, 158.0, 120.0, 108.0, 86.0, 55.0, 38.0, 32.0, 18.0, 23.0, 22.0, 13.0, 11.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.661865234375, -7.39404296875, -7.126220703125, -6.8583984375, -6.590576171875, -6.32275390625, -6.054931640625, -5.787109375, -5.519287109375, -5.25146484375, -4.983642578125, -4.7158203125, -4.447998046875, -4.18017578125, -3.912353515625, -3.64453125, -3.376708984375, -3.10888671875, -2.841064453125, -2.5732421875, -2.305419921875, -2.03759765625, -1.769775390625, -1.501953125, -1.234130859375, -0.96630859375, -0.698486328125, -0.4306640625, -0.162841796875, 0.10498046875, 0.372802734375, 0.640625, 0.908447265625, 1.17626953125, 1.444091796875, 1.7119140625, 1.979736328125, 2.24755859375, 2.515380859375, 2.783203125, 3.051025390625, 3.31884765625, 3.586669921875, 3.8544921875, 4.122314453125, 4.39013671875, 4.657958984375, 4.92578125, 5.193603515625, 5.46142578125, 5.729248046875, 5.9970703125, 6.264892578125, 6.53271484375, 6.800537109375, 7.068359375, 7.336181640625, 7.60400390625, 7.871826171875, 8.1396484375, 8.407470703125, 8.67529296875, 8.943115234375, 9.2109375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 7.0, 11.0, 8.0, 17.0, 19.0, 28.0, 32.0, 28.0, 44.0, 42.0, 55.0, 58.0, 55.0, 67.0, 49.0, 68.0, 50.0, 57.0, 50.0, 46.0, 36.0, 22.0, 27.0, 22.0, 20.0, 16.0, 10.0, 6.0, 7.0, 3.0, 4.0, 4.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.66727066040039, -15.98918342590332, -15.31109619140625, -14.63300895690918, -13.95492172241211, -13.276834487915039, -12.598746299743652, -11.920659065246582, -11.242571830749512, -10.564484596252441, -9.886397361755371, -9.208309173583984, -8.530221939086914, -7.852135181427002, -7.174047470092773, -6.495960235595703, -5.817873001098633, -5.1397857666015625, -4.461698532104492, -3.7836108207702637, -3.1055235862731934, -2.427436351776123, -1.7493486404418945, -1.0712614059448242, -0.3931741714477539, 0.28491318225860596, 0.9630005359649658, 1.6410880088806152, 2.3191752433776855, 2.997262477874756, 3.6753501892089844, 4.353437423706055, 5.031524658203125, 5.709611892700195, 6.387699127197266, 7.065786838531494, 7.7438740730285645, 8.421960830688477, 9.100049018859863, 9.778136253356934, 10.456223487854004, 11.134310722351074, 11.812397956848145, 12.490486145019531, 13.168573379516602, 13.846660614013672, 14.524747848510742, 15.202835083007812, 15.880922317504883, 16.559009552001953, 17.237096786499023, 17.915184020996094, 18.593271255493164, 19.271358489990234, 19.949447631835938, 20.627532958984375, 21.305622100830078, 21.98370933532715, 22.66179656982422, 23.33988380432129, 24.01797103881836, 24.69605827331543, 25.3741455078125, 26.052234649658203, 26.73031997680664]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 4.0, 12.0, 6.0, 5.0, 12.0, 12.0, 12.0, 14.0, 23.0, 23.0, 16.0, 23.0, 34.0, 29.0, 29.0, 49.0, 50.0, 45.0, 46.0, 47.0, 46.0, 48.0, 46.0, 32.0, 28.0, 44.0, 32.0, 22.0, 31.0, 29.0, 26.0, 21.0, 18.0, 12.0, 9.0, 14.0, 9.0, 13.0, 5.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.349449157714844, -18.798690795898438, -18.247934341430664, -17.697175979614258, -17.14641761779785, -16.595661163330078, -16.044902801513672, -15.494144439697266, -14.943387031555176, -14.392629623413086, -13.84187126159668, -13.29111385345459, -12.7403564453125, -12.189598083496094, -11.638840675354004, -11.088083267211914, -10.537324905395508, -9.986567497253418, -9.435809135437012, -8.885051727294922, -8.334293365478516, -7.783535957336426, -7.232778549194336, -6.682020664215088, -6.13126277923584, -5.580504894256592, -5.029747009277344, -4.478989601135254, -3.928231716156006, -3.377473831176758, -2.826716184616089, -2.27595853805542, -1.7251996994018555, -1.174441933631897, -0.6236841678619385, -0.07292640209197998, 0.4778313636779785, 1.0285892486572266, 1.5793468952178955, 2.1301045417785645, 2.6808624267578125, 3.2316203117370605, 3.7823779582977295, 4.333135604858398, 4.8838934898376465, 5.4346513748168945, 5.985408782958984, 6.536166667938232, 7.0869245529174805, 7.6376824378967285, 8.188440322875977, 8.739197731018066, 9.289955139160156, 9.840713500976562, 10.391470909118652, 10.942228317260742, 11.492986679077148, 12.043744087219238, 12.594502449035645, 13.145259857177734, 13.69601821899414, 14.24677562713623, 14.79753303527832, 15.348291397094727, 15.899048805236816]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 7.0, 4.0, 21.0, 38.0, 42.0, 69.0, 80.0, 137.0, 239.0, 354.0, 553.0, 858.0, 1337.0, 2108.0, 3239.0, 5077.0, 7771.0, 11889.0, 17783.0, 26921.0, 39920.0, 57111.0, 81108.0, 108010.0, 132106.0, 137480.0, 118694.0, 91148.0, 65582.0, 46169.0, 31322.0, 21487.0, 13786.0, 9236.0, 5939.0, 3802.0, 2545.0, 1621.0, 1050.0, 683.0, 438.0, 274.0, 154.0, 130.0, 85.0, 45.0, 38.0, 23.0, 16.0, 6.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-32.125, -31.127197265625, -30.12939453125, -29.131591796875, -28.1337890625, -27.135986328125, -26.13818359375, -25.140380859375, -24.142578125, -23.144775390625, -22.14697265625, -21.149169921875, -20.1513671875, -19.153564453125, -18.15576171875, -17.157958984375, -16.16015625, -15.162353515625, -14.16455078125, -13.166748046875, -12.1689453125, -11.171142578125, -10.17333984375, -9.175537109375, -8.177734375, -7.179931640625, -6.18212890625, -5.184326171875, -4.1865234375, -3.188720703125, -2.19091796875, -1.193115234375, -0.1953125, 0.802490234375, 1.80029296875, 2.798095703125, 3.7958984375, 4.793701171875, 5.79150390625, 6.789306640625, 7.787109375, 8.784912109375, 9.78271484375, 10.780517578125, 11.7783203125, 12.776123046875, 13.77392578125, 14.771728515625, 15.76953125, 16.767333984375, 17.76513671875, 18.762939453125, 19.7607421875, 20.758544921875, 21.75634765625, 22.754150390625, 23.751953125, 24.749755859375, 25.74755859375, 26.745361328125, 27.7431640625, 28.740966796875, 29.73876953125, 30.736572265625, 31.734375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 3.0, 6.0, 6.0, 4.0, 5.0, 10.0, 11.0, 13.0, 12.0, 11.0, 17.0, 20.0, 25.0, 29.0, 30.0, 33.0, 36.0, 40.0, 31.0, 51.0, 46.0, 56.0, 55.0, 56.0, 46.0, 41.0, 34.0, 39.0, 39.0, 27.0, 28.0, 27.0, 22.0, 18.0, 16.0, 12.0, 14.0, 6.0, 6.0, 7.0, 7.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.734375, -15.22509765625, -14.7158203125, -14.20654296875, -13.697265625, -13.18798828125, -12.6787109375, -12.16943359375, -11.66015625, -11.15087890625, -10.6416015625, -10.13232421875, -9.623046875, -9.11376953125, -8.6044921875, -8.09521484375, -7.5859375, -7.07666015625, -6.5673828125, -6.05810546875, -5.548828125, -5.03955078125, -4.5302734375, -4.02099609375, -3.51171875, -3.00244140625, -2.4931640625, -1.98388671875, -1.474609375, -0.96533203125, -0.4560546875, 0.05322265625, 0.5625, 1.07177734375, 1.5810546875, 2.09033203125, 2.599609375, 3.10888671875, 3.6181640625, 4.12744140625, 4.63671875, 5.14599609375, 5.6552734375, 6.16455078125, 6.673828125, 7.18310546875, 7.6923828125, 8.20166015625, 8.7109375, 9.22021484375, 9.7294921875, 10.23876953125, 10.748046875, 11.25732421875, 11.7666015625, 12.27587890625, 12.78515625, 13.29443359375, 13.8037109375, 14.31298828125, 14.822265625, 15.33154296875, 15.8408203125, 16.35009765625, 16.859375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 9.0, 28.0, 18.0, 34.0, 42.0, 73.0, 101.0, 130.0, 216.0, 276.0, 367.0, 514.0, 767.0, 1084.0, 1612.0, 2541.0, 4186.0, 7090.0, 12501.0, 25783.0, 65036.0, 218725.0, 438930.0, 166569.0, 52165.0, 21560.0, 11055.0, 6215.0, 3735.0, 2350.0, 1521.0, 961.0, 742.0, 476.0, 351.0, 211.0, 158.0, 115.0, 70.0, 73.0, 51.0, 37.0, 25.0, 22.0, 8.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.78125, -57.876953125, -55.97265625, -54.068359375, -52.1640625, -50.259765625, -48.35546875, -46.451171875, -44.546875, -42.642578125, -40.73828125, -38.833984375, -36.9296875, -35.025390625, -33.12109375, -31.216796875, -29.3125, -27.408203125, -25.50390625, -23.599609375, -21.6953125, -19.791015625, -17.88671875, -15.982421875, -14.078125, -12.173828125, -10.26953125, -8.365234375, -6.4609375, -4.556640625, -2.65234375, -0.748046875, 1.15625, 3.060546875, 4.96484375, 6.869140625, 8.7734375, 10.677734375, 12.58203125, 14.486328125, 16.390625, 18.294921875, 20.19921875, 22.103515625, 24.0078125, 25.912109375, 27.81640625, 29.720703125, 31.625, 33.529296875, 35.43359375, 37.337890625, 39.2421875, 41.146484375, 43.05078125, 44.955078125, 46.859375, 48.763671875, 50.66796875, 52.572265625, 54.4765625, 56.380859375, 58.28515625, 60.189453125, 62.09375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 6.0, 4.0, 12.0, 15.0, 15.0, 20.0, 24.0, 31.0, 25.0, 23.0, 31.0, 36.0, 39.0, 32.0, 39.0, 42.0, 50.0, 47.0, 41.0, 45.0, 52.0, 46.0, 35.0, 31.0, 39.0, 25.0, 22.0, 18.0, 12.0, 22.0, 24.0, 17.0, 7.0, 10.0, 10.0, 4.0, 7.0, 3.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5, -13.008056640625, -12.51611328125, -12.024169921875, -11.5322265625, -11.040283203125, -10.54833984375, -10.056396484375, -9.564453125, -9.072509765625, -8.58056640625, -8.088623046875, -7.5966796875, -7.104736328125, -6.61279296875, -6.120849609375, -5.62890625, -5.136962890625, -4.64501953125, -4.153076171875, -3.6611328125, -3.169189453125, -2.67724609375, -2.185302734375, -1.693359375, -1.201416015625, -0.70947265625, -0.217529296875, 0.2744140625, 0.766357421875, 1.25830078125, 1.750244140625, 2.2421875, 2.734130859375, 3.22607421875, 3.718017578125, 4.2099609375, 4.701904296875, 5.19384765625, 5.685791015625, 6.177734375, 6.669677734375, 7.16162109375, 7.653564453125, 8.1455078125, 8.637451171875, 9.12939453125, 9.621337890625, 10.11328125, 10.605224609375, 11.09716796875, 11.589111328125, 12.0810546875, 12.572998046875, 13.06494140625, 13.556884765625, 14.048828125, 14.540771484375, 15.03271484375, 15.524658203125, 16.0166015625, 16.508544921875, 17.00048828125, 17.492431640625, 17.984375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 5.0, 10.0, 6.0, 3.0, 12.0, 11.0, 19.0, 27.0, 21.0, 38.0, 72.0, 91.0, 150.0, 235.0, 371.0, 723.0, 1342.0, 2520.0, 5643.0, 16741.0, 76278.0, 756506.0, 148052.0, 25013.0, 7684.0, 3211.0, 1598.0, 840.0, 499.0, 299.0, 166.0, 101.0, 66.0, 51.0, 39.0, 26.0, 20.0, 16.0, 14.0, 9.0, 9.0, 3.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-259.0, -250.55078125, -242.1015625, -233.65234375, -225.203125, -216.75390625, -208.3046875, -199.85546875, -191.40625, -182.95703125, -174.5078125, -166.05859375, -157.609375, -149.16015625, -140.7109375, -132.26171875, -123.8125, -115.36328125, -106.9140625, -98.46484375, -90.015625, -81.56640625, -73.1171875, -64.66796875, -56.21875, -47.76953125, -39.3203125, -30.87109375, -22.421875, -13.97265625, -5.5234375, 2.92578125, 11.375, 19.82421875, 28.2734375, 36.72265625, 45.171875, 53.62109375, 62.0703125, 70.51953125, 78.96875, 87.41796875, 95.8671875, 104.31640625, 112.765625, 121.21484375, 129.6640625, 138.11328125, 146.5625, 155.01171875, 163.4609375, 171.91015625, 180.359375, 188.80859375, 197.2578125, 205.70703125, 214.15625, 222.60546875, 231.0546875, 239.50390625, 247.953125, 256.40234375, 264.8515625, 273.30078125, 281.75]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 6.0, 9.0, 12.0, 13.0, 24.0, 21.0, 29.0, 35.0, 44.0, 68.0, 104.0, 200.0, 110.0, 72.0, 61.0, 39.0, 39.0, 26.0, 17.0, 13.0, 13.0, 4.0, 11.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023284912109375, -0.022525787353515625, -0.02176666259765625, -0.021007537841796875, -0.0202484130859375, -0.019489288330078125, -0.01873016357421875, -0.017971038818359375, -0.0172119140625, -0.016452789306640625, -0.01569366455078125, -0.014934539794921875, -0.0141754150390625, -0.013416290283203125, -0.01265716552734375, -0.011898040771484375, -0.011138916015625, -0.010379791259765625, -0.00962066650390625, -0.008861541748046875, -0.0081024169921875, -0.007343292236328125, -0.00658416748046875, -0.005825042724609375, -0.00506591796875, -0.004306793212890625, -0.00354766845703125, -0.002788543701171875, -0.0020294189453125, -0.001270294189453125, -0.00051116943359375, 0.000247955322265625, 0.001007080078125, 0.001766204833984375, 0.00252532958984375, 0.003284454345703125, 0.0040435791015625, 0.004802703857421875, 0.00556182861328125, 0.006320953369140625, 0.007080078125, 0.007839202880859375, 0.00859832763671875, 0.009357452392578125, 0.0101165771484375, 0.010875701904296875, 0.01163482666015625, 0.012393951416015625, 0.013153076171875, 0.013912200927734375, 0.01467132568359375, 0.015430450439453125, 0.0161895751953125, 0.016948699951171875, 0.01770782470703125, 0.018466949462890625, 0.01922607421875, 0.019985198974609375, 0.02074432373046875, 0.021503448486328125, 0.0222625732421875, 0.023021697998046875, 0.02378082275390625, 0.024539947509765625, 0.025299072265625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 5.0, 5.0, 13.0, 11.0, 10.0, 24.0, 35.0, 45.0, 55.0, 73.0, 104.0, 147.0, 216.0, 342.0, 466.0, 710.0, 1041.0, 1525.0, 2415.0, 4081.0, 7097.0, 13551.0, 29046.0, 79767.0, 360085.0, 397983.0, 85587.0, 30762.0, 14198.0, 7448.0, 4193.0, 2527.0, 1682.0, 1044.0, 671.0, 484.0, 294.0, 219.0, 147.0, 120.0, 97.0, 70.0, 45.0, 29.0, 24.0, 21.0, 14.0, 10.0, 6.0, 8.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-62.0, -60.123046875, -58.24609375, -56.369140625, -54.4921875, -52.615234375, -50.73828125, -48.861328125, -46.984375, -45.107421875, -43.23046875, -41.353515625, -39.4765625, -37.599609375, -35.72265625, -33.845703125, -31.96875, -30.091796875, -28.21484375, -26.337890625, -24.4609375, -22.583984375, -20.70703125, -18.830078125, -16.953125, -15.076171875, -13.19921875, -11.322265625, -9.4453125, -7.568359375, -5.69140625, -3.814453125, -1.9375, -0.060546875, 1.81640625, 3.693359375, 5.5703125, 7.447265625, 9.32421875, 11.201171875, 13.078125, 14.955078125, 16.83203125, 18.708984375, 20.5859375, 22.462890625, 24.33984375, 26.216796875, 28.09375, 29.970703125, 31.84765625, 33.724609375, 35.6015625, 37.478515625, 39.35546875, 41.232421875, 43.109375, 44.986328125, 46.86328125, 48.740234375, 50.6171875, 52.494140625, 54.37109375, 56.248046875, 58.125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 0.0, 6.0, 5.0, 8.0, 10.0, 10.0, 12.0, 15.0, 14.0, 14.0, 28.0, 44.0, 34.0, 49.0, 40.0, 67.0, 92.0, 106.0, 82.0, 60.0, 49.0, 36.0, 42.0, 24.0, 29.0, 21.0, 23.0, 10.0, 8.0, 8.0, 8.0, 6.0, 10.0, 9.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.0859375, -13.6749267578125, -13.263916015625, -12.8529052734375, -12.44189453125, -12.0308837890625, -11.619873046875, -11.2088623046875, -10.7978515625, -10.3868408203125, -9.975830078125, -9.5648193359375, -9.15380859375, -8.7427978515625, -8.331787109375, -7.9207763671875, -7.509765625, -7.0987548828125, -6.687744140625, -6.2767333984375, -5.86572265625, -5.4547119140625, -5.043701171875, -4.6326904296875, -4.2216796875, -3.8106689453125, -3.399658203125, -2.9886474609375, -2.57763671875, -2.1666259765625, -1.755615234375, -1.3446044921875, -0.93359375, -0.5225830078125, -0.111572265625, 0.2994384765625, 0.71044921875, 1.1214599609375, 1.532470703125, 1.9434814453125, 2.3544921875, 2.7655029296875, 3.176513671875, 3.5875244140625, 3.99853515625, 4.4095458984375, 4.820556640625, 5.2315673828125, 5.642578125, 6.0535888671875, 6.464599609375, 6.8756103515625, 7.28662109375, 7.6976318359375, 8.108642578125, 8.5196533203125, 8.9306640625, 9.3416748046875, 9.752685546875, 10.1636962890625, 10.57470703125, 10.9857177734375, 11.396728515625, 11.8077392578125, 12.21875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 7.0, 1.0, 8.0, 7.0, 5.0, 11.0, 15.0, 16.0, 22.0, 24.0, 39.0, 39.0, 52.0, 91.0, 90.0, 104.0, 97.0, 82.0, 58.0, 45.0, 39.0, 34.0, 29.0, 18.0, 12.0, 10.0, 7.0, 6.0, 9.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-35.681339263916016, -34.799903869628906, -33.9184684753418, -33.03703308105469, -32.15559387207031, -31.274158477783203, -30.392723083496094, -29.511287689208984, -28.629850387573242, -27.748414993286133, -26.86697769165039, -25.98554229736328, -25.104106903076172, -24.22266960144043, -23.34123420715332, -22.459796905517578, -21.57836151123047, -20.69692611694336, -19.815488815307617, -18.934053421020508, -18.0526180267334, -17.171180725097656, -16.289745330810547, -15.408308982849121, -14.526874542236328, -13.645438194274902, -12.764002799987793, -11.882566452026367, -11.001130104064941, -10.119693756103516, -9.238258361816406, -8.35682201385498, -7.475385665893555, -6.593949794769287, -5.712513446807861, -4.831077575683594, -3.949641466140747, -3.0682053565979004, -2.186769485473633, -1.305333137512207, -0.42389726638793945, 0.45753878355026245, 1.3389748334884644, 2.2204108238220215, 3.101846933364868, 3.983283042907715, 4.864718914031982, 5.746155261993408, 6.627591133117676, 7.509027004241943, 8.390462875366211, 9.271899223327637, 10.153335571289062, 11.034770965576172, 11.916207313537598, 12.797643661499023, 13.679079055786133, 14.560515403747559, 15.441950798034668, 16.323387145996094, 17.204822540283203, 18.086259841918945, 18.967695236206055, 19.849132537841797, 20.730567932128906]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 10.0, 8.0, 14.0, 19.0, 17.0, 17.0, 25.0, 19.0, 27.0, 21.0, 36.0, 30.0, 42.0, 29.0, 40.0, 33.0, 49.0, 46.0, 44.0, 47.0, 41.0, 38.0, 36.0, 42.0, 36.0, 24.0, 27.0, 24.0, 28.0, 17.0, 12.0, 20.0, 14.0, 15.0, 7.0, 11.0, 9.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.817935943603516, -22.118282318115234, -21.418628692626953, -20.718975067138672, -20.01932144165039, -19.31966781616211, -18.620014190673828, -17.920360565185547, -17.220706939697266, -16.521053314208984, -15.821399688720703, -15.121746063232422, -14.42209243774414, -13.72243881225586, -13.022786140441895, -12.323132514953613, -11.623479843139648, -10.923826217651367, -10.224172592163086, -9.524518966674805, -8.824865341186523, -8.125211715698242, -7.425559043884277, -6.725905418395996, -6.026251792907715, -5.326598167419434, -4.626944541931152, -3.9272913932800293, -3.227637767791748, -2.527984142303467, -1.8283309936523438, -1.1286773681640625, -0.42902374267578125, 0.27062976360321045, 0.9702832698822021, 1.6699366569519043, 2.3695902824401855, 3.069243907928467, 3.76889705657959, 4.468550682067871, 5.168204307556152, 5.867857933044434, 6.567511558532715, 7.267164707183838, 7.966818332672119, 8.666471481323242, 9.366125106811523, 10.065778732299805, 10.765432357788086, 11.465085983276367, 12.164739608764648, 12.86439323425293, 13.564046859741211, 14.263700485229492, 14.963353157043457, 15.663006782531738, 16.362659454345703, 17.062313079833984, 17.761966705322266, 18.461620330810547, 19.161273956298828, 19.86092758178711, 20.56058120727539, 21.260234832763672, 21.959888458251953]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 8.0, 6.0, 24.0, 22.0, 41.0, 48.0, 77.0, 85.0, 136.0, 204.0, 327.0, 490.0, 734.0, 1181.0, 1897.0, 3230.0, 5625.0, 10420.0, 21276.0, 46800.0, 118080.0, 301143.0, 314073.0, 125312.0, 49490.0, 22250.0, 10891.0, 5865.0, 3302.0, 1929.0, 1217.0, 812.0, 503.0, 337.0, 239.0, 132.0, 96.0, 70.0, 45.0, 30.0, 30.0, 10.0, 16.0, 7.0, 10.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-48.125, -46.62255859375, -45.1201171875, -43.61767578125, -42.115234375, -40.61279296875, -39.1103515625, -37.60791015625, -36.10546875, -34.60302734375, -33.1005859375, -31.59814453125, -30.095703125, -28.59326171875, -27.0908203125, -25.58837890625, -24.0859375, -22.58349609375, -21.0810546875, -19.57861328125, -18.076171875, -16.57373046875, -15.0712890625, -13.56884765625, -12.06640625, -10.56396484375, -9.0615234375, -7.55908203125, -6.056640625, -4.55419921875, -3.0517578125, -1.54931640625, -0.046875, 1.45556640625, 2.9580078125, 4.46044921875, 5.962890625, 7.46533203125, 8.9677734375, 10.47021484375, 11.97265625, 13.47509765625, 14.9775390625, 16.47998046875, 17.982421875, 19.48486328125, 20.9873046875, 22.48974609375, 23.9921875, 25.49462890625, 26.9970703125, 28.49951171875, 30.001953125, 31.50439453125, 33.0068359375, 34.50927734375, 36.01171875, 37.51416015625, 39.0166015625, 40.51904296875, 42.021484375, 43.52392578125, 45.0263671875, 46.52880859375, 48.03125]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 10.0, 10.0, 9.0, 15.0, 14.0, 20.0, 18.0, 16.0, 22.0, 26.0, 29.0, 40.0, 32.0, 25.0, 52.0, 38.0, 42.0, 49.0, 51.0, 39.0, 54.0, 45.0, 29.0, 31.0, 34.0, 35.0, 31.0, 23.0, 21.0, 21.0, 18.0, 11.0, 19.0, 13.0, 11.0, 8.0, 10.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.984375, -13.5386962890625, -13.093017578125, -12.6473388671875, -12.20166015625, -11.7559814453125, -11.310302734375, -10.8646240234375, -10.4189453125, -9.9732666015625, -9.527587890625, -9.0819091796875, -8.63623046875, -8.1905517578125, -7.744873046875, -7.2991943359375, -6.853515625, -6.4078369140625, -5.962158203125, -5.5164794921875, -5.07080078125, -4.6251220703125, -4.179443359375, -3.7337646484375, -3.2880859375, -2.8424072265625, -2.396728515625, -1.9510498046875, -1.50537109375, -1.0596923828125, -0.614013671875, -0.1683349609375, 0.27734375, 0.7230224609375, 1.168701171875, 1.6143798828125, 2.06005859375, 2.5057373046875, 2.951416015625, 3.3970947265625, 3.8427734375, 4.2884521484375, 4.734130859375, 5.1798095703125, 5.62548828125, 6.0711669921875, 6.516845703125, 6.9625244140625, 7.408203125, 7.8538818359375, 8.299560546875, 8.7452392578125, 9.19091796875, 9.6365966796875, 10.082275390625, 10.5279541015625, 10.9736328125, 11.4193115234375, 11.864990234375, 12.3106689453125, 12.75634765625, 13.2020263671875, 13.647705078125, 14.0933837890625, 14.5390625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 8.0, 10.0, 5.0, 17.0, 17.0, 24.0, 32.0, 55.0, 60.0, 84.0, 102.0, 157.0, 228.0, 330.0, 498.0, 764.0, 1100.0, 2068.0, 3248.0, 6058.0, 12427.0, 28918.0, 85821.0, 403852.0, 368334.0, 80326.0, 27772.0, 11890.0, 5785.0, 3170.0, 1892.0, 1171.0, 703.0, 509.0, 357.0, 203.0, 143.0, 118.0, 72.0, 63.0, 53.0, 35.0, 17.0, 13.0, 10.0, 14.0, 5.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-76.6875, -74.12890625, -71.5703125, -69.01171875, -66.453125, -63.89453125, -61.3359375, -58.77734375, -56.21875, -53.66015625, -51.1015625, -48.54296875, -45.984375, -43.42578125, -40.8671875, -38.30859375, -35.75, -33.19140625, -30.6328125, -28.07421875, -25.515625, -22.95703125, -20.3984375, -17.83984375, -15.28125, -12.72265625, -10.1640625, -7.60546875, -5.046875, -2.48828125, 0.0703125, 2.62890625, 5.1875, 7.74609375, 10.3046875, 12.86328125, 15.421875, 17.98046875, 20.5390625, 23.09765625, 25.65625, 28.21484375, 30.7734375, 33.33203125, 35.890625, 38.44921875, 41.0078125, 43.56640625, 46.125, 48.68359375, 51.2421875, 53.80078125, 56.359375, 58.91796875, 61.4765625, 64.03515625, 66.59375, 69.15234375, 71.7109375, 74.26953125, 76.828125, 79.38671875, 81.9453125, 84.50390625, 87.0625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 2.0, 8.0, 3.0, 7.0, 8.0, 9.0, 8.0, 11.0, 10.0, 18.0, 22.0, 29.0, 32.0, 39.0, 57.0, 49.0, 66.0, 75.0, 74.0, 64.0, 62.0, 59.0, 62.0, 41.0, 44.0, 29.0, 18.0, 13.0, 14.0, 9.0, 7.0, 12.0, 9.0, 6.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.171875, -20.576171875, -19.98046875, -19.384765625, -18.7890625, -18.193359375, -17.59765625, -17.001953125, -16.40625, -15.810546875, -15.21484375, -14.619140625, -14.0234375, -13.427734375, -12.83203125, -12.236328125, -11.640625, -11.044921875, -10.44921875, -9.853515625, -9.2578125, -8.662109375, -8.06640625, -7.470703125, -6.875, -6.279296875, -5.68359375, -5.087890625, -4.4921875, -3.896484375, -3.30078125, -2.705078125, -2.109375, -1.513671875, -0.91796875, -0.322265625, 0.2734375, 0.869140625, 1.46484375, 2.060546875, 2.65625, 3.251953125, 3.84765625, 4.443359375, 5.0390625, 5.634765625, 6.23046875, 6.826171875, 7.421875, 8.017578125, 8.61328125, 9.208984375, 9.8046875, 10.400390625, 10.99609375, 11.591796875, 12.1875, 12.783203125, 13.37890625, 13.974609375, 14.5703125, 15.166015625, 15.76171875, 16.357421875, 16.953125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 3.0, 6.0, 4.0, 8.0, 3.0, 3.0, 17.0, 17.0, 15.0, 27.0, 38.0, 67.0, 87.0, 148.0, 181.0, 295.0, 527.0, 1023.0, 2145.0, 5267.0, 16578.0, 82798.0, 836639.0, 77005.0, 15861.0, 5270.0, 2106.0, 960.0, 540.0, 305.0, 170.0, 124.0, 86.0, 60.0, 40.0, 31.0, 18.0, 21.0, 13.0, 11.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-91.5, -88.59375, -85.6875, -82.78125, -79.875, -76.96875, -74.0625, -71.15625, -68.25, -65.34375, -62.4375, -59.53125, -56.625, -53.71875, -50.8125, -47.90625, -45.0, -42.09375, -39.1875, -36.28125, -33.375, -30.46875, -27.5625, -24.65625, -21.75, -18.84375, -15.9375, -13.03125, -10.125, -7.21875, -4.3125, -1.40625, 1.5, 4.40625, 7.3125, 10.21875, 13.125, 16.03125, 18.9375, 21.84375, 24.75, 27.65625, 30.5625, 33.46875, 36.375, 39.28125, 42.1875, 45.09375, 48.0, 50.90625, 53.8125, 56.71875, 59.625, 62.53125, 65.4375, 68.34375, 71.25, 74.15625, 77.0625, 79.96875, 82.875, 85.78125, 88.6875, 91.59375, 94.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 12.0, 11.0, 22.0, 44.0, 86.0, 301.0, 307.0, 109.0, 47.0, 30.0, 12.0, 5.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00382232666015625, -0.0036489367485046387, -0.0034755468368530273, -0.003302156925201416, -0.0031287670135498047, -0.0029553771018981934, -0.002781987190246582, -0.0026085972785949707, -0.0024352073669433594, -0.002261817455291748, -0.0020884275436401367, -0.0019150376319885254, -0.001741647720336914, -0.0015682578086853027, -0.0013948678970336914, -0.00122147798538208, -0.0010480880737304688, -0.0008746981620788574, -0.0007013082504272461, -0.0005279183387756348, -0.00035452842712402344, -0.0001811385154724121, -7.748603820800781e-06, 0.00016564130783081055, 0.0003390312194824219, 0.0005124211311340332, 0.0006858110427856445, 0.0008592009544372559, 0.0010325908660888672, 0.0012059807777404785, 0.0013793706893920898, 0.0015527606010437012, 0.0017261505126953125, 0.0018995404243469238, 0.002072930335998535, 0.0022463202476501465, 0.002419710159301758, 0.002593100070953369, 0.0027664899826049805, 0.002939879894256592, 0.003113269805908203, 0.0032866597175598145, 0.0034600496292114258, 0.003633439540863037, 0.0038068294525146484, 0.00398021936416626, 0.004153609275817871, 0.004326999187469482, 0.004500389099121094, 0.004673779010772705, 0.004847168922424316, 0.005020558834075928, 0.005193948745727539, 0.00536733865737915, 0.005540728569030762, 0.005714118480682373, 0.005887508392333984, 0.006060898303985596, 0.006234288215637207, 0.006407678127288818, 0.00658106803894043, 0.006754457950592041, 0.006927847862243652, 0.007101237773895264, 0.007274627685546875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 9.0, 9.0, 15.0, 22.0, 14.0, 26.0, 33.0, 48.0, 68.0, 79.0, 109.0, 141.0, 202.0, 285.0, 351.0, 554.0, 762.0, 1205.0, 2069.0, 4180.0, 10280.0, 42085.0, 820140.0, 132864.0, 18954.0, 6311.0, 2891.0, 1588.0, 961.0, 630.0, 466.0, 317.0, 219.0, 177.0, 118.0, 84.0, 66.0, 44.0, 43.0, 38.0, 24.0, 11.0, 12.0, 8.0, 16.0, 12.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-98.1875, -94.994140625, -91.80078125, -88.607421875, -85.4140625, -82.220703125, -79.02734375, -75.833984375, -72.640625, -69.447265625, -66.25390625, -63.060546875, -59.8671875, -56.673828125, -53.48046875, -50.287109375, -47.09375, -43.900390625, -40.70703125, -37.513671875, -34.3203125, -31.126953125, -27.93359375, -24.740234375, -21.546875, -18.353515625, -15.16015625, -11.966796875, -8.7734375, -5.580078125, -2.38671875, 0.806640625, 4.0, 7.193359375, 10.38671875, 13.580078125, 16.7734375, 19.966796875, 23.16015625, 26.353515625, 29.546875, 32.740234375, 35.93359375, 39.126953125, 42.3203125, 45.513671875, 48.70703125, 51.900390625, 55.09375, 58.287109375, 61.48046875, 64.673828125, 67.8671875, 71.060546875, 74.25390625, 77.447265625, 80.640625, 83.833984375, 87.02734375, 90.220703125, 93.4140625, 96.607421875, 99.80078125, 102.994140625, 106.1875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 13.0, 15.0, 17.0, 42.0, 70.0, 114.0, 352.0, 141.0, 64.0, 40.0, 35.0, 27.0, 8.0, 6.0, 8.0, 3.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.078125, -23.40234375, -22.7265625, -22.05078125, -21.375, -20.69921875, -20.0234375, -19.34765625, -18.671875, -17.99609375, -17.3203125, -16.64453125, -15.96875, -15.29296875, -14.6171875, -13.94140625, -13.265625, -12.58984375, -11.9140625, -11.23828125, -10.5625, -9.88671875, -9.2109375, -8.53515625, -7.859375, -7.18359375, -6.5078125, -5.83203125, -5.15625, -4.48046875, -3.8046875, -3.12890625, -2.453125, -1.77734375, -1.1015625, -0.42578125, 0.25, 0.92578125, 1.6015625, 2.27734375, 2.953125, 3.62890625, 4.3046875, 4.98046875, 5.65625, 6.33203125, 7.0078125, 7.68359375, 8.359375, 9.03515625, 9.7109375, 10.38671875, 11.0625, 11.73828125, 12.4140625, 13.08984375, 13.765625, 14.44140625, 15.1171875, 15.79296875, 16.46875, 17.14453125, 17.8203125, 18.49609375, 19.171875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 6.0, 7.0, 22.0, 15.0, 16.0, 26.0, 55.0, 84.0, 124.0, 185.0, 154.0, 92.0, 53.0, 37.0, 23.0, 24.0, 19.0, 13.0, 9.0, 10.0, 5.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.8348388671875, -61.2921142578125, -59.7493896484375, -58.2066650390625, -56.6639404296875, -55.1212158203125, -53.5784912109375, -52.0357666015625, -50.4930419921875, -48.9503173828125, -47.4075927734375, -45.8648681640625, -44.3221435546875, -42.7794189453125, -41.2366943359375, -39.6939697265625, -38.151248931884766, -36.608524322509766, -35.065799713134766, -33.523075103759766, -31.980350494384766, -30.437625885009766, -28.8949031829834, -27.3521785736084, -25.8094539642334, -24.2667293548584, -22.7240047454834, -21.18128204345703, -19.63855743408203, -18.09583282470703, -16.55310821533203, -15.010383605957031, -13.467655181884766, -11.924930572509766, -10.382205963134766, -8.839482307434082, -7.296757698059082, -5.754033088684082, -4.211309432983398, -2.6685848236083984, -1.1258602142333984, 0.41686415672302246, 1.9595885276794434, 3.502312660217285, 5.045037269592285, 6.587761878967285, 8.130485534667969, 9.673210144042969, 11.215934753417969, 12.758659362792969, 14.301383972167969, 15.844107627868652, 17.38683319091797, 18.92955780029297, 20.472280502319336, 22.015005111694336, 23.557729721069336, 25.100454330444336, 26.643178939819336, 28.185901641845703, 29.728626251220703, 31.271350860595703, 32.8140754699707, 34.3568000793457, 35.8995246887207]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 10.0, 5.0, 6.0, 10.0, 14.0, 17.0, 14.0, 19.0, 23.0, 31.0, 31.0, 43.0, 35.0, 44.0, 38.0, 41.0, 42.0, 51.0, 42.0, 40.0, 35.0, 46.0, 23.0, 40.0, 43.0, 37.0, 25.0, 32.0, 27.0, 18.0, 19.0, 11.0, 11.0, 12.0, 8.0, 6.0, 7.0, 8.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-29.94864273071289, -29.023019790649414, -28.097396850585938, -27.17177391052246, -26.246150970458984, -25.320528030395508, -24.39490509033203, -23.469282150268555, -22.543659210205078, -21.6180362701416, -20.692413330078125, -19.76679039001465, -18.841167449951172, -17.915544509887695, -16.98992156982422, -16.064298629760742, -15.138675689697266, -14.213052749633789, -13.287429809570312, -12.361806869506836, -11.43618392944336, -10.510560989379883, -9.584938049316406, -8.65931510925293, -7.733692169189453, -6.808069229125977, -5.8824462890625, -4.956823348999023, -4.031200408935547, -3.1055774688720703, -2.1799545288085938, -1.2543315887451172, -0.32871055603027344, 0.5969123840332031, 1.5225353240966797, 2.4481582641601562, 3.373781204223633, 4.299404144287109, 5.225027084350586, 6.1506500244140625, 7.076272964477539, 8.001895904541016, 8.927518844604492, 9.853141784667969, 10.778764724731445, 11.704387664794922, 12.630010604858398, 13.555633544921875, 14.481256484985352, 15.406879425048828, 16.332502365112305, 17.25812530517578, 18.183748245239258, 19.109371185302734, 20.03499412536621, 20.960617065429688, 21.886240005493164, 22.81186294555664, 23.737485885620117, 24.663108825683594, 25.58873176574707, 26.514354705810547, 27.439977645874023, 28.3656005859375, 29.291223526000977]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 7.0, 15.0, 17.0, 35.0, 34.0, 41.0, 81.0, 100.0, 128.0, 190.0, 280.0, 407.0, 597.0, 888.0, 1301.0, 2073.0, 3336.0, 5607.0, 9410.0, 17388.0, 34843.0, 97454.0, 993415.0, 2673438.0, 246290.0, 53482.0, 23930.0, 12440.0, 6866.0, 3856.0, 2288.0, 1419.0, 850.0, 589.0, 351.0, 281.0, 166.0, 102.0, 89.0, 59.0, 39.0, 27.0, 17.0, 20.0, 11.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.03125, -49.3974609375, -47.763671875, -46.1298828125, -44.49609375, -42.8623046875, -41.228515625, -39.5947265625, -37.9609375, -36.3271484375, -34.693359375, -33.0595703125, -31.42578125, -29.7919921875, -28.158203125, -26.5244140625, -24.890625, -23.2568359375, -21.623046875, -19.9892578125, -18.35546875, -16.7216796875, -15.087890625, -13.4541015625, -11.8203125, -10.1865234375, -8.552734375, -6.9189453125, -5.28515625, -3.6513671875, -2.017578125, -0.3837890625, 1.25, 2.8837890625, 4.517578125, 6.1513671875, 7.78515625, 9.4189453125, 11.052734375, 12.6865234375, 14.3203125, 15.9541015625, 17.587890625, 19.2216796875, 20.85546875, 22.4892578125, 24.123046875, 25.7568359375, 27.390625, 29.0244140625, 30.658203125, 32.2919921875, 33.92578125, 35.5595703125, 37.193359375, 38.8271484375, 40.4609375, 42.0947265625, 43.728515625, 45.3623046875, 46.99609375, 48.6298828125, 50.263671875, 51.8974609375, 53.53125]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 6.0, 8.0, 4.0, 8.0, 6.0, 6.0, 12.0, 10.0, 13.0, 13.0, 17.0, 23.0, 22.0, 30.0, 33.0, 27.0, 33.0, 40.0, 48.0, 36.0, 37.0, 49.0, 33.0, 43.0, 50.0, 41.0, 30.0, 41.0, 25.0, 46.0, 27.0, 34.0, 32.0, 21.0, 19.0, 17.0, 9.0, 12.0, 9.0, 8.0, 3.0, 5.0, 4.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.0859375, -14.620361328125, -14.15478515625, -13.689208984375, -13.2236328125, -12.758056640625, -12.29248046875, -11.826904296875, -11.361328125, -10.895751953125, -10.43017578125, -9.964599609375, -9.4990234375, -9.033447265625, -8.56787109375, -8.102294921875, -7.63671875, -7.171142578125, -6.70556640625, -6.239990234375, -5.7744140625, -5.308837890625, -4.84326171875, -4.377685546875, -3.912109375, -3.446533203125, -2.98095703125, -2.515380859375, -2.0498046875, -1.584228515625, -1.11865234375, -0.653076171875, -0.1875, 0.278076171875, 0.74365234375, 1.209228515625, 1.6748046875, 2.140380859375, 2.60595703125, 3.071533203125, 3.537109375, 4.002685546875, 4.46826171875, 4.933837890625, 5.3994140625, 5.864990234375, 6.33056640625, 6.796142578125, 7.26171875, 7.727294921875, 8.19287109375, 8.658447265625, 9.1240234375, 9.589599609375, 10.05517578125, 10.520751953125, 10.986328125, 11.451904296875, 11.91748046875, 12.383056640625, 12.8486328125, 13.314208984375, 13.77978515625, 14.245361328125, 14.7109375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 8.0, 3.0, 10.0, 7.0, 17.0, 14.0, 23.0, 30.0, 50.0, 71.0, 75.0, 113.0, 124.0, 155.0, 252.0, 319.0, 460.0, 637.0, 914.0, 1501.0, 2581.0, 4747.0, 9958.0, 25004.0, 113280.0, 3603013.0, 360517.0, 41511.0, 13941.0, 6234.0, 3121.0, 1808.0, 1069.0, 722.0, 510.0, 395.0, 259.0, 182.0, 133.0, 128.0, 94.0, 69.0, 67.0, 56.0, 23.0, 16.0, 10.0, 9.0, 9.0, 9.0, 6.0, 6.0, 5.0, 7.0, 1.0, 2.0, 2.0], "bins": [-141.5, -137.173828125, -132.84765625, -128.521484375, -124.1953125, -119.869140625, -115.54296875, -111.216796875, -106.890625, -102.564453125, -98.23828125, -93.912109375, -89.5859375, -85.259765625, -80.93359375, -76.607421875, -72.28125, -67.955078125, -63.62890625, -59.302734375, -54.9765625, -50.650390625, -46.32421875, -41.998046875, -37.671875, -33.345703125, -29.01953125, -24.693359375, -20.3671875, -16.041015625, -11.71484375, -7.388671875, -3.0625, 1.263671875, 5.58984375, 9.916015625, 14.2421875, 18.568359375, 22.89453125, 27.220703125, 31.546875, 35.873046875, 40.19921875, 44.525390625, 48.8515625, 53.177734375, 57.50390625, 61.830078125, 66.15625, 70.482421875, 74.80859375, 79.134765625, 83.4609375, 87.787109375, 92.11328125, 96.439453125, 100.765625, 105.091796875, 109.41796875, 113.744140625, 118.0703125, 122.396484375, 126.72265625, 131.048828125, 135.375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 8.0, 1.0, 7.0, 6.0, 2.0, 5.0, 12.0, 12.0, 14.0, 16.0, 17.0, 14.0, 27.0, 34.0, 43.0, 95.0, 149.0, 552.0, 1239.0, 867.0, 360.0, 180.0, 111.0, 95.0, 49.0, 40.0, 30.0, 13.0, 11.0, 14.0, 7.0, 7.0, 6.0, 6.0, 7.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.203125, -24.40869140625, -23.6142578125, -22.81982421875, -22.025390625, -21.23095703125, -20.4365234375, -19.64208984375, -18.84765625, -18.05322265625, -17.2587890625, -16.46435546875, -15.669921875, -14.87548828125, -14.0810546875, -13.28662109375, -12.4921875, -11.69775390625, -10.9033203125, -10.10888671875, -9.314453125, -8.52001953125, -7.7255859375, -6.93115234375, -6.13671875, -5.34228515625, -4.5478515625, -3.75341796875, -2.958984375, -2.16455078125, -1.3701171875, -0.57568359375, 0.21875, 1.01318359375, 1.8076171875, 2.60205078125, 3.396484375, 4.19091796875, 4.9853515625, 5.77978515625, 6.57421875, 7.36865234375, 8.1630859375, 8.95751953125, 9.751953125, 10.54638671875, 11.3408203125, 12.13525390625, 12.9296875, 13.72412109375, 14.5185546875, 15.31298828125, 16.107421875, 16.90185546875, 17.6962890625, 18.49072265625, 19.28515625, 20.07958984375, 20.8740234375, 21.66845703125, 22.462890625, 23.25732421875, 24.0517578125, 24.84619140625, 25.640625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 1.0, 13.0, 18.0, 9.0, 25.0, 117.0, 441.0, 145.0, 71.0, 53.0, 36.0, 19.0, 13.0, 11.0, 7.0, 1.0, 3.0, 0.0, 2.0], "bins": [-211.0430908203125, -206.93154907226562, -202.82000732421875, -198.70846557617188, -194.59690856933594, -190.48536682128906, -186.3738250732422, -182.2622833251953, -178.15074157714844, -174.03919982910156, -169.9276580810547, -165.81610107421875, -161.70455932617188, -157.593017578125, -153.48147583007812, -149.36993408203125, -145.25839233398438, -141.1468505859375, -137.03530883789062, -132.92376708984375, -128.8122100830078, -124.70066833496094, -120.58912658691406, -116.47758483886719, -112.36602783203125, -108.25448608398438, -104.14293670654297, -100.0313949584961, -95.91985321044922, -91.80830383300781, -87.69676208496094, -83.58522033691406, -79.47367095947266, -75.36212921142578, -71.25057983398438, -67.1390380859375, -63.027496337890625, -58.915950775146484, -54.804405212402344, -50.69286346435547, -46.58131790161133, -42.46977233886719, -38.35823059082031, -34.24668502807617, -30.135141372680664, -26.023597717285156, -21.912052154541016, -17.800508499145508, -13.68896484375, -9.577421188354492, -5.465876579284668, -1.3543319702148438, 2.757211685180664, 6.868755340576172, 10.980300903320312, 15.09184455871582, 19.203388214111328, 23.314931869506836, 27.426475524902344, 31.538021087646484, 35.649566650390625, 39.7611083984375, 43.87265396118164, 47.98419952392578, 52.095741271972656]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 7.0, 5.0, 9.0, 4.0, 8.0, 10.0, 13.0, 10.0, 13.0, 17.0, 13.0, 20.0, 17.0, 24.0, 28.0, 23.0, 25.0, 25.0, 47.0, 42.0, 44.0, 34.0, 55.0, 37.0, 42.0, 43.0, 23.0, 58.0, 37.0, 42.0, 33.0, 25.0, 13.0, 22.0, 16.0, 16.0, 15.0, 13.0, 11.0, 19.0, 7.0, 4.0, 7.0, 4.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-50.06481170654297, -48.45705032348633, -46.84928894042969, -45.24152755737305, -43.633766174316406, -42.02600860595703, -40.418243408203125, -38.81048583984375, -37.20272445678711, -35.59496307373047, -33.98720169067383, -32.37944030761719, -30.77168083190918, -29.16391944885254, -27.5561580657959, -25.94839859008789, -24.340635299682617, -22.732873916625977, -21.125112533569336, -19.517353057861328, -17.909591674804688, -16.301830291748047, -14.694068908691406, -13.086308479309082, -11.478547096252441, -9.8707857131958, -8.263025283813477, -6.655263900756836, -5.0475029945373535, -3.439742088317871, -1.8319807052612305, -0.22422027587890625, 1.3835411071777344, 2.991302013397217, 4.599062919616699, 6.20682430267334, 7.814585208892822, 9.422346115112305, 11.030107498168945, 12.63786792755127, 14.24562931060791, 15.85339069366455, 17.461151123046875, 19.068912506103516, 20.676673889160156, 22.284435272216797, 23.892196655273438, 25.499956130981445, 27.107717514038086, 28.715478897094727, 30.323240280151367, 31.930999755859375, 33.538761138916016, 35.146522521972656, 36.7542839050293, 38.36204528808594, 39.96980667114258, 41.57756805419922, 43.18532943725586, 44.7930908203125, 46.40085220336914, 48.00861358642578, 49.616371154785156, 51.2241325378418, 52.83189392089844]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 9.0, 11.0, 17.0, 29.0, 32.0, 51.0, 76.0, 89.0, 148.0, 212.0, 294.0, 430.0, 656.0, 984.0, 1683.0, 2737.0, 4685.0, 8943.0, 17755.0, 42029.0, 128166.0, 512651.0, 217387.0, 59875.0, 23561.0, 11304.0, 5895.0, 3207.0, 2075.0, 1164.0, 764.0, 536.0, 343.0, 227.0, 162.0, 110.0, 78.0, 47.0, 46.0, 19.0, 21.0, 14.0, 9.0, 14.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-78.3125, -75.759765625, -73.20703125, -70.654296875, -68.1015625, -65.548828125, -62.99609375, -60.443359375, -57.890625, -55.337890625, -52.78515625, -50.232421875, -47.6796875, -45.126953125, -42.57421875, -40.021484375, -37.46875, -34.916015625, -32.36328125, -29.810546875, -27.2578125, -24.705078125, -22.15234375, -19.599609375, -17.046875, -14.494140625, -11.94140625, -9.388671875, -6.8359375, -4.283203125, -1.73046875, 0.822265625, 3.375, 5.927734375, 8.48046875, 11.033203125, 13.5859375, 16.138671875, 18.69140625, 21.244140625, 23.796875, 26.349609375, 28.90234375, 31.455078125, 34.0078125, 36.560546875, 39.11328125, 41.666015625, 44.21875, 46.771484375, 49.32421875, 51.876953125, 54.4296875, 56.982421875, 59.53515625, 62.087890625, 64.640625, 67.193359375, 69.74609375, 72.298828125, 74.8515625, 77.404296875, 79.95703125, 82.509765625, 85.0625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 9.0, 0.0, 6.0, 7.0, 6.0, 5.0, 8.0, 10.0, 6.0, 9.0, 16.0, 14.0, 14.0, 15.0, 23.0, 23.0, 26.0, 30.0, 16.0, 22.0, 35.0, 51.0, 42.0, 38.0, 50.0, 42.0, 38.0, 38.0, 35.0, 44.0, 47.0, 33.0, 31.0, 29.0, 30.0, 17.0, 15.0, 20.0, 11.0, 20.0, 7.0, 15.0, 10.0, 8.0, 7.0, 4.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 8.0, 1.0, 3.0, 1.0], "bins": [-52.3125, -50.75341796875, -49.1943359375, -47.63525390625, -46.076171875, -44.51708984375, -42.9580078125, -41.39892578125, -39.83984375, -38.28076171875, -36.7216796875, -35.16259765625, -33.603515625, -32.04443359375, -30.4853515625, -28.92626953125, -27.3671875, -25.80810546875, -24.2490234375, -22.68994140625, -21.130859375, -19.57177734375, -18.0126953125, -16.45361328125, -14.89453125, -13.33544921875, -11.7763671875, -10.21728515625, -8.658203125, -7.09912109375, -5.5400390625, -3.98095703125, -2.421875, -0.86279296875, 0.6962890625, 2.25537109375, 3.814453125, 5.37353515625, 6.9326171875, 8.49169921875, 10.05078125, 11.60986328125, 13.1689453125, 14.72802734375, 16.287109375, 17.84619140625, 19.4052734375, 20.96435546875, 22.5234375, 24.08251953125, 25.6416015625, 27.20068359375, 28.759765625, 30.31884765625, 31.8779296875, 33.43701171875, 34.99609375, 36.55517578125, 38.1142578125, 39.67333984375, 41.232421875, 42.79150390625, 44.3505859375, 45.90966796875, 47.46875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 23.0, 17.0, 21.0, 25.0, 60.0, 71.0, 127.0, 204.0, 326.0, 541.0, 949.0, 1833.0, 3793.0, 9842.0, 35695.0, 509547.0, 434051.0, 34168.0, 9368.0, 3774.0, 1715.0, 991.0, 528.0, 314.0, 198.0, 108.0, 91.0, 52.0, 40.0, 21.0, 12.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.25, -165.72265625, -160.1953125, -154.66796875, -149.140625, -143.61328125, -138.0859375, -132.55859375, -127.03125, -121.50390625, -115.9765625, -110.44921875, -104.921875, -99.39453125, -93.8671875, -88.33984375, -82.8125, -77.28515625, -71.7578125, -66.23046875, -60.703125, -55.17578125, -49.6484375, -44.12109375, -38.59375, -33.06640625, -27.5390625, -22.01171875, -16.484375, -10.95703125, -5.4296875, 0.09765625, 5.625, 11.15234375, 16.6796875, 22.20703125, 27.734375, 33.26171875, 38.7890625, 44.31640625, 49.84375, 55.37109375, 60.8984375, 66.42578125, 71.953125, 77.48046875, 83.0078125, 88.53515625, 94.0625, 99.58984375, 105.1171875, 110.64453125, 116.171875, 121.69921875, 127.2265625, 132.75390625, 138.28125, 143.80859375, 149.3359375, 154.86328125, 160.390625, 165.91796875, 171.4453125, 176.97265625, 182.5]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 7.0, 10.0, 5.0, 7.0, 12.0, 5.0, 19.0, 17.0, 32.0, 31.0, 61.0, 72.0, 77.0, 93.0, 111.0, 91.0, 64.0, 61.0, 44.0, 27.0, 27.0, 30.0, 12.0, 16.0, 9.0, 8.0, 10.0, 10.0, 5.0, 2.0, 5.0, 4.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.25, -52.3330078125, -50.416015625, -48.4990234375, -46.58203125, -44.6650390625, -42.748046875, -40.8310546875, -38.9140625, -36.9970703125, -35.080078125, -33.1630859375, -31.24609375, -29.3291015625, -27.412109375, -25.4951171875, -23.578125, -21.6611328125, -19.744140625, -17.8271484375, -15.91015625, -13.9931640625, -12.076171875, -10.1591796875, -8.2421875, -6.3251953125, -4.408203125, -2.4912109375, -0.57421875, 1.3427734375, 3.259765625, 5.1767578125, 7.09375, 9.0107421875, 10.927734375, 12.8447265625, 14.76171875, 16.6787109375, 18.595703125, 20.5126953125, 22.4296875, 24.3466796875, 26.263671875, 28.1806640625, 30.09765625, 32.0146484375, 33.931640625, 35.8486328125, 37.765625, 39.6826171875, 41.599609375, 43.5166015625, 45.43359375, 47.3505859375, 49.267578125, 51.1845703125, 53.1015625, 55.0185546875, 56.935546875, 58.8525390625, 60.76953125, 62.6865234375, 64.603515625, 66.5205078125, 68.4375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 4.0, 9.0, 5.0, 15.0, 4.0, 13.0, 13.0, 20.0, 27.0, 19.0, 45.0, 57.0, 110.0, 215.0, 416.0, 1044.0, 3062.0, 17382.0, 979756.0, 39489.0, 4321.0, 1361.0, 520.0, 256.0, 123.0, 83.0, 39.0, 29.0, 22.0, 20.0, 18.0, 10.0, 7.0, 11.0, 10.0, 6.0, 7.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-280.25, -271.390625, -262.53125, -253.671875, -244.8125, -235.953125, -227.09375, -218.234375, -209.375, -200.515625, -191.65625, -182.796875, -173.9375, -165.078125, -156.21875, -147.359375, -138.5, -129.640625, -120.78125, -111.921875, -103.0625, -94.203125, -85.34375, -76.484375, -67.625, -58.765625, -49.90625, -41.046875, -32.1875, -23.328125, -14.46875, -5.609375, 3.25, 12.109375, 20.96875, 29.828125, 38.6875, 47.546875, 56.40625, 65.265625, 74.125, 82.984375, 91.84375, 100.703125, 109.5625, 118.421875, 127.28125, 136.140625, 145.0, 153.859375, 162.71875, 171.578125, 180.4375, 189.296875, 198.15625, 207.015625, 215.875, 224.734375, 233.59375, 242.453125, 251.3125, 260.171875, 269.03125, 277.890625, 286.75]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 4.0, 6.0, 9.0, 8.0, 14.0, 8.0, 10.0, 23.0, 28.0, 67.0, 70.0, 148.0, 209.0, 119.0, 90.0, 55.0, 32.0, 24.0, 15.0, 14.0, 8.0, 9.0, 10.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0020923614501953125, -0.0020365864038467407, -0.001980811357498169, -0.0019250363111495972, -0.0018692612648010254, -0.0018134862184524536, -0.0017577111721038818, -0.00170193612575531, -0.0016461610794067383, -0.0015903860330581665, -0.0015346109867095947, -0.001478835940361023, -0.0014230608940124512, -0.0013672858476638794, -0.0013115108013153076, -0.0012557357549667358, -0.001199960708618164, -0.0011441856622695923, -0.0010884106159210205, -0.0010326355695724487, -0.000976860523223877, -0.0009210854768753052, -0.0008653104305267334, -0.0008095353841781616, -0.0007537603378295898, -0.0006979852914810181, -0.0006422102451324463, -0.0005864351987838745, -0.0005306601524353027, -0.00047488510608673096, -0.0004191100597381592, -0.0003633350133895874, -0.0003075599670410156, -0.00025178492069244385, -0.00019600987434387207, -0.0001402348279953003, -8.445978164672852e-05, -2.8684735298156738e-05, 2.709031105041504e-05, 8.286535739898682e-05, 0.0001386404037475586, 0.00019441545009613037, 0.00025019049644470215, 0.0003059655427932739, 0.0003617405891418457, 0.0004175156354904175, 0.00047329068183898926, 0.000529065728187561, 0.0005848407745361328, 0.0006406158208847046, 0.0006963908672332764, 0.0007521659135818481, 0.0008079409599304199, 0.0008637160062789917, 0.0009194910526275635, 0.0009752660989761353, 0.001031041145324707, 0.0010868161916732788, 0.0011425912380218506, 0.0011983662843704224, 0.0012541413307189941, 0.001309916377067566, 0.0013656914234161377, 0.0014214664697647095, 0.0014772415161132812]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 4.0, 5.0, 6.0, 4.0, 4.0, 7.0, 9.0, 7.0, 6.0, 13.0, 19.0, 26.0, 43.0, 58.0, 94.0, 164.0, 331.0, 817.0, 2449.0, 28474.0, 1004118.0, 9060.0, 1608.0, 549.0, 276.0, 134.0, 77.0, 55.0, 33.0, 21.0, 24.0, 16.0, 8.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-447.0, -432.73046875, -418.4609375, -404.19140625, -389.921875, -375.65234375, -361.3828125, -347.11328125, -332.84375, -318.57421875, -304.3046875, -290.03515625, -275.765625, -261.49609375, -247.2265625, -232.95703125, -218.6875, -204.41796875, -190.1484375, -175.87890625, -161.609375, -147.33984375, -133.0703125, -118.80078125, -104.53125, -90.26171875, -75.9921875, -61.72265625, -47.453125, -33.18359375, -18.9140625, -4.64453125, 9.625, 23.89453125, 38.1640625, 52.43359375, 66.703125, 80.97265625, 95.2421875, 109.51171875, 123.78125, 138.05078125, 152.3203125, 166.58984375, 180.859375, 195.12890625, 209.3984375, 223.66796875, 237.9375, 252.20703125, 266.4765625, 280.74609375, 295.015625, 309.28515625, 323.5546875, 337.82421875, 352.09375, 366.36328125, 380.6328125, 394.90234375, 409.171875, 423.44140625, 437.7109375, 451.98046875, 466.25]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 19.0, 54.0, 208.0, 550.0, 103.0, 26.0, 18.0, 11.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.4375, -83.0849609375, -80.732421875, -78.3798828125, -76.02734375, -73.6748046875, -71.322265625, -68.9697265625, -66.6171875, -64.2646484375, -61.912109375, -59.5595703125, -57.20703125, -54.8544921875, -52.501953125, -50.1494140625, -47.796875, -45.4443359375, -43.091796875, -40.7392578125, -38.38671875, -36.0341796875, -33.681640625, -31.3291015625, -28.9765625, -26.6240234375, -24.271484375, -21.9189453125, -19.56640625, -17.2138671875, -14.861328125, -12.5087890625, -10.15625, -7.8037109375, -5.451171875, -3.0986328125, -0.74609375, 1.6064453125, 3.958984375, 6.3115234375, 8.6640625, 11.0166015625, 13.369140625, 15.7216796875, 18.07421875, 20.4267578125, 22.779296875, 25.1318359375, 27.484375, 29.8369140625, 32.189453125, 34.5419921875, 36.89453125, 39.2470703125, 41.599609375, 43.9521484375, 46.3046875, 48.6572265625, 51.009765625, 53.3623046875, 55.71484375, 58.0673828125, 60.419921875, 62.7724609375, 65.125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 15.0, 13.0, 23.0, 35.0, 152.0, 422.0, 139.0, 60.0, 44.0, 34.0, 15.0, 11.0, 3.0, 4.0, 1.0, 2.0], "bins": [-265.3590393066406, -260.35589599609375, -255.3527374267578, -250.34957885742188, -245.34642028808594, -240.34326171875, -235.34011840820312, -230.3369598388672, -225.33380126953125, -220.3306427001953, -215.32749938964844, -210.3243408203125, -205.32118225097656, -200.31802368164062, -195.31488037109375, -190.3117218017578, -185.30856323242188, -180.30540466308594, -175.30226135253906, -170.29910278320312, -165.2959442138672, -160.29278564453125, -155.28964233398438, -150.28648376464844, -145.28334045410156, -140.28018188476562, -135.27703857421875, -130.2738800048828, -125.27072143554688, -120.26757049560547, -115.26441955566406, -110.26126098632812, -105.25810241699219, -100.25495147705078, -95.25179290771484, -90.24864196777344, -85.2454833984375, -80.2423324584961, -75.23918151855469, -70.23602294921875, -65.23286437988281, -60.22970962524414, -55.22655487060547, -50.22340393066406, -45.220245361328125, -40.21709442138672, -35.21393966674805, -30.210784912109375, -25.20763397216797, -20.204479217529297, -15.201325416564941, -10.198171615600586, -5.195016860961914, -0.1918621063232422, 4.811290740966797, 9.814445495605469, 14.81760025024414, 19.820755004882812, 24.823909759521484, 29.827062606811523, 34.83021545410156, 39.8333740234375, 44.836524963378906, 49.83967971801758, 54.84283447265625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 2.0, 4.0, 5.0, 3.0, 8.0, 11.0, 6.0, 8.0, 14.0, 11.0, 15.0, 20.0, 14.0, 22.0, 19.0, 22.0, 29.0, 27.0, 24.0, 39.0, 43.0, 43.0, 40.0, 50.0, 46.0, 39.0, 39.0, 41.0, 36.0, 30.0, 33.0, 39.0, 30.0, 31.0, 18.0, 17.0, 20.0, 19.0, 19.0, 8.0, 10.0, 12.0, 4.0, 5.0, 10.0, 6.0, 5.0, 2.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-55.125999450683594, -53.378211975097656, -51.63042449951172, -49.88263702392578, -48.134849548339844, -46.387062072753906, -44.63927459716797, -42.89148712158203, -41.143699645996094, -39.395912170410156, -37.64812469482422, -35.90033721923828, -34.152549743652344, -32.404762268066406, -30.656972885131836, -28.9091854095459, -27.161396026611328, -25.41360855102539, -23.665821075439453, -21.918033599853516, -20.170246124267578, -18.42245864868164, -16.67466926574707, -14.926881790161133, -13.179094314575195, -11.431306838989258, -9.68351936340332, -7.935730934143066, -6.187943458557129, -4.440155982971191, -2.6923675537109375, -0.944580078125, 0.8032035827636719, 2.5509912967681885, 4.298779010772705, 6.046566963195801, 7.794354438781738, 9.542141914367676, 11.28993034362793, 13.037717819213867, 14.785505294799805, 16.533292770385742, 18.28108024597168, 20.02886962890625, 21.776657104492188, 23.524444580078125, 25.272232055664062, 27.02001953125, 28.767807006835938, 30.515594482421875, 32.26338195800781, 34.01116943359375, 35.75895690917969, 37.506744384765625, 39.25453186035156, 41.0023193359375, 42.75010681152344, 44.497894287109375, 46.24568176269531, 47.99346923828125, 49.74125671386719, 51.489044189453125, 53.23683166503906, 54.984619140625, 56.7324104309082]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 11.0, 13.0, 28.0, 23.0, 36.0, 58.0, 79.0, 108.0, 165.0, 201.0, 286.0, 364.0, 557.0, 840.0, 1057.0, 1533.0, 2329.0, 3323.0, 5006.0, 7520.0, 12141.0, 20156.0, 36265.0, 80159.0, 319645.0, 373543.0, 86841.0, 38214.0, 20895.0, 12649.0, 7948.0, 5105.0, 3496.0, 2376.0, 1583.0, 1148.0, 781.0, 606.0, 413.0, 293.0, 215.0, 159.0, 115.0, 79.0, 51.0, 44.0, 30.0, 28.0, 12.0, 10.0, 3.0, 8.0, 2.0, 1.0, 0.0, 2.0], "bins": [-69.4375, -67.3359375, -65.234375, -63.1328125, -61.03125, -58.9296875, -56.828125, -54.7265625, -52.625, -50.5234375, -48.421875, -46.3203125, -44.21875, -42.1171875, -40.015625, -37.9140625, -35.8125, -33.7109375, -31.609375, -29.5078125, -27.40625, -25.3046875, -23.203125, -21.1015625, -19.0, -16.8984375, -14.796875, -12.6953125, -10.59375, -8.4921875, -6.390625, -4.2890625, -2.1875, -0.0859375, 2.015625, 4.1171875, 6.21875, 8.3203125, 10.421875, 12.5234375, 14.625, 16.7265625, 18.828125, 20.9296875, 23.03125, 25.1328125, 27.234375, 29.3359375, 31.4375, 33.5390625, 35.640625, 37.7421875, 39.84375, 41.9453125, 44.046875, 46.1484375, 48.25, 50.3515625, 52.453125, 54.5546875, 56.65625, 58.7578125, 60.859375, 62.9609375, 65.0625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 4.0, 4.0, 11.0, 8.0, 10.0, 21.0, 16.0, 17.0, 9.0, 20.0, 29.0, 27.0, 28.0, 26.0, 31.0, 36.0, 46.0, 54.0, 47.0, 41.0, 49.0, 46.0, 41.0, 41.0, 37.0, 35.0, 31.0, 34.0, 28.0, 28.0, 16.0, 21.0, 13.0, 17.0, 12.0, 12.0, 6.0, 5.0, 5.0, 5.0, 6.0, 8.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-49.65625, -48.1015625, -46.546875, -44.9921875, -43.4375, -41.8828125, -40.328125, -38.7734375, -37.21875, -35.6640625, -34.109375, -32.5546875, -31.0, -29.4453125, -27.890625, -26.3359375, -24.78125, -23.2265625, -21.671875, -20.1171875, -18.5625, -17.0078125, -15.453125, -13.8984375, -12.34375, -10.7890625, -9.234375, -7.6796875, -6.125, -4.5703125, -3.015625, -1.4609375, 0.09375, 1.6484375, 3.203125, 4.7578125, 6.3125, 7.8671875, 9.421875, 10.9765625, 12.53125, 14.0859375, 15.640625, 17.1953125, 18.75, 20.3046875, 21.859375, 23.4140625, 24.96875, 26.5234375, 28.078125, 29.6328125, 31.1875, 32.7421875, 34.296875, 35.8515625, 37.40625, 38.9609375, 40.515625, 42.0703125, 43.625, 45.1796875, 46.734375, 48.2890625, 49.84375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 3.0, 5.0, 9.0, 14.0, 35.0, 28.0, 31.0, 44.0, 67.0, 74.0, 103.0, 144.0, 169.0, 233.0, 349.0, 391.0, 548.0, 734.0, 1101.0, 1527.0, 2257.0, 3790.0, 6729.0, 14596.0, 50394.0, 775509.0, 140797.0, 25136.0, 9535.0, 4821.0, 2856.0, 1767.0, 1229.0, 849.0, 649.0, 502.0, 322.0, 257.0, 237.0, 153.0, 142.0, 91.0, 84.0, 54.0, 48.0, 34.0, 24.0, 13.0, 21.0, 14.0, 14.0, 6.0, 3.0, 4.0, 5.0, 0.0, 1.0, 3.0], "bins": [-470.0, -455.1953125, -440.390625, -425.5859375, -410.78125, -395.9765625, -381.171875, -366.3671875, -351.5625, -336.7578125, -321.953125, -307.1484375, -292.34375, -277.5390625, -262.734375, -247.9296875, -233.125, -218.3203125, -203.515625, -188.7109375, -173.90625, -159.1015625, -144.296875, -129.4921875, -114.6875, -99.8828125, -85.078125, -70.2734375, -55.46875, -40.6640625, -25.859375, -11.0546875, 3.75, 18.5546875, 33.359375, 48.1640625, 62.96875, 77.7734375, 92.578125, 107.3828125, 122.1875, 136.9921875, 151.796875, 166.6015625, 181.40625, 196.2109375, 211.015625, 225.8203125, 240.625, 255.4296875, 270.234375, 285.0390625, 299.84375, 314.6484375, 329.453125, 344.2578125, 359.0625, 373.8671875, 388.671875, 403.4765625, 418.28125, 433.0859375, 447.890625, 462.6953125, 477.5]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 7.0, 4.0, 1.0, 5.0, 6.0, 13.0, 15.0, 13.0, 12.0, 8.0, 12.0, 16.0, 12.0, 19.0, 23.0, 11.0, 19.0, 25.0, 37.0, 37.0, 62.0, 114.0, 115.0, 69.0, 53.0, 37.0, 18.0, 30.0, 25.0, 24.0, 19.0, 23.0, 18.0, 15.0, 19.0, 9.0, 11.0, 9.0, 8.0, 5.0, 7.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-97.1875, -94.171875, -91.15625, -88.140625, -85.125, -82.109375, -79.09375, -76.078125, -73.0625, -70.046875, -67.03125, -64.015625, -61.0, -57.984375, -54.96875, -51.953125, -48.9375, -45.921875, -42.90625, -39.890625, -36.875, -33.859375, -30.84375, -27.828125, -24.8125, -21.796875, -18.78125, -15.765625, -12.75, -9.734375, -6.71875, -3.703125, -0.6875, 2.328125, 5.34375, 8.359375, 11.375, 14.390625, 17.40625, 20.421875, 23.4375, 26.453125, 29.46875, 32.484375, 35.5, 38.515625, 41.53125, 44.546875, 47.5625, 50.578125, 53.59375, 56.609375, 59.625, 62.640625, 65.65625, 68.671875, 71.6875, 74.703125, 77.71875, 80.734375, 83.75, 86.765625, 89.78125, 92.796875, 95.8125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 11.0, 7.0, 11.0, 10.0, 11.0, 22.0, 18.0, 31.0, 47.0, 48.0, 81.0, 94.0, 134.0, 174.0, 280.0, 387.0, 570.0, 944.0, 1631.0, 3429.0, 11686.0, 956621.0, 59789.0, 6277.0, 2476.0, 1300.0, 745.0, 484.0, 335.0, 226.0, 163.0, 124.0, 83.0, 62.0, 56.0, 31.0, 32.0, 30.0, 14.0, 22.0, 16.0, 8.0, 5.0, 6.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2070.0, -2008.75, -1947.5, -1886.25, -1825.0, -1763.75, -1702.5, -1641.25, -1580.0, -1518.75, -1457.5, -1396.25, -1335.0, -1273.75, -1212.5, -1151.25, -1090.0, -1028.75, -967.5, -906.25, -845.0, -783.75, -722.5, -661.25, -600.0, -538.75, -477.5, -416.25, -355.0, -293.75, -232.5, -171.25, -110.0, -48.75, 12.5, 73.75, 135.0, 196.25, 257.5, 318.75, 380.0, 441.25, 502.5, 563.75, 625.0, 686.25, 747.5, 808.75, 870.0, 931.25, 992.5, 1053.75, 1115.0, 1176.25, 1237.5, 1298.75, 1360.0, 1421.25, 1482.5, 1543.75, 1605.0, 1666.25, 1727.5, 1788.75, 1850.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 7.0, 8.0, 13.0, 44.0, 140.0, 378.0, 276.0, 82.0, 23.0, 9.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03228759765625, -0.030731201171875, -0.0291748046875, -0.027618408203125, -0.02606201171875, -0.024505615234375, -0.02294921875, -0.021392822265625, -0.01983642578125, -0.018280029296875, -0.0167236328125, -0.015167236328125, -0.01361083984375, -0.012054443359375, -0.010498046875, -0.008941650390625, -0.00738525390625, -0.005828857421875, -0.0042724609375, -0.002716064453125, -0.00115966796875, 0.000396728515625, 0.001953125, 0.003509521484375, 0.00506591796875, 0.006622314453125, 0.0081787109375, 0.009735107421875, 0.01129150390625, 0.012847900390625, 0.014404296875, 0.015960693359375, 0.01751708984375, 0.019073486328125, 0.0206298828125, 0.022186279296875, 0.02374267578125, 0.025299072265625, 0.02685546875, 0.028411865234375, 0.02996826171875, 0.031524658203125, 0.0330810546875, 0.034637451171875, 0.03619384765625, 0.037750244140625, 0.039306640625, 0.040863037109375, 0.04241943359375, 0.043975830078125, 0.0455322265625, 0.047088623046875, 0.04864501953125, 0.050201416015625, 0.0517578125, 0.053314208984375, 0.05487060546875, 0.056427001953125, 0.0579833984375, 0.059539794921875, 0.06109619140625, 0.062652587890625, 0.064208984375, 0.065765380859375, 0.06732177734375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 11.0, 6.0, 19.0, 9.0, 28.0, 26.0, 52.0, 48.0, 65.0, 102.0, 116.0, 174.0, 221.0, 352.0, 482.0, 857.0, 1719.0, 4787.0, 35775.0, 985387.0, 12057.0, 2817.0, 1262.0, 722.0, 415.0, 279.0, 186.0, 155.0, 91.0, 77.0, 63.0, 36.0, 24.0, 33.0, 14.0, 19.0, 16.0, 9.0, 9.0, 6.0, 6.0, 3.0, 1.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2246.0, -2174.21875, -2102.4375, -2030.65625, -1958.875, -1887.09375, -1815.3125, -1743.53125, -1671.75, -1599.96875, -1528.1875, -1456.40625, -1384.625, -1312.84375, -1241.0625, -1169.28125, -1097.5, -1025.71875, -953.9375, -882.15625, -810.375, -738.59375, -666.8125, -595.03125, -523.25, -451.46875, -379.6875, -307.90625, -236.125, -164.34375, -92.5625, -20.78125, 51.0, 122.78125, 194.5625, 266.34375, 338.125, 409.90625, 481.6875, 553.46875, 625.25, 697.03125, 768.8125, 840.59375, 912.375, 984.15625, 1055.9375, 1127.71875, 1199.5, 1271.28125, 1343.0625, 1414.84375, 1486.625, 1558.40625, 1630.1875, 1701.96875, 1773.75, 1845.53125, 1917.3125, 1989.09375, 2060.875, 2132.65625, 2204.4375, 2276.21875, 2348.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 8.0, 10.0, 10.0, 11.0, 49.0, 166.0, 321.0, 233.0, 85.0, 37.0, 7.0, 6.0, 9.0, 5.0, 3.0, 3.0, 6.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-299.75, -289.6328125, -279.515625, -269.3984375, -259.28125, -249.1640625, -239.046875, -228.9296875, -218.8125, -208.6953125, -198.578125, -188.4609375, -178.34375, -168.2265625, -158.109375, -147.9921875, -137.875, -127.7578125, -117.640625, -107.5234375, -97.40625, -87.2890625, -77.171875, -67.0546875, -56.9375, -46.8203125, -36.703125, -26.5859375, -16.46875, -6.3515625, 3.765625, 13.8828125, 24.0, 34.1171875, 44.234375, 54.3515625, 64.46875, 74.5859375, 84.703125, 94.8203125, 104.9375, 115.0546875, 125.171875, 135.2890625, 145.40625, 155.5234375, 165.640625, 175.7578125, 185.875, 195.9921875, 206.109375, 216.2265625, 226.34375, 236.4609375, 246.578125, 256.6953125, 266.8125, 276.9296875, 287.046875, 297.1640625, 307.28125, 317.3984375, 327.515625, 337.6328125, 347.75]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 6.0, 5.0, 9.0, 8.0, 8.0, 3.0, 7.0, 10.0, 13.0, 14.0, 20.0, 27.0, 31.0, 38.0, 45.0, 49.0, 100.0, 138.0, 417.0, 31.0, 3.0], "bins": [-487.7496643066406, -479.8569641113281, -471.96429443359375, -464.07159423828125, -456.17889404296875, -448.2862243652344, -440.3935241699219, -432.5008544921875, -424.608154296875, -416.7154541015625, -408.8227844238281, -400.9300842285156, -393.03741455078125, -385.14471435546875, -377.25201416015625, -369.3593444824219, -361.4666442871094, -353.5739440917969, -345.6812744140625, -337.78857421875, -329.8958740234375, -322.0032043457031, -314.1105041503906, -306.21783447265625, -298.32513427734375, -290.43243408203125, -282.5397644042969, -274.6470642089844, -266.75439453125, -258.8616943359375, -250.968994140625, -243.07630920410156, -235.18360900878906, -227.29092407226562, -219.39822387695312, -211.5055389404297, -203.61285400390625, -195.7201690673828, -187.82748413085938, -179.93478393554688, -172.04209899902344, -164.1494140625, -156.2567138671875, -148.36402893066406, -140.47134399414062, -132.5786590576172, -124.68596649169922, -116.79327392578125, -108.90058898925781, -101.00790405273438, -93.1152114868164, -85.22251892089844, -77.329833984375, -69.43714904785156, -61.544456481933594, -53.65176773071289, -45.75907897949219, -37.866390228271484, -29.97370147705078, -22.081012725830078, -14.188323974609375, -6.295635223388672, 1.5970535278320312, 9.489742279052734, 17.382431030273438]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 6.0, 4.0, 4.0, 9.0, 8.0, 11.0, 12.0, 14.0, 16.0, 14.0, 15.0, 26.0, 22.0, 29.0, 30.0, 41.0, 33.0, 53.0, 57.0, 46.0, 52.0, 51.0, 47.0, 51.0, 52.0, 34.0, 40.0, 35.0, 28.0, 21.0, 19.0, 19.0, 21.0, 13.0, 14.0, 12.0, 11.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-113.3019027709961, -109.62720489501953, -105.95250701904297, -102.2778091430664, -98.60311126708984, -94.92840576171875, -91.25370788574219, -87.57901000976562, -83.90431213378906, -80.2296142578125, -76.55491638183594, -72.88021850585938, -69.20552062988281, -65.53082275390625, -61.85612106323242, -58.181419372558594, -54.5067253112793, -50.832027435302734, -47.15732955932617, -43.482627868652344, -39.80792999267578, -36.13323211669922, -32.458534240722656, -28.78383445739746, -25.1091365814209, -21.434438705444336, -17.75973892211914, -14.085041046142578, -10.4103422164917, -6.73564338684082, -3.060945510864258, 0.6137542724609375, 4.2884521484375, 7.963150978088379, 11.637849807739258, 15.31254768371582, 18.987247467041016, 22.661945343017578, 26.33664321899414, 30.011343002319336, 33.68604278564453, 37.360740661621094, 41.035438537597656, 44.71013641357422, 48.38483810424805, 52.05953598022461, 55.73423385620117, 59.408935546875, 63.0836296081543, 66.75833129882812, 70.43302917480469, 74.10772705078125, 77.78242492675781, 81.45712280273438, 85.13182067871094, 88.8065185546875, 92.48121643066406, 96.15591430664062, 99.83061218261719, 103.50531005859375, 107.18000793457031, 110.85470581054688, 114.52940368652344, 118.20410919189453, 121.8788070678711]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 10.0, 11.0, 11.0, 18.0, 31.0, 39.0, 49.0, 78.0, 132.0, 163.0, 216.0, 321.0, 461.0, 656.0, 966.0, 1310.0, 2040.0, 3047.0, 4903.0, 8224.0, 14585.0, 26989.0, 55106.0, 127880.0, 1066675.0, 2565366.0, 172143.0, 67401.0, 32774.0, 16997.0, 9475.0, 5613.0, 3384.0, 2170.0, 1411.0, 986.0, 670.0, 472.0, 347.0, 266.0, 200.0, 138.0, 123.0, 98.0, 69.0, 64.0, 57.0, 34.0, 28.0, 23.0, 20.0, 8.0, 9.0, 10.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-70.75, -68.322265625, -65.89453125, -63.466796875, -61.0390625, -58.611328125, -56.18359375, -53.755859375, -51.328125, -48.900390625, -46.47265625, -44.044921875, -41.6171875, -39.189453125, -36.76171875, -34.333984375, -31.90625, -29.478515625, -27.05078125, -24.623046875, -22.1953125, -19.767578125, -17.33984375, -14.912109375, -12.484375, -10.056640625, -7.62890625, -5.201171875, -2.7734375, -0.345703125, 2.08203125, 4.509765625, 6.9375, 9.365234375, 11.79296875, 14.220703125, 16.6484375, 19.076171875, 21.50390625, 23.931640625, 26.359375, 28.787109375, 31.21484375, 33.642578125, 36.0703125, 38.498046875, 40.92578125, 43.353515625, 45.78125, 48.208984375, 50.63671875, 53.064453125, 55.4921875, 57.919921875, 60.34765625, 62.775390625, 65.203125, 67.630859375, 70.05859375, 72.486328125, 74.9140625, 77.341796875, 79.76953125, 82.197265625, 84.625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 7.0, 6.0, 8.0, 7.0, 12.0, 13.0, 11.0, 19.0, 25.0, 34.0, 25.0, 37.0, 42.0, 41.0, 42.0, 49.0, 57.0, 51.0, 45.0, 60.0, 44.0, 44.0, 41.0, 35.0, 40.0, 23.0, 27.0, 14.0, 19.0, 21.0, 23.0, 13.0, 5.0, 8.0, 7.0, 7.0, 3.0, 6.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-15.3828125, -14.8883056640625, -14.393798828125, -13.8992919921875, -13.40478515625, -12.9102783203125, -12.415771484375, -11.9212646484375, -11.4267578125, -10.9322509765625, -10.437744140625, -9.9432373046875, -9.44873046875, -8.9542236328125, -8.459716796875, -7.9652099609375, -7.470703125, -6.9761962890625, -6.481689453125, -5.9871826171875, -5.49267578125, -4.9981689453125, -4.503662109375, -4.0091552734375, -3.5146484375, -3.0201416015625, -2.525634765625, -2.0311279296875, -1.53662109375, -1.0421142578125, -0.547607421875, -0.0531005859375, 0.44140625, 0.9359130859375, 1.430419921875, 1.9249267578125, 2.41943359375, 2.9139404296875, 3.408447265625, 3.9029541015625, 4.3974609375, 4.8919677734375, 5.386474609375, 5.8809814453125, 6.37548828125, 6.8699951171875, 7.364501953125, 7.8590087890625, 8.353515625, 8.8480224609375, 9.342529296875, 9.8370361328125, 10.33154296875, 10.8260498046875, 11.320556640625, 11.8150634765625, 12.3095703125, 12.8040771484375, 13.298583984375, 13.7930908203125, 14.28759765625, 14.7821044921875, 15.276611328125, 15.7711181640625, 16.265625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 8.0, 13.0, 29.0, 16.0, 47.0, 42.0, 68.0, 117.0, 141.0, 216.0, 292.0, 440.0, 607.0, 1075.0, 1630.0, 2727.0, 4952.0, 10132.0, 24595.0, 78437.0, 520568.0, 3247898.0, 217339.0, 47956.0, 17087.0, 7632.0, 4085.0, 2117.0, 1373.0, 811.0, 549.0, 394.0, 228.0, 185.0, 132.0, 96.0, 68.0, 58.0, 40.0, 26.0, 17.0, 10.0, 5.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-55.125, -53.4189453125, -51.712890625, -50.0068359375, -48.30078125, -46.5947265625, -44.888671875, -43.1826171875, -41.4765625, -39.7705078125, -38.064453125, -36.3583984375, -34.65234375, -32.9462890625, -31.240234375, -29.5341796875, -27.828125, -26.1220703125, -24.416015625, -22.7099609375, -21.00390625, -19.2978515625, -17.591796875, -15.8857421875, -14.1796875, -12.4736328125, -10.767578125, -9.0615234375, -7.35546875, -5.6494140625, -3.943359375, -2.2373046875, -0.53125, 1.1748046875, 2.880859375, 4.5869140625, 6.29296875, 7.9990234375, 9.705078125, 11.4111328125, 13.1171875, 14.8232421875, 16.529296875, 18.2353515625, 19.94140625, 21.6474609375, 23.353515625, 25.0595703125, 26.765625, 28.4716796875, 30.177734375, 31.8837890625, 33.58984375, 35.2958984375, 37.001953125, 38.7080078125, 40.4140625, 42.1201171875, 43.826171875, 45.5322265625, 47.23828125, 48.9443359375, 50.650390625, 52.3564453125, 54.0625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 10.0, 4.0, 9.0, 10.0, 18.0, 7.0, 14.0, 19.0, 14.0, 17.0, 24.0, 36.0, 45.0, 58.0, 62.0, 85.0, 112.0, 184.0, 260.0, 467.0, 714.0, 541.0, 354.0, 232.0, 163.0, 123.0, 113.0, 84.0, 66.0, 41.0, 34.0, 25.0, 33.0, 30.0, 18.0, 16.0, 7.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5703125, -10.29046630859375, -10.0106201171875, -9.73077392578125, -9.450927734375, -9.17108154296875, -8.8912353515625, -8.61138916015625, -8.33154296875, -8.05169677734375, -7.7718505859375, -7.49200439453125, -7.212158203125, -6.93231201171875, -6.6524658203125, -6.37261962890625, -6.0927734375, -5.81292724609375, -5.5330810546875, -5.25323486328125, -4.973388671875, -4.69354248046875, -4.4136962890625, -4.13385009765625, -3.85400390625, -3.57415771484375, -3.2943115234375, -3.01446533203125, -2.734619140625, -2.45477294921875, -2.1749267578125, -1.89508056640625, -1.615234375, -1.33538818359375, -1.0555419921875, -0.77569580078125, -0.495849609375, -0.21600341796875, 0.0638427734375, 0.34368896484375, 0.62353515625, 0.90338134765625, 1.1832275390625, 1.46307373046875, 1.742919921875, 2.02276611328125, 2.3026123046875, 2.58245849609375, 2.8623046875, 3.14215087890625, 3.4219970703125, 3.70184326171875, 3.981689453125, 4.26153564453125, 4.5413818359375, 4.82122802734375, 5.10107421875, 5.38092041015625, 5.6607666015625, 5.94061279296875, 6.220458984375, 6.50030517578125, 6.7801513671875, 7.05999755859375, 7.33984375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 11.0, 10.0, 16.0, 12.0, 31.0, 71.0, 130.0, 338.0, 274.0, 44.0, 24.0, 14.0, 2.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.86091995239258, -32.923831939697266, -30.98674201965332, -29.049652099609375, -27.112564086914062, -25.175474166870117, -23.238384246826172, -21.30129623413086, -19.364206314086914, -17.42711639404297, -15.490028381347656, -13.552938461303711, -11.615849494934082, -9.678760528564453, -7.741670608520508, -5.804581642150879, -3.86749267578125, -1.930403470993042, 0.006685733795166016, 1.9437751770019531, 3.880864143371582, 5.817953109741211, 7.755043029785156, 9.692131996154785, 11.629220962524414, 13.566309928894043, 15.503398895263672, 17.440488815307617, 19.377578735351562, 21.314666748046875, 23.25175666809082, 25.188846588134766, 27.125930786132812, 29.063020706176758, 31.00010871887207, 32.937198638916016, 34.87428665161133, 36.811378479003906, 38.74846649169922, 40.68555450439453, 42.622642517089844, 44.559730529785156, 46.496822357177734, 48.43391036987305, 50.37099838256836, 52.30809020996094, 54.24517822265625, 56.18226623535156, 58.11935806274414, 60.05644607543945, 61.99353790283203, 63.930625915527344, 65.86771392822266, 67.80480194091797, 69.74189758300781, 71.67898559570312, 73.61607360839844, 75.55316162109375, 77.49024963378906, 79.42733764648438, 81.36443328857422, 83.30152130126953, 85.23860931396484, 87.17569732666016, 89.11278533935547]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 5.0, 5.0, 7.0, 11.0, 16.0, 12.0, 25.0, 29.0, 31.0, 36.0, 55.0, 44.0, 47.0, 39.0, 59.0, 54.0, 50.0, 59.0, 56.0, 39.0, 44.0, 46.0, 31.0, 36.0, 25.0, 19.0, 17.0, 22.0, 9.0, 12.0, 5.0, 6.0, 9.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-26.071685791015625, -25.326156616210938, -24.580629348754883, -23.835102081298828, -23.08957290649414, -22.344043731689453, -21.5985164642334, -20.852989196777344, -20.107460021972656, -19.36193084716797, -18.616403579711914, -17.87087631225586, -17.125347137451172, -16.379817962646484, -15.63429069519043, -14.888762474060059, -14.143234252929688, -13.397706031799316, -12.652177810668945, -11.906649589538574, -11.161121368408203, -10.415593147277832, -9.670064926147461, -8.92453670501709, -8.179008483886719, -7.433480262756348, -6.687952041625977, -5.9424238204956055, -5.196895599365234, -4.451367378234863, -3.705839157104492, -2.960310935974121, -2.214784622192383, -1.4692564010620117, -0.7237281799316406, 0.02180004119873047, 0.7673282623291016, 1.5128564834594727, 2.2583847045898438, 3.003912925720215, 3.749441146850586, 4.494969367980957, 5.240497589111328, 5.986025810241699, 6.73155403137207, 7.477082252502441, 8.222610473632812, 8.968138694763184, 9.713666915893555, 10.459195137023926, 11.204723358154297, 11.950251579284668, 12.695779800415039, 13.44130802154541, 14.186836242675781, 14.932364463806152, 15.677892684936523, 16.423419952392578, 17.168949127197266, 17.914478302001953, 18.660005569458008, 19.405532836914062, 20.15106201171875, 20.896591186523438, 21.642118453979492]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 7.0, 6.0, 10.0, 12.0, 16.0, 24.0, 37.0, 37.0, 52.0, 79.0, 102.0, 131.0, 188.0, 288.0, 412.0, 673.0, 1062.0, 1868.0, 3581.0, 7576.0, 19508.0, 67208.0, 356637.0, 462640.0, 85232.0, 23299.0, 8473.0, 3977.0, 2003.0, 1146.0, 709.0, 450.0, 298.0, 201.0, 157.0, 120.0, 83.0, 53.0, 51.0, 41.0, 24.0, 20.0, 18.0, 13.0, 9.0, 5.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-37.4375, -36.23291015625, -35.0283203125, -33.82373046875, -32.619140625, -31.41455078125, -30.2099609375, -29.00537109375, -27.80078125, -26.59619140625, -25.3916015625, -24.18701171875, -22.982421875, -21.77783203125, -20.5732421875, -19.36865234375, -18.1640625, -16.95947265625, -15.7548828125, -14.55029296875, -13.345703125, -12.14111328125, -10.9365234375, -9.73193359375, -8.52734375, -7.32275390625, -6.1181640625, -4.91357421875, -3.708984375, -2.50439453125, -1.2998046875, -0.09521484375, 1.109375, 2.31396484375, 3.5185546875, 4.72314453125, 5.927734375, 7.13232421875, 8.3369140625, 9.54150390625, 10.74609375, 11.95068359375, 13.1552734375, 14.35986328125, 15.564453125, 16.76904296875, 17.9736328125, 19.17822265625, 20.3828125, 21.58740234375, 22.7919921875, 23.99658203125, 25.201171875, 26.40576171875, 27.6103515625, 28.81494140625, 30.01953125, 31.22412109375, 32.4287109375, 33.63330078125, 34.837890625, 36.04248046875, 37.2470703125, 38.45166015625, 39.65625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 0.0, 7.0, 7.0, 11.0, 14.0, 9.0, 15.0, 22.0, 31.0, 27.0, 50.0, 39.0, 36.0, 46.0, 52.0, 43.0, 43.0, 48.0, 50.0, 47.0, 55.0, 51.0, 33.0, 38.0, 21.0, 28.0, 24.0, 17.0, 29.0, 18.0, 13.0, 12.0, 9.0, 5.0, 5.0, 5.0, 7.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.78125, -17.200439453125, -16.61962890625, -16.038818359375, -15.4580078125, -14.877197265625, -14.29638671875, -13.715576171875, -13.134765625, -12.553955078125, -11.97314453125, -11.392333984375, -10.8115234375, -10.230712890625, -9.64990234375, -9.069091796875, -8.48828125, -7.907470703125, -7.32666015625, -6.745849609375, -6.1650390625, -5.584228515625, -5.00341796875, -4.422607421875, -3.841796875, -3.260986328125, -2.68017578125, -2.099365234375, -1.5185546875, -0.937744140625, -0.35693359375, 0.223876953125, 0.8046875, 1.385498046875, 1.96630859375, 2.547119140625, 3.1279296875, 3.708740234375, 4.28955078125, 4.870361328125, 5.451171875, 6.031982421875, 6.61279296875, 7.193603515625, 7.7744140625, 8.355224609375, 8.93603515625, 9.516845703125, 10.09765625, 10.678466796875, 11.25927734375, 11.840087890625, 12.4208984375, 13.001708984375, 13.58251953125, 14.163330078125, 14.744140625, 15.324951171875, 15.90576171875, 16.486572265625, 17.0673828125, 17.648193359375, 18.22900390625, 18.809814453125, 19.390625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 9.0, 14.0, 20.0, 27.0, 41.0, 76.0, 74.0, 104.0, 177.0, 214.0, 281.0, 411.0, 602.0, 796.0, 1211.0, 1723.0, 2640.0, 4296.0, 7580.0, 15995.0, 42290.0, 210479.0, 620713.0, 86153.0, 25387.0, 11006.0, 5715.0, 3429.0, 2214.0, 1473.0, 954.0, 713.0, 495.0, 379.0, 238.0, 199.0, 129.0, 81.0, 65.0, 44.0, 31.0, 23.0, 22.0, 10.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.5625, -46.041015625, -44.51953125, -42.998046875, -41.4765625, -39.955078125, -38.43359375, -36.912109375, -35.390625, -33.869140625, -32.34765625, -30.826171875, -29.3046875, -27.783203125, -26.26171875, -24.740234375, -23.21875, -21.697265625, -20.17578125, -18.654296875, -17.1328125, -15.611328125, -14.08984375, -12.568359375, -11.046875, -9.525390625, -8.00390625, -6.482421875, -4.9609375, -3.439453125, -1.91796875, -0.396484375, 1.125, 2.646484375, 4.16796875, 5.689453125, 7.2109375, 8.732421875, 10.25390625, 11.775390625, 13.296875, 14.818359375, 16.33984375, 17.861328125, 19.3828125, 20.904296875, 22.42578125, 23.947265625, 25.46875, 26.990234375, 28.51171875, 30.033203125, 31.5546875, 33.076171875, 34.59765625, 36.119140625, 37.640625, 39.162109375, 40.68359375, 42.205078125, 43.7265625, 45.248046875, 46.76953125, 48.291015625, 49.8125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 7.0, 7.0, 9.0, 9.0, 4.0, 11.0, 17.0, 23.0, 19.0, 23.0, 27.0, 23.0, 40.0, 36.0, 60.0, 79.0, 91.0, 77.0, 59.0, 60.0, 50.0, 42.0, 33.0, 29.0, 34.0, 21.0, 20.0, 14.0, 7.0, 12.0, 11.0, 11.0, 6.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.75, -25.970703125, -25.19140625, -24.412109375, -23.6328125, -22.853515625, -22.07421875, -21.294921875, -20.515625, -19.736328125, -18.95703125, -18.177734375, -17.3984375, -16.619140625, -15.83984375, -15.060546875, -14.28125, -13.501953125, -12.72265625, -11.943359375, -11.1640625, -10.384765625, -9.60546875, -8.826171875, -8.046875, -7.267578125, -6.48828125, -5.708984375, -4.9296875, -4.150390625, -3.37109375, -2.591796875, -1.8125, -1.033203125, -0.25390625, 0.525390625, 1.3046875, 2.083984375, 2.86328125, 3.642578125, 4.421875, 5.201171875, 5.98046875, 6.759765625, 7.5390625, 8.318359375, 9.09765625, 9.876953125, 10.65625, 11.435546875, 12.21484375, 12.994140625, 13.7734375, 14.552734375, 15.33203125, 16.111328125, 16.890625, 17.669921875, 18.44921875, 19.228515625, 20.0078125, 20.787109375, 21.56640625, 22.345703125, 23.125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 15.0, 14.0, 14.0, 27.0, 30.0, 46.0, 86.0, 108.0, 152.0, 230.0, 327.0, 540.0, 938.0, 1568.0, 2893.0, 5905.0, 15428.0, 82126.0, 833286.0, 76935.0, 15205.0, 5815.0, 2777.0, 1594.0, 899.0, 534.0, 339.0, 216.0, 144.0, 105.0, 69.0, 58.0, 43.0, 18.0, 13.0, 16.0, 14.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-62.96875, -61.1943359375, -59.419921875, -57.6455078125, -55.87109375, -54.0966796875, -52.322265625, -50.5478515625, -48.7734375, -46.9990234375, -45.224609375, -43.4501953125, -41.67578125, -39.9013671875, -38.126953125, -36.3525390625, -34.578125, -32.8037109375, -31.029296875, -29.2548828125, -27.48046875, -25.7060546875, -23.931640625, -22.1572265625, -20.3828125, -18.6083984375, -16.833984375, -15.0595703125, -13.28515625, -11.5107421875, -9.736328125, -7.9619140625, -6.1875, -4.4130859375, -2.638671875, -0.8642578125, 0.91015625, 2.6845703125, 4.458984375, 6.2333984375, 8.0078125, 9.7822265625, 11.556640625, 13.3310546875, 15.10546875, 16.8798828125, 18.654296875, 20.4287109375, 22.203125, 23.9775390625, 25.751953125, 27.5263671875, 29.30078125, 31.0751953125, 32.849609375, 34.6240234375, 36.3984375, 38.1728515625, 39.947265625, 41.7216796875, 43.49609375, 45.2705078125, 47.044921875, 48.8193359375, 50.59375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 5.0, 4.0, 16.0, 9.0, 25.0, 31.0, 36.0, 62.0, 115.0, 207.0, 213.0, 89.0, 48.0, 42.0, 19.0, 24.0, 9.0, 11.0, 8.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0011777877807617188, -0.0011466816067695618, -0.0011155754327774048, -0.0010844692587852478, -0.0010533630847930908, -0.0010222569108009338, -0.0009911507368087769, -0.0009600445628166199, -0.0009289383888244629, -0.0008978322148323059, -0.0008667260408401489, -0.0008356198668479919, -0.000804513692855835, -0.000773407518863678, -0.000742301344871521, -0.000711195170879364, -0.000680088996887207, -0.00064898282289505, -0.0006178766489028931, -0.0005867704749107361, -0.0005556643009185791, -0.0005245581269264221, -0.0004934519529342651, -0.00046234577894210815, -0.00043123960494995117, -0.0004001334309577942, -0.0003690272569656372, -0.0003379210829734802, -0.00030681490898132324, -0.00027570873498916626, -0.0002446025609970093, -0.0002134963870048523, -0.0001823902130126953, -0.00015128403902053833, -0.00012017786502838135, -8.907169103622437e-05, -5.796551704406738e-05, -2.68593430519104e-05, 4.246830940246582e-06, 3.5353004932403564e-05, 6.645917892456055e-05, 9.756535291671753e-05, 0.0001286715269088745, 0.0001597777009010315, 0.00019088387489318848, 0.00022199004888534546, 0.00025309622287750244, 0.0002842023968696594, 0.0003153085708618164, 0.0003464147448539734, 0.00037752091884613037, 0.00040862709283828735, 0.00043973326683044434, 0.0004708394408226013, 0.0005019456148147583, 0.0005330517888069153, 0.0005641579627990723, 0.0005952641367912292, 0.0006263703107833862, 0.0006574764847755432, 0.0006885826587677002, 0.0007196888327598572, 0.0007507950067520142, 0.0007819011807441711, 0.0008130073547363281]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 4.0, 10.0, 11.0, 7.0, 16.0, 17.0, 19.0, 40.0, 48.0, 57.0, 86.0, 121.0, 168.0, 258.0, 402.0, 528.0, 928.0, 1625.0, 2857.0, 6357.0, 18209.0, 104595.0, 828471.0, 59046.0, 13377.0, 5041.0, 2385.0, 1357.0, 864.0, 513.0, 347.0, 247.0, 151.0, 121.0, 78.0, 46.0, 35.0, 38.0, 15.0, 21.0, 15.0, 6.0, 5.0, 4.0, 1.0, 8.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.84375, -52.12744140625, -50.4111328125, -48.69482421875, -46.978515625, -45.26220703125, -43.5458984375, -41.82958984375, -40.11328125, -38.39697265625, -36.6806640625, -34.96435546875, -33.248046875, -31.53173828125, -29.8154296875, -28.09912109375, -26.3828125, -24.66650390625, -22.9501953125, -21.23388671875, -19.517578125, -17.80126953125, -16.0849609375, -14.36865234375, -12.65234375, -10.93603515625, -9.2197265625, -7.50341796875, -5.787109375, -4.07080078125, -2.3544921875, -0.63818359375, 1.078125, 2.79443359375, 4.5107421875, 6.22705078125, 7.943359375, 9.65966796875, 11.3759765625, 13.09228515625, 14.80859375, 16.52490234375, 18.2412109375, 19.95751953125, 21.673828125, 23.39013671875, 25.1064453125, 26.82275390625, 28.5390625, 30.25537109375, 31.9716796875, 33.68798828125, 35.404296875, 37.12060546875, 38.8369140625, 40.55322265625, 42.26953125, 43.98583984375, 45.7021484375, 47.41845703125, 49.134765625, 50.85107421875, 52.5673828125, 54.28369140625, 56.0]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 14.0, 9.0, 17.0, 23.0, 19.0, 22.0, 18.0, 41.0, 47.0, 68.0, 155.0, 211.0, 95.0, 53.0, 34.0, 30.0, 29.0, 20.0, 14.0, 17.0, 15.0, 4.0, 8.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.109375, -23.443359375, -22.77734375, -22.111328125, -21.4453125, -20.779296875, -20.11328125, -19.447265625, -18.78125, -18.115234375, -17.44921875, -16.783203125, -16.1171875, -15.451171875, -14.78515625, -14.119140625, -13.453125, -12.787109375, -12.12109375, -11.455078125, -10.7890625, -10.123046875, -9.45703125, -8.791015625, -8.125, -7.458984375, -6.79296875, -6.126953125, -5.4609375, -4.794921875, -4.12890625, -3.462890625, -2.796875, -2.130859375, -1.46484375, -0.798828125, -0.1328125, 0.533203125, 1.19921875, 1.865234375, 2.53125, 3.197265625, 3.86328125, 4.529296875, 5.1953125, 5.861328125, 6.52734375, 7.193359375, 7.859375, 8.525390625, 9.19140625, 9.857421875, 10.5234375, 11.189453125, 11.85546875, 12.521484375, 13.1875, 13.853515625, 14.51953125, 15.185546875, 15.8515625, 16.517578125, 17.18359375, 17.849609375, 18.515625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 9.0, 8.0, 18.0, 33.0, 72.0, 214.0, 508.0, 77.0, 24.0, 9.0, 8.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.509647369384766, -23.459304809570312, -21.40896224975586, -19.358617782592773, -17.30827522277832, -15.257932662963867, -13.207589149475098, -11.157245635986328, -9.106903076171875, -7.056560039520264, -5.006217002868652, -2.955873966217041, -0.9055309295654297, 1.1448116302490234, 3.195155143737793, 5.2454986572265625, 7.295841217041016, 9.346183776855469, 11.396527290344238, 13.446870803833008, 15.497213363647461, 17.547555923461914, 19.597900390625, 21.648242950439453, 23.698585510253906, 25.74892807006836, 27.799270629882812, 29.8496150970459, 31.89995765686035, 33.95030212402344, 36.00064468383789, 38.050987243652344, 40.10133361816406, 42.151676177978516, 44.20201873779297, 46.25236129760742, 48.302703857421875, 50.353050231933594, 52.40339279174805, 54.4537353515625, 56.50407791137695, 58.554420471191406, 60.60476303100586, 62.65510559082031, 64.70545196533203, 66.75579071044922, 68.80613708496094, 70.85647583007812, 72.90682220458984, 74.95716857910156, 77.00750732421875, 79.05785369873047, 81.10819244384766, 83.15853881835938, 85.20887756347656, 87.25922393798828, 89.3095703125, 91.35991668701172, 93.4102554321289, 95.46060180664062, 97.51094055175781, 99.56128692626953, 101.61162567138672, 103.66197204589844, 105.71231079101562]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 5.0, 6.0, 12.0, 10.0, 26.0, 21.0, 20.0, 36.0, 39.0, 58.0, 58.0, 56.0, 68.0, 72.0, 69.0, 58.0, 68.0, 62.0, 41.0, 40.0, 41.0, 25.0, 17.0, 21.0, 13.0, 8.0, 10.0, 6.0, 6.0, 2.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-29.521896362304688, -28.74603843688965, -27.97018051147461, -27.19432258605957, -26.41846466064453, -25.642606735229492, -24.866748809814453, -24.090892791748047, -23.315032958984375, -22.539175033569336, -21.763317108154297, -20.987459182739258, -20.21160125732422, -19.43574333190918, -18.65988540649414, -17.884029388427734, -17.108171463012695, -16.332313537597656, -15.556455612182617, -14.780597686767578, -14.004739761352539, -13.2288818359375, -12.453024864196777, -11.677166938781738, -10.9013090133667, -10.12545108795166, -9.349593162536621, -8.573736190795898, -7.797877788543701, -7.022019863128662, -6.246162414550781, -5.470304489135742, -4.694446563720703, -3.918588638305664, -3.142730951309204, -2.366873264312744, -1.591015338897705, -0.815157413482666, -0.039299964904785156, 0.7365579605102539, 1.512415885925293, 2.288273811340332, 3.064131498336792, 3.839989185333252, 4.615847110748291, 5.39170503616333, 6.167562484741211, 6.94342041015625, 7.719278335571289, 8.495136260986328, 9.270994186401367, 10.046852111816406, 10.822710037231445, 11.598567962646484, 12.374424934387207, 13.150282859802246, 13.926140785217285, 14.701998710632324, 15.477856636047363, 16.253713607788086, 17.029571533203125, 17.805429458618164, 18.581287384033203, 19.357145309448242, 20.13300323486328]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 10.0, 12.0, 12.0, 25.0, 19.0, 21.0, 54.0, 75.0, 94.0, 165.0, 307.0, 492.0, 940.0, 2062.0, 5258.0, 14508.0, 49145.0, 222098.0, 567363.0, 134302.0, 33546.0, 10583.0, 3889.0, 1637.0, 804.0, 432.0, 216.0, 158.0, 97.0, 56.0, 45.0, 28.0, 19.0, 21.0, 11.0, 12.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.65625, -45.16796875, -43.6796875, -42.19140625, -40.703125, -39.21484375, -37.7265625, -36.23828125, -34.75, -33.26171875, -31.7734375, -30.28515625, -28.796875, -27.30859375, -25.8203125, -24.33203125, -22.84375, -21.35546875, -19.8671875, -18.37890625, -16.890625, -15.40234375, -13.9140625, -12.42578125, -10.9375, -9.44921875, -7.9609375, -6.47265625, -4.984375, -3.49609375, -2.0078125, -0.51953125, 0.96875, 2.45703125, 3.9453125, 5.43359375, 6.921875, 8.41015625, 9.8984375, 11.38671875, 12.875, 14.36328125, 15.8515625, 17.33984375, 18.828125, 20.31640625, 21.8046875, 23.29296875, 24.78125, 26.26953125, 27.7578125, 29.24609375, 30.734375, 32.22265625, 33.7109375, 35.19921875, 36.6875, 38.17578125, 39.6640625, 41.15234375, 42.640625, 44.12890625, 45.6171875, 47.10546875, 48.59375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 16.0, 22.0, 18.0, 35.0, 34.0, 54.0, 70.0, 76.0, 73.0, 100.0, 67.0, 72.0, 74.0, 62.0, 46.0, 28.0, 36.0, 27.0, 7.0, 14.0, 11.0, 8.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.515625, -17.0528564453125, -16.590087890625, -16.1273193359375, -15.66455078125, -15.2017822265625, -14.739013671875, -14.2762451171875, -13.8134765625, -13.3507080078125, -12.887939453125, -12.4251708984375, -11.96240234375, -11.4996337890625, -11.036865234375, -10.5740966796875, -10.111328125, -9.6485595703125, -9.185791015625, -8.7230224609375, -8.26025390625, -7.7974853515625, -7.334716796875, -6.8719482421875, -6.4091796875, -5.9464111328125, -5.483642578125, -5.0208740234375, -4.55810546875, -4.0953369140625, -3.632568359375, -3.1697998046875, -2.70703125, -2.2442626953125, -1.781494140625, -1.3187255859375, -0.85595703125, -0.3931884765625, 0.069580078125, 0.5323486328125, 0.9951171875, 1.4578857421875, 1.920654296875, 2.3834228515625, 2.84619140625, 3.3089599609375, 3.771728515625, 4.2344970703125, 4.697265625, 5.1600341796875, 5.622802734375, 6.0855712890625, 6.54833984375, 7.0111083984375, 7.473876953125, 7.9366455078125, 8.3994140625, 8.8621826171875, 9.324951171875, 9.7877197265625, 10.25048828125, 10.7132568359375, 11.176025390625, 11.6387939453125, 12.1015625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 5.0, 10.0, 20.0, 27.0, 30.0, 43.0, 66.0, 70.0, 105.0, 148.0, 228.0, 289.0, 406.0, 626.0, 854.0, 1271.0, 1913.0, 3042.0, 5189.0, 9080.0, 16776.0, 36337.0, 97883.0, 515457.0, 238181.0, 62466.0, 25995.0, 12946.0, 7071.0, 4190.0, 2529.0, 1667.0, 1125.0, 732.0, 505.0, 330.0, 272.0, 185.0, 147.0, 71.0, 72.0, 50.0, 42.0, 30.0, 21.0, 15.0, 12.0, 9.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-33.46875, -32.4482421875, -31.427734375, -30.4072265625, -29.38671875, -28.3662109375, -27.345703125, -26.3251953125, -25.3046875, -24.2841796875, -23.263671875, -22.2431640625, -21.22265625, -20.2021484375, -19.181640625, -18.1611328125, -17.140625, -16.1201171875, -15.099609375, -14.0791015625, -13.05859375, -12.0380859375, -11.017578125, -9.9970703125, -8.9765625, -7.9560546875, -6.935546875, -5.9150390625, -4.89453125, -3.8740234375, -2.853515625, -1.8330078125, -0.8125, 0.2080078125, 1.228515625, 2.2490234375, 3.26953125, 4.2900390625, 5.310546875, 6.3310546875, 7.3515625, 8.3720703125, 9.392578125, 10.4130859375, 11.43359375, 12.4541015625, 13.474609375, 14.4951171875, 15.515625, 16.5361328125, 17.556640625, 18.5771484375, 19.59765625, 20.6181640625, 21.638671875, 22.6591796875, 23.6796875, 24.7001953125, 25.720703125, 26.7412109375, 27.76171875, 28.7822265625, 29.802734375, 30.8232421875, 31.84375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 9.0, 4.0, 6.0, 7.0, 5.0, 5.0, 15.0, 9.0, 21.0, 17.0, 18.0, 21.0, 23.0, 22.0, 35.0, 30.0, 36.0, 45.0, 42.0, 50.0, 55.0, 51.0, 36.0, 45.0, 39.0, 46.0, 32.0, 29.0, 31.0, 17.0, 21.0, 25.0, 27.0, 21.0, 12.0, 15.0, 10.0, 12.0, 10.0, 10.0, 9.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.21875, -9.8831787109375, -9.547607421875, -9.2120361328125, -8.87646484375, -8.5408935546875, -8.205322265625, -7.8697509765625, -7.5341796875, -7.1986083984375, -6.863037109375, -6.5274658203125, -6.19189453125, -5.8563232421875, -5.520751953125, -5.1851806640625, -4.849609375, -4.5140380859375, -4.178466796875, -3.8428955078125, -3.50732421875, -3.1717529296875, -2.836181640625, -2.5006103515625, -2.1650390625, -1.8294677734375, -1.493896484375, -1.1583251953125, -0.82275390625, -0.4871826171875, -0.151611328125, 0.1839599609375, 0.51953125, 0.8551025390625, 1.190673828125, 1.5262451171875, 1.86181640625, 2.1973876953125, 2.532958984375, 2.8685302734375, 3.2041015625, 3.5396728515625, 3.875244140625, 4.2108154296875, 4.54638671875, 4.8819580078125, 5.217529296875, 5.5531005859375, 5.888671875, 6.2242431640625, 6.559814453125, 6.8953857421875, 7.23095703125, 7.5665283203125, 7.902099609375, 8.2376708984375, 8.5732421875, 8.9088134765625, 9.244384765625, 9.5799560546875, 9.91552734375, 10.2510986328125, 10.586669921875, 10.9222412109375, 11.2578125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 11.0, 10.0, 20.0, 17.0, 21.0, 29.0, 30.0, 46.0, 62.0, 76.0, 121.0, 198.0, 233.0, 346.0, 588.0, 1133.0, 2506.0, 10685.0, 973460.0, 50257.0, 4739.0, 1639.0, 751.0, 476.0, 330.0, 207.0, 143.0, 100.0, 76.0, 49.0, 43.0, 33.0, 21.0, 13.0, 16.0, 12.0, 11.0, 7.0, 10.0, 3.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-315.5, -306.15625, -296.8125, -287.46875, -278.125, -268.78125, -259.4375, -250.09375, -240.75, -231.40625, -222.0625, -212.71875, -203.375, -194.03125, -184.6875, -175.34375, -166.0, -156.65625, -147.3125, -137.96875, -128.625, -119.28125, -109.9375, -100.59375, -91.25, -81.90625, -72.5625, -63.21875, -53.875, -44.53125, -35.1875, -25.84375, -16.5, -7.15625, 2.1875, 11.53125, 20.875, 30.21875, 39.5625, 48.90625, 58.25, 67.59375, 76.9375, 86.28125, 95.625, 104.96875, 114.3125, 123.65625, 133.0, 142.34375, 151.6875, 161.03125, 170.375, 179.71875, 189.0625, 198.40625, 207.75, 217.09375, 226.4375, 235.78125, 245.125, 254.46875, 263.8125, 273.15625, 282.5]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 12.0, 23.0, 56.0, 238.0, 469.0, 144.0, 38.0, 14.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006443023681640625, -0.006222784519195557, -0.006002545356750488, -0.00578230619430542, -0.0055620670318603516, -0.005341827869415283, -0.005121588706970215, -0.0049013495445251465, -0.004681110382080078, -0.00446087121963501, -0.004240632057189941, -0.004020392894744873, -0.0038001537322998047, -0.0035799145698547363, -0.003359675407409668, -0.0031394362449645996, -0.0029191970825195312, -0.002698957920074463, -0.0024787187576293945, -0.002258479595184326, -0.002038240432739258, -0.0018180012702941895, -0.001597762107849121, -0.0013775229454040527, -0.0011572837829589844, -0.000937044620513916, -0.0007168054580688477, -0.0004965662956237793, -0.00027632713317871094, -5.608797073364258e-05, 0.00016415119171142578, 0.00038439035415649414, 0.0006046295166015625, 0.0008248686790466309, 0.0010451078414916992, 0.0012653470039367676, 0.001485586166381836, 0.0017058253288269043, 0.0019260644912719727, 0.002146303653717041, 0.0023665428161621094, 0.0025867819786071777, 0.002807021141052246, 0.0030272603034973145, 0.003247499465942383, 0.003467738628387451, 0.0036879777908325195, 0.003908216953277588, 0.004128456115722656, 0.004348695278167725, 0.004568934440612793, 0.004789173603057861, 0.00500941276550293, 0.005229651927947998, 0.005449891090393066, 0.005670130252838135, 0.005890369415283203, 0.0061106085777282715, 0.00633084774017334, 0.006551086902618408, 0.0067713260650634766, 0.006991565227508545, 0.007211804389953613, 0.007432043552398682, 0.00765228271484375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 6.0, 14.0, 13.0, 15.0, 22.0, 18.0, 33.0, 37.0, 52.0, 92.0, 128.0, 193.0, 285.0, 432.0, 908.0, 2325.0, 11223.0, 987276.0, 38403.0, 4034.0, 1382.0, 582.0, 340.0, 220.0, 148.0, 107.0, 69.0, 48.0, 31.0, 24.0, 23.0, 17.0, 8.0, 7.0, 8.0, 6.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-329.75, -318.65234375, -307.5546875, -296.45703125, -285.359375, -274.26171875, -263.1640625, -252.06640625, -240.96875, -229.87109375, -218.7734375, -207.67578125, -196.578125, -185.48046875, -174.3828125, -163.28515625, -152.1875, -141.08984375, -129.9921875, -118.89453125, -107.796875, -96.69921875, -85.6015625, -74.50390625, -63.40625, -52.30859375, -41.2109375, -30.11328125, -19.015625, -7.91796875, 3.1796875, 14.27734375, 25.375, 36.47265625, 47.5703125, 58.66796875, 69.765625, 80.86328125, 91.9609375, 103.05859375, 114.15625, 125.25390625, 136.3515625, 147.44921875, 158.546875, 169.64453125, 180.7421875, 191.83984375, 202.9375, 214.03515625, 225.1328125, 236.23046875, 247.328125, 258.42578125, 269.5234375, 280.62109375, 291.71875, 302.81640625, 313.9140625, 325.01171875, 336.109375, 347.20703125, 358.3046875, 369.40234375, 380.5]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 3.0, 14.0, 36.0, 85.0, 186.0, 345.0, 173.0, 80.0, 28.0, 10.0, 8.0, 5.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-53.34375, -51.7939453125, -50.244140625, -48.6943359375, -47.14453125, -45.5947265625, -44.044921875, -42.4951171875, -40.9453125, -39.3955078125, -37.845703125, -36.2958984375, -34.74609375, -33.1962890625, -31.646484375, -30.0966796875, -28.546875, -26.9970703125, -25.447265625, -23.8974609375, -22.34765625, -20.7978515625, -19.248046875, -17.6982421875, -16.1484375, -14.5986328125, -13.048828125, -11.4990234375, -9.94921875, -8.3994140625, -6.849609375, -5.2998046875, -3.75, -2.2001953125, -0.650390625, 0.8994140625, 2.44921875, 3.9990234375, 5.548828125, 7.0986328125, 8.6484375, 10.1982421875, 11.748046875, 13.2978515625, 14.84765625, 16.3974609375, 17.947265625, 19.4970703125, 21.046875, 22.5966796875, 24.146484375, 25.6962890625, 27.24609375, 28.7958984375, 30.345703125, 31.8955078125, 33.4453125, 34.9951171875, 36.544921875, 38.0947265625, 39.64453125, 41.1943359375, 42.744140625, 44.2939453125, 45.84375]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 7.0, 4.0, 2.0, 5.0, 7.0, 9.0, 3.0, 7.0, 7.0, 7.0, 15.0, 22.0, 13.0, 15.0, 32.0, 31.0, 73.0, 106.0, 208.0, 343.0, 51.0, 10.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.80369567871094, -41.900936126708984, -40.9981803894043, -40.095420837402344, -39.192665100097656, -38.2899055480957, -37.38714599609375, -36.48439025878906, -35.58163070678711, -34.678871154785156, -33.77611541748047, -32.873355865478516, -31.970598220825195, -31.067840576171875, -30.165082931518555, -29.262325286865234, -28.359567642211914, -27.456809997558594, -26.554052352905273, -25.651294708251953, -24.74853515625, -23.84577751159668, -22.94301986694336, -22.04026222229004, -21.13750457763672, -20.2347469329834, -19.331989288330078, -18.429229736328125, -17.526472091674805, -16.623714447021484, -15.720956802368164, -14.818199157714844, -13.915441513061523, -13.012683868408203, -12.109925270080566, -11.207167625427246, -10.30440902709961, -9.401651382446289, -8.498893737792969, -7.59613561630249, -6.693377494812012, -5.790619373321533, -4.887861251831055, -3.9851036071777344, -3.082345485687256, -2.1795873641967773, -1.276829719543457, -0.3740715980529785, 0.5286865234375, 1.431444525718689, 2.334202527999878, 3.2369604110717773, 4.139718532562256, 5.042476654052734, 5.945234298706055, 6.847992420196533, 7.750750541687012, 8.653508186340332, 9.556266784667969, 10.459024429321289, 11.36178207397461, 12.264540672302246, 13.167298316955566, 14.070056915283203, 14.972814559936523]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 5.0, 4.0, 7.0, 12.0, 11.0, 10.0, 14.0, 31.0, 22.0, 39.0, 42.0, 55.0, 48.0, 63.0, 81.0, 86.0, 67.0, 74.0, 67.0, 49.0, 47.0, 37.0, 24.0, 21.0, 23.0, 13.0, 10.0, 6.0, 9.0, 4.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.38955307006836, -16.737333297729492, -16.085115432739258, -15.43289566040039, -14.780675888061523, -14.128457069396973, -13.476238250732422, -12.824018478393555, -12.171798706054688, -11.519579887390137, -10.86736011505127, -10.215141296386719, -9.562921524047852, -8.9107027053833, -8.25848388671875, -7.606264114379883, -6.954045295715332, -6.301826000213623, -5.649606704711914, -4.997387886047363, -4.345168113708496, -3.692949056625366, -3.0407299995422363, -2.3885107040405273, -1.7362914085388184, -1.0840721130371094, -0.43185293674468994, 0.2203662395477295, 0.8725855350494385, 1.5248048305511475, 2.1770238876342773, 2.8292431831359863, 3.4814624786376953, 4.133681774139404, 4.785901069641113, 5.438119888305664, 6.090339660644531, 6.742558479309082, 7.394777774810791, 8.0469970703125, 8.699216842651367, 9.351435661315918, 10.003655433654785, 10.655874252319336, 11.308094024658203, 11.960312843322754, 12.612531661987305, 13.264751434326172, 13.916970252990723, 14.569189071655273, 15.22140884399414, 15.873627662658691, 16.525846481323242, 17.17806625366211, 17.830286026000977, 18.482505798339844, 19.134723663330078, 19.786943435668945, 20.43916130065918, 21.091381072998047, 21.743600845336914, 22.39582061767578, 23.048038482666016, 23.700258255004883, 24.35247802734375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 9.0, 12.0, 17.0, 28.0, 41.0, 50.0, 84.0, 115.0, 140.0, 208.0, 285.0, 386.0, 603.0, 872.0, 1307.0, 2076.0, 3076.0, 4962.0, 8097.0, 13095.0, 23229.0, 43873.0, 91683.0, 234814.0, 2168860.0, 1246298.0, 185771.0, 76904.0, 37351.0, 19941.0, 11166.0, 6656.0, 4310.0, 2753.0, 1670.0, 1138.0, 769.0, 500.0, 351.0, 240.0, 173.0, 120.0, 86.0, 49.0, 36.0, 20.0, 15.0, 14.0, 12.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.4375, -10.1102294921875, -9.782958984375, -9.4556884765625, -9.12841796875, -8.8011474609375, -8.473876953125, -8.1466064453125, -7.8193359375, -7.4920654296875, -7.164794921875, -6.8375244140625, -6.51025390625, -6.1829833984375, -5.855712890625, -5.5284423828125, -5.201171875, -4.8739013671875, -4.546630859375, -4.2193603515625, -3.89208984375, -3.5648193359375, -3.237548828125, -2.9102783203125, -2.5830078125, -2.2557373046875, -1.928466796875, -1.6011962890625, -1.27392578125, -0.9466552734375, -0.619384765625, -0.2921142578125, 0.03515625, 0.3624267578125, 0.689697265625, 1.0169677734375, 1.34423828125, 1.6715087890625, 1.998779296875, 2.3260498046875, 2.6533203125, 2.9805908203125, 3.307861328125, 3.6351318359375, 3.96240234375, 4.2896728515625, 4.616943359375, 4.9442138671875, 5.271484375, 5.5987548828125, 5.926025390625, 6.2532958984375, 6.58056640625, 6.9078369140625, 7.235107421875, 7.5623779296875, 7.8896484375, 8.2169189453125, 8.544189453125, 8.8714599609375, 9.19873046875, 9.5260009765625, 9.853271484375, 10.1805419921875, 10.5078125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 6.0, 10.0, 11.0, 11.0, 19.0, 15.0, 26.0, 33.0, 26.0, 41.0, 44.0, 42.0, 47.0, 51.0, 52.0, 62.0, 59.0, 70.0, 53.0, 58.0, 41.0, 43.0, 29.0, 35.0, 24.0, 21.0, 17.0, 9.0, 6.0, 12.0, 8.0, 4.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462890625, -2.379730224609375, -2.29656982421875, -2.213409423828125, -2.1302490234375, -2.047088623046875, -1.96392822265625, -1.880767822265625, -1.797607421875, -1.714447021484375, -1.63128662109375, -1.548126220703125, -1.4649658203125, -1.381805419921875, -1.29864501953125, -1.215484619140625, -1.13232421875, -1.049163818359375, -0.96600341796875, -0.882843017578125, -0.7996826171875, -0.716522216796875, -0.63336181640625, -0.550201416015625, -0.467041015625, -0.383880615234375, -0.30072021484375, -0.217559814453125, -0.1343994140625, -0.051239013671875, 0.03192138671875, 0.115081787109375, 0.1982421875, 0.281402587890625, 0.36456298828125, 0.447723388671875, 0.5308837890625, 0.614044189453125, 0.69720458984375, 0.780364990234375, 0.863525390625, 0.946685791015625, 1.02984619140625, 1.113006591796875, 1.1961669921875, 1.279327392578125, 1.36248779296875, 1.445648193359375, 1.52880859375, 1.611968994140625, 1.69512939453125, 1.778289794921875, 1.8614501953125, 1.944610595703125, 2.02777099609375, 2.110931396484375, 2.194091796875, 2.277252197265625, 2.36041259765625, 2.443572998046875, 2.5267333984375, 2.609893798828125, 2.69305419921875, 2.776214599609375, 2.859375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 12.0, 14.0, 17.0, 26.0, 34.0, 49.0, 83.0, 128.0, 177.0, 260.0, 384.0, 681.0, 1088.0, 1848.0, 3540.0, 7318.0, 16981.0, 49304.0, 216789.0, 2578011.0, 1123768.0, 132321.0, 35140.0, 13109.0, 6093.0, 2930.0, 1605.0, 922.0, 585.0, 336.0, 218.0, 170.0, 88.0, 73.0, 43.0, 39.0, 28.0, 16.0, 14.0, 8.0, 8.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.31640625, -7.07928466796875, -6.8421630859375, -6.60504150390625, -6.367919921875, -6.13079833984375, -5.8936767578125, -5.65655517578125, -5.41943359375, -5.18231201171875, -4.9451904296875, -4.70806884765625, -4.470947265625, -4.23382568359375, -3.9967041015625, -3.75958251953125, -3.5224609375, -3.28533935546875, -3.0482177734375, -2.81109619140625, -2.573974609375, -2.33685302734375, -2.0997314453125, -1.86260986328125, -1.62548828125, -1.38836669921875, -1.1512451171875, -0.91412353515625, -0.677001953125, -0.43988037109375, -0.2027587890625, 0.03436279296875, 0.271484375, 0.50860595703125, 0.7457275390625, 0.98284912109375, 1.219970703125, 1.45709228515625, 1.6942138671875, 1.93133544921875, 2.16845703125, 2.40557861328125, 2.6427001953125, 2.87982177734375, 3.116943359375, 3.35406494140625, 3.5911865234375, 3.82830810546875, 4.0654296875, 4.30255126953125, 4.5396728515625, 4.77679443359375, 5.013916015625, 5.25103759765625, 5.4881591796875, 5.72528076171875, 5.96240234375, 6.19952392578125, 6.4366455078125, 6.67376708984375, 6.910888671875, 7.14801025390625, 7.3851318359375, 7.62225341796875, 7.859375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 5.0, 6.0, 3.0, 6.0, 10.0, 12.0, 8.0, 22.0, 31.0, 28.0, 51.0, 48.0, 56.0, 60.0, 86.0, 84.0, 143.0, 176.0, 247.0, 304.0, 356.0, 402.0, 374.0, 337.0, 238.0, 227.0, 186.0, 125.0, 110.0, 87.0, 68.0, 47.0, 35.0, 30.0, 21.0, 9.0, 13.0, 7.0, 4.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.3291015625, -1.2925567626953125, -1.256011962890625, -1.2194671630859375, -1.18292236328125, -1.1463775634765625, -1.109832763671875, -1.0732879638671875, -1.0367431640625, -1.0001983642578125, -0.963653564453125, -0.9271087646484375, -0.89056396484375, -0.8540191650390625, -0.817474365234375, -0.7809295654296875, -0.744384765625, -0.7078399658203125, -0.671295166015625, -0.6347503662109375, -0.59820556640625, -0.5616607666015625, -0.525115966796875, -0.4885711669921875, -0.4520263671875, -0.4154815673828125, -0.378936767578125, -0.3423919677734375, -0.30584716796875, -0.2693023681640625, -0.232757568359375, -0.1962127685546875, -0.15966796875, -0.1231231689453125, -0.086578369140625, -0.0500335693359375, -0.01348876953125, 0.0230560302734375, 0.059600830078125, 0.0961456298828125, 0.1326904296875, 0.1692352294921875, 0.205780029296875, 0.2423248291015625, 0.27886962890625, 0.3154144287109375, 0.351959228515625, 0.3885040283203125, 0.425048828125, 0.4615936279296875, 0.498138427734375, 0.5346832275390625, 0.57122802734375, 0.6077728271484375, 0.644317626953125, 0.6808624267578125, 0.7174072265625, 0.7539520263671875, 0.790496826171875, 0.8270416259765625, 0.86358642578125, 0.9001312255859375, 0.936676025390625, 0.9732208251953125, 1.009765625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 8.0, 11.0, 16.0, 20.0, 66.0, 192.0, 457.0, 151.0, 40.0, 16.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.987723350524902, -8.636414527893066, -8.28510570526123, -7.933796405792236, -7.582487106323242, -7.231178283691406, -6.87986946105957, -6.528560638427734, -6.17725133895874, -5.825942516326904, -5.47463321685791, -5.123324394226074, -4.772015571594238, -4.420706272125244, -4.069397449493408, -3.718088388442993, -3.366779327392578, -3.015470266342163, -2.664161205291748, -2.312852382659912, -1.961543321609497, -1.610234260559082, -1.258925437927246, -0.907616376876831, -0.556307315826416, -0.20499831438064575, 0.1463106870651245, 0.49761962890625, 0.848928689956665, 1.20023775100708, 1.551546573638916, 1.902855634689331, 2.2541656494140625, 2.6054747104644775, 2.9567837715148926, 3.3080925941467285, 3.6594016551971436, 4.010710716247559, 4.3620195388793945, 4.7133283615112305, 5.064637660980225, 5.4159464836120605, 5.767255783081055, 6.118564605712891, 6.469873428344727, 6.821182727813721, 7.172491550445557, 7.523800849914551, 7.875109672546387, 8.226418495178223, 8.577727317810059, 8.929037094116211, 9.280345916748047, 9.631654739379883, 9.982963562011719, 10.334272384643555, 10.68558120727539, 11.036890029907227, 11.388198852539062, 11.739507675170898, 12.09081745147705, 12.442126274108887, 12.793435096740723, 13.144743919372559, 13.496053695678711]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 9.0, 8.0, 12.0, 8.0, 14.0, 13.0, 22.0, 18.0, 36.0, 37.0, 31.0, 39.0, 40.0, 54.0, 51.0, 55.0, 39.0, 75.0, 55.0, 44.0, 50.0, 39.0, 45.0, 33.0, 23.0, 28.0, 13.0, 16.0, 18.0, 15.0, 12.0, 5.0, 13.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8062503337860107, -2.7200124263763428, -2.6337742805480957, -2.5475363731384277, -2.4612984657287598, -2.375060558319092, -2.2888224124908447, -2.2025845050811768, -2.1163463592529297, -2.0301084518432617, -1.9438704252243042, -1.8576323986053467, -1.7713944911956787, -1.6851564645767212, -1.5989184379577637, -1.5126805305480957, -1.4264426231384277, -1.3402045965194702, -1.2539666891098022, -1.1677286624908447, -1.0814907550811768, -0.9952527284622192, -0.9090147018432617, -0.822776734828949, -0.7365387678146362, -0.6503008008003235, -0.5640628337860107, -0.4778248071670532, -0.3915868401527405, -0.30534887313842773, -0.21911084651947021, -0.13287287950515747, -0.04663515090942383, 0.03960283100605011, 0.12584081292152405, 0.21207880973815918, 0.2983167767524719, 0.38455474376678467, 0.4707927703857422, 0.5570307374000549, 0.6432687044143677, 0.7295066714286804, 0.8157446384429932, 0.9019826650619507, 0.9882206320762634, 1.0744585990905762, 1.1606966257095337, 1.2469346523284912, 1.3331725597381592, 1.4194105863571167, 1.5056484937667847, 1.5918865203857422, 1.6781244277954102, 1.7643624544143677, 1.8506004810333252, 1.9368383884429932, 2.0230765342712402, 2.109314441680908, 2.1955525875091553, 2.2817904949188232, 2.368028402328491, 2.4542665481567383, 2.5405044555664062, 2.626742362976074, 2.712980270385742]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 14.0, 18.0, 21.0, 27.0, 38.0, 62.0, 88.0, 104.0, 156.0, 260.0, 413.0, 675.0, 1051.0, 1678.0, 2942.0, 5701.0, 12958.0, 37895.0, 204951.0, 627763.0, 105593.0, 25570.0, 9709.0, 4504.0, 2468.0, 1414.0, 854.0, 564.0, 323.0, 230.0, 155.0, 93.0, 56.0, 50.0, 33.0, 31.0, 19.0, 13.0, 9.0, 4.0, 9.0, 6.0, 7.0, 1.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-4.87890625, -4.7325439453125, -4.586181640625, -4.4398193359375, -4.29345703125, -4.1470947265625, -4.000732421875, -3.8543701171875, -3.7080078125, -3.5616455078125, -3.415283203125, -3.2689208984375, -3.12255859375, -2.9761962890625, -2.829833984375, -2.6834716796875, -2.537109375, -2.3907470703125, -2.244384765625, -2.0980224609375, -1.95166015625, -1.8052978515625, -1.658935546875, -1.5125732421875, -1.3662109375, -1.2198486328125, -1.073486328125, -0.9271240234375, -0.78076171875, -0.6343994140625, -0.488037109375, -0.3416748046875, -0.1953125, -0.0489501953125, 0.097412109375, 0.2437744140625, 0.39013671875, 0.5364990234375, 0.682861328125, 0.8292236328125, 0.9755859375, 1.1219482421875, 1.268310546875, 1.4146728515625, 1.56103515625, 1.7073974609375, 1.853759765625, 2.0001220703125, 2.146484375, 2.2928466796875, 2.439208984375, 2.5855712890625, 2.73193359375, 2.8782958984375, 3.024658203125, 3.1710205078125, 3.3173828125, 3.4637451171875, 3.610107421875, 3.7564697265625, 3.90283203125, 4.0491943359375, 4.195556640625, 4.3419189453125, 4.48828125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 7.0, 6.0, 7.0, 7.0, 18.0, 11.0, 20.0, 31.0, 24.0, 26.0, 40.0, 28.0, 54.0, 51.0, 40.0, 44.0, 52.0, 56.0, 60.0, 57.0, 45.0, 55.0, 34.0, 33.0, 28.0, 24.0, 22.0, 16.0, 17.0, 12.0, 11.0, 14.0, 12.0, 9.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.330078125, -2.257171630859375, -2.18426513671875, -2.111358642578125, -2.0384521484375, -1.965545654296875, -1.89263916015625, -1.819732666015625, -1.746826171875, -1.673919677734375, -1.60101318359375, -1.528106689453125, -1.4552001953125, -1.382293701171875, -1.30938720703125, -1.236480712890625, -1.16357421875, -1.090667724609375, -1.01776123046875, -0.944854736328125, -0.8719482421875, -0.799041748046875, -0.72613525390625, -0.653228759765625, -0.580322265625, -0.507415771484375, -0.43450927734375, -0.361602783203125, -0.2886962890625, -0.215789794921875, -0.14288330078125, -0.069976806640625, 0.0029296875, 0.075836181640625, 0.14874267578125, 0.221649169921875, 0.2945556640625, 0.367462158203125, 0.44036865234375, 0.513275146484375, 0.586181640625, 0.659088134765625, 0.73199462890625, 0.804901123046875, 0.8778076171875, 0.950714111328125, 1.02362060546875, 1.096527099609375, 1.16943359375, 1.242340087890625, 1.31524658203125, 1.388153076171875, 1.4610595703125, 1.533966064453125, 1.60687255859375, 1.679779052734375, 1.752685546875, 1.825592041015625, 1.89849853515625, 1.971405029296875, 2.0443115234375, 2.117218017578125, 2.19012451171875, 2.263031005859375, 2.3359375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 9.0, 4.0, 5.0, 10.0, 10.0, 21.0, 24.0, 46.0, 76.0, 75.0, 134.0, 206.0, 268.0, 401.0, 648.0, 996.0, 1829.0, 3116.0, 6301.0, 16181.0, 70663.0, 704999.0, 195628.0, 27907.0, 9163.0, 4094.0, 2168.0, 1239.0, 804.0, 513.0, 330.0, 207.0, 128.0, 111.0, 79.0, 44.0, 38.0, 23.0, 21.0, 12.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3671875, -5.1802978515625, -4.993408203125, -4.8065185546875, -4.61962890625, -4.4327392578125, -4.245849609375, -4.0589599609375, -3.8720703125, -3.6851806640625, -3.498291015625, -3.3114013671875, -3.12451171875, -2.9376220703125, -2.750732421875, -2.5638427734375, -2.376953125, -2.1900634765625, -2.003173828125, -1.8162841796875, -1.62939453125, -1.4425048828125, -1.255615234375, -1.0687255859375, -0.8818359375, -0.6949462890625, -0.508056640625, -0.3211669921875, -0.13427734375, 0.0526123046875, 0.239501953125, 0.4263916015625, 0.61328125, 0.8001708984375, 0.987060546875, 1.1739501953125, 1.36083984375, 1.5477294921875, 1.734619140625, 1.9215087890625, 2.1083984375, 2.2952880859375, 2.482177734375, 2.6690673828125, 2.85595703125, 3.0428466796875, 3.229736328125, 3.4166259765625, 3.603515625, 3.7904052734375, 3.977294921875, 4.1641845703125, 4.35107421875, 4.5379638671875, 4.724853515625, 4.9117431640625, 5.0986328125, 5.2855224609375, 5.472412109375, 5.6593017578125, 5.84619140625, 6.0330810546875, 6.219970703125, 6.4068603515625, 6.59375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 6.0, 9.0, 12.0, 7.0, 12.0, 7.0, 30.0, 32.0, 22.0, 41.0, 34.0, 49.0, 41.0, 41.0, 32.0, 46.0, 52.0, 56.0, 53.0, 53.0, 43.0, 51.0, 45.0, 31.0, 26.0, 28.0, 23.0, 15.0, 11.0, 15.0, 13.0, 15.0, 10.0, 4.0, 9.0, 5.0, 2.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.7587890625, -1.708892822265625, -1.65899658203125, -1.609100341796875, -1.5592041015625, -1.509307861328125, -1.45941162109375, -1.409515380859375, -1.359619140625, -1.309722900390625, -1.25982666015625, -1.209930419921875, -1.1600341796875, -1.110137939453125, -1.06024169921875, -1.010345458984375, -0.96044921875, -0.910552978515625, -0.86065673828125, -0.810760498046875, -0.7608642578125, -0.710968017578125, -0.66107177734375, -0.611175537109375, -0.561279296875, -0.511383056640625, -0.46148681640625, -0.411590576171875, -0.3616943359375, -0.311798095703125, -0.26190185546875, -0.212005615234375, -0.162109375, -0.112213134765625, -0.06231689453125, -0.012420654296875, 0.0374755859375, 0.087371826171875, 0.13726806640625, 0.187164306640625, 0.237060546875, 0.286956787109375, 0.33685302734375, 0.386749267578125, 0.4366455078125, 0.486541748046875, 0.53643798828125, 0.586334228515625, 0.63623046875, 0.686126708984375, 0.73602294921875, 0.785919189453125, 0.8358154296875, 0.885711669921875, 0.93560791015625, 0.985504150390625, 1.035400390625, 1.085296630859375, 1.13519287109375, 1.185089111328125, 1.2349853515625, 1.284881591796875, 1.33477783203125, 1.384674072265625, 1.4345703125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 4.0, 8.0, 11.0, 22.0, 15.0, 42.0, 34.0, 63.0, 101.0, 156.0, 223.0, 366.0, 740.0, 1513.0, 3917.0, 12537.0, 83806.0, 864943.0, 62656.0, 10850.0, 3468.0, 1387.0, 690.0, 333.0, 209.0, 145.0, 81.0, 62.0, 36.0, 28.0, 22.0, 14.0, 15.0, 9.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.671875, -2.5841064453125, -2.496337890625, -2.4085693359375, -2.32080078125, -2.2330322265625, -2.145263671875, -2.0574951171875, -1.9697265625, -1.8819580078125, -1.794189453125, -1.7064208984375, -1.61865234375, -1.5308837890625, -1.443115234375, -1.3553466796875, -1.267578125, -1.1798095703125, -1.092041015625, -1.0042724609375, -0.91650390625, -0.8287353515625, -0.740966796875, -0.6531982421875, -0.5654296875, -0.4776611328125, -0.389892578125, -0.3021240234375, -0.21435546875, -0.1265869140625, -0.038818359375, 0.0489501953125, 0.13671875, 0.2244873046875, 0.312255859375, 0.4000244140625, 0.48779296875, 0.5755615234375, 0.663330078125, 0.7510986328125, 0.8388671875, 0.9266357421875, 1.014404296875, 1.1021728515625, 1.18994140625, 1.2777099609375, 1.365478515625, 1.4532470703125, 1.541015625, 1.6287841796875, 1.716552734375, 1.8043212890625, 1.89208984375, 1.9798583984375, 2.067626953125, 2.1553955078125, 2.2431640625, 2.3309326171875, 2.418701171875, 2.5064697265625, 2.59423828125, 2.6820068359375, 2.769775390625, 2.8575439453125, 2.9453125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 2.0, 2.0, 8.0, 10.0, 12.0, 17.0, 64.0, 231.0, 456.0, 94.0, 38.0, 17.0, 9.0, 4.0, 6.0, 3.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013494491577148438, -0.00013033486902713776, -0.00012572482228279114, -0.00012111477553844452, -0.0001165047287940979, -0.00011189468204975128, -0.00010728463530540466, -0.00010267458856105804, -9.806454181671143e-05, -9.345449507236481e-05, -8.884444832801819e-05, -8.423440158367157e-05, -7.962435483932495e-05, -7.501430809497833e-05, -7.040426135063171e-05, -6.57942146062851e-05, -6.118416786193848e-05, -5.657412111759186e-05, -5.196407437324524e-05, -4.735402762889862e-05, -4.2743980884552e-05, -3.813393414020538e-05, -3.3523887395858765e-05, -2.8913840651512146e-05, -2.4303793907165527e-05, -1.969374716281891e-05, -1.508370041847229e-05, -1.0473653674125671e-05, -5.863606929779053e-06, -1.253560185432434e-06, 3.3564865589141846e-06, 7.966533303260803e-06, 1.2576580047607422e-05, 1.718662679195404e-05, 2.179667353630066e-05, 2.6406720280647278e-05, 3.1016767024993896e-05, 3.5626813769340515e-05, 4.0236860513687134e-05, 4.484690725803375e-05, 4.945695400238037e-05, 5.406700074672699e-05, 5.867704749107361e-05, 6.328709423542023e-05, 6.789714097976685e-05, 7.250718772411346e-05, 7.711723446846008e-05, 8.17272812128067e-05, 8.633732795715332e-05, 9.094737470149994e-05, 9.555742144584656e-05, 0.00010016746819019318, 0.0001047775149345398, 0.00010938756167888641, 0.00011399760842323303, 0.00011860765516757965, 0.00012321770191192627, 0.0001278277486562729, 0.0001324377954006195, 0.00013704784214496613, 0.00014165788888931274, 0.00014626793563365936, 0.00015087798237800598, 0.0001554880291223526, 0.00016009807586669922]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 9.0, 7.0, 7.0, 7.0, 14.0, 23.0, 20.0, 39.0, 37.0, 80.0, 130.0, 178.0, 307.0, 540.0, 1098.0, 2580.0, 8799.0, 54963.0, 891288.0, 72697.0, 10012.0, 2985.0, 1220.0, 589.0, 292.0, 199.0, 135.0, 92.0, 47.0, 48.0, 31.0, 19.0, 12.0, 13.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8359375, -1.771636962890625, -1.70733642578125, -1.643035888671875, -1.5787353515625, -1.514434814453125, -1.45013427734375, -1.385833740234375, -1.321533203125, -1.257232666015625, -1.19293212890625, -1.128631591796875, -1.0643310546875, -1.000030517578125, -0.93572998046875, -0.871429443359375, -0.80712890625, -0.742828369140625, -0.67852783203125, -0.614227294921875, -0.5499267578125, -0.485626220703125, -0.42132568359375, -0.357025146484375, -0.292724609375, -0.228424072265625, -0.16412353515625, -0.099822998046875, -0.0355224609375, 0.028778076171875, 0.09307861328125, 0.157379150390625, 0.2216796875, 0.285980224609375, 0.35028076171875, 0.414581298828125, 0.4788818359375, 0.543182373046875, 0.60748291015625, 0.671783447265625, 0.736083984375, 0.800384521484375, 0.86468505859375, 0.928985595703125, 0.9932861328125, 1.057586669921875, 1.12188720703125, 1.186187744140625, 1.25048828125, 1.314788818359375, 1.37908935546875, 1.443389892578125, 1.5076904296875, 1.571990966796875, 1.63629150390625, 1.700592041015625, 1.764892578125, 1.829193115234375, 1.89349365234375, 1.957794189453125, 2.0220947265625, 2.086395263671875, 2.15069580078125, 2.214996337890625, 2.279296875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 12.0, 12.0, 24.0, 67.0, 166.0, 343.0, 212.0, 70.0, 47.0, 19.0, 9.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7060546875, -0.6749114990234375, -0.643768310546875, -0.6126251220703125, -0.58148193359375, -0.5503387451171875, -0.519195556640625, -0.4880523681640625, -0.4569091796875, -0.4257659912109375, -0.394622802734375, -0.3634796142578125, -0.33233642578125, -0.3011932373046875, -0.270050048828125, -0.2389068603515625, -0.207763671875, -0.1766204833984375, -0.145477294921875, -0.1143341064453125, -0.08319091796875, -0.0520477294921875, -0.020904541015625, 0.0102386474609375, 0.0413818359375, 0.0725250244140625, 0.103668212890625, 0.1348114013671875, 0.16595458984375, 0.1970977783203125, 0.228240966796875, 0.2593841552734375, 0.29052734375, 0.3216705322265625, 0.352813720703125, 0.3839569091796875, 0.41510009765625, 0.4462432861328125, 0.477386474609375, 0.5085296630859375, 0.5396728515625, 0.5708160400390625, 0.601959228515625, 0.6331024169921875, 0.66424560546875, 0.6953887939453125, 0.726531982421875, 0.7576751708984375, 0.788818359375, 0.8199615478515625, 0.851104736328125, 0.8822479248046875, 0.91339111328125, 0.9445343017578125, 0.975677490234375, 1.0068206787109375, 1.0379638671875, 1.0691070556640625, 1.100250244140625, 1.1313934326171875, 1.16253662109375, 1.1936798095703125, 1.224822998046875, 1.2559661865234375, 1.287109375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 15.0, 23.0, 24.0, 116.0, 426.0, 264.0, 63.0, 30.0, 11.0, 7.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.598084449768066, -5.284798622131348, -4.971512794494629, -4.658227443695068, -4.34494161605835, -4.031655788421631, -3.718370199203491, -3.4050846099853516, -3.091798782348633, -2.778512954711914, -2.4652273654937744, -2.1519417762756348, -1.838655948638916, -1.5253702402114868, -1.2120845317840576, -0.898798942565918, -0.5855131149291992, -0.27222740650177, 0.04105830192565918, 0.3543440103530884, 0.6676297187805176, 0.9809154272079468, 1.294201135635376, 1.6074867248535156, 1.9207725524902344, 2.234058380126953, 2.5473439693450928, 2.8606295585632324, 3.173915386199951, 3.48720121383667, 3.8004868030548096, 4.113772392272949, 4.427057266235352, 4.74034309387207, 5.053628921508789, 5.36691427230835, 5.680200099945068, 5.993485927581787, 6.306771278381348, 6.620057106018066, 6.933342933654785, 7.246628761291504, 7.559914588928223, 7.873199939727783, 8.186485290527344, 8.499771118164062, 8.813056945800781, 9.1263427734375, 9.439628601074219, 9.752914428710938, 10.066200256347656, 10.379486083984375, 10.692771911621094, 11.006056785583496, 11.319342613220215, 11.632628440856934, 11.945914268493652, 12.259200096130371, 12.57248592376709, 12.885771751403809, 13.199056625366211, 13.51234245300293, 13.825628280639648, 14.138914108276367, 14.452199935913086]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 6.0, 9.0, 10.0, 12.0, 9.0, 11.0, 16.0, 23.0, 28.0, 35.0, 39.0, 33.0, 30.0, 48.0, 41.0, 51.0, 54.0, 60.0, 62.0, 51.0, 45.0, 41.0, 50.0, 34.0, 30.0, 24.0, 28.0, 17.0, 14.0, 15.0, 15.0, 12.0, 8.0, 10.0, 10.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.364989995956421, -2.291995048522949, -2.2190001010894775, -2.146005153656006, -2.073010206222534, -2.0000152587890625, -1.9270203113555908, -1.8540253639221191, -1.7810304164886475, -1.7080354690551758, -1.635040521621704, -1.5620455741882324, -1.4890506267547607, -1.416055679321289, -1.3430607318878174, -1.2700657844543457, -1.197070837020874, -1.1240758895874023, -1.0510809421539307, -0.978085994720459, -0.9050910472869873, -0.8320960998535156, -0.759101152420044, -0.6861062049865723, -0.6131112575531006, -0.5401163101196289, -0.4671213626861572, -0.39412641525268555, -0.32113146781921387, -0.2481365203857422, -0.1751415729522705, -0.10214662551879883, -0.02915191650390625, 0.04384303092956543, 0.11683797836303711, 0.1898329257965088, 0.26282787322998047, 0.33582282066345215, 0.40881776809692383, 0.4818127155303955, 0.5548076629638672, 0.6278026103973389, 0.7007975578308105, 0.7737925052642822, 0.8467874526977539, 0.9197824001312256, 0.9927773475646973, 1.065772294998169, 1.1387672424316406, 1.2117621898651123, 1.284757137298584, 1.3577520847320557, 1.4307470321655273, 1.503741979598999, 1.5767369270324707, 1.6497318744659424, 1.722726821899414, 1.7957217693328857, 1.8687167167663574, 1.941711664199829, 2.014706611633301, 2.0877015590667725, 2.160696506500244, 2.233691453933716, 2.3066864013671875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 2.0, 9.0, 12.0, 8.0, 23.0, 31.0, 44.0, 45.0, 71.0, 107.0, 144.0, 250.0, 397.0, 712.0, 1299.0, 2384.0, 4733.0, 9652.0, 21086.0, 48355.0, 122887.0, 347408.0, 302472.0, 106997.0, 42501.0, 18814.0, 8692.0, 4370.0, 2083.0, 1185.0, 641.0, 381.0, 269.0, 142.0, 105.0, 81.0, 51.0, 31.0, 23.0, 21.0, 8.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.18878173828125, -4.0533447265625, -3.91790771484375, -3.782470703125, -3.64703369140625, -3.5115966796875, -3.37615966796875, -3.24072265625, -3.10528564453125, -2.9698486328125, -2.83441162109375, -2.698974609375, -2.56353759765625, -2.4281005859375, -2.29266357421875, -2.1572265625, -2.02178955078125, -1.8863525390625, -1.75091552734375, -1.615478515625, -1.48004150390625, -1.3446044921875, -1.20916748046875, -1.07373046875, -0.93829345703125, -0.8028564453125, -0.66741943359375, -0.531982421875, -0.39654541015625, -0.2611083984375, -0.12567138671875, 0.009765625, 0.14520263671875, 0.2806396484375, 0.41607666015625, 0.551513671875, 0.68695068359375, 0.8223876953125, 0.95782470703125, 1.09326171875, 1.22869873046875, 1.3641357421875, 1.49957275390625, 1.635009765625, 1.77044677734375, 1.9058837890625, 2.04132080078125, 2.1767578125, 2.31219482421875, 2.4476318359375, 2.58306884765625, 2.718505859375, 2.85394287109375, 2.9893798828125, 3.12481689453125, 3.26025390625, 3.39569091796875, 3.5311279296875, 3.66656494140625, 3.802001953125, 3.93743896484375, 4.0728759765625, 4.20831298828125, 4.34375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 8.0, 6.0, 10.0, 18.0, 15.0, 9.0, 9.0, 24.0, 26.0, 26.0, 40.0, 31.0, 48.0, 43.0, 45.0, 55.0, 58.0, 61.0, 46.0, 54.0, 48.0, 33.0, 43.0, 40.0, 29.0, 29.0, 23.0, 15.0, 15.0, 14.0, 16.0, 8.0, 7.0, 11.0, 5.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.416015625, -1.3734130859375, -1.330810546875, -1.2882080078125, -1.24560546875, -1.2030029296875, -1.160400390625, -1.1177978515625, -1.0751953125, -1.0325927734375, -0.989990234375, -0.9473876953125, -0.90478515625, -0.8621826171875, -0.819580078125, -0.7769775390625, -0.734375, -0.6917724609375, -0.649169921875, -0.6065673828125, -0.56396484375, -0.5213623046875, -0.478759765625, -0.4361572265625, -0.3935546875, -0.3509521484375, -0.308349609375, -0.2657470703125, -0.22314453125, -0.1805419921875, -0.137939453125, -0.0953369140625, -0.052734375, -0.0101318359375, 0.032470703125, 0.0750732421875, 0.11767578125, 0.1602783203125, 0.202880859375, 0.2454833984375, 0.2880859375, 0.3306884765625, 0.373291015625, 0.4158935546875, 0.45849609375, 0.5010986328125, 0.543701171875, 0.5863037109375, 0.62890625, 0.6715087890625, 0.714111328125, 0.7567138671875, 0.79931640625, 0.8419189453125, 0.884521484375, 0.9271240234375, 0.9697265625, 1.0123291015625, 1.054931640625, 1.0975341796875, 1.14013671875, 1.1827392578125, 1.225341796875, 1.2679443359375, 1.310546875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 11.0, 10.0, 20.0, 25.0, 39.0, 47.0, 74.0, 133.0, 210.0, 263.0, 461.0, 672.0, 1084.0, 1929.0, 3360.0, 6395.0, 13184.0, 29153.0, 78095.0, 319410.0, 430293.0, 97096.0, 34878.0, 15049.0, 7371.0, 3813.0, 2164.0, 1193.0, 765.0, 477.0, 286.0, 199.0, 125.0, 83.0, 72.0, 44.0, 21.0, 15.0, 10.0, 11.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.4296875, -4.303466796875, -4.17724609375, -4.051025390625, -3.9248046875, -3.798583984375, -3.67236328125, -3.546142578125, -3.419921875, -3.293701171875, -3.16748046875, -3.041259765625, -2.9150390625, -2.788818359375, -2.66259765625, -2.536376953125, -2.41015625, -2.283935546875, -2.15771484375, -2.031494140625, -1.9052734375, -1.779052734375, -1.65283203125, -1.526611328125, -1.400390625, -1.274169921875, -1.14794921875, -1.021728515625, -0.8955078125, -0.769287109375, -0.64306640625, -0.516845703125, -0.390625, -0.264404296875, -0.13818359375, -0.011962890625, 0.1142578125, 0.240478515625, 0.36669921875, 0.492919921875, 0.619140625, 0.745361328125, 0.87158203125, 0.997802734375, 1.1240234375, 1.250244140625, 1.37646484375, 1.502685546875, 1.62890625, 1.755126953125, 1.88134765625, 2.007568359375, 2.1337890625, 2.260009765625, 2.38623046875, 2.512451171875, 2.638671875, 2.764892578125, 2.89111328125, 3.017333984375, 3.1435546875, 3.269775390625, 3.39599609375, 3.522216796875, 3.6484375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 9.0, 6.0, 7.0, 8.0, 8.0, 15.0, 14.0, 14.0, 25.0, 24.0, 27.0, 28.0, 29.0, 33.0, 38.0, 40.0, 34.0, 42.0, 41.0, 39.0, 45.0, 52.0, 39.0, 49.0, 39.0, 32.0, 36.0, 30.0, 27.0, 24.0, 18.0, 24.0, 13.0, 10.0, 13.0, 14.0, 7.0, 9.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.009765625, -0.9783477783203125, -0.946929931640625, -0.9155120849609375, -0.88409423828125, -0.8526763916015625, -0.821258544921875, -0.7898406982421875, -0.7584228515625, -0.7270050048828125, -0.695587158203125, -0.6641693115234375, -0.63275146484375, -0.6013336181640625, -0.569915771484375, -0.5384979248046875, -0.507080078125, -0.4756622314453125, -0.444244384765625, -0.4128265380859375, -0.38140869140625, -0.3499908447265625, -0.318572998046875, -0.2871551513671875, -0.2557373046875, -0.2243194580078125, -0.192901611328125, -0.1614837646484375, -0.13006591796875, -0.0986480712890625, -0.067230224609375, -0.0358123779296875, -0.00439453125, 0.0270233154296875, 0.058441162109375, 0.0898590087890625, 0.12127685546875, 0.1526947021484375, 0.184112548828125, 0.2155303955078125, 0.2469482421875, 0.2783660888671875, 0.309783935546875, 0.3412017822265625, 0.37261962890625, 0.4040374755859375, 0.435455322265625, 0.4668731689453125, 0.498291015625, 0.5297088623046875, 0.561126708984375, 0.5925445556640625, 0.62396240234375, 0.6553802490234375, 0.686798095703125, 0.7182159423828125, 0.7496337890625, 0.7810516357421875, 0.812469482421875, 0.8438873291015625, 0.87530517578125, 0.9067230224609375, 0.938140869140625, 0.9695587158203125, 1.0009765625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 7.0, 17.0, 17.0, 26.0, 20.0, 18.0, 52.0, 85.0, 116.0, 180.0, 240.0, 433.0, 1040.0, 2792.0, 14009.0, 944225.0, 75271.0, 6628.0, 1632.0, 714.0, 399.0, 208.0, 125.0, 82.0, 75.0, 52.0, 30.0, 22.0, 8.0, 7.0, 5.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.0643310546875, -14.480224609375, -13.8961181640625, -13.31201171875, -12.7279052734375, -12.143798828125, -11.5596923828125, -10.9755859375, -10.3914794921875, -9.807373046875, -9.2232666015625, -8.63916015625, -8.0550537109375, -7.470947265625, -6.8868408203125, -6.302734375, -5.7186279296875, -5.134521484375, -4.5504150390625, -3.96630859375, -3.3822021484375, -2.798095703125, -2.2139892578125, -1.6298828125, -1.0457763671875, -0.461669921875, 0.1224365234375, 0.70654296875, 1.2906494140625, 1.874755859375, 2.4588623046875, 3.04296875, 3.6270751953125, 4.211181640625, 4.7952880859375, 5.37939453125, 5.9635009765625, 6.547607421875, 7.1317138671875, 7.7158203125, 8.2999267578125, 8.884033203125, 9.4681396484375, 10.05224609375, 10.6363525390625, 11.220458984375, 11.8045654296875, 12.388671875, 12.9727783203125, 13.556884765625, 14.1409912109375, 14.72509765625, 15.3092041015625, 15.893310546875, 16.4774169921875, 17.0615234375, 17.6456298828125, 18.229736328125, 18.8138427734375, 19.39794921875, 19.9820556640625, 20.566162109375, 21.1502685546875, 21.734375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 8.0, 10.0, 19.0, 27.0, 29.0, 53.0, 77.0, 122.0, 290.0, 124.0, 66.0, 62.0, 40.0, 20.0, 14.0, 10.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017023086547851562, -0.00016425922513008118, -0.00015828758478164673, -0.00015231594443321228, -0.00014634430408477783, -0.00014037266373634338, -0.00013440102338790894, -0.0001284293830394745, -0.00012245774269104004, -0.00011648610234260559, -0.00011051446199417114, -0.0001045428216457367, -9.857118129730225e-05, -9.25995409488678e-05, -8.662790060043335e-05, -8.06562602519989e-05, -7.468461990356445e-05, -6.871297955513e-05, -6.274133920669556e-05, -5.676969885826111e-05, -5.079805850982666e-05, -4.482641816139221e-05, -3.8854777812957764e-05, -3.2883137464523315e-05, -2.6911497116088867e-05, -2.093985676765442e-05, -1.496821641921997e-05, -8.996576070785522e-06, -3.0249357223510742e-06, 2.946704626083374e-06, 8.918344974517822e-06, 1.488998532295227e-05, 2.086162567138672e-05, 2.6833266019821167e-05, 3.2804906368255615e-05, 3.8776546716690063e-05, 4.474818706512451e-05, 5.071982741355896e-05, 5.669146776199341e-05, 6.266310811042786e-05, 6.86347484588623e-05, 7.460638880729675e-05, 8.05780291557312e-05, 8.654966950416565e-05, 9.25213098526001e-05, 9.849295020103455e-05, 0.000104464590549469, 0.00011043623089790344, 0.00011640787124633789, 0.00012237951159477234, 0.0001283511519432068, 0.00013432279229164124, 0.00014029443264007568, 0.00014626607298851013, 0.00015223771333694458, 0.00015820935368537903, 0.00016418099403381348, 0.00017015263438224792, 0.00017612427473068237, 0.00018209591507911682, 0.00018806755542755127, 0.00019403919577598572, 0.00020001083612442017, 0.00020598247647285461, 0.00021195411682128906]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 12.0, 9.0, 15.0, 17.0, 26.0, 31.0, 42.0, 61.0, 88.0, 120.0, 164.0, 236.0, 367.0, 724.0, 1529.0, 3875.0, 18154.0, 936072.0, 74263.0, 7820.0, 2331.0, 1016.0, 538.0, 316.0, 210.0, 136.0, 79.0, 74.0, 48.0, 31.0, 33.0, 20.0, 14.0, 17.0, 13.0, 6.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.072509765625, -13.62939453125, -13.186279296875, -12.7431640625, -12.300048828125, -11.85693359375, -11.413818359375, -10.970703125, -10.527587890625, -10.08447265625, -9.641357421875, -9.1982421875, -8.755126953125, -8.31201171875, -7.868896484375, -7.42578125, -6.982666015625, -6.53955078125, -6.096435546875, -5.6533203125, -5.210205078125, -4.76708984375, -4.323974609375, -3.880859375, -3.437744140625, -2.99462890625, -2.551513671875, -2.1083984375, -1.665283203125, -1.22216796875, -0.779052734375, -0.3359375, 0.107177734375, 0.55029296875, 0.993408203125, 1.4365234375, 1.879638671875, 2.32275390625, 2.765869140625, 3.208984375, 3.652099609375, 4.09521484375, 4.538330078125, 4.9814453125, 5.424560546875, 5.86767578125, 6.310791015625, 6.75390625, 7.197021484375, 7.64013671875, 8.083251953125, 8.5263671875, 8.969482421875, 9.41259765625, 9.855712890625, 10.298828125, 10.741943359375, 11.18505859375, 11.628173828125, 12.0712890625, 12.514404296875, 12.95751953125, 13.400634765625, 13.84375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 13.0, 18.0, 40.0, 63.0, 120.0, 394.0, 155.0, 78.0, 41.0, 26.0, 16.0, 12.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.8359222412109375, -1.764617919921875, -1.6933135986328125, -1.62200927734375, -1.5507049560546875, -1.479400634765625, -1.4080963134765625, -1.3367919921875, -1.2654876708984375, -1.194183349609375, -1.1228790283203125, -1.05157470703125, -0.9802703857421875, -0.908966064453125, -0.8376617431640625, -0.766357421875, -0.6950531005859375, -0.623748779296875, -0.5524444580078125, -0.48114013671875, -0.4098358154296875, -0.338531494140625, -0.2672271728515625, -0.1959228515625, -0.1246185302734375, -0.053314208984375, 0.0179901123046875, 0.08929443359375, 0.1605987548828125, 0.231903076171875, 0.3032073974609375, 0.37451171875, 0.4458160400390625, 0.517120361328125, 0.5884246826171875, 0.65972900390625, 0.7310333251953125, 0.802337646484375, 0.8736419677734375, 0.9449462890625, 1.0162506103515625, 1.087554931640625, 1.1588592529296875, 1.23016357421875, 1.3014678955078125, 1.372772216796875, 1.4440765380859375, 1.515380859375, 1.5866851806640625, 1.657989501953125, 1.7292938232421875, 1.80059814453125, 1.8719024658203125, 1.943206787109375, 2.0145111083984375, 2.0858154296875, 2.1571197509765625, 2.228424072265625, 2.2997283935546875, 2.37103271484375, 2.4423370361328125, 2.513641357421875, 2.5849456787109375, 2.65625]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 3.0, 3.0, 8.0, 10.0, 17.0, 25.0, 33.0, 67.0, 110.0, 254.0, 306.0, 85.0, 34.0, 15.0, 7.0, 10.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.084416389465332, -4.951287269592285, -4.818158149719238, -4.685028553009033, -4.551899433135986, -4.4187703132629395, -4.285640716552734, -4.1525115966796875, -4.019382476806641, -3.8862533569335938, -3.7531239986419678, -3.619994640350342, -3.486865520477295, -3.353736400604248, -3.220607042312622, -3.087477684020996, -2.954348564147949, -2.8212194442749023, -2.6880900859832764, -2.5549607276916504, -2.4218316078186035, -2.2887024879455566, -2.1555731296539307, -2.0224437713623047, -1.8893146514892578, -1.7561854124069214, -1.623056173324585, -1.4899269342422485, -1.356797695159912, -1.2236684560775757, -1.0905392169952393, -0.9574099779129028, -0.8242802619934082, -0.6911510229110718, -0.5580217838287354, -0.4248925447463989, -0.2917633056640625, -0.15863406658172607, -0.02550482749938965, 0.10762441158294678, 0.2407536506652832, 0.37388288974761963, 0.507012128829956, 0.6401413679122925, 0.7732706069946289, 0.9063998460769653, 1.0395290851593018, 1.1726583242416382, 1.3057875633239746, 1.438916802406311, 1.5720460414886475, 1.7051752805709839, 1.8383045196533203, 1.9714337587356567, 2.104562997817993, 2.237692356109619, 2.370821475982666, 2.503950595855713, 2.637079954147339, 2.770209312438965, 2.9033384323120117, 3.0364675521850586, 3.1695969104766846, 3.3027262687683105, 3.4358553886413574]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 3.0, 4.0, 13.0, 13.0, 15.0, 19.0, 20.0, 23.0, 36.0, 39.0, 43.0, 37.0, 38.0, 39.0, 52.0, 61.0, 53.0, 60.0, 39.0, 43.0, 46.0, 48.0, 33.0, 32.0, 21.0, 24.0, 25.0, 17.0, 13.0, 16.0, 14.0, 9.0, 9.0, 7.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6580816507339478, -1.609861969947815, -1.5616422891616821, -1.5134227275848389, -1.465203046798706, -1.4169833660125732, -1.3687636852264404, -1.3205440044403076, -1.2723243236541748, -1.224104642868042, -1.1758849620819092, -1.1276652812957764, -1.079445719718933, -1.0312260389328003, -0.9830063581466675, -0.9347866773605347, -0.8865671157836914, -0.8383474349975586, -0.7901278138160706, -0.7419081330299377, -0.6936885118484497, -0.6454688310623169, -0.5972491502761841, -0.5490294694900513, -0.5008098483085632, -0.4525901973247528, -0.4043705463409424, -0.35615086555480957, -0.30793121457099915, -0.2597115635871887, -0.2114918828010559, -0.16327223181724548, -0.11505258083343506, -0.06683292239904404, -0.018613263964653015, 0.029606401920318604, 0.07782605290412903, 0.12604570388793945, 0.17426538467407227, 0.2224850356578827, 0.2707046866416931, 0.31892433762550354, 0.36714398860931396, 0.4153636693954468, 0.4635833203792572, 0.5118029713630676, 0.5600226521492004, 0.6082422733306885, 0.6564619541168213, 0.7046816349029541, 0.7529012560844421, 0.801120936870575, 0.849340558052063, 0.8975602388381958, 0.9457799196243286, 0.9939996004104614, 1.0422191619873047, 1.0904388427734375, 1.1386585235595703, 1.1868782043457031, 1.2350977659225464, 1.2833174467086792, 1.331537127494812, 1.3797568082809448, 1.4279764890670776]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 9.0, 13.0, 25.0, 30.0, 54.0, 63.0, 89.0, 122.0, 166.0, 211.0, 314.0, 439.0, 693.0, 1022.0, 1447.0, 2225.0, 3210.0, 4610.0, 7269.0, 11258.0, 18586.0, 32066.0, 57810.0, 117948.0, 320073.0, 1978831.0, 1198185.0, 226102.0, 93254.0, 47908.0, 27166.0, 16045.0, 9762.0, 6184.0, 3957.0, 2593.0, 1634.0, 977.0, 664.0, 413.0, 275.0, 204.0, 133.0, 89.0, 62.0, 37.0, 26.0, 12.0, 9.0, 8.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.580078125, -1.5347442626953125, -1.489410400390625, -1.4440765380859375, -1.39874267578125, -1.3534088134765625, -1.308074951171875, -1.2627410888671875, -1.2174072265625, -1.1720733642578125, -1.126739501953125, -1.0814056396484375, -1.03607177734375, -0.9907379150390625, -0.945404052734375, -0.9000701904296875, -0.854736328125, -0.8094024658203125, -0.764068603515625, -0.7187347412109375, -0.67340087890625, -0.6280670166015625, -0.582733154296875, -0.5373992919921875, -0.4920654296875, -0.4467315673828125, -0.401397705078125, -0.3560638427734375, -0.31072998046875, -0.2653961181640625, -0.220062255859375, -0.1747283935546875, -0.12939453125, -0.0840606689453125, -0.038726806640625, 0.0066070556640625, 0.05194091796875, 0.0972747802734375, 0.142608642578125, 0.1879425048828125, 0.2332763671875, 0.2786102294921875, 0.323944091796875, 0.3692779541015625, 0.41461181640625, 0.4599456787109375, 0.505279541015625, 0.5506134033203125, 0.595947265625, 0.6412811279296875, 0.686614990234375, 0.7319488525390625, 0.77728271484375, 0.8226165771484375, 0.867950439453125, 0.9132843017578125, 0.9586181640625, 1.0039520263671875, 1.049285888671875, 1.0946197509765625, 1.13995361328125, 1.1852874755859375, 1.230621337890625, 1.2759552001953125, 1.3212890625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 6.0, 9.0, 4.0, 5.0, 8.0, 9.0, 11.0, 14.0, 14.0, 19.0, 32.0, 38.0, 27.0, 29.0, 39.0, 42.0, 38.0, 45.0, 50.0, 44.0, 56.0, 49.0, 43.0, 45.0, 44.0, 41.0, 30.0, 36.0, 23.0, 15.0, 20.0, 18.0, 13.0, 16.0, 15.0, 17.0, 6.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.482666015625, -0.46929168701171875, -0.4559173583984375, -0.44254302978515625, -0.429168701171875, -0.41579437255859375, -0.4024200439453125, -0.38904571533203125, -0.37567138671875, -0.36229705810546875, -0.3489227294921875, -0.33554840087890625, -0.322174072265625, -0.30879974365234375, -0.2954254150390625, -0.28205108642578125, -0.2686767578125, -0.25530242919921875, -0.2419281005859375, -0.22855377197265625, -0.215179443359375, -0.20180511474609375, -0.1884307861328125, -0.17505645751953125, -0.16168212890625, -0.14830780029296875, -0.1349334716796875, -0.12155914306640625, -0.108184814453125, -0.09481048583984375, -0.0814361572265625, -0.06806182861328125, -0.0546875, -0.04131317138671875, -0.0279388427734375, -0.01456451416015625, -0.001190185546875, 0.01218414306640625, 0.0255584716796875, 0.03893280029296875, 0.05230712890625, 0.06568145751953125, 0.0790557861328125, 0.09243011474609375, 0.105804443359375, 0.11917877197265625, 0.1325531005859375, 0.14592742919921875, 0.1593017578125, 0.17267608642578125, 0.1860504150390625, 0.19942474365234375, 0.212799072265625, 0.22617340087890625, 0.2395477294921875, 0.25292205810546875, 0.26629638671875, 0.27967071533203125, 0.2930450439453125, 0.30641937255859375, 0.319793701171875, 0.33316802978515625, 0.3465423583984375, 0.35991668701171875, 0.373291015625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 13.0, 12.0, 20.0, 27.0, 45.0, 50.0, 101.0, 142.0, 210.0, 301.0, 464.0, 764.0, 1239.0, 2088.0, 4015.0, 7823.0, 15954.0, 38019.0, 114528.0, 529882.0, 2720487.0, 564383.0, 120221.0, 39331.0, 16455.0, 7779.0, 4155.0, 2248.0, 1329.0, 795.0, 472.0, 327.0, 205.0, 129.0, 92.0, 54.0, 36.0, 25.0, 17.0, 15.0, 9.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2861328125, -1.243988037109375, -1.20184326171875, -1.159698486328125, -1.1175537109375, -1.075408935546875, -1.03326416015625, -0.991119384765625, -0.948974609375, -0.906829833984375, -0.86468505859375, -0.822540283203125, -0.7803955078125, -0.738250732421875, -0.69610595703125, -0.653961181640625, -0.61181640625, -0.569671630859375, -0.52752685546875, -0.485382080078125, -0.4432373046875, -0.401092529296875, -0.35894775390625, -0.316802978515625, -0.274658203125, -0.232513427734375, -0.19036865234375, -0.148223876953125, -0.1060791015625, -0.063934326171875, -0.02178955078125, 0.020355224609375, 0.0625, 0.104644775390625, 0.14678955078125, 0.188934326171875, 0.2310791015625, 0.273223876953125, 0.31536865234375, 0.357513427734375, 0.399658203125, 0.441802978515625, 0.48394775390625, 0.526092529296875, 0.5682373046875, 0.610382080078125, 0.65252685546875, 0.694671630859375, 0.73681640625, 0.778961181640625, 0.82110595703125, 0.863250732421875, 0.9053955078125, 0.947540283203125, 0.98968505859375, 1.031829833984375, 1.073974609375, 1.116119384765625, 1.15826416015625, 1.200408935546875, 1.2425537109375, 1.284698486328125, 1.32684326171875, 1.368988037109375, 1.4111328125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 3.0, 4.0, 7.0, 8.0, 11.0, 18.0, 13.0, 19.0, 19.0, 33.0, 33.0, 34.0, 46.0, 47.0, 62.0, 72.0, 111.0, 143.0, 186.0, 237.0, 281.0, 339.0, 423.0, 393.0, 297.0, 285.0, 193.0, 158.0, 140.0, 102.0, 81.0, 68.0, 48.0, 37.0, 37.0, 18.0, 23.0, 10.0, 10.0, 9.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.275634765625, -0.26827239990234375, -0.2609100341796875, -0.25354766845703125, -0.246185302734375, -0.23882293701171875, -0.2314605712890625, -0.22409820556640625, -0.21673583984375, -0.20937347412109375, -0.2020111083984375, -0.19464874267578125, -0.187286376953125, -0.17992401123046875, -0.1725616455078125, -0.16519927978515625, -0.1578369140625, -0.15047454833984375, -0.1431121826171875, -0.13574981689453125, -0.128387451171875, -0.12102508544921875, -0.1136627197265625, -0.10630035400390625, -0.09893798828125, -0.09157562255859375, -0.0842132568359375, -0.07685089111328125, -0.069488525390625, -0.06212615966796875, -0.0547637939453125, -0.04740142822265625, -0.0400390625, -0.03267669677734375, -0.0253143310546875, -0.01795196533203125, -0.010589599609375, -0.00322723388671875, 0.0041351318359375, 0.01149749755859375, 0.01885986328125, 0.02622222900390625, 0.0335845947265625, 0.04094696044921875, 0.048309326171875, 0.05567169189453125, 0.0630340576171875, 0.07039642333984375, 0.0777587890625, 0.08512115478515625, 0.0924835205078125, 0.09984588623046875, 0.107208251953125, 0.11457061767578125, 0.1219329833984375, 0.12929534912109375, 0.13665771484375, 0.14402008056640625, 0.1513824462890625, 0.15874481201171875, 0.166107177734375, 0.17346954345703125, 0.1808319091796875, 0.18819427490234375, 0.195556640625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 20.0, 21.0, 24.0, 37.0, 73.0, 136.0, 228.0, 233.0, 101.0, 41.0, 17.0, 18.0, 10.0, 6.0, 7.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3627512454986572, -1.3213934898376465, -1.2800357341766357, -1.238677978515625, -1.1973202228546143, -1.1559624671936035, -1.1146047115325928, -1.073246955871582, -1.0318892002105713, -0.9905314445495605, -0.9491736888885498, -0.9078159332275391, -0.8664581775665283, -0.8251004219055176, -0.7837427258491516, -0.7423849701881409, -0.7010272741317749, -0.6596695184707642, -0.6183117628097534, -0.5769540071487427, -0.5355962514877319, -0.4942385256290436, -0.4528807997703552, -0.4115230441093445, -0.37016528844833374, -0.328807532787323, -0.28744977712631226, -0.2460920512676239, -0.20473429560661316, -0.16337653994560242, -0.12201879918575287, -0.08066105842590332, -0.03930318355560303, 0.002054564654827118, 0.04341231286525726, 0.08477006107568741, 0.12612780928611755, 0.1674855649471283, 0.20884330570697784, 0.2502010464668274, 0.29155880212783813, 0.3329165577888489, 0.3742743134498596, 0.415632039308548, 0.4569897949695587, 0.49834755063056946, 0.5397052764892578, 0.5810630321502686, 0.6224207878112793, 0.66377854347229, 0.7051362991333008, 0.7464940547943115, 0.7878518104553223, 0.829209566116333, 0.870567262172699, 0.9119250178337097, 0.9532827734947205, 0.9946405291557312, 1.0359982252120972, 1.077355980873108, 1.1187137365341187, 1.1600714921951294, 1.2014292478561401, 1.2427870035171509, 1.2841447591781616]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 5.0, 3.0, 6.0, 5.0, 4.0, 8.0, 15.0, 11.0, 16.0, 11.0, 18.0, 17.0, 35.0, 27.0, 32.0, 37.0, 42.0, 45.0, 49.0, 43.0, 34.0, 48.0, 42.0, 48.0, 43.0, 52.0, 38.0, 29.0, 38.0, 26.0, 30.0, 17.0, 19.0, 21.0, 17.0, 15.0, 10.0, 12.0, 5.0, 10.0, 9.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47232919931411743, -0.45789918303489685, -0.44346919655799866, -0.4290391802787781, -0.4146091639995575, -0.4001791477203369, -0.3857491612434387, -0.37131914496421814, -0.35688912868499756, -0.342459112405777, -0.3280291259288788, -0.3135991096496582, -0.2991690933704376, -0.28473907709121704, -0.27030909061431885, -0.25587907433509827, -0.24144907295703888, -0.2270190715789795, -0.2125890552997589, -0.19815905392169952, -0.18372903764247894, -0.16929903626441956, -0.15486901998519897, -0.1404390186071396, -0.1260090172290802, -0.11157900840044022, -0.09714899957180023, -0.08271899819374084, -0.06828898191452026, -0.053858980536460876, -0.03942897170782089, -0.024998962879180908, -0.010568946599960327, 0.0038610612973570824, 0.018291069194674492, 0.03272107616066933, 0.04715108498930931, 0.061581090092659, 0.07601109892129898, 0.09044110774993896, 0.10487111657857895, 0.11930112540721893, 0.13373112678527832, 0.1481611430644989, 0.1625911444425583, 0.17702114582061768, 0.19145116209983826, 0.20588117837905884, 0.22031117975711823, 0.2347411811351776, 0.2491711974143982, 0.2636012136936188, 0.27803120017051697, 0.29246121644973755, 0.30689123272895813, 0.3213212490081787, 0.3357512354850769, 0.3501812517642975, 0.3646112382411957, 0.37904125452041626, 0.39347127079963684, 0.4079012870788574, 0.4223312735557556, 0.4367612898349762, 0.4511913061141968]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 0.0, 5.0, 6.0, 4.0, 7.0, 13.0, 15.0, 22.0, 29.0, 57.0, 75.0, 106.0, 155.0, 243.0, 362.0, 556.0, 768.0, 1356.0, 1973.0, 3069.0, 5074.0, 8739.0, 17036.0, 42510.0, 155481.0, 538423.0, 182697.0, 47338.0, 18752.0, 9313.0, 5248.0, 3213.0, 2022.0, 1298.0, 834.0, 602.0, 397.0, 258.0, 159.0, 105.0, 86.0, 49.0, 35.0, 21.0, 17.0, 10.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68310546875, -0.6599884033203125, -0.636871337890625, -0.6137542724609375, -0.59063720703125, -0.5675201416015625, -0.544403076171875, -0.5212860107421875, -0.4981689453125, -0.4750518798828125, -0.451934814453125, -0.4288177490234375, -0.40570068359375, -0.3825836181640625, -0.359466552734375, -0.3363494873046875, -0.313232421875, -0.2901153564453125, -0.266998291015625, -0.2438812255859375, -0.22076416015625, -0.1976470947265625, -0.174530029296875, -0.1514129638671875, -0.1282958984375, -0.1051788330078125, -0.082061767578125, -0.0589447021484375, -0.03582763671875, -0.0127105712890625, 0.010406494140625, 0.0335235595703125, 0.056640625, 0.0797576904296875, 0.102874755859375, 0.1259918212890625, 0.14910888671875, 0.1722259521484375, 0.195343017578125, 0.2184600830078125, 0.2415771484375, 0.2646942138671875, 0.287811279296875, 0.3109283447265625, 0.33404541015625, 0.3571624755859375, 0.380279541015625, 0.4033966064453125, 0.426513671875, 0.4496307373046875, 0.472747802734375, 0.4958648681640625, 0.51898193359375, 0.5420989990234375, 0.565216064453125, 0.5883331298828125, 0.6114501953125, 0.6345672607421875, 0.657684326171875, 0.6808013916015625, 0.70391845703125, 0.7270355224609375, 0.750152587890625, 0.7732696533203125, 0.79638671875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 8.0, 8.0, 12.0, 8.0, 13.0, 14.0, 17.0, 19.0, 23.0, 18.0, 39.0, 25.0, 38.0, 41.0, 35.0, 46.0, 42.0, 37.0, 49.0, 43.0, 30.0, 46.0, 36.0, 38.0, 45.0, 42.0, 29.0, 32.0, 20.0, 20.0, 17.0, 18.0, 13.0, 14.0, 9.0, 12.0, 10.0, 7.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.37705230712890625, -0.3651885986328125, -0.35332489013671875, -0.341461181640625, -0.32959747314453125, -0.3177337646484375, -0.30587005615234375, -0.29400634765625, -0.28214263916015625, -0.2702789306640625, -0.25841522216796875, -0.246551513671875, -0.23468780517578125, -0.2228240966796875, -0.21096038818359375, -0.1990966796875, -0.18723297119140625, -0.1753692626953125, -0.16350555419921875, -0.151641845703125, -0.13977813720703125, -0.1279144287109375, -0.11605072021484375, -0.10418701171875, -0.09232330322265625, -0.0804595947265625, -0.06859588623046875, -0.056732177734375, -0.04486846923828125, -0.0330047607421875, -0.02114105224609375, -0.00927734375, 0.00258636474609375, 0.0144500732421875, 0.02631378173828125, 0.038177490234375, 0.05004119873046875, 0.0619049072265625, 0.07376861572265625, 0.08563232421875, 0.09749603271484375, 0.1093597412109375, 0.12122344970703125, 0.133087158203125, 0.14495086669921875, 0.1568145751953125, 0.16867828369140625, 0.1805419921875, 0.19240570068359375, 0.2042694091796875, 0.21613311767578125, 0.227996826171875, 0.23986053466796875, 0.2517242431640625, 0.26358795166015625, 0.27545166015625, 0.28731536865234375, 0.2991790771484375, 0.31104278564453125, 0.322906494140625, 0.33477020263671875, 0.3466339111328125, 0.35849761962890625, 0.370361328125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 9.0, 8.0, 12.0, 24.0, 34.0, 38.0, 62.0, 157.0, 244.0, 473.0, 1092.0, 2652.0, 8359.0, 48749.0, 894044.0, 76728.0, 10278.0, 3115.0, 1281.0, 538.0, 267.0, 138.0, 87.0, 58.0, 32.0, 17.0, 15.0, 8.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9921875, -1.919952392578125, -1.84771728515625, -1.775482177734375, -1.7032470703125, -1.631011962890625, -1.55877685546875, -1.486541748046875, -1.414306640625, -1.342071533203125, -1.26983642578125, -1.197601318359375, -1.1253662109375, -1.053131103515625, -0.98089599609375, -0.908660888671875, -0.83642578125, -0.764190673828125, -0.69195556640625, -0.619720458984375, -0.5474853515625, -0.475250244140625, -0.40301513671875, -0.330780029296875, -0.258544921875, -0.186309814453125, -0.11407470703125, -0.041839599609375, 0.0303955078125, 0.102630615234375, 0.17486572265625, 0.247100830078125, 0.3193359375, 0.391571044921875, 0.46380615234375, 0.536041259765625, 0.6082763671875, 0.680511474609375, 0.75274658203125, 0.824981689453125, 0.897216796875, 0.969451904296875, 1.04168701171875, 1.113922119140625, 1.1861572265625, 1.258392333984375, 1.33062744140625, 1.402862548828125, 1.47509765625, 1.547332763671875, 1.61956787109375, 1.691802978515625, 1.7640380859375, 1.836273193359375, 1.90850830078125, 1.980743408203125, 2.052978515625, 2.125213623046875, 2.19744873046875, 2.269683837890625, 2.3419189453125, 2.414154052734375, 2.48638916015625, 2.558624267578125, 2.630859375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 6.0, 9.0, 11.0, 11.0, 19.0, 27.0, 26.0, 29.0, 31.0, 37.0, 37.0, 48.0, 42.0, 50.0, 52.0, 49.0, 41.0, 30.0, 48.0, 41.0, 44.0, 41.0, 31.0, 43.0, 33.0, 37.0, 24.0, 17.0, 17.0, 16.0, 12.0, 7.0, 8.0, 6.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.304443359375, -0.29537200927734375, -0.2863006591796875, -0.27722930908203125, -0.268157958984375, -0.25908660888671875, -0.2500152587890625, -0.24094390869140625, -0.23187255859375, -0.22280120849609375, -0.2137298583984375, -0.20465850830078125, -0.195587158203125, -0.18651580810546875, -0.1774444580078125, -0.16837310791015625, -0.1593017578125, -0.15023040771484375, -0.1411590576171875, -0.13208770751953125, -0.123016357421875, -0.11394500732421875, -0.1048736572265625, -0.09580230712890625, -0.08673095703125, -0.07765960693359375, -0.0685882568359375, -0.05951690673828125, -0.050445556640625, -0.04137420654296875, -0.0323028564453125, -0.02323150634765625, -0.01416015625, -0.00508880615234375, 0.0039825439453125, 0.01305389404296875, 0.022125244140625, 0.03119659423828125, 0.0402679443359375, 0.04933929443359375, 0.05841064453125, 0.06748199462890625, 0.0765533447265625, 0.08562469482421875, 0.094696044921875, 0.10376739501953125, 0.1128387451171875, 0.12191009521484375, 0.1309814453125, 0.14005279541015625, 0.1491241455078125, 0.15819549560546875, 0.167266845703125, 0.17633819580078125, 0.1854095458984375, 0.19448089599609375, 0.20355224609375, 0.21262359619140625, 0.2216949462890625, 0.23076629638671875, 0.239837646484375, 0.24890899658203125, 0.2579803466796875, 0.26705169677734375, 0.276123046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 3.0, 5.0, 10.0, 20.0, 22.0, 41.0, 37.0, 51.0, 66.0, 91.0, 126.0, 221.0, 338.0, 512.0, 799.0, 1313.0, 2403.0, 4999.0, 11120.0, 31322.0, 137046.0, 671395.0, 133589.0, 30926.0, 11099.0, 4884.0, 2453.0, 1307.0, 803.0, 482.0, 318.0, 229.0, 160.0, 101.0, 69.0, 43.0, 35.0, 21.0, 27.0, 21.0, 7.0, 10.0, 5.0, 2.0, 4.0, 5.0, 3.0, 4.0], "bins": [-0.28076171875, -0.2732734680175781, -0.26578521728515625, -0.2582969665527344, -0.2508087158203125, -0.24332046508789062, -0.23583221435546875, -0.22834396362304688, -0.220855712890625, -0.21336746215820312, -0.20587921142578125, -0.19839096069335938, -0.1909027099609375, -0.18341445922851562, -0.17592620849609375, -0.16843795776367188, -0.16094970703125, -0.15346145629882812, -0.14597320556640625, -0.13848495483398438, -0.1309967041015625, -0.12350845336914062, -0.11602020263671875, -0.10853195190429688, -0.101043701171875, -0.09355545043945312, -0.08606719970703125, -0.07857894897460938, -0.0710906982421875, -0.06360244750976562, -0.05611419677734375, -0.048625946044921875, -0.0411376953125, -0.033649444580078125, -0.02616119384765625, -0.018672943115234375, -0.0111846923828125, -0.003696441650390625, 0.00379180908203125, 0.011280059814453125, 0.018768310546875, 0.026256561279296875, 0.03374481201171875, 0.041233062744140625, 0.0487213134765625, 0.056209564208984375, 0.06369781494140625, 0.07118606567382812, 0.07867431640625, 0.08616256713867188, 0.09365081787109375, 0.10113906860351562, 0.1086273193359375, 0.11611557006835938, 0.12360382080078125, 0.13109207153320312, 0.138580322265625, 0.14606857299804688, 0.15355682373046875, 0.16104507446289062, 0.1685333251953125, 0.17602157592773438, 0.18350982666015625, 0.19099807739257812, 0.198486328125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 8.0, 14.0, 21.0, 30.0, 44.0, 75.0, 104.0, 196.0, 195.0, 114.0, 48.0, 42.0, 15.0, 17.0, 13.0, 7.0, 9.0, 11.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2292137145996094e-05, -2.1548941731452942e-05, -2.080574631690979e-05, -2.0062550902366638e-05, -1.9319355487823486e-05, -1.8576160073280334e-05, -1.7832964658737183e-05, -1.708976924419403e-05, -1.634657382965088e-05, -1.5603378415107727e-05, -1.4860183000564575e-05, -1.4116987586021423e-05, -1.3373792171478271e-05, -1.263059675693512e-05, -1.1887401342391968e-05, -1.1144205927848816e-05, -1.0401010513305664e-05, -9.657815098762512e-06, -8.91461968421936e-06, -8.171424269676208e-06, -7.428228855133057e-06, -6.685033440589905e-06, -5.941838026046753e-06, -5.198642611503601e-06, -4.455447196960449e-06, -3.7122517824172974e-06, -2.9690563678741455e-06, -2.2258609533309937e-06, -1.4826655387878418e-06, -7.394701242446899e-07, 3.725290298461914e-09, 7.469207048416138e-07, 1.4901161193847656e-06, 2.2333115339279175e-06, 2.9765069484710693e-06, 3.719702363014221e-06, 4.462897777557373e-06, 5.206093192100525e-06, 5.949288606643677e-06, 6.692484021186829e-06, 7.4356794357299805e-06, 8.178874850273132e-06, 8.922070264816284e-06, 9.665265679359436e-06, 1.0408461093902588e-05, 1.115165650844574e-05, 1.1894851922988892e-05, 1.2638047337532043e-05, 1.3381242752075195e-05, 1.4124438166618347e-05, 1.4867633581161499e-05, 1.561082899570465e-05, 1.6354024410247803e-05, 1.7097219824790955e-05, 1.7840415239334106e-05, 1.8583610653877258e-05, 1.932680606842041e-05, 2.0070001482963562e-05, 2.0813196897506714e-05, 2.1556392312049866e-05, 2.2299587726593018e-05, 2.304278314113617e-05, 2.378597855567932e-05, 2.4529173970222473e-05, 2.5272369384765625e-05]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 10.0, 10.0, 7.0, 19.0, 30.0, 47.0, 49.0, 74.0, 116.0, 173.0, 300.0, 439.0, 732.0, 1343.0, 2502.0, 5189.0, 12308.0, 36116.0, 158768.0, 652617.0, 125659.0, 31061.0, 10872.0, 4724.0, 2222.0, 1223.0, 712.0, 422.0, 260.0, 176.0, 112.0, 69.0, 52.0, 38.0, 32.0, 20.0, 8.0, 11.0, 6.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1846923828125, -0.17932891845703125, -0.1739654541015625, -0.16860198974609375, -0.163238525390625, -0.15787506103515625, -0.1525115966796875, -0.14714813232421875, -0.14178466796875, -0.13642120361328125, -0.1310577392578125, -0.12569427490234375, -0.120330810546875, -0.11496734619140625, -0.1096038818359375, -0.10424041748046875, -0.098876953125, -0.09351348876953125, -0.0881500244140625, -0.08278656005859375, -0.077423095703125, -0.07205963134765625, -0.0666961669921875, -0.06133270263671875, -0.05596923828125, -0.05060577392578125, -0.0452423095703125, -0.03987884521484375, -0.034515380859375, -0.02915191650390625, -0.0237884521484375, -0.01842498779296875, -0.0130615234375, -0.00769805908203125, -0.0023345947265625, 0.00302886962890625, 0.008392333984375, 0.01375579833984375, 0.0191192626953125, 0.02448272705078125, 0.02984619140625, 0.03520965576171875, 0.0405731201171875, 0.04593658447265625, 0.051300048828125, 0.05666351318359375, 0.0620269775390625, 0.06739044189453125, 0.07275390625, 0.07811737060546875, 0.0834808349609375, 0.08884429931640625, 0.094207763671875, 0.09957122802734375, 0.1049346923828125, 0.11029815673828125, 0.11566162109375, 0.12102508544921875, 0.1263885498046875, 0.13175201416015625, 0.137115478515625, 0.14247894287109375, 0.1478424072265625, 0.15320587158203125, 0.1585693359375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 6.0, 11.0, 6.0, 15.0, 26.0, 25.0, 24.0, 30.0, 62.0, 47.0, 73.0, 84.0, 94.0, 86.0, 105.0, 61.0, 62.0, 34.0, 34.0, 27.0, 31.0, 15.0, 12.0, 12.0, 5.0, 6.0, 3.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05218505859375, -0.0507659912109375, -0.049346923828125, -0.0479278564453125, -0.0465087890625, -0.0450897216796875, -0.043670654296875, -0.0422515869140625, -0.04083251953125, -0.0394134521484375, -0.037994384765625, -0.0365753173828125, -0.03515625, -0.0337371826171875, -0.032318115234375, -0.0308990478515625, -0.02947998046875, -0.0280609130859375, -0.026641845703125, -0.0252227783203125, -0.0238037109375, -0.0223846435546875, -0.020965576171875, -0.0195465087890625, -0.01812744140625, -0.0167083740234375, -0.015289306640625, -0.0138702392578125, -0.012451171875, -0.0110321044921875, -0.009613037109375, -0.0081939697265625, -0.00677490234375, -0.0053558349609375, -0.003936767578125, -0.0025177001953125, -0.0010986328125, 0.0003204345703125, 0.001739501953125, 0.0031585693359375, 0.00457763671875, 0.0059967041015625, 0.007415771484375, 0.0088348388671875, 0.01025390625, 0.0116729736328125, 0.013092041015625, 0.0145111083984375, 0.01593017578125, 0.0173492431640625, 0.018768310546875, 0.0201873779296875, 0.0216064453125, 0.0230255126953125, 0.024444580078125, 0.0258636474609375, 0.02728271484375, 0.0287017822265625, 0.030120849609375, 0.0315399169921875, 0.032958984375, 0.0343780517578125, 0.035797119140625, 0.0372161865234375, 0.03863525390625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 6.0, 13.0, 24.0, 19.0, 31.0, 60.0, 113.0, 210.0, 221.0, 124.0, 67.0, 33.0, 17.0, 9.0, 12.0, 5.0, 7.0, 6.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.934408962726593, -0.9022752046585083, -0.8701415061950684, -0.8380078077316284, -0.8058740496635437, -0.773740291595459, -0.741606593132019, -0.7094728946685791, -0.6773391366004944, -0.6452053785324097, -0.6130716800689697, -0.5809379816055298, -0.5488042235374451, -0.5166704654693604, -0.4845367670059204, -0.4524030387401581, -0.42026931047439575, -0.3881355822086334, -0.3560018539428711, -0.32386812567710876, -0.29173439741134644, -0.2596006691455841, -0.22746694087982178, -0.19533321261405945, -0.16319948434829712, -0.1310657560825348, -0.09893202781677246, -0.06679829955101013, -0.0346645712852478, -0.0025308430194854736, 0.029602885246276855, 0.061736613512039185, 0.09387028217315674, 0.12600401043891907, 0.1581377387046814, 0.19027146697044373, 0.22240519523620605, 0.2545389235019684, 0.2866726517677307, 0.31880638003349304, 0.35094010829925537, 0.3830738365650177, 0.41520756483078003, 0.44734129309654236, 0.4794750213623047, 0.5116087198257446, 0.5437424778938293, 0.5758762359619141, 0.608009934425354, 0.640143632888794, 0.6722773909568787, 0.7044111490249634, 0.7365448474884033, 0.7686785459518433, 0.800812304019928, 0.8329460620880127, 0.8650797605514526, 0.8972134590148926, 0.9293472170829773, 0.961480975151062, 0.993614673614502, 1.025748372077942, 1.0578820705413818, 1.0900158882141113, 1.1221495866775513]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 4.0, 3.0, 10.0, 14.0, 8.0, 15.0, 13.0, 16.0, 18.0, 27.0, 35.0, 32.0, 38.0, 33.0, 43.0, 55.0, 40.0, 49.0, 48.0, 38.0, 41.0, 47.0, 59.0, 29.0, 41.0, 35.0, 29.0, 25.0, 19.0, 17.0, 26.0, 16.0, 12.0, 14.0, 6.0, 6.0, 11.0, 11.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4165615141391754, -0.4038724899291992, -0.3911834955215454, -0.3784944713115692, -0.365805447101593, -0.3531164228916168, -0.3404273986816406, -0.3277384042739868, -0.3150493800640106, -0.3023603558540344, -0.2896713614463806, -0.2769823372364044, -0.2642933130264282, -0.251604288816452, -0.23891527950763702, -0.22622627019882202, -0.21353724598884583, -0.20084822177886963, -0.18815921247005463, -0.17547020316123962, -0.16278117895126343, -0.15009215474128723, -0.13740314543247223, -0.12471412867307663, -0.11202511191368103, -0.09933609515428543, -0.08664707839488983, -0.07395806163549423, -0.06126904487609863, -0.04858002811670303, -0.035891011357307434, -0.023201994597911835, -0.010512977838516235, 0.002176038920879364, 0.014865055680274963, 0.027554072439670563, 0.04024308919906616, 0.05293210595846176, 0.06562112271785736, 0.07831013947725296, 0.09099915623664856, 0.10368817299604416, 0.11637718975543976, 0.12906619906425476, 0.14175522327423096, 0.15444424748420715, 0.16713325679302216, 0.17982226610183716, 0.19251129031181335, 0.20520031452178955, 0.21788932383060455, 0.23057833313941956, 0.24326735734939575, 0.25595638155937195, 0.26864540576934814, 0.28133440017700195, 0.29402342438697815, 0.30671244859695435, 0.31940144300460815, 0.33209046721458435, 0.34477949142456055, 0.35746851563453674, 0.37015753984451294, 0.38284653425216675, 0.39553555846214294]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 9.0, 15.0, 28.0, 30.0, 50.0, 79.0, 109.0, 202.0, 314.0, 486.0, 896.0, 1694.0, 3402.0, 7193.0, 15394.0, 33385.0, 78188.0, 196161.0, 376150.0, 194369.0, 77436.0, 33265.0, 15181.0, 7108.0, 3471.0, 1670.0, 928.0, 500.0, 289.0, 194.0, 117.0, 81.0, 42.0, 40.0, 26.0, 20.0, 5.0, 8.0, 6.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9462890625, -0.9180374145507812, -0.8897857666015625, -0.8615341186523438, -0.833282470703125, -0.8050308227539062, -0.7767791748046875, -0.7485275268554688, -0.72027587890625, -0.6920242309570312, -0.6637725830078125, -0.6355209350585938, -0.607269287109375, -0.5790176391601562, -0.5507659912109375, -0.5225143432617188, -0.4942626953125, -0.46601104736328125, -0.4377593994140625, -0.40950775146484375, -0.381256103515625, -0.35300445556640625, -0.3247528076171875, -0.29650115966796875, -0.26824951171875, -0.23999786376953125, -0.2117462158203125, -0.18349456787109375, -0.155242919921875, -0.12699127197265625, -0.0987396240234375, -0.07048797607421875, -0.042236328125, -0.01398468017578125, 0.0142669677734375, 0.04251861572265625, 0.070770263671875, 0.09902191162109375, 0.1272735595703125, 0.15552520751953125, 0.18377685546875, 0.21202850341796875, 0.2402801513671875, 0.26853179931640625, 0.296783447265625, 0.32503509521484375, 0.3532867431640625, 0.38153839111328125, 0.4097900390625, 0.43804168701171875, 0.4662933349609375, 0.49454498291015625, 0.522796630859375, 0.5510482788085938, 0.5792999267578125, 0.6075515747070312, 0.63580322265625, 0.6640548706054688, 0.6923065185546875, 0.7205581665039062, 0.748809814453125, 0.7770614624023438, 0.8053131103515625, 0.8335647583007812, 0.86181640625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 6.0, 9.0, 6.0, 8.0, 12.0, 17.0, 5.0, 13.0, 15.0, 18.0, 30.0, 26.0, 38.0, 32.0, 31.0, 42.0, 41.0, 40.0, 34.0, 45.0, 40.0, 42.0, 34.0, 37.0, 40.0, 41.0, 35.0, 25.0, 27.0, 28.0, 22.0, 16.0, 13.0, 24.0, 14.0, 20.0, 8.0, 10.0, 5.0, 6.0, 6.0, 9.0, 7.0, 5.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.2802734375, -0.2721080780029297, -0.2639427185058594, -0.25577735900878906, -0.24761199951171875, -0.23944664001464844, -0.23128128051757812, -0.2231159210205078, -0.2149505615234375, -0.2067852020263672, -0.19861984252929688, -0.19045448303222656, -0.18228912353515625, -0.17412376403808594, -0.16595840454101562, -0.1577930450439453, -0.149627685546875, -0.1414623260498047, -0.13329696655273438, -0.12513160705566406, -0.11696624755859375, -0.10880088806152344, -0.10063552856445312, -0.09247016906738281, -0.0843048095703125, -0.07613945007324219, -0.06797409057617188, -0.05980873107910156, -0.05164337158203125, -0.04347801208496094, -0.035312652587890625, -0.027147293090820312, -0.01898193359375, -0.010816574096679688, -0.002651214599609375, 0.0055141448974609375, 0.01367950439453125, 0.021844863891601562, 0.030010223388671875, 0.03817558288574219, 0.0463409423828125, 0.05450630187988281, 0.06267166137695312, 0.07083702087402344, 0.07900238037109375, 0.08716773986816406, 0.09533309936523438, 0.10349845886230469, 0.111663818359375, 0.11982917785644531, 0.12799453735351562, 0.13615989685058594, 0.14432525634765625, 0.15249061584472656, 0.16065597534179688, 0.1688213348388672, 0.1769866943359375, 0.1851520538330078, 0.19331741333007812, 0.20148277282714844, 0.20964813232421875, 0.21781349182128906, 0.22597885131835938, 0.2341442108154297, 0.2423095703125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 8.0, 4.0, 14.0, 11.0, 23.0, 27.0, 44.0, 67.0, 87.0, 141.0, 199.0, 368.0, 641.0, 1194.0, 2292.0, 4688.0, 10266.0, 24455.0, 68467.0, 254179.0, 482491.0, 128419.0, 40806.0, 15541.0, 7062.0, 3264.0, 1635.0, 889.0, 475.0, 284.0, 177.0, 95.0, 70.0, 53.0, 38.0, 22.0, 24.0, 10.0, 10.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.0087890625, -0.9775161743164062, -0.9462432861328125, -0.9149703979492188, -0.883697509765625, -0.8524246215820312, -0.8211517333984375, -0.7898788452148438, -0.75860595703125, -0.7273330688476562, -0.6960601806640625, -0.6647872924804688, -0.633514404296875, -0.6022415161132812, -0.5709686279296875, -0.5396957397460938, -0.5084228515625, -0.47714996337890625, -0.4458770751953125, -0.41460418701171875, -0.383331298828125, -0.35205841064453125, -0.3207855224609375, -0.28951263427734375, -0.25823974609375, -0.22696685791015625, -0.1956939697265625, -0.16442108154296875, -0.133148193359375, -0.10187530517578125, -0.0706024169921875, -0.03932952880859375, -0.008056640625, 0.02321624755859375, 0.0544891357421875, 0.08576202392578125, 0.117034912109375, 0.14830780029296875, 0.1795806884765625, 0.21085357666015625, 0.24212646484375, 0.27339935302734375, 0.3046722412109375, 0.33594512939453125, 0.367218017578125, 0.39849090576171875, 0.4297637939453125, 0.46103668212890625, 0.4923095703125, 0.5235824584960938, 0.5548553466796875, 0.5861282348632812, 0.617401123046875, 0.6486740112304688, 0.6799468994140625, 0.7112197875976562, 0.74249267578125, 0.7737655639648438, 0.8050384521484375, 0.8363113403320312, 0.867584228515625, 0.8988571166992188, 0.9301300048828125, 0.9614028930664062, 0.99267578125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 7.0, 6.0, 7.0, 9.0, 13.0, 17.0, 21.0, 14.0, 18.0, 24.0, 25.0, 21.0, 20.0, 36.0, 34.0, 34.0, 34.0, 39.0, 31.0, 35.0, 35.0, 37.0, 40.0, 44.0, 41.0, 42.0, 29.0, 26.0, 28.0, 28.0, 25.0, 33.0, 21.0, 18.0, 17.0, 9.0, 9.0, 12.0, 10.0, 7.0, 8.0, 5.0, 5.0, 1.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1759033203125, -0.17000389099121094, -0.16410446166992188, -0.1582050323486328, -0.15230560302734375, -0.1464061737060547, -0.14050674438476562, -0.13460731506347656, -0.1287078857421875, -0.12280845642089844, -0.11690902709960938, -0.11100959777832031, -0.10511016845703125, -0.09921073913574219, -0.09331130981445312, -0.08741188049316406, -0.081512451171875, -0.07561302185058594, -0.06971359252929688, -0.06381416320800781, -0.05791473388671875, -0.05201530456542969, -0.046115875244140625, -0.04021644592285156, -0.0343170166015625, -0.028417587280273438, -0.022518157958984375, -0.016618728637695312, -0.01071929931640625, -0.0048198699951171875, 0.001079559326171875, 0.0069789886474609375, 0.01287841796875, 0.018777847290039062, 0.024677276611328125, 0.030576705932617188, 0.03647613525390625, 0.04237556457519531, 0.048274993896484375, 0.05417442321777344, 0.0600738525390625, 0.06597328186035156, 0.07187271118164062, 0.07777214050292969, 0.08367156982421875, 0.08957099914550781, 0.09547042846679688, 0.10136985778808594, 0.107269287109375, 0.11316871643066406, 0.11906814575195312, 0.12496757507324219, 0.13086700439453125, 0.1367664337158203, 0.14266586303710938, 0.14856529235839844, 0.1544647216796875, 0.16036415100097656, 0.16626358032226562, 0.1721630096435547, 0.17806243896484375, 0.1839618682861328, 0.18986129760742188, 0.19576072692871094, 0.20166015625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 13.0, 10.0, 18.0, 26.0, 42.0, 46.0, 66.0, 102.0, 150.0, 246.0, 390.0, 718.0, 1421.0, 3278.0, 10085.0, 57480.0, 914423.0, 45147.0, 8858.0, 2964.0, 1315.0, 677.0, 387.0, 230.0, 152.0, 108.0, 57.0, 47.0, 28.0, 18.0, 16.0, 16.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.3984375, -2.330780029296875, -2.26312255859375, -2.195465087890625, -2.1278076171875, -2.060150146484375, -1.99249267578125, -1.924835205078125, -1.857177734375, -1.789520263671875, -1.72186279296875, -1.654205322265625, -1.5865478515625, -1.518890380859375, -1.45123291015625, -1.383575439453125, -1.31591796875, -1.248260498046875, -1.18060302734375, -1.112945556640625, -1.0452880859375, -0.977630615234375, -0.90997314453125, -0.842315673828125, -0.774658203125, -0.707000732421875, -0.63934326171875, -0.571685791015625, -0.5040283203125, -0.436370849609375, -0.36871337890625, -0.301055908203125, -0.2333984375, -0.165740966796875, -0.09808349609375, -0.030426025390625, 0.0372314453125, 0.104888916015625, 0.17254638671875, 0.240203857421875, 0.307861328125, 0.375518798828125, 0.44317626953125, 0.510833740234375, 0.5784912109375, 0.646148681640625, 0.71380615234375, 0.781463623046875, 0.84912109375, 0.916778564453125, 0.98443603515625, 1.052093505859375, 1.1197509765625, 1.187408447265625, 1.25506591796875, 1.322723388671875, 1.390380859375, 1.458038330078125, 1.52569580078125, 1.593353271484375, 1.6610107421875, 1.728668212890625, 1.79632568359375, 1.863983154296875, 1.931640625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 8.0, 9.0, 7.0, 25.0, 54.0, 112.0, 278.0, 310.0, 105.0, 49.0, 21.0, 7.0, 11.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.301568984985352e-05, -7.123500108718872e-05, -6.945431232452393e-05, -6.767362356185913e-05, -6.589293479919434e-05, -6.411224603652954e-05, -6.233155727386475e-05, -6.055086851119995e-05, -5.8770179748535156e-05, -5.698949098587036e-05, -5.5208802223205566e-05, -5.342811346054077e-05, -5.1647424697875977e-05, -4.986673593521118e-05, -4.808604717254639e-05, -4.630535840988159e-05, -4.45246696472168e-05, -4.2743980884552e-05, -4.096329212188721e-05, -3.918260335922241e-05, -3.740191459655762e-05, -3.562122583389282e-05, -3.384053707122803e-05, -3.205984830856323e-05, -3.0279159545898438e-05, -2.8498470783233643e-05, -2.6717782020568848e-05, -2.4937093257904053e-05, -2.3156404495239258e-05, -2.1375715732574463e-05, -1.9595026969909668e-05, -1.7814338207244873e-05, -1.6033649444580078e-05, -1.4252960681915283e-05, -1.2472271919250488e-05, -1.0691583156585693e-05, -8.910894393920898e-06, -7.1302056312561035e-06, -5.349516868591309e-06, -3.5688281059265137e-06, -1.7881393432617188e-06, -7.450580596923828e-09, 1.773238182067871e-06, 3.553926944732666e-06, 5.334615707397461e-06, 7.115304470062256e-06, 8.89599323272705e-06, 1.0676681995391846e-05, 1.245737075805664e-05, 1.4238059520721436e-05, 1.601874828338623e-05, 1.7799437046051025e-05, 1.958012580871582e-05, 2.1360814571380615e-05, 2.314150333404541e-05, 2.4922192096710205e-05, 2.6702880859375e-05, 2.8483569622039795e-05, 3.026425838470459e-05, 3.2044947147369385e-05, 3.382563591003418e-05, 3.5606324672698975e-05, 3.738701343536377e-05, 3.9167702198028564e-05, 4.094839096069336e-05]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 9.0, 10.0, 8.0, 15.0, 20.0, 27.0, 28.0, 49.0, 73.0, 85.0, 118.0, 192.0, 236.0, 423.0, 676.0, 1164.0, 2273.0, 5248.0, 16051.0, 92265.0, 864301.0, 46121.0, 10706.0, 3970.0, 1810.0, 971.0, 573.0, 334.0, 219.0, 153.0, 103.0, 76.0, 53.0, 50.0, 28.0, 24.0, 24.0, 17.0, 10.0, 9.0, 6.0, 9.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6669921875, -1.613800048828125, -1.56060791015625, -1.507415771484375, -1.4542236328125, -1.401031494140625, -1.34783935546875, -1.294647216796875, -1.241455078125, -1.188262939453125, -1.13507080078125, -1.081878662109375, -1.0286865234375, -0.975494384765625, -0.92230224609375, -0.869110107421875, -0.81591796875, -0.762725830078125, -0.70953369140625, -0.656341552734375, -0.6031494140625, -0.549957275390625, -0.49676513671875, -0.443572998046875, -0.390380859375, -0.337188720703125, -0.28399658203125, -0.230804443359375, -0.1776123046875, -0.124420166015625, -0.07122802734375, -0.018035888671875, 0.03515625, 0.088348388671875, 0.14154052734375, 0.194732666015625, 0.2479248046875, 0.301116943359375, 0.35430908203125, 0.407501220703125, 0.460693359375, 0.513885498046875, 0.56707763671875, 0.620269775390625, 0.6734619140625, 0.726654052734375, 0.77984619140625, 0.833038330078125, 0.88623046875, 0.939422607421875, 0.99261474609375, 1.045806884765625, 1.0989990234375, 1.152191162109375, 1.20538330078125, 1.258575439453125, 1.311767578125, 1.364959716796875, 1.41815185546875, 1.471343994140625, 1.5245361328125, 1.577728271484375, 1.63092041015625, 1.684112548828125, 1.7373046875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 10.0, 16.0, 23.0, 39.0, 61.0, 90.0, 117.0, 368.0, 82.0, 56.0, 43.0, 33.0, 15.0, 8.0, 8.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36865234375, -0.35753631591796875, -0.3464202880859375, -0.33530426025390625, -0.324188232421875, -0.31307220458984375, -0.3019561767578125, -0.29084014892578125, -0.27972412109375, -0.26860809326171875, -0.2574920654296875, -0.24637603759765625, -0.235260009765625, -0.22414398193359375, -0.2130279541015625, -0.20191192626953125, -0.1907958984375, -0.17967987060546875, -0.1685638427734375, -0.15744781494140625, -0.146331787109375, -0.13521575927734375, -0.1240997314453125, -0.11298370361328125, -0.10186767578125, -0.09075164794921875, -0.0796356201171875, -0.06851959228515625, -0.057403564453125, -0.04628753662109375, -0.0351715087890625, -0.02405548095703125, -0.012939453125, -0.00182342529296875, 0.0092926025390625, 0.02040863037109375, 0.031524658203125, 0.04264068603515625, 0.0537567138671875, 0.06487274169921875, 0.07598876953125, 0.08710479736328125, 0.0982208251953125, 0.10933685302734375, 0.120452880859375, 0.13156890869140625, 0.1426849365234375, 0.15380096435546875, 0.1649169921875, 0.17603302001953125, 0.1871490478515625, 0.19826507568359375, 0.209381103515625, 0.22049713134765625, 0.2316131591796875, 0.24272918701171875, 0.25384521484375, 0.26496124267578125, 0.2760772705078125, 0.28719329833984375, 0.298309326171875, 0.30942535400390625, 0.3205413818359375, 0.33165740966796875, 0.3427734375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 7.0, 8.0, 13.0, 32.0, 44.0, 64.0, 111.0, 222.0, 271.0, 104.0, 44.0, 17.0, 11.0, 13.0, 6.0, 5.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.845899760723114, -0.8180158138275146, -0.7901318669319153, -0.7622479796409607, -0.7343640327453613, -0.706480085849762, -0.6785961389541626, -0.650712251663208, -0.6228283047676086, -0.5949443578720093, -0.5670604109764099, -0.5391765236854553, -0.511292576789856, -0.4834086298942566, -0.4555246829986572, -0.42764076590538025, -0.3997568190097809, -0.3718728721141815, -0.34398895502090454, -0.3161050081253052, -0.2882210910320282, -0.26033714413642883, -0.23245321214199066, -0.2045692801475525, -0.17668534815311432, -0.14880141615867615, -0.12091748416423798, -0.09303354471921921, -0.06514961272478104, -0.03726567327976227, -0.009381741285324097, 0.018502190709114075, 0.046386122703552246, 0.07427005469799042, 0.10215398669242859, 0.13003793358802795, 0.15792185068130493, 0.1858057975769043, 0.21368972957134247, 0.24157366156578064, 0.2694575786590576, 0.297341525554657, 0.32522544264793396, 0.3531093895435333, 0.3809933066368103, 0.40887725353240967, 0.43676120042800903, 0.464645117521286, 0.4925290644168854, 0.5204129815101624, 0.5482969284057617, 0.5761808753013611, 0.6040648221969604, 0.631948709487915, 0.6598326563835144, 0.6877166032791138, 0.7156005501747131, 0.7434844970703125, 0.7713684439659119, 0.7992523312568665, 0.8271362781524658, 0.8550202250480652, 0.8829041719436646, 0.9107880592346191, 0.9386720061302185]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 2.0, 5.0, 3.0, 3.0, 6.0, 13.0, 12.0, 12.0, 14.0, 19.0, 22.0, 21.0, 31.0, 29.0, 37.0, 32.0, 38.0, 45.0, 50.0, 46.0, 47.0, 57.0, 64.0, 40.0, 37.0, 28.0, 37.0, 34.0, 36.0, 25.0, 24.0, 23.0, 21.0, 17.0, 9.0, 10.0, 15.0, 17.0, 9.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3324841856956482, -0.3221283555030823, -0.31177252531051636, -0.30141669511795044, -0.2910608649253845, -0.2807050347328186, -0.2703492045402527, -0.25999337434768677, -0.24963755905628204, -0.23928172886371613, -0.2289258986711502, -0.2185700684785843, -0.20821425318717957, -0.19785842299461365, -0.18750259280204773, -0.1771467626094818, -0.1667909324169159, -0.15643510222434998, -0.14607927203178406, -0.13572344183921814, -0.12536761164665222, -0.1150117889046669, -0.10465596616268158, -0.09430013597011566, -0.08394430577754974, -0.07358847558498383, -0.06323264539241791, -0.05287682265043259, -0.04252099245786667, -0.03216516226530075, -0.02180933579802513, -0.011453509330749512, -0.0010976791381835938, 0.009258149191737175, 0.019613977521657944, 0.029969805851578712, 0.04032563418149948, 0.0506814643740654, 0.06103729084134102, 0.07139311730861664, 0.08174894750118256, 0.09210477769374847, 0.10246060788631439, 0.11281643062829971, 0.12317226082086563, 0.13352808356285095, 0.14388391375541687, 0.1542397439479828, 0.1645955741405487, 0.17495140433311462, 0.18530723452568054, 0.19566306471824646, 0.20601889491081238, 0.2163747251033783, 0.22673054039478302, 0.23708637058734894, 0.24744220077991486, 0.2577980160713196, 0.2681538462638855, 0.2785096764564514, 0.28886550664901733, 0.29922133684158325, 0.30957716703414917, 0.3199329972267151, 0.330288827419281]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 7.0, 7.0, 10.0, 11.0, 22.0, 23.0, 43.0, 61.0, 87.0, 97.0, 165.0, 200.0, 308.0, 377.0, 577.0, 724.0, 1011.0, 1473.0, 2130.0, 3100.0, 4318.0, 6486.0, 9655.0, 14627.0, 23541.0, 38180.0, 65992.0, 126241.0, 312031.0, 1324007.0, 1576523.0, 360394.0, 136828.0, 71103.0, 40975.0, 25044.0, 15561.0, 10318.0, 6706.0, 4502.0, 3186.0, 2160.0, 1598.0, 1106.0, 793.0, 534.0, 379.0, 273.0, 212.0, 157.0, 128.0, 87.0, 74.0, 52.0, 35.0, 26.0, 16.0, 11.0, 3.0, 2.0], "bins": [-0.35205078125, -0.3417167663574219, -0.33138275146484375, -0.3210487365722656, -0.3107147216796875, -0.3003807067871094, -0.29004669189453125, -0.2797126770019531, -0.269378662109375, -0.2590446472167969, -0.24871063232421875, -0.23837661743164062, -0.2280426025390625, -0.21770858764648438, -0.20737457275390625, -0.19704055786132812, -0.18670654296875, -0.17637252807617188, -0.16603851318359375, -0.15570449829101562, -0.1453704833984375, -0.13503646850585938, -0.12470245361328125, -0.11436843872070312, -0.104034423828125, -0.09370040893554688, -0.08336639404296875, -0.07303237915039062, -0.0626983642578125, -0.052364349365234375, -0.04203033447265625, -0.031696319580078125, -0.0213623046875, -0.011028289794921875, -0.00069427490234375, 0.009639739990234375, 0.0199737548828125, 0.030307769775390625, 0.04064178466796875, 0.050975799560546875, 0.061309814453125, 0.07164382934570312, 0.08197784423828125, 0.09231185913085938, 0.1026458740234375, 0.11297988891601562, 0.12331390380859375, 0.13364791870117188, 0.14398193359375, 0.15431594848632812, 0.16464996337890625, 0.17498397827148438, 0.1853179931640625, 0.19565200805664062, 0.20598602294921875, 0.21632003784179688, 0.226654052734375, 0.23698806762695312, 0.24732208251953125, 0.2576560974121094, 0.2679901123046875, 0.2783241271972656, 0.28865814208984375, 0.2989921569824219, 0.309326171875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 5.0, 12.0, 13.0, 6.0, 17.0, 19.0, 22.0, 25.0, 27.0, 35.0, 43.0, 27.0, 48.0, 40.0, 51.0, 65.0, 41.0, 46.0, 45.0, 42.0, 37.0, 40.0, 34.0, 41.0, 37.0, 26.0, 23.0, 17.0, 24.0, 18.0, 8.0, 13.0, 12.0, 5.0, 6.0, 7.0, 7.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14501953125, -0.14050865173339844, -0.13599777221679688, -0.1314868927001953, -0.12697601318359375, -0.12246513366699219, -0.11795425415039062, -0.11344337463378906, -0.1089324951171875, -0.10442161560058594, -0.09991073608398438, -0.09539985656738281, -0.09088897705078125, -0.08637809753417969, -0.08186721801757812, -0.07735633850097656, -0.072845458984375, -0.06833457946777344, -0.06382369995117188, -0.05931282043457031, -0.05480194091796875, -0.05029106140136719, -0.045780181884765625, -0.04126930236816406, -0.0367584228515625, -0.03224754333496094, -0.027736663818359375, -0.023225784301757812, -0.01871490478515625, -0.014204025268554688, -0.009693145751953125, -0.0051822662353515625, -0.00067138671875, 0.0038394927978515625, 0.008350372314453125, 0.012861251831054688, 0.01737213134765625, 0.021883010864257812, 0.026393890380859375, 0.030904769897460938, 0.0354156494140625, 0.03992652893066406, 0.044437408447265625, 0.04894828796386719, 0.05345916748046875, 0.05797004699707031, 0.062480926513671875, 0.06699180603027344, 0.071502685546875, 0.07601356506347656, 0.08052444458007812, 0.08503532409667969, 0.08954620361328125, 0.09405708312988281, 0.09856796264648438, 0.10307884216308594, 0.1075897216796875, 0.11210060119628906, 0.11661148071289062, 0.12112236022949219, 0.12563323974609375, 0.1301441192626953, 0.13465499877929688, 0.13916587829589844, 0.1436767578125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 11.0, 4.0, 10.0, 14.0, 24.0, 36.0, 52.0, 72.0, 150.0, 226.0, 364.0, 544.0, 924.0, 1522.0, 2680.0, 4795.0, 9276.0, 18576.0, 43364.0, 118259.0, 445689.0, 2439100.0, 819276.0, 179185.0, 59932.0, 24723.0, 11555.0, 5914.0, 3225.0, 1913.0, 1138.0, 649.0, 396.0, 261.0, 162.0, 87.0, 58.0, 28.0, 33.0, 23.0, 12.0, 4.0, 10.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.42724609375, -0.41455841064453125, -0.4018707275390625, -0.38918304443359375, -0.376495361328125, -0.36380767822265625, -0.3511199951171875, -0.33843231201171875, -0.32574462890625, -0.31305694580078125, -0.3003692626953125, -0.28768157958984375, -0.274993896484375, -0.26230621337890625, -0.2496185302734375, -0.23693084716796875, -0.2242431640625, -0.21155548095703125, -0.1988677978515625, -0.18618011474609375, -0.173492431640625, -0.16080474853515625, -0.1481170654296875, -0.13542938232421875, -0.12274169921875, -0.11005401611328125, -0.0973663330078125, -0.08467864990234375, -0.071990966796875, -0.05930328369140625, -0.0466156005859375, -0.03392791748046875, -0.021240234375, -0.00855255126953125, 0.0041351318359375, 0.01682281494140625, 0.029510498046875, 0.04219818115234375, 0.0548858642578125, 0.06757354736328125, 0.08026123046875, 0.09294891357421875, 0.1056365966796875, 0.11832427978515625, 0.131011962890625, 0.14369964599609375, 0.1563873291015625, 0.16907501220703125, 0.1817626953125, 0.19445037841796875, 0.2071380615234375, 0.21982574462890625, 0.232513427734375, 0.24520111083984375, 0.2578887939453125, 0.27057647705078125, 0.28326416015625, 0.29595184326171875, 0.3086395263671875, 0.32132720947265625, 0.334014892578125, 0.34670257568359375, 0.3593902587890625, 0.37207794189453125, 0.384765625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 6.0, 7.0, 14.0, 24.0, 19.0, 36.0, 31.0, 48.0, 64.0, 83.0, 103.0, 124.0, 176.0, 230.0, 272.0, 359.0, 484.0, 427.0, 348.0, 305.0, 224.0, 160.0, 136.0, 108.0, 82.0, 45.0, 39.0, 41.0, 23.0, 15.0, 7.0, 8.0, 6.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097412109375, -0.0945281982421875, -0.091644287109375, -0.0887603759765625, -0.08587646484375, -0.0829925537109375, -0.080108642578125, -0.0772247314453125, -0.0743408203125, -0.0714569091796875, -0.068572998046875, -0.0656890869140625, -0.06280517578125, -0.0599212646484375, -0.057037353515625, -0.0541534423828125, -0.05126953125, -0.0483856201171875, -0.045501708984375, -0.0426177978515625, -0.03973388671875, -0.0368499755859375, -0.033966064453125, -0.0310821533203125, -0.0281982421875, -0.0253143310546875, -0.022430419921875, -0.0195465087890625, -0.01666259765625, -0.0137786865234375, -0.010894775390625, -0.0080108642578125, -0.005126953125, -0.0022430419921875, 0.000640869140625, 0.0035247802734375, 0.00640869140625, 0.0092926025390625, 0.012176513671875, 0.0150604248046875, 0.0179443359375, 0.0208282470703125, 0.023712158203125, 0.0265960693359375, 0.02947998046875, 0.0323638916015625, 0.035247802734375, 0.0381317138671875, 0.041015625, 0.0438995361328125, 0.046783447265625, 0.0496673583984375, 0.05255126953125, 0.0554351806640625, 0.058319091796875, 0.0612030029296875, 0.0640869140625, 0.0669708251953125, 0.069854736328125, 0.0727386474609375, 0.07562255859375, 0.0785064697265625, 0.081390380859375, 0.0842742919921875, 0.087158203125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 4.0, 4.0, 13.0, 15.0, 27.0, 27.0, 45.0, 74.0, 136.0, 199.0, 194.0, 95.0, 56.0, 34.0, 23.0, 7.0, 6.0, 8.0, 6.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22267018258571625, -0.21153748035430908, -0.20040477812290192, -0.18927207589149475, -0.1781393587589264, -0.16700665652751923, -0.15587395429611206, -0.1447412371635437, -0.13360854983329773, -0.12247584760189056, -0.1113431379199028, -0.10021043568849564, -0.08907772600650787, -0.07794502377510071, -0.06681232154369354, -0.05567961186170578, -0.04454690217971802, -0.033414196223020554, -0.02228149212896824, -0.011148788034915924, -1.6082078218460083e-05, 0.011116623878479004, 0.02224932610988617, 0.03338203579187393, 0.0445147380232811, 0.05564744397997856, 0.06678014993667603, 0.07791285216808319, 0.08904555439949036, 0.10017826408147812, 0.11131096631288528, 0.12244367599487305, 0.1335763931274414, 0.14470909535884857, 0.15584179759025574, 0.1669745147228241, 0.17810721695423126, 0.18923991918563843, 0.2003726214170456, 0.21150532364845276, 0.22263804078102112, 0.23377074301242828, 0.24490344524383545, 0.2560361623764038, 0.2671688497066498, 0.27830156683921814, 0.2894342541694641, 0.30056697130203247, 0.31169968843460083, 0.3228324055671692, 0.33396509289741516, 0.3450978100299835, 0.3562304973602295, 0.36736321449279785, 0.3784959316253662, 0.3896286189556122, 0.40076130628585815, 0.4118940234184265, 0.4230267107486725, 0.43415942788124084, 0.4452921152114868, 0.4564248323440552, 0.46755754947662354, 0.4786902368068695, 0.48982295393943787]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 2.0, 9.0, 13.0, 11.0, 15.0, 11.0, 15.0, 23.0, 19.0, 20.0, 41.0, 30.0, 38.0, 44.0, 47.0, 39.0, 49.0, 40.0, 50.0, 53.0, 52.0, 40.0, 40.0, 26.0, 35.0, 35.0, 29.0, 23.0, 24.0, 19.0, 16.0, 14.0, 13.0, 18.0, 11.0, 6.0, 6.0, 6.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.15669216215610504, -0.1520506590604782, -0.14740917086601257, -0.14276766777038574, -0.1381261646747589, -0.13348466157913208, -0.12884317338466644, -0.12420167028903961, -0.11956017464399338, -0.11491867899894714, -0.11027717590332031, -0.10563568025827408, -0.10099418461322784, -0.09635268151760101, -0.09171118587255478, -0.08706969022750854, -0.08242818713188171, -0.07778669148683548, -0.07314518839120865, -0.06850369274616241, -0.06386218965053558, -0.05922069400548935, -0.054579198360443115, -0.04993769899010658, -0.04529619961977005, -0.04065470024943352, -0.036013200879096985, -0.03137170523405075, -0.026730205863714218, -0.022088706493377686, -0.017447208985686302, -0.012805711477994919, -0.008164197206497192, -0.0035226987674832344, 0.0011187996715307236, 0.0057602981105446815, 0.01040179654955864, 0.015043295919895172, 0.019684793427586555, 0.02432629093527794, 0.02896779030561447, 0.033609289675951004, 0.03825078904628754, 0.04289228469133377, 0.0475337840616703, 0.052175283432006836, 0.05681677907705307, 0.0614582784473896, 0.06609977781772614, 0.07074127346277237, 0.0753827765583992, 0.08002427220344543, 0.08466577529907227, 0.0893072709441185, 0.09394876658916473, 0.09859026968479156, 0.1032317653298378, 0.10787326097488403, 0.11251476407051086, 0.1171562597155571, 0.12179775536060333, 0.12643925845623016, 0.131080761551857, 0.13572224974632263, 0.14036375284194946]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 9.0, 11.0, 14.0, 17.0, 23.0, 42.0, 60.0, 84.0, 136.0, 189.0, 293.0, 485.0, 734.0, 1183.0, 1781.0, 3072.0, 5108.0, 9979.0, 22804.0, 74360.0, 485625.0, 345537.0, 57012.0, 19056.0, 8745.0, 4754.0, 2732.0, 1632.0, 1043.0, 704.0, 444.0, 282.0, 205.0, 119.0, 98.0, 58.0, 38.0, 29.0, 28.0, 14.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0], "bins": [-0.42626953125, -0.415313720703125, -0.40435791015625, -0.393402099609375, -0.3824462890625, -0.371490478515625, -0.36053466796875, -0.349578857421875, -0.338623046875, -0.327667236328125, -0.31671142578125, -0.305755615234375, -0.2947998046875, -0.283843994140625, -0.27288818359375, -0.261932373046875, -0.2509765625, -0.240020751953125, -0.22906494140625, -0.218109130859375, -0.2071533203125, -0.196197509765625, -0.18524169921875, -0.174285888671875, -0.163330078125, -0.152374267578125, -0.14141845703125, -0.130462646484375, -0.1195068359375, -0.108551025390625, -0.09759521484375, -0.086639404296875, -0.07568359375, -0.064727783203125, -0.05377197265625, -0.042816162109375, -0.0318603515625, -0.020904541015625, -0.00994873046875, 0.001007080078125, 0.011962890625, 0.022918701171875, 0.03387451171875, 0.044830322265625, 0.0557861328125, 0.066741943359375, 0.07769775390625, 0.088653564453125, 0.099609375, 0.110565185546875, 0.12152099609375, 0.132476806640625, 0.1434326171875, 0.154388427734375, 0.16534423828125, 0.176300048828125, 0.187255859375, 0.198211669921875, 0.20916748046875, 0.220123291015625, 0.2310791015625, 0.242034912109375, 0.25299072265625, 0.263946533203125, 0.27490234375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 3.0, 10.0, 9.0, 9.0, 10.0, 23.0, 21.0, 22.0, 23.0, 27.0, 35.0, 38.0, 36.0, 50.0, 50.0, 43.0, 44.0, 57.0, 48.0, 55.0, 47.0, 46.0, 29.0, 31.0, 35.0, 29.0, 21.0, 22.0, 30.0, 16.0, 7.0, 11.0, 15.0, 9.0, 6.0, 8.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1365966796875, -0.13245201110839844, -0.12830734252929688, -0.12416267395019531, -0.12001800537109375, -0.11587333679199219, -0.11172866821289062, -0.10758399963378906, -0.1034393310546875, -0.09929466247558594, -0.09514999389648438, -0.09100532531738281, -0.08686065673828125, -0.08271598815917969, -0.07857131958007812, -0.07442665100097656, -0.070281982421875, -0.06613731384277344, -0.061992645263671875, -0.05784797668457031, -0.05370330810546875, -0.04955863952636719, -0.045413970947265625, -0.04126930236816406, -0.0371246337890625, -0.03297996520996094, -0.028835296630859375, -0.024690628051757812, -0.02054595947265625, -0.016401290893554688, -0.012256622314453125, -0.008111953735351562, -0.00396728515625, 0.0001773834228515625, 0.004322052001953125, 0.008466720581054688, 0.01261138916015625, 0.016756057739257812, 0.020900726318359375, 0.025045394897460938, 0.0291900634765625, 0.03333473205566406, 0.037479400634765625, 0.04162406921386719, 0.04576873779296875, 0.04991340637207031, 0.054058074951171875, 0.05820274353027344, 0.062347412109375, 0.06649208068847656, 0.07063674926757812, 0.07478141784667969, 0.07892608642578125, 0.08307075500488281, 0.08721542358398438, 0.09136009216308594, 0.0955047607421875, 0.09964942932128906, 0.10379409790039062, 0.10793876647949219, 0.11208343505859375, 0.11622810363769531, 0.12037277221679688, 0.12451744079589844, 0.128662109375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 1.0, 4.0, 8.0, 14.0, 21.0, 22.0, 38.0, 49.0, 80.0, 132.0, 209.0, 318.0, 569.0, 1117.0, 2186.0, 4988.0, 17172.0, 545860.0, 449965.0, 16170.0, 4945.0, 2152.0, 1069.0, 581.0, 298.0, 225.0, 114.0, 80.0, 45.0, 37.0, 32.0, 20.0, 15.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0166015625, -0.989837646484375, -0.96307373046875, -0.936309814453125, -0.9095458984375, -0.882781982421875, -0.85601806640625, -0.829254150390625, -0.802490234375, -0.775726318359375, -0.74896240234375, -0.722198486328125, -0.6954345703125, -0.668670654296875, -0.64190673828125, -0.615142822265625, -0.58837890625, -0.561614990234375, -0.53485107421875, -0.508087158203125, -0.4813232421875, -0.454559326171875, -0.42779541015625, -0.401031494140625, -0.374267578125, -0.347503662109375, -0.32073974609375, -0.293975830078125, -0.2672119140625, -0.240447998046875, -0.21368408203125, -0.186920166015625, -0.16015625, -0.133392333984375, -0.10662841796875, -0.079864501953125, -0.0531005859375, -0.026336669921875, 0.00042724609375, 0.027191162109375, 0.053955078125, 0.080718994140625, 0.10748291015625, 0.134246826171875, 0.1610107421875, 0.187774658203125, 0.21453857421875, 0.241302490234375, 0.26806640625, 0.294830322265625, 0.32159423828125, 0.348358154296875, 0.3751220703125, 0.401885986328125, 0.42864990234375, 0.455413818359375, 0.482177734375, 0.508941650390625, 0.53570556640625, 0.562469482421875, 0.5892333984375, 0.615997314453125, 0.64276123046875, 0.669525146484375, 0.6962890625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 3.0, 8.0, 4.0, 4.0, 10.0, 9.0, 14.0, 19.0, 15.0, 18.0, 29.0, 32.0, 26.0, 35.0, 36.0, 41.0, 40.0, 61.0, 52.0, 54.0, 41.0, 50.0, 48.0, 47.0, 42.0, 42.0, 27.0, 33.0, 23.0, 25.0, 23.0, 19.0, 9.0, 13.0, 9.0, 10.0, 9.0, 6.0, 5.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0848388671875, -0.08195018768310547, -0.07906150817871094, -0.0761728286743164, -0.07328414916992188, -0.07039546966552734, -0.06750679016113281, -0.06461811065673828, -0.06172943115234375, -0.05884075164794922, -0.05595207214355469, -0.053063392639160156, -0.050174713134765625, -0.047286033630371094, -0.04439735412597656, -0.04150867462158203, -0.0386199951171875, -0.03573131561279297, -0.03284263610839844, -0.029953956604003906, -0.027065277099609375, -0.024176597595214844, -0.021287918090820312, -0.01839923858642578, -0.01551055908203125, -0.012621879577636719, -0.009733200073242188, -0.006844520568847656, -0.003955841064453125, -0.0010671615600585938, 0.0018215179443359375, 0.004710197448730469, 0.007598876953125, 0.010487556457519531, 0.013376235961914062, 0.016264915466308594, 0.019153594970703125, 0.022042274475097656, 0.024930953979492188, 0.02781963348388672, 0.03070831298828125, 0.03359699249267578, 0.03648567199707031, 0.039374351501464844, 0.042263031005859375, 0.045151710510253906, 0.04804039001464844, 0.05092906951904297, 0.0538177490234375, 0.05670642852783203, 0.05959510803222656, 0.062483787536621094, 0.06537246704101562, 0.06826114654541016, 0.07114982604980469, 0.07403850555419922, 0.07692718505859375, 0.07981586456298828, 0.08270454406738281, 0.08559322357177734, 0.08848190307617188, 0.0913705825805664, 0.09425926208496094, 0.09714794158935547, 0.10003662109375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 9.0, 7.0, 17.0, 24.0, 26.0, 61.0, 82.0, 123.0, 180.0, 253.0, 394.0, 691.0, 1264.0, 2041.0, 3815.0, 7703.0, 17788.0, 50344.0, 208627.0, 576238.0, 118838.0, 33717.0, 13001.0, 5987.0, 3079.0, 1585.0, 992.0, 603.0, 355.0, 244.0, 159.0, 97.0, 64.0, 56.0, 27.0, 23.0, 17.0, 5.0, 8.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046356201171875, -0.04477548599243164, -0.04319477081298828, -0.04161405563354492, -0.04003334045410156, -0.0384526252746582, -0.036871910095214844, -0.035291194915771484, -0.033710479736328125, -0.032129764556884766, -0.030549049377441406, -0.028968334197998047, -0.027387619018554688, -0.025806903839111328, -0.02422618865966797, -0.02264547348022461, -0.02106475830078125, -0.01948404312133789, -0.01790332794189453, -0.016322612762451172, -0.014741897583007812, -0.013161182403564453, -0.011580467224121094, -0.009999752044677734, -0.008419036865234375, -0.006838321685791016, -0.005257606506347656, -0.003676891326904297, -0.0020961761474609375, -0.0005154609680175781, 0.0010652542114257812, 0.0026459693908691406, 0.0042266845703125, 0.005807399749755859, 0.007388114929199219, 0.008968830108642578, 0.010549545288085938, 0.012130260467529297, 0.013710975646972656, 0.015291690826416016, 0.016872406005859375, 0.018453121185302734, 0.020033836364746094, 0.021614551544189453, 0.023195266723632812, 0.024775981903076172, 0.02635669708251953, 0.02793741226196289, 0.02951812744140625, 0.03109884262084961, 0.03267955780029297, 0.03426027297973633, 0.03584098815917969, 0.03742170333862305, 0.039002418518066406, 0.040583133697509766, 0.042163848876953125, 0.043744564056396484, 0.045325279235839844, 0.0469059944152832, 0.04848670959472656, 0.05006742477416992, 0.05164813995361328, 0.05322885513305664, 0.0548095703125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 1.0, 7.0, 9.0, 14.0, 16.0, 25.0, 25.0, 41.0, 42.0, 61.0, 83.0, 100.0, 102.0, 77.0, 71.0, 108.0, 54.0, 41.0, 28.0, 28.0, 15.0, 15.0, 10.0, 9.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1861324310302734e-05, -1.1548399925231934e-05, -1.1235475540161133e-05, -1.0922551155090332e-05, -1.0609626770019531e-05, -1.029670238494873e-05, -9.98377799987793e-06, -9.670853614807129e-06, -9.357929229736328e-06, -9.045004844665527e-06, -8.732080459594727e-06, -8.419156074523926e-06, -8.106231689453125e-06, -7.793307304382324e-06, -7.4803829193115234e-06, -7.167458534240723e-06, -6.854534149169922e-06, -6.541609764099121e-06, -6.22868537902832e-06, -5.9157609939575195e-06, -5.602836608886719e-06, -5.289912223815918e-06, -4.976987838745117e-06, -4.664063453674316e-06, -4.351139068603516e-06, -4.038214683532715e-06, -3.725290298461914e-06, -3.4123659133911133e-06, -3.0994415283203125e-06, -2.7865171432495117e-06, -2.473592758178711e-06, -2.16066837310791e-06, -1.8477439880371094e-06, -1.5348196029663086e-06, -1.2218952178955078e-06, -9.08970832824707e-07, -5.960464477539062e-07, -2.8312206268310547e-07, 2.9802322387695312e-08, 3.427267074584961e-07, 6.556510925292969e-07, 9.685754776000977e-07, 1.2814998626708984e-06, 1.5944242477416992e-06, 1.9073486328125e-06, 2.2202730178833008e-06, 2.5331974029541016e-06, 2.8461217880249023e-06, 3.159046173095703e-06, 3.471970558166504e-06, 3.7848949432373047e-06, 4.0978193283081055e-06, 4.410743713378906e-06, 4.723668098449707e-06, 5.036592483520508e-06, 5.349516868591309e-06, 5.662441253662109e-06, 5.97536563873291e-06, 6.288290023803711e-06, 6.601214408874512e-06, 6.9141387939453125e-06, 7.227063179016113e-06, 7.539987564086914e-06, 7.852911949157715e-06, 8.165836334228516e-06]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 10.0, 12.0, 19.0, 21.0, 29.0, 35.0, 52.0, 70.0, 122.0, 154.0, 233.0, 332.0, 545.0, 948.0, 1875.0, 4261.0, 11263.0, 42002.0, 325894.0, 574396.0, 61509.0, 14534.0, 5094.0, 2154.0, 1135.0, 608.0, 406.0, 233.0, 187.0, 131.0, 83.0, 58.0, 46.0, 22.0, 16.0, 15.0, 16.0, 10.0, 4.0, 7.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0560302734375, -0.054285526275634766, -0.05254077911376953, -0.0507960319519043, -0.04905128479003906, -0.04730653762817383, -0.045561790466308594, -0.04381704330444336, -0.042072296142578125, -0.04032754898071289, -0.038582801818847656, -0.03683805465698242, -0.03509330749511719, -0.03334856033325195, -0.03160381317138672, -0.029859066009521484, -0.02811431884765625, -0.026369571685791016, -0.02462482452392578, -0.022880077362060547, -0.021135330200195312, -0.019390583038330078, -0.017645835876464844, -0.01590108871459961, -0.014156341552734375, -0.01241159439086914, -0.010666847229003906, -0.008922100067138672, -0.0071773529052734375, -0.005432605743408203, -0.0036878585815429688, -0.0019431114196777344, -0.0001983642578125, 0.0015463829040527344, 0.0032911300659179688, 0.005035877227783203, 0.0067806243896484375, 0.008525371551513672, 0.010270118713378906, 0.01201486587524414, 0.013759613037109375, 0.01550436019897461, 0.017249107360839844, 0.018993854522705078, 0.020738601684570312, 0.022483348846435547, 0.02422809600830078, 0.025972843170166016, 0.02771759033203125, 0.029462337493896484, 0.03120708465576172, 0.03295183181762695, 0.03469657897949219, 0.03644132614135742, 0.038186073303222656, 0.03993082046508789, 0.041675567626953125, 0.04342031478881836, 0.045165061950683594, 0.04690980911254883, 0.04865455627441406, 0.0503993034362793, 0.05214405059814453, 0.053888797760009766, 0.055633544921875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 1.0, 4.0, 9.0, 4.0, 13.0, 24.0, 29.0, 34.0, 47.0, 63.0, 84.0, 103.0, 121.0, 103.0, 82.0, 68.0, 52.0, 45.0, 25.0, 17.0, 12.0, 14.0, 12.0, 9.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01035308837890625, -0.010013818740844727, -0.009674549102783203, -0.00933527946472168, -0.008996009826660156, -0.008656740188598633, -0.00831747055053711, -0.007978200912475586, -0.0076389312744140625, -0.007299661636352539, -0.006960391998291016, -0.006621122360229492, -0.006281852722167969, -0.005942583084106445, -0.005603313446044922, -0.0052640438079833984, -0.004924774169921875, -0.0045855045318603516, -0.004246234893798828, -0.003906965255737305, -0.0035676956176757812, -0.003228425979614258, -0.0028891563415527344, -0.002549886703491211, -0.0022106170654296875, -0.001871347427368164, -0.0015320777893066406, -0.0011928081512451172, -0.0008535385131835938, -0.0005142688751220703, -0.00017499923706054688, 0.00016427040100097656, 0.0005035400390625, 0.0008428096771240234, 0.0011820793151855469, 0.0015213489532470703, 0.0018606185913085938, 0.002199888229370117, 0.0025391578674316406, 0.002878427505493164, 0.0032176971435546875, 0.003556966781616211, 0.0038962364196777344, 0.004235506057739258, 0.004574775695800781, 0.004914045333862305, 0.005253314971923828, 0.0055925846099853516, 0.005931854248046875, 0.0062711238861083984, 0.006610393524169922, 0.006949663162231445, 0.007288932800292969, 0.007628202438354492, 0.007967472076416016, 0.008306741714477539, 0.008646011352539062, 0.008985280990600586, 0.00932455062866211, 0.009663820266723633, 0.010003089904785156, 0.01034235954284668, 0.010681629180908203, 0.011020898818969727, 0.01136016845703125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 5.0, 8.0, 9.0, 16.0, 23.0, 38.0, 65.0, 99.0, 178.0, 217.0, 128.0, 86.0, 36.0, 27.0, 10.0, 14.0, 11.0, 3.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1730543076992035, -0.16308629512786865, -0.15311826765537262, -0.1431502401828766, -0.13318222761154175, -0.12321420758962631, -0.11324618756771088, -0.10327816754579544, -0.09331014752388, -0.08334212750196457, -0.07337410748004913, -0.0634060874581337, -0.05343806743621826, -0.043470047414302826, -0.03350202739238739, -0.023534007370471954, -0.013565987348556519, -0.0035979673266410828, 0.006370052695274353, 0.01633807271718979, 0.026306092739105225, 0.03627411276102066, 0.046242132782936096, 0.05621015280485153, 0.06617817282676697, 0.0761461928486824, 0.08611421287059784, 0.09608223289251328, 0.10605025291442871, 0.11601827293634415, 0.12598629295825958, 0.13595432043075562, 0.14592236280441284, 0.15589037537574768, 0.1658584028482437, 0.17582643032073975, 0.18579444289207458, 0.19576245546340942, 0.20573048293590546, 0.2156985104084015, 0.22566652297973633, 0.23563453555107117, 0.2456025630235672, 0.25557059049606323, 0.26553860306739807, 0.2755066156387329, 0.28547465801239014, 0.295442670583725, 0.3054106831550598, 0.31537869572639465, 0.3253467082977295, 0.3353147506713867, 0.34528276324272156, 0.3552507758140564, 0.3652188181877136, 0.37518683075904846, 0.3851548433303833, 0.39512285590171814, 0.405090868473053, 0.4150589108467102, 0.42502692341804504, 0.4349949359893799, 0.4449629783630371, 0.45493099093437195, 0.4648990035057068]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 3.0, 6.0, 11.0, 10.0, 13.0, 13.0, 10.0, 24.0, 15.0, 23.0, 27.0, 35.0, 36.0, 42.0, 41.0, 40.0, 44.0, 50.0, 38.0, 56.0, 48.0, 47.0, 45.0, 37.0, 30.0, 35.0, 30.0, 27.0, 22.0, 26.0, 16.0, 14.0, 10.0, 18.0, 14.0, 13.0, 8.0, 4.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.13098222017288208, -0.12706336379051208, -0.1231444925069809, -0.1192256286740303, -0.11530676484107971, -0.11138790100812912, -0.10746903717517853, -0.10355018079280853, -0.09963130950927734, -0.09571244567632675, -0.09179358184337616, -0.08787471801042557, -0.08395585417747498, -0.08003699034452438, -0.07611812651157379, -0.0721992701292038, -0.0682804062962532, -0.06436154246330261, -0.06044267863035202, -0.05652381479740143, -0.052604950964450836, -0.048686087131500244, -0.04476722702383995, -0.04084836319088936, -0.036929499357938766, -0.033010635524988174, -0.029091771692037582, -0.02517290972173214, -0.021254045888781548, -0.017335182055830956, -0.013416320085525513, -0.00949745625257492, -0.005578592419624329, -0.0016597290523350239, 0.002259134314954281, 0.006177997216582298, 0.01009686104953289, 0.014015724882483482, 0.017934586852788925, 0.021853450685739517, 0.02577231451869011, 0.0296911783516407, 0.03361004218459129, 0.03752890229225159, 0.04144776612520218, 0.04536662995815277, 0.04928549379110336, 0.053204357624053955, 0.05712322145700455, 0.06104208528995514, 0.06496094912290573, 0.06887981295585632, 0.07279867678880692, 0.07671754062175751, 0.0806363970041275, 0.08455526828765869, 0.08847412467002869, 0.09239298850297928, 0.09631185233592987, 0.10023071616888046, 0.10414958000183105, 0.10806844383478165, 0.11198730766773224, 0.11590616405010223, 0.11982503533363342]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 14.0, 6.0, 18.0, 24.0, 26.0, 50.0, 83.0, 130.0, 223.0, 368.0, 571.0, 960.0, 1541.0, 2632.0, 4196.0, 7303.0, 12561.0, 22610.0, 41752.0, 80500.0, 165379.0, 296533.0, 201864.0, 97094.0, 49723.0, 26827.0, 14816.0, 8307.0, 4919.0, 2937.0, 1779.0, 1089.0, 661.0, 394.0, 222.0, 141.0, 102.0, 74.0, 45.0, 20.0, 19.0, 13.0, 3.0, 10.0, 3.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.2435302734375, -0.23583221435546875, -0.2281341552734375, -0.22043609619140625, -0.212738037109375, -0.20503997802734375, -0.1973419189453125, -0.18964385986328125, -0.18194580078125, -0.17424774169921875, -0.1665496826171875, -0.15885162353515625, -0.151153564453125, -0.14345550537109375, -0.1357574462890625, -0.12805938720703125, -0.120361328125, -0.11266326904296875, -0.1049652099609375, -0.09726715087890625, -0.089569091796875, -0.08187103271484375, -0.0741729736328125, -0.06647491455078125, -0.05877685546875, -0.05107879638671875, -0.0433807373046875, -0.03568267822265625, -0.027984619140625, -0.02028656005859375, -0.0125885009765625, -0.00489044189453125, 0.0028076171875, 0.01050567626953125, 0.0182037353515625, 0.02590179443359375, 0.033599853515625, 0.04129791259765625, 0.0489959716796875, 0.05669403076171875, 0.06439208984375, 0.07209014892578125, 0.0797882080078125, 0.08748626708984375, 0.095184326171875, 0.10288238525390625, 0.1105804443359375, 0.11827850341796875, 0.1259765625, 0.13367462158203125, 0.1413726806640625, 0.14907073974609375, 0.156768798828125, 0.16446685791015625, 0.1721649169921875, 0.17986297607421875, 0.18756103515625, 0.19525909423828125, 0.2029571533203125, 0.21065521240234375, 0.218353271484375, 0.22605133056640625, 0.2337493896484375, 0.24144744873046875, 0.2491455078125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 5.0, 9.0, 7.0, 12.0, 17.0, 14.0, 12.0, 21.0, 25.0, 25.0, 22.0, 22.0, 26.0, 35.0, 45.0, 43.0, 41.0, 44.0, 41.0, 45.0, 43.0, 45.0, 44.0, 35.0, 37.0, 26.0, 33.0, 32.0, 18.0, 26.0, 21.0, 20.0, 16.0, 12.0, 7.0, 12.0, 15.0, 8.0, 7.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.09686279296875, -0.09391307830810547, -0.09096336364746094, -0.0880136489868164, -0.08506393432617188, -0.08211421966552734, -0.07916450500488281, -0.07621479034423828, -0.07326507568359375, -0.07031536102294922, -0.06736564636230469, -0.06441593170166016, -0.061466217041015625, -0.058516502380371094, -0.05556678771972656, -0.05261707305908203, -0.0496673583984375, -0.04671764373779297, -0.04376792907714844, -0.040818214416503906, -0.037868499755859375, -0.034918785095214844, -0.03196907043457031, -0.02901935577392578, -0.02606964111328125, -0.02311992645263672, -0.020170211791992188, -0.017220497131347656, -0.014270782470703125, -0.011321067810058594, -0.008371353149414062, -0.005421638488769531, -0.002471923828125, 0.00047779083251953125, 0.0034275054931640625, 0.006377220153808594, 0.009326934814453125, 0.012276649475097656, 0.015226364135742188, 0.01817607879638672, 0.02112579345703125, 0.02407550811767578, 0.027025222778320312, 0.029974937438964844, 0.032924652099609375, 0.035874366760253906, 0.03882408142089844, 0.04177379608154297, 0.0447235107421875, 0.04767322540283203, 0.05062294006347656, 0.053572654724121094, 0.056522369384765625, 0.059472084045410156, 0.06242179870605469, 0.06537151336669922, 0.06832122802734375, 0.07127094268798828, 0.07422065734863281, 0.07717037200927734, 0.08012008666992188, 0.0830698013305664, 0.08601951599121094, 0.08896923065185547, 0.0919189453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 9.0, 9.0, 12.0, 15.0, 24.0, 29.0, 49.0, 92.0, 143.0, 187.0, 316.0, 522.0, 840.0, 1445.0, 2428.0, 4561.0, 8738.0, 18649.0, 42881.0, 111277.0, 352946.0, 324110.0, 102963.0, 40277.0, 17521.0, 8406.0, 4149.0, 2444.0, 1366.0, 803.0, 504.0, 284.0, 200.0, 129.0, 77.0, 50.0, 36.0, 27.0, 13.0, 10.0, 5.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.297119140625, -0.2881050109863281, -0.27909088134765625, -0.2700767517089844, -0.2610626220703125, -0.2520484924316406, -0.24303436279296875, -0.23402023315429688, -0.225006103515625, -0.21599197387695312, -0.20697784423828125, -0.19796371459960938, -0.1889495849609375, -0.17993545532226562, -0.17092132568359375, -0.16190719604492188, -0.15289306640625, -0.14387893676757812, -0.13486480712890625, -0.12585067749023438, -0.1168365478515625, -0.10782241821289062, -0.09880828857421875, -0.08979415893554688, -0.080780029296875, -0.07176589965820312, -0.06275177001953125, -0.053737640380859375, -0.0447235107421875, -0.035709381103515625, -0.02669525146484375, -0.017681121826171875, -0.0086669921875, 0.000347137451171875, 0.00936126708984375, 0.018375396728515625, 0.0273895263671875, 0.036403656005859375, 0.04541778564453125, 0.054431915283203125, 0.063446044921875, 0.07246017456054688, 0.08147430419921875, 0.09048843383789062, 0.0995025634765625, 0.10851669311523438, 0.11753082275390625, 0.12654495239257812, 0.13555908203125, 0.14457321166992188, 0.15358734130859375, 0.16260147094726562, 0.1716156005859375, 0.18062973022460938, 0.18964385986328125, 0.19865798950195312, 0.207672119140625, 0.21668624877929688, 0.22570037841796875, 0.23471450805664062, 0.2437286376953125, 0.2527427673339844, 0.26175689697265625, 0.2707710266113281, 0.27978515625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 10.0, 9.0, 6.0, 4.0, 17.0, 13.0, 12.0, 20.0, 33.0, 22.0, 22.0, 21.0, 26.0, 35.0, 31.0, 38.0, 42.0, 33.0, 46.0, 52.0, 32.0, 44.0, 36.0, 34.0, 33.0, 48.0, 27.0, 39.0, 30.0, 33.0, 20.0, 24.0, 20.0, 20.0, 19.0, 9.0, 9.0, 7.0, 4.0, 3.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05987548828125, -0.057913780212402344, -0.05595207214355469, -0.05399036407470703, -0.052028656005859375, -0.05006694793701172, -0.04810523986816406, -0.046143531799316406, -0.04418182373046875, -0.042220115661621094, -0.04025840759277344, -0.03829669952392578, -0.036334991455078125, -0.03437328338623047, -0.03241157531738281, -0.030449867248535156, -0.0284881591796875, -0.026526451110839844, -0.024564743041992188, -0.02260303497314453, -0.020641326904296875, -0.01867961883544922, -0.016717910766601562, -0.014756202697753906, -0.01279449462890625, -0.010832786560058594, -0.008871078491210938, -0.006909370422363281, -0.004947662353515625, -0.0029859542846679688, -0.0010242462158203125, 0.0009374618530273438, 0.002899169921875, 0.004860877990722656, 0.0068225860595703125, 0.008784294128417969, 0.010746002197265625, 0.012707710266113281, 0.014669418334960938, 0.016631126403808594, 0.01859283447265625, 0.020554542541503906, 0.022516250610351562, 0.02447795867919922, 0.026439666748046875, 0.02840137481689453, 0.030363082885742188, 0.032324790954589844, 0.0342864990234375, 0.036248207092285156, 0.03820991516113281, 0.04017162322998047, 0.042133331298828125, 0.04409503936767578, 0.04605674743652344, 0.048018455505371094, 0.04998016357421875, 0.051941871643066406, 0.05390357971191406, 0.05586528778076172, 0.057826995849609375, 0.05978870391845703, 0.06175041198730469, 0.06371212005615234, 0.065673828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 9.0, 17.0, 20.0, 33.0, 35.0, 56.0, 75.0, 98.0, 158.0, 239.0, 381.0, 550.0, 842.0, 1358.0, 2416.0, 4253.0, 8059.0, 17861.0, 51322.0, 729134.0, 167121.0, 35246.0, 13820.0, 6548.0, 3475.0, 2014.0, 1188.0, 763.0, 459.0, 328.0, 210.0, 154.0, 97.0, 56.0, 45.0, 31.0, 13.0, 19.0, 12.0, 13.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.259033203125, -0.2511463165283203, -0.24325942993164062, -0.23537254333496094, -0.22748565673828125, -0.21959877014160156, -0.21171188354492188, -0.2038249969482422, -0.1959381103515625, -0.1880512237548828, -0.18016433715820312, -0.17227745056152344, -0.16439056396484375, -0.15650367736816406, -0.14861679077148438, -0.1407299041748047, -0.132843017578125, -0.12495613098144531, -0.11706924438476562, -0.10918235778808594, -0.10129547119140625, -0.09340858459472656, -0.08552169799804688, -0.07763481140136719, -0.0697479248046875, -0.06186103820800781, -0.053974151611328125, -0.04608726501464844, -0.03820037841796875, -0.030313491821289062, -0.022426605224609375, -0.014539718627929688, -0.00665283203125, 0.0012340545654296875, 0.009120941162109375, 0.017007827758789062, 0.02489471435546875, 0.03278160095214844, 0.040668487548828125, 0.04855537414550781, 0.0564422607421875, 0.06432914733886719, 0.07221603393554688, 0.08010292053222656, 0.08798980712890625, 0.09587669372558594, 0.10376358032226562, 0.11165046691894531, 0.119537353515625, 0.1274242401123047, 0.13531112670898438, 0.14319801330566406, 0.15108489990234375, 0.15897178649902344, 0.16685867309570312, 0.1747455596923828, 0.1826324462890625, 0.1905193328857422, 0.19840621948242188, 0.20629310607910156, 0.21417999267578125, 0.22206687927246094, 0.22995376586914062, 0.2378406524658203, 0.2457275390625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 8.0, 9.0, 7.0, 11.0, 7.0, 20.0, 32.0, 44.0, 47.0, 97.0, 138.0, 155.0, 125.0, 76.0, 57.0, 31.0, 24.0, 18.0, 13.0, 11.0, 9.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.748603820800781e-06, -7.5232237577438354e-06, -7.29784369468689e-06, -7.072463631629944e-06, -6.847083568572998e-06, -6.621703505516052e-06, -6.3963234424591064e-06, -6.170943379402161e-06, -5.945563316345215e-06, -5.720183253288269e-06, -5.494803190231323e-06, -5.2694231271743774e-06, -5.044043064117432e-06, -4.818663001060486e-06, -4.59328293800354e-06, -4.367902874946594e-06, -4.1425228118896484e-06, -3.917142748832703e-06, -3.691762685775757e-06, -3.466382622718811e-06, -3.2410025596618652e-06, -3.0156224966049194e-06, -2.7902424335479736e-06, -2.564862370491028e-06, -2.339482307434082e-06, -2.1141022443771362e-06, -1.8887221813201904e-06, -1.6633421182632446e-06, -1.4379620552062988e-06, -1.212581992149353e-06, -9.872019290924072e-07, -7.618218660354614e-07, -5.364418029785156e-07, -3.110617399215698e-07, -8.568167686462402e-08, 1.3969838619232178e-07, 3.650784492492676e-07, 5.904585123062134e-07, 8.158385753631592e-07, 1.041218638420105e-06, 1.2665987014770508e-06, 1.4919787645339966e-06, 1.7173588275909424e-06, 1.942738890647888e-06, 2.168118953704834e-06, 2.3934990167617798e-06, 2.6188790798187256e-06, 2.8442591428756714e-06, 3.069639205932617e-06, 3.295019268989563e-06, 3.520399332046509e-06, 3.7457793951034546e-06, 3.9711594581604e-06, 4.196539521217346e-06, 4.421919584274292e-06, 4.647299647331238e-06, 4.872679710388184e-06, 5.098059773445129e-06, 5.323439836502075e-06, 5.548819899559021e-06, 5.774199962615967e-06, 5.999580025672913e-06, 6.224960088729858e-06, 6.450340151786804e-06, 6.67572021484375e-06]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 7.0, 10.0, 12.0, 17.0, 27.0, 31.0, 48.0, 73.0, 114.0, 161.0, 224.0, 341.0, 547.0, 830.0, 1294.0, 2114.0, 3743.0, 7037.0, 14653.0, 37403.0, 169565.0, 718598.0, 52923.0, 18928.0, 8538.0, 4616.0, 2522.0, 1500.0, 885.0, 563.0, 420.0, 242.0, 195.0, 97.0, 83.0, 60.0, 38.0, 36.0, 16.0, 14.0, 10.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.242919921875, -0.23559188842773438, -0.22826385498046875, -0.22093582153320312, -0.2136077880859375, -0.20627975463867188, -0.19895172119140625, -0.19162368774414062, -0.184295654296875, -0.17696762084960938, -0.16963958740234375, -0.16231155395507812, -0.1549835205078125, -0.14765548706054688, -0.14032745361328125, -0.13299942016601562, -0.12567138671875, -0.11834335327148438, -0.11101531982421875, -0.10368728637695312, -0.0963592529296875, -0.08903121948242188, -0.08170318603515625, -0.07437515258789062, -0.067047119140625, -0.059719085693359375, -0.05239105224609375, -0.045063018798828125, -0.0377349853515625, -0.030406951904296875, -0.02307891845703125, -0.015750885009765625, -0.0084228515625, -0.001094818115234375, 0.00623321533203125, 0.013561248779296875, 0.0208892822265625, 0.028217315673828125, 0.03554534912109375, 0.042873382568359375, 0.050201416015625, 0.057529449462890625, 0.06485748291015625, 0.07218551635742188, 0.0795135498046875, 0.08684158325195312, 0.09416961669921875, 0.10149765014648438, 0.10882568359375, 0.11615371704101562, 0.12348175048828125, 0.13080978393554688, 0.1381378173828125, 0.14546585083007812, 0.15279388427734375, 0.16012191772460938, 0.167449951171875, 0.17477798461914062, 0.18210601806640625, 0.18943405151367188, 0.1967620849609375, 0.20409011840820312, 0.21141815185546875, 0.21874618530273438, 0.22607421875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 2.0, 7.0, 8.0, 12.0, 19.0, 9.0, 22.0, 28.0, 24.0, 33.0, 34.0, 47.0, 86.0, 353.0, 55.0, 34.0, 41.0, 41.0, 25.0, 21.0, 16.0, 17.0, 4.0, 7.0, 9.0, 7.0, 4.0, 4.0, 1.0, 6.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04931640625, -0.04783058166503906, -0.046344757080078125, -0.04485893249511719, -0.04337310791015625, -0.04188728332519531, -0.040401458740234375, -0.03891563415527344, -0.0374298095703125, -0.03594398498535156, -0.034458160400390625, -0.03297233581542969, -0.03148651123046875, -0.030000686645507812, -0.028514862060546875, -0.027029037475585938, -0.025543212890625, -0.024057388305664062, -0.022571563720703125, -0.021085739135742188, -0.01959991455078125, -0.018114089965820312, -0.016628265380859375, -0.015142440795898438, -0.0136566162109375, -0.012170791625976562, -0.010684967041015625, -0.009199142456054688, -0.00771331787109375, -0.0062274932861328125, -0.004741668701171875, -0.0032558441162109375, -0.00177001953125, -0.0002841949462890625, 0.001201629638671875, 0.0026874542236328125, 0.00417327880859375, 0.0056591033935546875, 0.007144927978515625, 0.008630752563476562, 0.0101165771484375, 0.011602401733398438, 0.013088226318359375, 0.014574050903320312, 0.01605987548828125, 0.017545700073242188, 0.019031524658203125, 0.020517349243164062, 0.022003173828125, 0.023488998413085938, 0.024974822998046875, 0.026460647583007812, 0.02794647216796875, 0.029432296752929688, 0.030918121337890625, 0.03240394592285156, 0.0338897705078125, 0.03537559509277344, 0.036861419677734375, 0.03834724426269531, 0.03983306884765625, 0.04131889343261719, 0.042804718017578125, 0.04429054260253906, 0.0457763671875]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 9.0, 10.0, 15.0, 27.0, 39.0, 49.0, 93.0, 129.0, 210.0, 195.0, 89.0, 51.0, 16.0, 15.0, 12.0, 4.0, 14.0, 1.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17663122713565826, -0.16863369941711426, -0.16063618659973145, -0.15263865888118744, -0.14464113116264343, -0.13664360344409943, -0.12864607572555542, -0.12064856290817261, -0.1126510351896286, -0.1046535074710846, -0.09665598720312119, -0.08865846693515778, -0.08066093921661377, -0.07266341149806976, -0.06466589123010635, -0.056668367236852646, -0.04867084324359894, -0.04067331925034523, -0.03267579525709152, -0.024678271263837814, -0.016680747270584106, -0.008683223277330399, -0.0006856992840766907, 0.007311824709177017, 0.015309348702430725, 0.023306872695684433, 0.03130439668893814, 0.03930192068219185, 0.04729944467544556, 0.055296968668699265, 0.06329449266195297, 0.07129201292991638, 0.07928955554962158, 0.08728708326816559, 0.095284603536129, 0.10328212380409241, 0.11127965152263641, 0.11927717924118042, 0.12727469205856323, 0.13527221977710724, 0.14326974749565125, 0.15126727521419525, 0.15926480293273926, 0.16726231575012207, 0.17525984346866608, 0.18325737118721008, 0.1912548840045929, 0.1992524117231369, 0.2072499394416809, 0.21524746716022491, 0.22324499487876892, 0.23124250769615173, 0.23924003541469574, 0.24723756313323975, 0.25523507595062256, 0.26323261857032776, 0.27123013138771057, 0.2792276442050934, 0.2872251868247986, 0.2952226996421814, 0.3032202124595642, 0.3112177550792694, 0.3192152678966522, 0.3272128105163574, 0.33521032333374023]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 9.0, 6.0, 10.0, 8.0, 14.0, 11.0, 14.0, 21.0, 22.0, 31.0, 33.0, 35.0, 41.0, 32.0, 43.0, 50.0, 41.0, 45.0, 53.0, 49.0, 41.0, 40.0, 50.0, 28.0, 37.0, 41.0, 26.0, 22.0, 25.0, 16.0, 24.0, 20.0, 18.0, 9.0, 10.0, 6.0, 8.0, 5.0, 1.0, 2.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11947879195213318, -0.11584986001253128, -0.11222092807292938, -0.10859199613332748, -0.10496306419372559, -0.10133413225412369, -0.09770520031452179, -0.09407627582550049, -0.090447336435318, -0.0868184044957161, -0.0831894725561142, -0.0795605406165123, -0.0759316086769104, -0.0723026767373085, -0.0686737447977066, -0.0650448203086853, -0.061415888369083405, -0.057786956429481506, -0.05415802448987961, -0.05052909255027771, -0.04690016061067581, -0.043271228671073914, -0.039642300456762314, -0.036013368517160416, -0.03238443657755852, -0.02875550463795662, -0.02512657269835472, -0.021497642621397972, -0.017868710681796074, -0.014239778742194176, -0.010610848665237427, -0.0069819167256355286, -0.0033529847860336304, 0.0002759466879069805, 0.0039048781618475914, 0.007533809170126915, 0.011162741109728813, 0.014791673049330711, 0.01842060312628746, 0.02204953506588936, 0.025678467005491257, 0.029307398945093155, 0.03293633088469505, 0.03656525909900665, 0.04019419103860855, 0.04382312297821045, 0.04745205491781235, 0.051080986857414246, 0.054709918797016144, 0.05833885073661804, 0.06196778267621994, 0.06559671461582184, 0.06922564655542374, 0.07285457849502563, 0.07648350298404694, 0.08011244237422943, 0.08374136686325073, 0.08737029880285263, 0.09099923074245453, 0.09462816268205643, 0.09825709462165833, 0.10188602656126022, 0.10551495850086212, 0.10914388298988342, 0.11277282238006592]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 14.0, 12.0, 14.0, 36.0, 43.0, 65.0, 92.0, 130.0, 202.0, 300.0, 436.0, 695.0, 1043.0, 1699.0, 2616.0, 4143.0, 6931.0, 11076.0, 18364.0, 31367.0, 55396.0, 107569.0, 243939.0, 963414.0, 1920040.0, 475295.0, 162214.0, 78347.0, 43018.0, 24729.0, 14786.0, 9139.0, 5754.0, 3760.0, 2500.0, 1644.0, 1110.0, 799.0, 524.0, 342.0, 233.0, 152.0, 97.0, 74.0, 37.0, 36.0, 17.0, 17.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.1474609375, -0.1431598663330078, -0.13885879516601562, -0.13455772399902344, -0.13025665283203125, -0.12595558166503906, -0.12165451049804688, -0.11735343933105469, -0.1130523681640625, -0.10875129699707031, -0.10445022583007812, -0.10014915466308594, -0.09584808349609375, -0.09154701232910156, -0.08724594116210938, -0.08294486999511719, -0.078643798828125, -0.07434272766113281, -0.07004165649414062, -0.06574058532714844, -0.06143951416015625, -0.05713844299316406, -0.052837371826171875, -0.04853630065917969, -0.0442352294921875, -0.03993415832519531, -0.035633087158203125, -0.03133201599121094, -0.02703094482421875, -0.022729873657226562, -0.018428802490234375, -0.014127731323242188, -0.00982666015625, -0.0055255889892578125, -0.001224517822265625, 0.0030765533447265625, 0.00737762451171875, 0.011678695678710938, 0.015979766845703125, 0.020280838012695312, 0.0245819091796875, 0.028882980346679688, 0.033184051513671875, 0.03748512268066406, 0.04178619384765625, 0.04608726501464844, 0.050388336181640625, 0.05468940734863281, 0.058990478515625, 0.06329154968261719, 0.06759262084960938, 0.07189369201660156, 0.07619476318359375, 0.08049583435058594, 0.08479690551757812, 0.08909797668457031, 0.0933990478515625, 0.09770011901855469, 0.10200119018554688, 0.10630226135253906, 0.11060333251953125, 0.11490440368652344, 0.11920547485351562, 0.12350654602050781, 0.1278076171875]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 8.0, 7.0, 6.0, 12.0, 11.0, 26.0, 26.0, 22.0, 38.0, 43.0, 35.0, 36.0, 46.0, 50.0, 48.0, 32.0, 43.0, 62.0, 38.0, 37.0, 37.0, 41.0, 39.0, 39.0, 23.0, 24.0, 26.0, 21.0, 20.0, 24.0, 14.0, 21.0, 4.0, 4.0, 8.0, 6.0, 2.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05633544921875, -0.05450773239135742, -0.052680015563964844, -0.050852298736572266, -0.04902458190917969, -0.04719686508178711, -0.04536914825439453, -0.04354143142700195, -0.041713714599609375, -0.0398859977722168, -0.03805828094482422, -0.03623056411743164, -0.03440284729003906, -0.032575130462646484, -0.030747413635253906, -0.028919696807861328, -0.02709197998046875, -0.025264263153076172, -0.023436546325683594, -0.021608829498291016, -0.019781112670898438, -0.01795339584350586, -0.01612567901611328, -0.014297962188720703, -0.012470245361328125, -0.010642528533935547, -0.008814811706542969, -0.006987094879150391, -0.0051593780517578125, -0.0033316612243652344, -0.0015039443969726562, 0.0003237724304199219, 0.0021514892578125, 0.003979206085205078, 0.005806922912597656, 0.007634639739990234, 0.009462356567382812, 0.01129007339477539, 0.013117790222167969, 0.014945507049560547, 0.016773223876953125, 0.018600940704345703, 0.02042865753173828, 0.02225637435913086, 0.024084091186523438, 0.025911808013916016, 0.027739524841308594, 0.029567241668701172, 0.03139495849609375, 0.03322267532348633, 0.035050392150878906, 0.036878108978271484, 0.03870582580566406, 0.04053354263305664, 0.04236125946044922, 0.0441889762878418, 0.046016693115234375, 0.04784440994262695, 0.04967212677001953, 0.05149984359741211, 0.05332756042480469, 0.055155277252197266, 0.056982994079589844, 0.05881071090698242, 0.060638427734375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 14.0, 18.0, 17.0, 31.0, 59.0, 67.0, 99.0, 139.0, 207.0, 331.0, 504.0, 816.0, 1217.0, 2023.0, 3215.0, 5612.0, 10077.0, 18008.0, 35167.0, 75651.0, 190772.0, 640347.0, 2169339.0, 682941.0, 199842.0, 78750.0, 35966.0, 18515.0, 9838.0, 5578.0, 3400.0, 2015.0, 1276.0, 807.0, 545.0, 350.0, 247.0, 160.0, 99.0, 84.0, 57.0, 19.0, 18.0, 9.0, 10.0, 9.0, 5.0, 7.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.1385498046875, -0.1344165802001953, -0.13028335571289062, -0.12615013122558594, -0.12201690673828125, -0.11788368225097656, -0.11375045776367188, -0.10961723327636719, -0.1054840087890625, -0.10135078430175781, -0.09721755981445312, -0.09308433532714844, -0.08895111083984375, -0.08481788635253906, -0.08068466186523438, -0.07655143737792969, -0.072418212890625, -0.06828498840332031, -0.06415176391601562, -0.06001853942871094, -0.05588531494140625, -0.05175209045410156, -0.047618865966796875, -0.04348564147949219, -0.0393524169921875, -0.03521919250488281, -0.031085968017578125, -0.026952743530273438, -0.02281951904296875, -0.018686294555664062, -0.014553070068359375, -0.010419845581054688, -0.00628662109375, -0.0021533966064453125, 0.001979827880859375, 0.0061130523681640625, 0.01024627685546875, 0.014379501342773438, 0.018512725830078125, 0.022645950317382812, 0.0267791748046875, 0.030912399291992188, 0.035045623779296875, 0.03917884826660156, 0.04331207275390625, 0.04744529724121094, 0.051578521728515625, 0.05571174621582031, 0.059844970703125, 0.06397819519042969, 0.06811141967773438, 0.07224464416503906, 0.07637786865234375, 0.08051109313964844, 0.08464431762695312, 0.08877754211425781, 0.0929107666015625, 0.09704399108886719, 0.10117721557617188, 0.10531044006347656, 0.10944366455078125, 0.11357688903808594, 0.11771011352539062, 0.12184333801269531, 0.1259765625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 4.0, 11.0, 8.0, 12.0, 14.0, 24.0, 30.0, 30.0, 37.0, 58.0, 77.0, 74.0, 99.0, 123.0, 141.0, 190.0, 230.0, 258.0, 366.0, 372.0, 337.0, 293.0, 267.0, 190.0, 194.0, 120.0, 118.0, 98.0, 55.0, 53.0, 43.0, 35.0, 27.0, 24.0, 16.0, 10.0, 7.0, 3.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0316162109375, -0.030617237091064453, -0.029618263244628906, -0.02861928939819336, -0.027620315551757812, -0.026621341705322266, -0.02562236785888672, -0.024623394012451172, -0.023624420166015625, -0.022625446319580078, -0.02162647247314453, -0.020627498626708984, -0.019628524780273438, -0.01862955093383789, -0.017630577087402344, -0.016631603240966797, -0.01563262939453125, -0.014633655548095703, -0.013634681701660156, -0.01263570785522461, -0.011636734008789062, -0.010637760162353516, -0.009638786315917969, -0.008639812469482422, -0.007640838623046875, -0.006641864776611328, -0.005642890930175781, -0.004643917083740234, -0.0036449432373046875, -0.0026459693908691406, -0.0016469955444335938, -0.0006480216979980469, 0.0003509521484375, 0.0013499259948730469, 0.0023488998413085938, 0.0033478736877441406, 0.0043468475341796875, 0.005345821380615234, 0.006344795227050781, 0.007343769073486328, 0.008342742919921875, 0.009341716766357422, 0.010340690612792969, 0.011339664459228516, 0.012338638305664062, 0.01333761215209961, 0.014336585998535156, 0.015335559844970703, 0.01633453369140625, 0.017333507537841797, 0.018332481384277344, 0.01933145523071289, 0.020330429077148438, 0.021329402923583984, 0.02232837677001953, 0.023327350616455078, 0.024326324462890625, 0.025325298309326172, 0.02632427215576172, 0.027323246002197266, 0.028322219848632812, 0.02932119369506836, 0.030320167541503906, 0.03131914138793945, 0.032318115234375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 17.0, 13.0, 17.0, 32.0, 45.0, 68.0, 103.0, 162.0, 169.0, 136.0, 80.0, 48.0, 25.0, 12.0, 13.0, 8.0, 6.0, 6.0, 5.0, 1.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09861345589160919, -0.09456570446491241, -0.09051796048879623, -0.08647021651268005, -0.08242246508598328, -0.0783747136592865, -0.07432696968317032, -0.07027922570705414, -0.06623147428035736, -0.06218372657895088, -0.0581359788775444, -0.054088231176137924, -0.050040483474731445, -0.045992735773324966, -0.04194498807191849, -0.03789724037051201, -0.03384949266910553, -0.02980174496769905, -0.025753997266292572, -0.021706249564886093, -0.017658501863479614, -0.013610754162073135, -0.009563006460666656, -0.005515258759260178, -0.0014675110578536987, 0.00258023664355278, 0.006627984344959259, 0.010675732046365738, 0.014723479747772217, 0.018771227449178696, 0.022818975150585175, 0.026866722851991653, 0.030914485454559326, 0.034962233155965805, 0.039009980857372284, 0.04305772855877876, 0.04710547626018524, 0.05115322396159172, 0.0552009716629982, 0.05924871936440468, 0.06329646706581116, 0.06734421849250793, 0.07139196246862411, 0.0754397064447403, 0.07948745787143707, 0.08353520929813385, 0.08758295327425003, 0.09163069725036621, 0.09567844867706299, 0.09972620010375977, 0.10377394407987595, 0.10782168805599213, 0.1118694394826889, 0.11591719090938568, 0.11996493488550186, 0.12401267886161804, 0.12806043028831482, 0.1321081817150116, 0.13615593314170837, 0.14020366966724396, 0.14425142109394073, 0.1482991725206375, 0.1523469090461731, 0.15639466047286987, 0.16044241189956665]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 12.0, 16.0, 6.0, 23.0, 14.0, 26.0, 29.0, 28.0, 44.0, 46.0, 42.0, 42.0, 57.0, 51.0, 50.0, 52.0, 58.0, 37.0, 34.0, 51.0, 39.0, 41.0, 28.0, 27.0, 26.0, 22.0, 17.0, 17.0, 10.0, 7.0, 9.0, 6.0, 9.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07376483827829361, -0.07160855829715729, -0.06945228576660156, -0.06729600578546524, -0.06513972580432892, -0.0629834532737732, -0.06082717329263687, -0.05867089331150055, -0.056514617055654526, -0.0543583407998085, -0.05220206081867218, -0.05004578456282616, -0.04788950830698013, -0.04573322832584381, -0.04357695206999779, -0.041420675814151764, -0.03926439583301544, -0.03710811957716942, -0.034951839596033096, -0.03279556334018707, -0.0306392852216959, -0.028483007103204727, -0.026326730847358704, -0.02417045272886753, -0.022014174610376358, -0.019857896491885185, -0.017701618373394012, -0.015545342117547989, -0.013389063999056816, -0.011232785880565643, -0.009076508693397045, -0.006920231506228447, -0.004763945937156677, -0.0026076682843267918, -0.0004513906314969063, 0.0017048870213329792, 0.0038611646741628647, 0.0060174427926540375, 0.008173719979822636, 0.010329997166991234, 0.012486275285482407, 0.01464255340397358, 0.016798831522464752, 0.018955107778310776, 0.02111138589680195, 0.02326766401529312, 0.025423940271139145, 0.027580218389630318, 0.02973649650812149, 0.031892772763967514, 0.034049052745103836, 0.03620532900094986, 0.03836160898208618, 0.040517885237932205, 0.04267416149377823, 0.04483044147491455, 0.046986717730760574, 0.0491429939866066, 0.05129927396774292, 0.053455550223588943, 0.05561182647943497, 0.05776810646057129, 0.05992438271641731, 0.062080658972263336, 0.06423693895339966]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 9.0, 12.0, 17.0, 26.0, 28.0, 41.0, 91.0, 99.0, 132.0, 213.0, 289.0, 437.0, 648.0, 977.0, 1581.0, 2402.0, 3912.0, 6948.0, 13210.0, 27688.0, 68403.0, 201170.0, 411462.0, 187838.0, 64630.0, 26261.0, 12596.0, 6765.0, 3968.0, 2221.0, 1498.0, 956.0, 652.0, 396.0, 296.0, 201.0, 156.0, 96.0, 64.0, 50.0, 33.0, 29.0, 19.0, 11.0, 4.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0760498046875, -0.07363319396972656, -0.07121658325195312, -0.06879997253417969, -0.06638336181640625, -0.06396675109863281, -0.061550140380859375, -0.05913352966308594, -0.0567169189453125, -0.05430030822753906, -0.051883697509765625, -0.04946708679199219, -0.04705047607421875, -0.04463386535644531, -0.042217254638671875, -0.03980064392089844, -0.037384033203125, -0.03496742248535156, -0.032550811767578125, -0.030134201049804688, -0.02771759033203125, -0.025300979614257812, -0.022884368896484375, -0.020467758178710938, -0.0180511474609375, -0.015634536743164062, -0.013217926025390625, -0.010801315307617188, -0.00838470458984375, -0.0059680938720703125, -0.003551483154296875, -0.0011348724365234375, 0.00128173828125, 0.0036983489990234375, 0.006114959716796875, 0.008531570434570312, 0.01094818115234375, 0.013364791870117188, 0.015781402587890625, 0.018198013305664062, 0.0206146240234375, 0.023031234741210938, 0.025447845458984375, 0.027864456176757812, 0.03028106689453125, 0.03269767761230469, 0.035114288330078125, 0.03753089904785156, 0.039947509765625, 0.04236412048339844, 0.044780731201171875, 0.04719734191894531, 0.04961395263671875, 0.05203056335449219, 0.054447174072265625, 0.05686378479003906, 0.0592803955078125, 0.06169700622558594, 0.06411361694335938, 0.06653022766113281, 0.06894683837890625, 0.07136344909667969, 0.07378005981445312, 0.07619667053222656, 0.07861328125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 13.0, 10.0, 9.0, 10.0, 17.0, 27.0, 21.0, 25.0, 32.0, 20.0, 45.0, 26.0, 29.0, 46.0, 39.0, 49.0, 51.0, 48.0, 42.0, 51.0, 38.0, 29.0, 41.0, 44.0, 34.0, 30.0, 23.0, 22.0, 22.0, 22.0, 13.0, 5.0, 14.0, 9.0, 5.0, 9.0, 9.0, 6.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0640869140625, -0.062285423278808594, -0.06048393249511719, -0.05868244171142578, -0.056880950927734375, -0.05507946014404297, -0.05327796936035156, -0.051476478576660156, -0.04967498779296875, -0.047873497009277344, -0.04607200622558594, -0.04427051544189453, -0.042469024658203125, -0.04066753387451172, -0.03886604309082031, -0.037064552307128906, -0.0352630615234375, -0.033461570739746094, -0.03166007995605469, -0.02985858917236328, -0.028057098388671875, -0.02625560760498047, -0.024454116821289062, -0.022652626037597656, -0.02085113525390625, -0.019049644470214844, -0.017248153686523438, -0.015446662902832031, -0.013645172119140625, -0.011843681335449219, -0.010042190551757812, -0.008240699768066406, -0.006439208984375, -0.004637718200683594, -0.0028362274169921875, -0.0010347366333007812, 0.000766754150390625, 0.0025682449340820312, 0.0043697357177734375, 0.006171226501464844, 0.00797271728515625, 0.009774208068847656, 0.011575698852539062, 0.013377189636230469, 0.015178680419921875, 0.01698017120361328, 0.018781661987304688, 0.020583152770996094, 0.0223846435546875, 0.024186134338378906, 0.025987625122070312, 0.02778911590576172, 0.029590606689453125, 0.03139209747314453, 0.03319358825683594, 0.034995079040527344, 0.03679656982421875, 0.038598060607910156, 0.04039955139160156, 0.04220104217529297, 0.044002532958984375, 0.04580402374267578, 0.04760551452636719, 0.049407005310058594, 0.05120849609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 9.0, 13.0, 19.0, 24.0, 36.0, 48.0, 126.0, 193.0, 350.0, 648.0, 1406.0, 3153.0, 8142.0, 28161.0, 159129.0, 695851.0, 116334.0, 22665.0, 6887.0, 2764.0, 1246.0, 572.0, 327.0, 173.0, 119.0, 51.0, 25.0, 25.0, 17.0, 13.0, 8.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.112548828125, -0.10812187194824219, -0.10369491577148438, -0.09926795959472656, -0.09484100341796875, -0.09041404724121094, -0.08598709106445312, -0.08156013488769531, -0.0771331787109375, -0.07270622253417969, -0.06827926635742188, -0.06385231018066406, -0.05942535400390625, -0.05499839782714844, -0.050571441650390625, -0.04614448547363281, -0.041717529296875, -0.03729057312011719, -0.032863616943359375, -0.028436660766601562, -0.02400970458984375, -0.019582748413085938, -0.015155792236328125, -0.010728836059570312, -0.0063018798828125, -0.0018749237060546875, 0.002552032470703125, 0.0069789886474609375, 0.01140594482421875, 0.015832901000976562, 0.020259857177734375, 0.024686813354492188, 0.02911376953125, 0.03354072570800781, 0.037967681884765625, 0.04239463806152344, 0.04682159423828125, 0.05124855041503906, 0.055675506591796875, 0.06010246276855469, 0.0645294189453125, 0.06895637512207031, 0.07338333129882812, 0.07781028747558594, 0.08223724365234375, 0.08666419982910156, 0.09109115600585938, 0.09551811218261719, 0.099945068359375, 0.10437202453613281, 0.10879898071289062, 0.11322593688964844, 0.11765289306640625, 0.12207984924316406, 0.12650680541992188, 0.1309337615966797, 0.1353607177734375, 0.1397876739501953, 0.14421463012695312, 0.14864158630371094, 0.15306854248046875, 0.15749549865722656, 0.16192245483398438, 0.1663494110107422, 0.1707763671875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 4.0, 8.0, 9.0, 8.0, 12.0, 16.0, 17.0, 20.0, 25.0, 12.0, 23.0, 40.0, 32.0, 40.0, 35.0, 39.0, 36.0, 53.0, 41.0, 46.0, 49.0, 39.0, 37.0, 39.0, 39.0, 31.0, 37.0, 15.0, 36.0, 29.0, 24.0, 20.0, 15.0, 11.0, 11.0, 8.0, 15.0, 4.0, 2.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033111572265625, -0.03195333480834961, -0.03079509735107422, -0.029636859893798828, -0.028478622436523438, -0.027320384979248047, -0.026162147521972656, -0.025003910064697266, -0.023845672607421875, -0.022687435150146484, -0.021529197692871094, -0.020370960235595703, -0.019212722778320312, -0.018054485321044922, -0.01689624786376953, -0.01573801040649414, -0.01457977294921875, -0.01342153549194336, -0.012263298034667969, -0.011105060577392578, -0.009946823120117188, -0.008788585662841797, -0.007630348205566406, -0.006472110748291016, -0.005313873291015625, -0.004155635833740234, -0.0029973983764648438, -0.0018391609191894531, -0.0006809234619140625, 0.0004773139953613281, 0.0016355514526367188, 0.0027937889099121094, 0.0039520263671875, 0.005110263824462891, 0.006268501281738281, 0.007426738739013672, 0.008584976196289062, 0.009743213653564453, 0.010901451110839844, 0.012059688568115234, 0.013217926025390625, 0.014376163482666016, 0.015534400939941406, 0.016692638397216797, 0.017850875854492188, 0.019009113311767578, 0.02016735076904297, 0.02132558822631836, 0.02248382568359375, 0.02364206314086914, 0.02480030059814453, 0.025958538055419922, 0.027116775512695312, 0.028275012969970703, 0.029433250427246094, 0.030591487884521484, 0.031749725341796875, 0.032907962799072266, 0.034066200256347656, 0.03522443771362305, 0.03638267517089844, 0.03754091262817383, 0.03869915008544922, 0.03985738754272461, 0.041015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 12.0, 16.0, 17.0, 32.0, 53.0, 66.0, 107.0, 150.0, 185.0, 305.0, 428.0, 675.0, 1048.0, 1541.0, 2378.0, 3739.0, 6614.0, 11445.0, 23100.0, 56916.0, 228253.0, 532147.0, 105162.0, 35431.0, 16308.0, 8654.0, 5035.0, 3059.0, 1919.0, 1226.0, 819.0, 532.0, 339.0, 270.0, 179.0, 132.0, 91.0, 58.0, 30.0, 23.0, 18.0, 14.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01934814453125, -0.01870870590209961, -0.01806926727294922, -0.017429828643798828, -0.016790390014648438, -0.016150951385498047, -0.015511512756347656, -0.014872074127197266, -0.014232635498046875, -0.013593196868896484, -0.012953758239746094, -0.012314319610595703, -0.011674880981445312, -0.011035442352294922, -0.010396003723144531, -0.00975656509399414, -0.00911712646484375, -0.00847768783569336, -0.007838249206542969, -0.007198810577392578, -0.0065593719482421875, -0.005919933319091797, -0.005280494689941406, -0.004641056060791016, -0.004001617431640625, -0.0033621788024902344, -0.0027227401733398438, -0.002083301544189453, -0.0014438629150390625, -0.0008044242858886719, -0.00016498565673828125, 0.0004744529724121094, 0.0011138916015625, 0.0017533302307128906, 0.0023927688598632812, 0.003032207489013672, 0.0036716461181640625, 0.004311084747314453, 0.004950523376464844, 0.005589962005615234, 0.006229400634765625, 0.006868839263916016, 0.007508277893066406, 0.008147716522216797, 0.008787155151367188, 0.009426593780517578, 0.010066032409667969, 0.01070547103881836, 0.01134490966796875, 0.01198434829711914, 0.012623786926269531, 0.013263225555419922, 0.013902664184570312, 0.014542102813720703, 0.015181541442871094, 0.015820980072021484, 0.016460418701171875, 0.017099857330322266, 0.017739295959472656, 0.018378734588623047, 0.019018173217773438, 0.019657611846923828, 0.02029705047607422, 0.02093648910522461, 0.021575927734375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 8.0, 2.0, 2.0, 2.0, 9.0, 8.0, 6.0, 11.0, 17.0, 10.0, 19.0, 27.0, 43.0, 99.0, 176.0, 212.0, 135.0, 52.0, 28.0, 23.0, 15.0, 12.0, 12.0, 9.0, 6.0, 10.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0], "bins": [-2.0742416381835938e-05, -2.0137056708335876e-05, -1.9531697034835815e-05, -1.8926337361335754e-05, -1.8320977687835693e-05, -1.7715618014335632e-05, -1.711025834083557e-05, -1.650489866733551e-05, -1.589953899383545e-05, -1.5294179320335388e-05, -1.4688819646835327e-05, -1.4083459973335266e-05, -1.3478100299835205e-05, -1.2872740626335144e-05, -1.2267380952835083e-05, -1.1662021279335022e-05, -1.1056661605834961e-05, -1.04513019323349e-05, -9.845942258834839e-06, -9.240582585334778e-06, -8.635222911834717e-06, -8.029863238334656e-06, -7.424503564834595e-06, -6.819143891334534e-06, -6.213784217834473e-06, -5.608424544334412e-06, -5.003064870834351e-06, -4.3977051973342896e-06, -3.7923455238342285e-06, -3.1869858503341675e-06, -2.5816261768341064e-06, -1.9762665033340454e-06, -1.3709068298339844e-06, -7.655471563339233e-07, -1.601874828338623e-07, 4.4517219066619873e-07, 1.0505318641662598e-06, 1.6558915376663208e-06, 2.261251211166382e-06, 2.866610884666443e-06, 3.471970558166504e-06, 4.077330231666565e-06, 4.682689905166626e-06, 5.288049578666687e-06, 5.893409252166748e-06, 6.498768925666809e-06, 7.10412859916687e-06, 7.709488272666931e-06, 8.314847946166992e-06, 8.920207619667053e-06, 9.525567293167114e-06, 1.0130926966667175e-05, 1.0736286640167236e-05, 1.1341646313667297e-05, 1.1947005987167358e-05, 1.255236566066742e-05, 1.315772533416748e-05, 1.3763085007667542e-05, 1.4368444681167603e-05, 1.4973804354667664e-05, 1.5579164028167725e-05, 1.6184523701667786e-05, 1.6789883375167847e-05, 1.7395243048667908e-05, 1.800060272216797e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 7.0, 9.0, 18.0, 17.0, 27.0, 24.0, 38.0, 56.0, 77.0, 113.0, 173.0, 249.0, 399.0, 651.0, 1088.0, 1965.0, 3753.0, 7522.0, 17010.0, 42900.0, 144181.0, 543333.0, 193294.0, 52994.0, 20022.0, 8930.0, 4243.0, 2139.0, 1249.0, 683.0, 428.0, 269.0, 215.0, 123.0, 104.0, 58.0, 51.0, 33.0, 30.0, 24.0, 10.0, 12.0, 8.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01415252685546875, -0.013674378395080566, -0.013196229934692383, -0.0127180814743042, -0.012239933013916016, -0.011761784553527832, -0.011283636093139648, -0.010805487632751465, -0.010327339172363281, -0.009849190711975098, -0.009371042251586914, -0.00889289379119873, -0.008414745330810547, -0.007936596870422363, -0.00745844841003418, -0.006980299949645996, -0.0065021514892578125, -0.006024003028869629, -0.005545854568481445, -0.005067706108093262, -0.004589557647705078, -0.0041114091873168945, -0.003633260726928711, -0.0031551122665405273, -0.0026769638061523438, -0.00219881534576416, -0.0017206668853759766, -0.001242518424987793, -0.0007643699645996094, -0.0002862215042114258, 0.0001919269561767578, 0.0006700754165649414, 0.001148223876953125, 0.0016263723373413086, 0.002104520797729492, 0.0025826692581176758, 0.0030608177185058594, 0.003538966178894043, 0.0040171146392822266, 0.00449526309967041, 0.004973411560058594, 0.005451560020446777, 0.005929708480834961, 0.0064078569412231445, 0.006886005401611328, 0.007364153861999512, 0.007842302322387695, 0.008320450782775879, 0.008798599243164062, 0.009276747703552246, 0.00975489616394043, 0.010233044624328613, 0.010711193084716797, 0.01118934154510498, 0.011667490005493164, 0.012145638465881348, 0.012623786926269531, 0.013101935386657715, 0.013580083847045898, 0.014058232307434082, 0.014536380767822266, 0.01501452922821045, 0.015492677688598633, 0.015970826148986816, 0.016448974609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 7.0, 0.0, 6.0, 11.0, 10.0, 9.0, 13.0, 10.0, 20.0, 24.0, 29.0, 28.0, 49.0, 43.0, 69.0, 78.0, 78.0, 67.0, 71.0, 75.0, 50.0, 46.0, 31.0, 37.0, 26.0, 14.0, 22.0, 14.0, 16.0, 8.0, 8.0, 7.0, 9.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.003814697265625, -0.003693819046020508, -0.0035729408264160156, -0.0034520626068115234, -0.0033311843872070312, -0.003210306167602539, -0.003089427947998047, -0.0029685497283935547, -0.0028476715087890625, -0.0027267932891845703, -0.002605915069580078, -0.002485036849975586, -0.0023641586303710938, -0.0022432804107666016, -0.0021224021911621094, -0.002001523971557617, -0.001880645751953125, -0.0017597675323486328, -0.0016388893127441406, -0.0015180110931396484, -0.0013971328735351562, -0.001276254653930664, -0.0011553764343261719, -0.0010344982147216797, -0.0009136199951171875, -0.0007927417755126953, -0.0006718635559082031, -0.0005509853363037109, -0.00043010711669921875, -0.00030922889709472656, -0.00018835067749023438, -6.747245788574219e-05, 5.340576171875e-05, 0.0001742839813232422, 0.0002951622009277344, 0.00041604042053222656, 0.0005369186401367188, 0.0006577968597412109, 0.0007786750793457031, 0.0008995532989501953, 0.0010204315185546875, 0.0011413097381591797, 0.0012621879577636719, 0.001383066177368164, 0.0015039443969726562, 0.0016248226165771484, 0.0017457008361816406, 0.0018665790557861328, 0.001987457275390625, 0.002108335494995117, 0.0022292137145996094, 0.0023500919342041016, 0.0024709701538085938, 0.002591848373413086, 0.002712726593017578, 0.0028336048126220703, 0.0029544830322265625, 0.0030753612518310547, 0.003196239471435547, 0.003317117691040039, 0.0034379959106445312, 0.0035588741302490234, 0.0036797523498535156, 0.003800630569458008, 0.0039215087890625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 3.0, 18.0, 24.0, 23.0, 35.0, 48.0, 82.0, 149.0, 185.0, 157.0, 89.0, 66.0, 35.0, 22.0, 14.0, 9.0, 6.0, 7.0, 4.0, 7.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08575208485126495, -0.0818125531077385, -0.07787302881479263, -0.07393349707126617, -0.06999396532773972, -0.06605443358421326, -0.062114909291267395, -0.058175377547740936, -0.054235849529504776, -0.050296321511268616, -0.04635678976774216, -0.042417261749506, -0.038477733731269836, -0.03453820198774338, -0.030598673969507217, -0.026659144088625908, -0.0227196142077446, -0.01878008432686329, -0.014840555377304554, -0.010901026427745819, -0.00696149654686451, -0.0030219666659832, 0.0009175613522529602, 0.00485709123313427, 0.00879662111401558, 0.012736150994896889, 0.016675680875778198, 0.02061520889401436, 0.024554738774895668, 0.028494268655776978, 0.03243379667401314, 0.0363733246922493, 0.04031285643577576, 0.04425238445401192, 0.048191916197538376, 0.052131444215774536, 0.056070975959300995, 0.060010503977537155, 0.06395003199577332, 0.06788956373929977, 0.07182909548282623, 0.07576862722635269, 0.07970815151929855, 0.08364768326282501, 0.08758721500635147, 0.09152674674987793, 0.09546627104282379, 0.09940580278635025, 0.10334532707929611, 0.10728485882282257, 0.11122438311576843, 0.11516391485929489, 0.11910344660282135, 0.12304297089576721, 0.12698251008987427, 0.13092203438282013, 0.134861558675766, 0.13880108296871185, 0.1427406221628189, 0.14668014645576477, 0.15061967074871063, 0.1545592099428177, 0.15849873423576355, 0.1624382585287094, 0.16637779772281647]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 8.0, 8.0, 15.0, 11.0, 18.0, 15.0, 27.0, 25.0, 34.0, 42.0, 43.0, 42.0, 42.0, 53.0, 54.0, 45.0, 58.0, 47.0, 49.0, 38.0, 50.0, 33.0, 39.0, 29.0, 30.0, 23.0, 24.0, 20.0, 12.0, 13.0, 11.0, 6.0, 8.0, 5.0, 8.0, 8.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06840439885854721, -0.06641142070293427, -0.06441844254732132, -0.062425464391708374, -0.06043248623609543, -0.05843950808048248, -0.05644652992486954, -0.05445355176925659, -0.052460573613643646, -0.0504675954580307, -0.048474617302417755, -0.04648163914680481, -0.044488660991191864, -0.04249568283557892, -0.04050270467996597, -0.03850972652435303, -0.03651674464344978, -0.03452376648783684, -0.03253078833222389, -0.030537810176610947, -0.028544832020998, -0.026551853865385056, -0.02455887384712696, -0.022565895691514015, -0.02057291753590107, -0.018579939380288124, -0.01658696122467518, -0.014593982137739658, -0.012601003982126713, -0.010608025826513767, -0.008615046739578247, -0.0066220685839653015, -0.0046290867030620575, -0.0026361083146184683, -0.0006431299261748791, 0.0013498486950993538, 0.0033428268507122993, 0.005335805006325245, 0.007328784093260765, 0.00932176224887371, 0.011314740404486656, 0.013307718560099602, 0.015300696715712547, 0.017293676733970642, 0.019286654889583588, 0.021279633045196533, 0.02327261120080948, 0.025265589356422424, 0.02725856751203537, 0.029251545667648315, 0.03124452382326126, 0.03323750197887421, 0.03523048013448715, 0.0372234582901001, 0.03921643644571304, 0.04120941460132599, 0.043202392756938934, 0.04519537091255188, 0.047188349068164825, 0.04918132722377777, 0.05117430537939072, 0.05316728353500366, 0.05516026169061661, 0.05715323984622955, 0.0591462217271328]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 5.0, 8.0, 11.0, 21.0, 27.0, 30.0, 59.0, 70.0, 103.0, 155.0, 228.0, 316.0, 415.0, 645.0, 870.0, 1393.0, 1911.0, 2788.0, 4272.0, 6325.0, 9388.0, 14001.0, 21975.0, 34797.0, 55906.0, 93017.0, 158534.0, 221935.0, 163605.0, 96167.0, 57601.0, 35423.0, 22736.0, 14444.0, 9470.0, 6381.0, 4282.0, 2816.0, 1970.0, 1381.0, 930.0, 647.0, 442.0, 296.0, 226.0, 175.0, 107.0, 76.0, 66.0, 39.0, 29.0, 11.0, 12.0, 11.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.0836181640625, -0.08096599578857422, -0.07831382751464844, -0.07566165924072266, -0.07300949096679688, -0.0703573226928711, -0.06770515441894531, -0.06505298614501953, -0.06240081787109375, -0.05974864959716797, -0.05709648132324219, -0.054444313049316406, -0.051792144775390625, -0.049139976501464844, -0.04648780822753906, -0.04383563995361328, -0.0411834716796875, -0.03853130340576172, -0.03587913513183594, -0.033226966857910156, -0.030574798583984375, -0.027922630310058594, -0.025270462036132812, -0.02261829376220703, -0.01996612548828125, -0.01731395721435547, -0.014661788940429688, -0.012009620666503906, -0.009357452392578125, -0.006705284118652344, -0.0040531158447265625, -0.0014009475708007812, 0.001251220703125, 0.0039033889770507812, 0.0065555572509765625, 0.009207725524902344, 0.011859893798828125, 0.014512062072753906, 0.017164230346679688, 0.01981639862060547, 0.02246856689453125, 0.02512073516845703, 0.027772903442382812, 0.030425071716308594, 0.033077239990234375, 0.035729408264160156, 0.03838157653808594, 0.04103374481201172, 0.0436859130859375, 0.04633808135986328, 0.04899024963378906, 0.051642417907714844, 0.054294586181640625, 0.056946754455566406, 0.05959892272949219, 0.06225109100341797, 0.06490325927734375, 0.06755542755126953, 0.07020759582519531, 0.0728597640991211, 0.07551193237304688, 0.07816410064697266, 0.08081626892089844, 0.08346843719482422, 0.08612060546875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 12.0, 9.0, 15.0, 13.0, 13.0, 25.0, 28.0, 38.0, 31.0, 45.0, 47.0, 45.0, 41.0, 52.0, 50.0, 55.0, 61.0, 51.0, 41.0, 40.0, 35.0, 44.0, 24.0, 33.0, 22.0, 23.0, 25.0, 15.0, 12.0, 5.0, 8.0, 10.0, 6.0, 7.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05157470703125, -0.05003643035888672, -0.04849815368652344, -0.046959877014160156, -0.045421600341796875, -0.043883323669433594, -0.04234504699707031, -0.04080677032470703, -0.03926849365234375, -0.03773021697998047, -0.03619194030761719, -0.034653663635253906, -0.033115386962890625, -0.031577110290527344, -0.030038833618164062, -0.02850055694580078, -0.0269622802734375, -0.02542400360107422, -0.023885726928710938, -0.022347450256347656, -0.020809173583984375, -0.019270896911621094, -0.017732620239257812, -0.01619434356689453, -0.01465606689453125, -0.013117790222167969, -0.011579513549804688, -0.010041236877441406, -0.008502960205078125, -0.006964683532714844, -0.0054264068603515625, -0.0038881301879882812, -0.002349853515625, -0.0008115768432617188, 0.0007266998291015625, 0.0022649765014648438, 0.003803253173828125, 0.005341529846191406, 0.0068798065185546875, 0.008418083190917969, 0.00995635986328125, 0.011494636535644531, 0.013032913208007812, 0.014571189880371094, 0.016109466552734375, 0.017647743225097656, 0.019186019897460938, 0.02072429656982422, 0.0222625732421875, 0.02380084991455078, 0.025339126586914062, 0.026877403259277344, 0.028415679931640625, 0.029953956604003906, 0.03149223327636719, 0.03303050994873047, 0.03456878662109375, 0.03610706329345703, 0.03764533996582031, 0.039183616638183594, 0.040721893310546875, 0.042260169982910156, 0.04379844665527344, 0.04533672332763672, 0.046875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 10.0, 10.0, 13.0, 26.0, 41.0, 64.0, 69.0, 108.0, 146.0, 237.0, 339.0, 454.0, 677.0, 950.0, 1356.0, 1968.0, 2932.0, 4289.0, 6811.0, 10448.0, 16964.0, 29049.0, 51176.0, 95896.0, 190554.0, 276080.0, 162244.0, 82198.0, 44737.0, 25369.0, 15267.0, 9479.0, 5971.0, 3957.0, 2672.0, 1864.0, 1206.0, 919.0, 598.0, 450.0, 294.0, 213.0, 143.0, 96.0, 80.0, 51.0, 33.0, 19.0, 13.0, 8.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.08502197265625, -0.0823965072631836, -0.07977104187011719, -0.07714557647705078, -0.07452011108398438, -0.07189464569091797, -0.06926918029785156, -0.06664371490478516, -0.06401824951171875, -0.061392784118652344, -0.05876731872558594, -0.05614185333251953, -0.053516387939453125, -0.05089092254638672, -0.04826545715332031, -0.045639991760253906, -0.0430145263671875, -0.040389060974121094, -0.03776359558105469, -0.03513813018798828, -0.032512664794921875, -0.02988719940185547, -0.027261734008789062, -0.024636268615722656, -0.02201080322265625, -0.019385337829589844, -0.016759872436523438, -0.014134407043457031, -0.011508941650390625, -0.008883476257324219, -0.0062580108642578125, -0.0036325454711914062, -0.001007080078125, 0.0016183853149414062, 0.0042438507080078125, 0.006869316101074219, 0.009494781494140625, 0.012120246887207031, 0.014745712280273438, 0.017371177673339844, 0.01999664306640625, 0.022622108459472656, 0.025247573852539062, 0.02787303924560547, 0.030498504638671875, 0.03312397003173828, 0.03574943542480469, 0.038374900817871094, 0.0410003662109375, 0.043625831604003906, 0.04625129699707031, 0.04887676239013672, 0.051502227783203125, 0.05412769317626953, 0.05675315856933594, 0.059378623962402344, 0.06200408935546875, 0.06462955474853516, 0.06725502014160156, 0.06988048553466797, 0.07250595092773438, 0.07513141632080078, 0.07775688171386719, 0.0803823471069336, 0.0830078125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 10.0, 9.0, 14.0, 15.0, 13.0, 22.0, 21.0, 20.0, 30.0, 30.0, 35.0, 28.0, 30.0, 31.0, 48.0, 35.0, 35.0, 40.0, 40.0, 33.0, 34.0, 38.0, 37.0, 34.0, 31.0, 25.0, 33.0, 24.0, 24.0, 22.0, 20.0, 17.0, 21.0, 11.0, 15.0, 11.0, 8.0, 9.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.021484375, -0.020735502243041992, -0.019986629486083984, -0.019237756729125977, -0.01848888397216797, -0.01774001121520996, -0.016991138458251953, -0.016242265701293945, -0.015493392944335938, -0.01474452018737793, -0.013995647430419922, -0.013246774673461914, -0.012497901916503906, -0.011749029159545898, -0.01100015640258789, -0.010251283645629883, -0.009502410888671875, -0.008753538131713867, -0.00800466537475586, -0.0072557926177978516, -0.006506919860839844, -0.005758047103881836, -0.005009174346923828, -0.00426030158996582, -0.0035114288330078125, -0.0027625560760498047, -0.002013683319091797, -0.001264810562133789, -0.0005159378051757812, 0.00023293495178222656, 0.0009818077087402344, 0.0017306804656982422, 0.00247955322265625, 0.003228425979614258, 0.003977298736572266, 0.0047261714935302734, 0.005475044250488281, 0.006223917007446289, 0.006972789764404297, 0.007721662521362305, 0.008470535278320312, 0.00921940803527832, 0.009968280792236328, 0.010717153549194336, 0.011466026306152344, 0.012214899063110352, 0.01296377182006836, 0.013712644577026367, 0.014461517333984375, 0.015210390090942383, 0.01595926284790039, 0.0167081356048584, 0.017457008361816406, 0.018205881118774414, 0.018954753875732422, 0.01970362663269043, 0.020452499389648438, 0.021201372146606445, 0.021950244903564453, 0.02269911766052246, 0.02344799041748047, 0.024196863174438477, 0.024945735931396484, 0.025694608688354492, 0.0264434814453125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 9.0, 9.0, 10.0, 15.0, 30.0, 42.0, 44.0, 70.0, 111.0, 192.0, 274.0, 445.0, 672.0, 1161.0, 1999.0, 3697.0, 7488.0, 17779.0, 59196.0, 894889.0, 35133.0, 12594.0, 5572.0, 2920.0, 1621.0, 923.0, 577.0, 377.0, 228.0, 162.0, 99.0, 84.0, 42.0, 20.0, 20.0, 17.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.107421875, -0.10429096221923828, -0.10116004943847656, -0.09802913665771484, -0.09489822387695312, -0.0917673110961914, -0.08863639831542969, -0.08550548553466797, -0.08237457275390625, -0.07924365997314453, -0.07611274719238281, -0.0729818344116211, -0.06985092163085938, -0.06672000885009766, -0.06358909606933594, -0.06045818328857422, -0.0573272705078125, -0.05419635772705078, -0.05106544494628906, -0.047934532165527344, -0.044803619384765625, -0.041672706604003906, -0.03854179382324219, -0.03541088104248047, -0.03227996826171875, -0.02914905548095703, -0.026018142700195312, -0.022887229919433594, -0.019756317138671875, -0.016625404357910156, -0.013494491577148438, -0.010363578796386719, -0.007232666015625, -0.004101753234863281, -0.0009708404541015625, 0.0021600723266601562, 0.005290985107421875, 0.008421897888183594, 0.011552810668945312, 0.014683723449707031, 0.01781463623046875, 0.02094554901123047, 0.024076461791992188, 0.027207374572753906, 0.030338287353515625, 0.033469200134277344, 0.03660011291503906, 0.03973102569580078, 0.0428619384765625, 0.04599285125732422, 0.04912376403808594, 0.052254676818847656, 0.055385589599609375, 0.058516502380371094, 0.06164741516113281, 0.06477832794189453, 0.06790924072265625, 0.07104015350341797, 0.07417106628417969, 0.0773019790649414, 0.08043289184570312, 0.08356380462646484, 0.08669471740722656, 0.08982563018798828, 0.09295654296875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 9.0, 11.0, 6.0, 7.0, 19.0, 22.0, 33.0, 21.0, 25.0, 39.0, 40.0, 61.0, 93.0, 65.0, 73.0, 67.0, 60.0, 92.0, 43.0, 35.0, 34.0, 22.0, 26.0, 17.0, 12.0, 13.0, 7.0, 7.0, 7.0, 10.0, 3.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.5299530029296875e-06, -4.3995678424835205e-06, -4.2691826820373535e-06, -4.1387975215911865e-06, -4.0084123611450195e-06, -3.8780272006988525e-06, -3.7476420402526855e-06, -3.6172568798065186e-06, -3.4868717193603516e-06, -3.3564865589141846e-06, -3.2261013984680176e-06, -3.0957162380218506e-06, -2.9653310775756836e-06, -2.8349459171295166e-06, -2.7045607566833496e-06, -2.5741755962371826e-06, -2.4437904357910156e-06, -2.3134052753448486e-06, -2.1830201148986816e-06, -2.0526349544525146e-06, -1.9222497940063477e-06, -1.7918646335601807e-06, -1.6614794731140137e-06, -1.5310943126678467e-06, -1.4007091522216797e-06, -1.2703239917755127e-06, -1.1399388313293457e-06, -1.0095536708831787e-06, -8.791685104370117e-07, -7.487833499908447e-07, -6.183981895446777e-07, -4.880130290985107e-07, -3.5762786865234375e-07, -2.2724270820617676e-07, -9.685754776000977e-08, 3.3527612686157227e-08, 1.6391277313232422e-07, 2.942979335784912e-07, 4.246830940246582e-07, 5.550682544708252e-07, 6.854534149169922e-07, 8.158385753631592e-07, 9.462237358093262e-07, 1.0766088962554932e-06, 1.2069940567016602e-06, 1.3373792171478271e-06, 1.4677643775939941e-06, 1.5981495380401611e-06, 1.7285346984863281e-06, 1.8589198589324951e-06, 1.989305019378662e-06, 2.119690179824829e-06, 2.250075340270996e-06, 2.380460500717163e-06, 2.51084566116333e-06, 2.641230821609497e-06, 2.771615982055664e-06, 2.902001142501831e-06, 3.032386302947998e-06, 3.162771463394165e-06, 3.293156623840332e-06, 3.423541784286499e-06, 3.553926944732666e-06, 3.684312105178833e-06, 3.814697265625e-06]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 14.0, 18.0, 21.0, 24.0, 50.0, 62.0, 78.0, 110.0, 176.0, 236.0, 343.0, 522.0, 734.0, 1086.0, 1713.0, 2709.0, 4652.0, 8694.0, 19425.0, 64658.0, 881145.0, 33017.0, 12611.0, 6432.0, 3672.0, 2162.0, 1311.0, 910.0, 584.0, 400.0, 302.0, 174.0, 145.0, 107.0, 69.0, 49.0, 35.0, 29.0, 17.0, 10.0, 17.0, 11.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080810546875, -0.07822513580322266, -0.07563972473144531, -0.07305431365966797, -0.07046890258789062, -0.06788349151611328, -0.06529808044433594, -0.0627126693725586, -0.06012725830078125, -0.057541847229003906, -0.05495643615722656, -0.05237102508544922, -0.049785614013671875, -0.04720020294189453, -0.04461479187011719, -0.042029380798339844, -0.0394439697265625, -0.036858558654785156, -0.03427314758300781, -0.03168773651123047, -0.029102325439453125, -0.02651691436767578, -0.023931503295898438, -0.021346092224121094, -0.01876068115234375, -0.016175270080566406, -0.013589859008789062, -0.011004447937011719, -0.008419036865234375, -0.005833625793457031, -0.0032482147216796875, -0.0006628036499023438, 0.001922607421875, 0.004508018493652344, 0.0070934295654296875, 0.009678840637207031, 0.012264251708984375, 0.014849662780761719, 0.017435073852539062, 0.020020484924316406, 0.02260589599609375, 0.025191307067871094, 0.027776718139648438, 0.03036212921142578, 0.032947540283203125, 0.03553295135498047, 0.03811836242675781, 0.040703773498535156, 0.0432891845703125, 0.045874595642089844, 0.04846000671386719, 0.05104541778564453, 0.053630828857421875, 0.05621623992919922, 0.05880165100097656, 0.061387062072753906, 0.06397247314453125, 0.0665578842163086, 0.06914329528808594, 0.07172870635986328, 0.07431411743164062, 0.07689952850341797, 0.07948493957519531, 0.08207035064697266, 0.08465576171875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 4.0, 6.0, 10.0, 8.0, 13.0, 14.0, 16.0, 19.0, 24.0, 721.0, 19.0, 29.0, 22.0, 16.0, 8.0, 8.0, 9.0, 3.0, 5.0, 5.0, 3.0, 0.0, 7.0, 3.0, 1.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01934814453125, -0.01872849464416504, -0.018108844757080078, -0.017489194869995117, -0.016869544982910156, -0.016249895095825195, -0.015630245208740234, -0.015010595321655273, -0.014390945434570312, -0.013771295547485352, -0.01315164566040039, -0.01253199577331543, -0.011912345886230469, -0.011292695999145508, -0.010673046112060547, -0.010053396224975586, -0.009433746337890625, -0.008814096450805664, -0.008194446563720703, -0.007574796676635742, -0.006955146789550781, -0.00633549690246582, -0.005715847015380859, -0.0050961971282958984, -0.0044765472412109375, -0.0038568973541259766, -0.0032372474670410156, -0.0026175975799560547, -0.0019979476928710938, -0.0013782978057861328, -0.0007586479187011719, -0.00013899803161621094, 0.00048065185546875, 0.001100301742553711, 0.0017199516296386719, 0.002339601516723633, 0.0029592514038085938, 0.0035789012908935547, 0.004198551177978516, 0.0048182010650634766, 0.0054378509521484375, 0.0060575008392333984, 0.006677150726318359, 0.00729680061340332, 0.007916450500488281, 0.008536100387573242, 0.009155750274658203, 0.009775400161743164, 0.010395050048828125, 0.011014699935913086, 0.011634349822998047, 0.012253999710083008, 0.012873649597167969, 0.01349329948425293, 0.01411294937133789, 0.014732599258422852, 0.015352249145507812, 0.015971899032592773, 0.016591548919677734, 0.017211198806762695, 0.017830848693847656, 0.018450498580932617, 0.019070148468017578, 0.01968979835510254, 0.0203094482421875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 10.0, 12.0, 16.0, 23.0, 46.0, 56.0, 94.0, 141.0, 234.0, 177.0, 76.0, 37.0, 22.0, 14.0, 14.0, 7.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09046808630228043, -0.08663983643054962, -0.08281158655881882, -0.07898333668708801, -0.07515507936477661, -0.0713268369436264, -0.067498579621315, -0.0636703297495842, -0.059842079877853394, -0.05601383000612259, -0.052185580134391785, -0.04835732653737068, -0.04452907666563988, -0.04070082679390907, -0.03687257319688797, -0.033044323325157166, -0.02921607345342636, -0.025387823581695557, -0.021559571847319603, -0.01773132011294365, -0.013903070241212845, -0.01007482036948204, -0.006246568635106087, -0.002418316900730133, 0.0014099329710006714, 0.0052381837740540504, 0.00906643457710743, 0.012894685380160809, 0.016722936183214188, 0.020551186054944992, 0.024379437789320946, 0.0282076895236969, 0.03203593194484711, 0.03586418181657791, 0.039692431688308716, 0.04352068528532982, 0.04734893515706062, 0.05117718502879143, 0.05500543862581253, 0.058833688497543335, 0.06266193836927414, 0.06649018824100494, 0.07031843811273575, 0.07414668798446655, 0.07797494530677795, 0.08180318772792816, 0.08563144505023956, 0.08945969492197037, 0.09328794479370117, 0.09711619466543198, 0.10094444453716278, 0.10477269440889359, 0.10860094428062439, 0.11242920160293579, 0.1162574514746666, 0.1200857013463974, 0.1239139512181282, 0.127742201089859, 0.1315704584121704, 0.13539870083332062, 0.13922695815563202, 0.14305520057678223, 0.14688345789909363, 0.15071171522140503, 0.15453995764255524]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 0.0, 5.0, 9.0, 5.0, 11.0, 16.0, 16.0, 18.0, 24.0, 22.0, 40.0, 36.0, 46.0, 39.0, 49.0, 56.0, 50.0, 60.0, 47.0, 55.0, 52.0, 49.0, 39.0, 38.0, 45.0, 23.0, 28.0, 20.0, 20.0, 15.0, 17.0, 13.0, 10.0, 10.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0564868189394474, -0.05477957800030708, -0.05307233706116676, -0.051365096122026443, -0.049657855182886124, -0.047950614243745804, -0.046243373304605484, -0.044536132365465164, -0.042828891426324844, -0.041121650487184525, -0.039414409548044205, -0.037707168608903885, -0.035999927669763565, -0.034292686730623245, -0.032585445791482925, -0.030878204852342606, -0.029170963913202286, -0.027463722974061966, -0.025756482034921646, -0.024049241095781326, -0.022342000156641006, -0.020634759217500687, -0.018927518278360367, -0.017220277339220047, -0.015513036400079727, -0.013805795460939407, -0.012098554521799088, -0.010391313582658768, -0.008684072643518448, -0.006976831704378128, -0.005269590765237808, -0.0035623498260974884, -0.0018551051616668701, -0.0001478642225265503, 0.0015593767166137695, 0.0032666176557540894, 0.004973858594894409, 0.006681099534034729, 0.008388340473175049, 0.010095581412315369, 0.011802822351455688, 0.013510063290596008, 0.015217304229736328, 0.016924545168876648, 0.018631786108016968, 0.020339027047157288, 0.022046267986297607, 0.023753508925437927, 0.025460749864578247, 0.027167990803718567, 0.028875231742858887, 0.030582472681999207, 0.032289713621139526, 0.033996954560279846, 0.035704195499420166, 0.037411436438560486, 0.039118677377700806, 0.040825918316841125, 0.042533159255981445, 0.044240400195121765, 0.045947641134262085, 0.047654882073402405, 0.049362123012542725, 0.051069363951683044, 0.052776604890823364]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 12.0, 7.0, 8.0, 18.0, 13.0, 34.0, 24.0, 51.0, 57.0, 82.0, 131.0, 188.0, 264.0, 357.0, 555.0, 874.0, 1220.0, 1821.0, 2780.0, 4247.0, 6652.0, 10640.0, 17454.0, 29745.0, 53666.0, 104033.0, 238657.0, 825802.0, 1901176.0, 592968.0, 195740.0, 88783.0, 46040.0, 26008.0, 15915.0, 9870.0, 6474.0, 4186.0, 2773.0, 1851.0, 1136.0, 730.0, 473.0, 294.0, 153.0, 125.0, 76.0, 49.0, 29.0, 18.0, 9.0, 6.0, 2.0, 1.0], "bins": [-0.07354736328125, -0.07163143157958984, -0.06971549987792969, -0.06779956817626953, -0.06588363647460938, -0.06396770477294922, -0.06205177307128906, -0.060135841369628906, -0.05821990966796875, -0.056303977966308594, -0.05438804626464844, -0.05247211456298828, -0.050556182861328125, -0.04864025115966797, -0.04672431945800781, -0.044808387756347656, -0.0428924560546875, -0.040976524353027344, -0.03906059265136719, -0.03714466094970703, -0.035228729248046875, -0.03331279754638672, -0.03139686584472656, -0.029480934143066406, -0.02756500244140625, -0.025649070739746094, -0.023733139038085938, -0.02181720733642578, -0.019901275634765625, -0.01798534393310547, -0.016069412231445312, -0.014153480529785156, -0.012237548828125, -0.010321617126464844, -0.008405685424804688, -0.006489753723144531, -0.004573822021484375, -0.0026578903198242188, -0.0007419586181640625, 0.0011739730834960938, 0.00308990478515625, 0.005005836486816406, 0.0069217681884765625, 0.008837699890136719, 0.010753631591796875, 0.012669563293457031, 0.014585494995117188, 0.016501426696777344, 0.0184173583984375, 0.020333290100097656, 0.022249221801757812, 0.02416515350341797, 0.026081085205078125, 0.02799701690673828, 0.029912948608398438, 0.031828880310058594, 0.03374481201171875, 0.035660743713378906, 0.03757667541503906, 0.03949260711669922, 0.041408538818359375, 0.04332447052001953, 0.04524040222167969, 0.047156333923339844, 0.049072265625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 4.0, 10.0, 7.0, 13.0, 17.0, 14.0, 14.0, 21.0, 30.0, 37.0, 28.0, 40.0, 49.0, 50.0, 50.0, 57.0, 45.0, 53.0, 62.0, 47.0, 54.0, 42.0, 46.0, 34.0, 28.0, 21.0, 25.0, 17.0, 16.0, 15.0, 12.0, 13.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.035736083984375, -0.03474855422973633, -0.033761024475097656, -0.032773494720458984, -0.03178596496582031, -0.03079843521118164, -0.02981090545654297, -0.028823375701904297, -0.027835845947265625, -0.026848316192626953, -0.02586078643798828, -0.02487325668334961, -0.023885726928710938, -0.022898197174072266, -0.021910667419433594, -0.020923137664794922, -0.01993560791015625, -0.018948078155517578, -0.017960548400878906, -0.016973018646240234, -0.015985488891601562, -0.01499795913696289, -0.014010429382324219, -0.013022899627685547, -0.012035369873046875, -0.011047840118408203, -0.010060310363769531, -0.00907278060913086, -0.008085250854492188, -0.007097721099853516, -0.006110191345214844, -0.005122661590576172, -0.0041351318359375, -0.003147602081298828, -0.0021600723266601562, -0.0011725425720214844, -0.0001850128173828125, 0.0008025169372558594, 0.0017900466918945312, 0.002777576446533203, 0.003765106201171875, 0.004752635955810547, 0.005740165710449219, 0.006727695465087891, 0.0077152252197265625, 0.008702754974365234, 0.009690284729003906, 0.010677814483642578, 0.01166534423828125, 0.012652873992919922, 0.013640403747558594, 0.014627933502197266, 0.015615463256835938, 0.01660299301147461, 0.01759052276611328, 0.018578052520751953, 0.019565582275390625, 0.020553112030029297, 0.02154064178466797, 0.02252817153930664, 0.023515701293945312, 0.024503231048583984, 0.025490760803222656, 0.026478290557861328, 0.0274658203125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 8.0, 15.0, 17.0, 13.0, 31.0, 40.0, 57.0, 70.0, 115.0, 139.0, 239.0, 263.0, 421.0, 641.0, 932.0, 1338.0, 2134.0, 3190.0, 5177.0, 8273.0, 14068.0, 24780.0, 46221.0, 93407.0, 209784.0, 579303.0, 1752486.0, 900569.0, 294286.0, 122264.0, 58607.0, 30471.0, 17230.0, 9907.0, 6281.0, 3898.0, 2569.0, 1593.0, 1082.0, 729.0, 511.0, 340.0, 215.0, 175.0, 136.0, 83.0, 45.0, 42.0, 32.0, 15.0, 13.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 2.0], "bins": [-0.0543212890625, -0.052659034729003906, -0.05099678039550781, -0.04933452606201172, -0.047672271728515625, -0.04601001739501953, -0.04434776306152344, -0.042685508728027344, -0.04102325439453125, -0.039361000061035156, -0.03769874572753906, -0.03603649139404297, -0.034374237060546875, -0.03271198272705078, -0.031049728393554688, -0.029387474060058594, -0.0277252197265625, -0.026062965393066406, -0.024400711059570312, -0.02273845672607422, -0.021076202392578125, -0.01941394805908203, -0.017751693725585938, -0.016089439392089844, -0.01442718505859375, -0.012764930725097656, -0.011102676391601562, -0.009440422058105469, -0.007778167724609375, -0.006115913391113281, -0.0044536590576171875, -0.0027914047241210938, -0.001129150390625, 0.0005331039428710938, 0.0021953582763671875, 0.0038576126098632812, 0.005519866943359375, 0.007182121276855469, 0.008844375610351562, 0.010506629943847656, 0.01216888427734375, 0.013831138610839844, 0.015493392944335938, 0.01715564727783203, 0.018817901611328125, 0.02048015594482422, 0.022142410278320312, 0.023804664611816406, 0.0254669189453125, 0.027129173278808594, 0.028791427612304688, 0.03045368194580078, 0.032115936279296875, 0.03377819061279297, 0.03544044494628906, 0.037102699279785156, 0.03876495361328125, 0.040427207946777344, 0.04208946228027344, 0.04375171661376953, 0.045413970947265625, 0.04707622528076172, 0.04873847961425781, 0.050400733947753906, 0.05206298828125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 8.0, 8.0, 9.0, 22.0, 12.0, 29.0, 25.0, 33.0, 44.0, 67.0, 61.0, 98.0, 104.0, 124.0, 128.0, 149.0, 226.0, 271.0, 295.0, 294.0, 337.0, 313.0, 259.0, 210.0, 194.0, 159.0, 113.0, 113.0, 73.0, 69.0, 38.0, 38.0, 36.0, 19.0, 11.0, 17.0, 11.0, 7.0, 10.0, 5.0, 6.0, 4.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.01385498046875, -0.013395071029663086, -0.012935161590576172, -0.012475252151489258, -0.012015342712402344, -0.01155543327331543, -0.011095523834228516, -0.010635614395141602, -0.010175704956054688, -0.009715795516967773, -0.00925588607788086, -0.008795976638793945, -0.008336067199707031, -0.007876157760620117, -0.007416248321533203, -0.006956338882446289, -0.006496429443359375, -0.006036520004272461, -0.005576610565185547, -0.005116701126098633, -0.004656791687011719, -0.004196882247924805, -0.0037369728088378906, -0.0032770633697509766, -0.0028171539306640625, -0.0023572444915771484, -0.0018973350524902344, -0.0014374256134033203, -0.0009775161743164062, -0.0005176067352294922, -5.7697296142578125e-05, 0.00040221214294433594, 0.00086212158203125, 0.001322031021118164, 0.0017819404602050781, 0.002241849899291992, 0.0027017593383789062, 0.0031616687774658203, 0.0036215782165527344, 0.0040814876556396484, 0.0045413970947265625, 0.0050013065338134766, 0.005461215972900391, 0.005921125411987305, 0.006381034851074219, 0.006840944290161133, 0.007300853729248047, 0.007760763168334961, 0.008220672607421875, 0.008680582046508789, 0.009140491485595703, 0.009600400924682617, 0.010060310363769531, 0.010520219802856445, 0.01098012924194336, 0.011440038681030273, 0.011899948120117188, 0.012359857559204102, 0.012819766998291016, 0.01327967643737793, 0.013739585876464844, 0.014199495315551758, 0.014659404754638672, 0.015119314193725586, 0.0155792236328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 5.0, 7.0, 7.0, 13.0, 19.0, 39.0, 59.0, 86.0, 121.0, 190.0, 169.0, 110.0, 63.0, 28.0, 25.0, 19.0, 12.0, 8.0, 6.0, 5.0, 2.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06749097257852554, -0.06515972316265106, -0.06282848119735718, -0.0604972317814827, -0.058165982365608215, -0.05583473667502403, -0.05350349098443985, -0.05117224156856537, -0.048840995877981186, -0.046509750187397, -0.04417850077152252, -0.04184725508093834, -0.039516009390354156, -0.037184759974479675, -0.03485351428389549, -0.03252226859331131, -0.03019101917743683, -0.027859771624207497, -0.025528524070978165, -0.023197278380393982, -0.02086603082716465, -0.018534783273935318, -0.016203537583351135, -0.013872290030121803, -0.011541042476892471, -0.00920979492366314, -0.006878548301756382, -0.004547301214188337, -0.0022160541266202927, 0.0001151934266090393, 0.0024464400485157967, 0.004777686670422554, 0.007108934223651886, 0.009440181776881218, 0.011771428398787975, 0.014102675020694733, 0.016433922573924065, 0.018765170127153397, 0.02109641581773758, 0.02342766337096691, 0.025758910924196243, 0.028090158477425575, 0.030421406030654907, 0.03275265172123909, 0.03508389741182327, 0.037415146827697754, 0.03974639251828194, 0.04207763820886612, 0.0444088876247406, 0.04674013331532478, 0.049071382731199265, 0.05140262842178345, 0.05373387783765793, 0.05606512352824211, 0.058396369218826294, 0.060727618634700775, 0.06305886805057526, 0.06539011746644974, 0.06772135943174362, 0.0700526088476181, 0.07238385826349258, 0.07471510767936707, 0.07704634964466095, 0.07937759906053543, 0.08170884102582932]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 9.0, 10.0, 8.0, 13.0, 20.0, 22.0, 24.0, 23.0, 17.0, 22.0, 42.0, 37.0, 41.0, 41.0, 50.0, 40.0, 42.0, 53.0, 60.0, 54.0, 49.0, 38.0, 35.0, 38.0, 29.0, 25.0, 19.0, 25.0, 19.0, 19.0, 17.0, 10.0, 13.0, 8.0, 6.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.03549375757575035, -0.03448797017335892, -0.033482182770967484, -0.03247639536857605, -0.031470607966184616, -0.03046482242643833, -0.029459035024046898, -0.028453247621655464, -0.02744746208190918, -0.026441674679517746, -0.025435887277126312, -0.02443009987473488, -0.023424314334988594, -0.02241852693259716, -0.021412739530205727, -0.020406952127814293, -0.01940116472542286, -0.018395377323031425, -0.017389589920639992, -0.016383804380893707, -0.015378016978502274, -0.01437222957611084, -0.013366442173719406, -0.012360654771327972, -0.011354868300259113, -0.01034908089786768, -0.00934329442679882, -0.008337507024407387, -0.00733172008767724, -0.006325933150947094, -0.00532014574855566, -0.004314358811825514, -0.0033085737377405167, -0.0023027868010103703, -0.0012969996314495802, -0.00029121246188879013, 0.0007145744748413563, 0.0017203614115715027, 0.0027261488139629364, 0.003731935750693083, 0.004737722687423229, 0.005743509624153376, 0.006749296560883522, 0.007755083963274956, 0.00876087136566639, 0.009766657836735249, 0.010772445239126682, 0.011778231710195541, 0.012784019112586975, 0.013789806514978409, 0.014795592986047268, 0.015801381319761276, 0.01680716685950756, 0.017812954261898994, 0.018818741664290428, 0.019824529066681862, 0.020830314606428146, 0.02183610200881958, 0.022841889411211014, 0.023847676813602448, 0.024853462353348732, 0.025859249755740166, 0.0268650371581316, 0.027870824560523033, 0.028876611962914467]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 2.0, 14.0, 12.0, 12.0, 13.0, 27.0, 37.0, 56.0, 77.0, 139.0, 167.0, 276.0, 404.0, 621.0, 980.0, 1618.0, 2678.0, 4647.0, 8804.0, 18962.0, 47298.0, 157159.0, 475914.0, 220664.0, 61139.0, 23054.0, 10179.0, 5376.0, 3162.0, 1823.0, 1154.0, 748.0, 461.0, 307.0, 173.0, 152.0, 82.0, 54.0, 36.0, 26.0, 18.0, 12.0, 11.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.04718017578125, -0.0457768440246582, -0.044373512268066406, -0.04297018051147461, -0.04156684875488281, -0.040163516998291016, -0.03876018524169922, -0.03735685348510742, -0.035953521728515625, -0.03455018997192383, -0.03314685821533203, -0.031743526458740234, -0.030340194702148438, -0.02893686294555664, -0.027533531188964844, -0.026130199432373047, -0.02472686767578125, -0.023323535919189453, -0.021920204162597656, -0.02051687240600586, -0.019113540649414062, -0.017710208892822266, -0.01630687713623047, -0.014903545379638672, -0.013500213623046875, -0.012096881866455078, -0.010693550109863281, -0.009290218353271484, -0.007886886596679688, -0.006483554840087891, -0.005080223083496094, -0.003676891326904297, -0.0022735595703125, -0.0008702278137207031, 0.0005331039428710938, 0.0019364356994628906, 0.0033397674560546875, 0.004743099212646484, 0.006146430969238281, 0.007549762725830078, 0.008953094482421875, 0.010356426239013672, 0.011759757995605469, 0.013163089752197266, 0.014566421508789062, 0.01596975326538086, 0.017373085021972656, 0.018776416778564453, 0.02017974853515625, 0.021583080291748047, 0.022986412048339844, 0.02438974380493164, 0.025793075561523438, 0.027196407318115234, 0.02859973907470703, 0.030003070831298828, 0.031406402587890625, 0.03280973434448242, 0.03421306610107422, 0.035616397857666016, 0.03701972961425781, 0.03842306137084961, 0.039826393127441406, 0.0412297248840332, 0.042633056640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 5.0, 6.0, 7.0, 9.0, 13.0, 14.0, 18.0, 27.0, 27.0, 25.0, 30.0, 32.0, 41.0, 39.0, 42.0, 49.0, 44.0, 42.0, 55.0, 47.0, 56.0, 46.0, 37.0, 43.0, 32.0, 30.0, 23.0, 25.0, 27.0, 23.0, 19.0, 12.0, 10.0, 10.0, 9.0, 9.0, 7.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.034454345703125, -0.03347444534301758, -0.032494544982910156, -0.031514644622802734, -0.030534744262695312, -0.02955484390258789, -0.02857494354248047, -0.027595043182373047, -0.026615142822265625, -0.025635242462158203, -0.02465534210205078, -0.02367544174194336, -0.022695541381835938, -0.021715641021728516, -0.020735740661621094, -0.019755840301513672, -0.01877593994140625, -0.017796039581298828, -0.016816139221191406, -0.015836238861083984, -0.014856338500976562, -0.01387643814086914, -0.012896537780761719, -0.011916637420654297, -0.010936737060546875, -0.009956836700439453, -0.008976936340332031, -0.00799703598022461, -0.0070171356201171875, -0.006037235260009766, -0.005057334899902344, -0.004077434539794922, -0.0030975341796875, -0.002117633819580078, -0.0011377334594726562, -0.00015783309936523438, 0.0008220672607421875, 0.0018019676208496094, 0.0027818679809570312, 0.003761768341064453, 0.004741668701171875, 0.005721569061279297, 0.006701469421386719, 0.007681369781494141, 0.008661270141601562, 0.009641170501708984, 0.010621070861816406, 0.011600971221923828, 0.01258087158203125, 0.013560771942138672, 0.014540672302246094, 0.015520572662353516, 0.016500473022460938, 0.01748037338256836, 0.01846027374267578, 0.019440174102783203, 0.020420074462890625, 0.021399974822998047, 0.02237987518310547, 0.02335977554321289, 0.024339675903320312, 0.025319576263427734, 0.026299476623535156, 0.027279376983642578, 0.02825927734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 15.0, 19.0, 30.0, 35.0, 66.0, 85.0, 150.0, 220.0, 412.0, 633.0, 1070.0, 1862.0, 3538.0, 7158.0, 17434.0, 55626.0, 351097.0, 498897.0, 71771.0, 21067.0, 8380.0, 3978.0, 2072.0, 1131.0, 701.0, 415.0, 232.0, 157.0, 90.0, 63.0, 48.0, 36.0, 11.0, 11.0, 9.0, 8.0, 10.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053955078125, -0.052100181579589844, -0.05024528503417969, -0.04839038848876953, -0.046535491943359375, -0.04468059539794922, -0.04282569885253906, -0.040970802307128906, -0.03911590576171875, -0.037261009216308594, -0.03540611267089844, -0.03355121612548828, -0.031696319580078125, -0.02984142303466797, -0.027986526489257812, -0.026131629943847656, -0.0242767333984375, -0.022421836853027344, -0.020566940307617188, -0.01871204376220703, -0.016857147216796875, -0.015002250671386719, -0.013147354125976562, -0.011292457580566406, -0.00943756103515625, -0.007582664489746094, -0.0057277679443359375, -0.0038728713989257812, -0.002017974853515625, -0.00016307830810546875, 0.0016918182373046875, 0.0035467147827148438, 0.005401611328125, 0.007256507873535156, 0.009111404418945312, 0.010966300964355469, 0.012821197509765625, 0.014676094055175781, 0.016530990600585938, 0.018385887145996094, 0.02024078369140625, 0.022095680236816406, 0.023950576782226562, 0.02580547332763672, 0.027660369873046875, 0.02951526641845703, 0.03137016296386719, 0.033225059509277344, 0.0350799560546875, 0.036934852600097656, 0.03878974914550781, 0.04064464569091797, 0.042499542236328125, 0.04435443878173828, 0.04620933532714844, 0.048064231872558594, 0.04991912841796875, 0.051774024963378906, 0.05362892150878906, 0.05548381805419922, 0.057338714599609375, 0.05919361114501953, 0.06104850769042969, 0.06290340423583984, 0.06475830078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 10.0, 10.0, 8.0, 13.0, 14.0, 14.0, 16.0, 27.0, 20.0, 33.0, 31.0, 34.0, 30.0, 43.0, 53.0, 40.0, 47.0, 36.0, 53.0, 37.0, 38.0, 41.0, 35.0, 39.0, 35.0, 28.0, 24.0, 23.0, 25.0, 28.0, 15.0, 19.0, 21.0, 8.0, 16.0, 6.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0189056396484375, -0.01831841468811035, -0.017731189727783203, -0.017143964767456055, -0.016556739807128906, -0.015969514846801758, -0.01538228988647461, -0.014795064926147461, -0.014207839965820312, -0.013620615005493164, -0.013033390045166016, -0.012446165084838867, -0.011858940124511719, -0.01127171516418457, -0.010684490203857422, -0.010097265243530273, -0.009510040283203125, -0.008922815322875977, -0.008335590362548828, -0.00774836540222168, -0.007161140441894531, -0.006573915481567383, -0.005986690521240234, -0.005399465560913086, -0.0048122406005859375, -0.004225015640258789, -0.0036377906799316406, -0.003050565719604492, -0.0024633407592773438, -0.0018761157989501953, -0.0012888908386230469, -0.0007016658782958984, -0.00011444091796875, 0.00047278404235839844, 0.0010600090026855469, 0.0016472339630126953, 0.0022344589233398438, 0.002821683883666992, 0.0034089088439941406, 0.003996133804321289, 0.0045833587646484375, 0.005170583724975586, 0.005757808685302734, 0.006345033645629883, 0.006932258605957031, 0.00751948356628418, 0.008106708526611328, 0.008693933486938477, 0.009281158447265625, 0.009868383407592773, 0.010455608367919922, 0.01104283332824707, 0.011630058288574219, 0.012217283248901367, 0.012804508209228516, 0.013391733169555664, 0.013978958129882812, 0.014566183090209961, 0.01515340805053711, 0.015740633010864258, 0.016327857971191406, 0.016915082931518555, 0.017502307891845703, 0.01808953285217285, 0.0186767578125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 2.0, 6.0, 8.0, 14.0, 29.0, 38.0, 66.0, 72.0, 105.0, 173.0, 252.0, 367.0, 514.0, 735.0, 1166.0, 1741.0, 2806.0, 4668.0, 7730.0, 14227.0, 28135.0, 63410.0, 184648.0, 457193.0, 163371.0, 57794.0, 26020.0, 13312.0, 7404.0, 4527.0, 2702.0, 1779.0, 1088.0, 741.0, 533.0, 346.0, 259.0, 191.0, 97.0, 87.0, 67.0, 39.0, 30.0, 18.0, 6.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007537841796875, -0.007305562496185303, -0.0070732831954956055, -0.006841003894805908, -0.006608724594116211, -0.006376445293426514, -0.006144165992736816, -0.005911886692047119, -0.005679607391357422, -0.005447328090667725, -0.005215048789978027, -0.00498276948928833, -0.004750490188598633, -0.0045182108879089355, -0.004285931587219238, -0.004053652286529541, -0.0038213729858398438, -0.0035890936851501465, -0.0033568143844604492, -0.003124535083770752, -0.0028922557830810547, -0.0026599764823913574, -0.00242769718170166, -0.002195417881011963, -0.0019631385803222656, -0.0017308592796325684, -0.001498579978942871, -0.0012663006782531738, -0.0010340213775634766, -0.0008017420768737793, -0.000569462776184082, -0.00033718347549438477, -0.0001049041748046875, 0.00012737512588500977, 0.00035965442657470703, 0.0005919337272644043, 0.0008242130279541016, 0.0010564923286437988, 0.001288771629333496, 0.0015210509300231934, 0.0017533302307128906, 0.001985609531402588, 0.002217888832092285, 0.0024501681327819824, 0.0026824474334716797, 0.002914726734161377, 0.0031470060348510742, 0.0033792853355407715, 0.0036115646362304688, 0.003843843936920166, 0.004076123237609863, 0.0043084025382995605, 0.004540681838989258, 0.004772961139678955, 0.005005240440368652, 0.00523751974105835, 0.005469799041748047, 0.005702078342437744, 0.005934357643127441, 0.006166636943817139, 0.006398916244506836, 0.006631195545196533, 0.0068634748458862305, 0.007095754146575928, 0.007328033447265625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 2.0, 5.0, 9.0, 12.0, 14.0, 35.0, 56.0, 65.0, 148.0, 174.0, 164.0, 117.0, 60.0, 39.0, 18.0, 12.0, 16.0, 5.0, 4.0, 7.0, 0.0, 6.0, 5.0, 0.0, 4.0, 1.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7821788787841797e-05, -1.724250614643097e-05, -1.666322350502014e-05, -1.6083940863609314e-05, -1.5504658222198486e-05, -1.4925375580787659e-05, -1.4346092939376831e-05, -1.3766810297966003e-05, -1.3187527656555176e-05, -1.2608245015144348e-05, -1.202896237373352e-05, -1.1449679732322693e-05, -1.0870397090911865e-05, -1.0291114449501038e-05, -9.71183180809021e-06, -9.132549166679382e-06, -8.553266525268555e-06, -7.973983883857727e-06, -7.394701242446899e-06, -6.815418601036072e-06, -6.236135959625244e-06, -5.6568533182144165e-06, -5.077570676803589e-06, -4.498288035392761e-06, -3.919005393981934e-06, -3.339722752571106e-06, -2.7604401111602783e-06, -2.1811574697494507e-06, -1.601874828338623e-06, -1.0225921869277954e-06, -4.4330954551696777e-07, 1.3597309589385986e-07, 7.152557373046875e-07, 1.2945383787155151e-06, 1.8738210201263428e-06, 2.4531036615371704e-06, 3.032386302947998e-06, 3.6116689443588257e-06, 4.190951585769653e-06, 4.770234227180481e-06, 5.349516868591309e-06, 5.928799510002136e-06, 6.508082151412964e-06, 7.0873647928237915e-06, 7.666647434234619e-06, 8.245930075645447e-06, 8.825212717056274e-06, 9.404495358467102e-06, 9.98377799987793e-06, 1.0563060641288757e-05, 1.1142343282699585e-05, 1.1721625924110413e-05, 1.230090856552124e-05, 1.2880191206932068e-05, 1.3459473848342896e-05, 1.4038756489753723e-05, 1.461803913116455e-05, 1.5197321772575378e-05, 1.5776604413986206e-05, 1.6355887055397034e-05, 1.693516969680786e-05, 1.751445233821869e-05, 1.8093734979629517e-05, 1.8673017621040344e-05, 1.9252300262451172e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 4.0, 6.0, 9.0, 14.0, 19.0, 20.0, 40.0, 48.0, 74.0, 129.0, 195.0, 319.0, 512.0, 901.0, 1508.0, 2738.0, 5150.0, 10285.0, 22248.0, 53195.0, 150703.0, 454937.0, 218972.0, 70966.0, 28585.0, 12947.0, 6344.0, 3241.0, 1782.0, 1012.0, 660.0, 359.0, 235.0, 137.0, 91.0, 44.0, 44.0, 29.0, 12.0, 12.0, 11.0, 2.0, 2.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007762908935546875, -0.007525146007537842, -0.007287383079528809, -0.007049620151519775, -0.006811857223510742, -0.006574094295501709, -0.006336331367492676, -0.006098568439483643, -0.005860805511474609, -0.005623042583465576, -0.005385279655456543, -0.00514751672744751, -0.0049097537994384766, -0.004671990871429443, -0.00443422794342041, -0.004196465015411377, -0.003958702087402344, -0.0037209391593933105, -0.0034831762313842773, -0.003245413303375244, -0.003007650375366211, -0.0027698874473571777, -0.0025321245193481445, -0.0022943615913391113, -0.002056598663330078, -0.001818835735321045, -0.0015810728073120117, -0.0013433098793029785, -0.0011055469512939453, -0.0008677840232849121, -0.0006300210952758789, -0.0003922581672668457, -0.0001544952392578125, 8.32676887512207e-05, 0.0003210306167602539, 0.0005587935447692871, 0.0007965564727783203, 0.0010343194007873535, 0.0012720823287963867, 0.00150984525680542, 0.0017476081848144531, 0.0019853711128234863, 0.0022231340408325195, 0.0024608969688415527, 0.002698659896850586, 0.002936422824859619, 0.0031741857528686523, 0.0034119486808776855, 0.0036497116088867188, 0.003887474536895752, 0.004125237464904785, 0.004363000392913818, 0.0046007633209228516, 0.004838526248931885, 0.005076289176940918, 0.005314052104949951, 0.005551815032958984, 0.005789577960968018, 0.006027340888977051, 0.006265103816986084, 0.006502866744995117, 0.00674062967300415, 0.006978392601013184, 0.007216155529022217, 0.00745391845703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 5.0, 7.0, 10.0, 10.0, 11.0, 8.0, 12.0, 21.0, 24.0, 39.0, 37.0, 40.0, 55.0, 58.0, 71.0, 63.0, 78.0, 65.0, 70.0, 49.0, 44.0, 51.0, 25.0, 29.0, 24.0, 17.0, 13.0, 10.0, 7.0, 8.0, 7.0, 7.0, 8.0, 3.0, 4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00147247314453125, -0.0014088153839111328, -0.0013451576232910156, -0.0012814998626708984, -0.0012178421020507812, -0.001154184341430664, -0.0010905265808105469, -0.0010268688201904297, -0.0009632110595703125, -0.0008995532989501953, -0.0008358955383300781, -0.0007722377777099609, -0.0007085800170898438, -0.0006449222564697266, -0.0005812644958496094, -0.0005176067352294922, -0.000453948974609375, -0.0003902912139892578, -0.0003266334533691406, -0.00026297569274902344, -0.00019931793212890625, -0.00013566017150878906, -7.200241088867188e-05, -8.344650268554688e-06, 5.53131103515625e-05, 0.00011897087097167969, 0.00018262863159179688, 0.00024628639221191406, 0.00030994415283203125, 0.00037360191345214844, 0.0004372596740722656, 0.0005009174346923828, 0.0005645751953125, 0.0006282329559326172, 0.0006918907165527344, 0.0007555484771728516, 0.0008192062377929688, 0.0008828639984130859, 0.0009465217590332031, 0.0010101795196533203, 0.0010738372802734375, 0.0011374950408935547, 0.0012011528015136719, 0.001264810562133789, 0.0013284683227539062, 0.0013921260833740234, 0.0014557838439941406, 0.0015194416046142578, 0.001583099365234375, 0.0016467571258544922, 0.0017104148864746094, 0.0017740726470947266, 0.0018377304077148438, 0.001901388168334961, 0.001965045928955078, 0.0020287036895751953, 0.0020923614501953125, 0.0021560192108154297, 0.002219676971435547, 0.002283334732055664, 0.0023469924926757812, 0.0024106502532958984, 0.0024743080139160156, 0.002537965774536133, 0.00260162353515625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 6.0, 14.0, 9.0, 25.0, 57.0, 71.0, 94.0, 178.0, 190.0, 129.0, 81.0, 39.0, 29.0, 18.0, 19.0, 8.0, 7.0, 8.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.05892157554626465, -0.056685153394937515, -0.05444873124361038, -0.05221230909228325, -0.049975886940956116, -0.04773946851491928, -0.04550304636359215, -0.043266624212265015, -0.04103020206093788, -0.03879377990961075, -0.036557357758283615, -0.03432093560695648, -0.03208451718091965, -0.029848093166947365, -0.02761167287826538, -0.025375250726938248, -0.023138828575611115, -0.02090240642428398, -0.018665984272956848, -0.016429563984274864, -0.014193141832947731, -0.011956719681620598, -0.00972029846161604, -0.007483877241611481, -0.0052474550902843475, -0.0030110334046185017, -0.0007746117189526558, 0.00146180996671319, 0.003698231652379036, 0.005934653803706169, 0.008171075023710728, 0.010407496243715286, 0.012643925845623016, 0.01488034799695015, 0.017116770148277283, 0.019353190436959267, 0.0215896125882864, 0.023826034739613533, 0.026062455028295517, 0.02829887717962265, 0.030535299330949783, 0.032771721482276917, 0.03500814363360405, 0.03724456578493118, 0.03948098421096802, 0.04171741008758545, 0.043953828513622284, 0.04619025066494942, 0.04842667281627655, 0.050663094967603683, 0.05289951711893082, 0.05513593927025795, 0.05737236142158508, 0.05960877984762192, 0.06184520199894905, 0.06408162415027618, 0.06631805002689362, 0.06855446845293045, 0.07079089432954788, 0.07302731275558472, 0.07526373863220215, 0.07750015705823898, 0.07973658293485641, 0.08197300136089325, 0.08420941978693008]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 6.0, 4.0, 12.0, 8.0, 18.0, 11.0, 29.0, 21.0, 22.0, 19.0, 25.0, 34.0, 46.0, 41.0, 44.0, 44.0, 38.0, 53.0, 51.0, 52.0, 56.0, 58.0, 33.0, 36.0, 34.0, 32.0, 21.0, 21.0, 22.0, 20.0, 16.0, 19.0, 9.0, 13.0, 9.0, 6.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.034080080687999725, -0.0331118069589138, -0.03214352950453758, -0.03117525391280651, -0.03020697832107544, -0.029238702729344368, -0.028270427137613297, -0.027302153408527374, -0.026333875954151154, -0.025365600362420082, -0.02439732477068901, -0.02342904917895794, -0.022460773587226868, -0.021492497995495796, -0.020524222403764725, -0.019555948674678802, -0.01858767308294773, -0.01761939749121666, -0.016651121899485588, -0.015682846307754517, -0.014714570716023445, -0.013746295124292374, -0.012778020463883877, -0.011809744872152805, -0.010841469280421734, -0.009873193688690662, -0.008904918096959591, -0.007936643436551094, -0.006968367379158735, -0.006000091787427664, -0.00503181666135788, -0.004063541069626808, -0.0030952654778957367, -0.0021269898861646652, -0.0011587145272642374, -0.00019043916836380959, 0.0007778364233672619, 0.0017461120150983334, 0.0027143871411681175, 0.003682662732899189, 0.0046509383246302605, 0.005619213916361332, 0.006587489508092403, 0.007555764634162188, 0.008524039760231972, 0.009492315351963043, 0.010460590943694115, 0.011428866535425186, 0.012397142127156258, 0.013365417718887329, 0.0143336933106184, 0.015301968902349472, 0.016270244494080544, 0.017238520085811615, 0.018206793814897537, 0.019175071269273758, 0.02014334499835968, 0.02111162059009075, 0.022079896181821823, 0.023048171773552895, 0.024016447365283966, 0.024984722957015038, 0.02595299854874611, 0.02692127227783203, 0.027889549732208252]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 15.0, 13.0, 24.0, 35.0, 51.0, 56.0, 116.0, 114.0, 216.0, 323.0, 446.0, 607.0, 901.0, 1305.0, 1846.0, 2775.0, 3919.0, 5704.0, 8519.0, 13037.0, 20056.0, 30560.0, 48700.0, 80007.0, 136084.0, 215990.0, 186112.0, 109541.0, 65209.0, 40033.0, 25548.0, 16398.0, 10962.0, 7407.0, 4950.0, 3388.0, 2347.0, 1578.0, 1114.0, 740.0, 526.0, 393.0, 263.0, 206.0, 143.0, 84.0, 53.0, 45.0, 31.0, 23.0, 16.0, 10.0, 6.0, 2.0, 5.0, 3.0, 1.0], "bins": [-0.043365478515625, -0.042043209075927734, -0.04072093963623047, -0.0393986701965332, -0.03807640075683594, -0.03675413131713867, -0.035431861877441406, -0.03410959243774414, -0.032787322998046875, -0.03146505355834961, -0.030142784118652344, -0.028820514678955078, -0.027498245239257812, -0.026175975799560547, -0.02485370635986328, -0.023531436920166016, -0.02220916748046875, -0.020886898040771484, -0.01956462860107422, -0.018242359161376953, -0.016920089721679688, -0.015597820281982422, -0.014275550842285156, -0.01295328140258789, -0.011631011962890625, -0.01030874252319336, -0.008986473083496094, -0.007664203643798828, -0.0063419342041015625, -0.005019664764404297, -0.0036973953247070312, -0.0023751258850097656, -0.0010528564453125, 0.0002694129943847656, 0.0015916824340820312, 0.002913951873779297, 0.0042362213134765625, 0.005558490753173828, 0.006880760192871094, 0.00820302963256836, 0.009525299072265625, 0.01084756851196289, 0.012169837951660156, 0.013492107391357422, 0.014814376831054688, 0.016136646270751953, 0.01745891571044922, 0.018781185150146484, 0.02010345458984375, 0.021425724029541016, 0.02274799346923828, 0.024070262908935547, 0.025392532348632812, 0.026714801788330078, 0.028037071228027344, 0.02935934066772461, 0.030681610107421875, 0.03200387954711914, 0.033326148986816406, 0.03464841842651367, 0.03597068786621094, 0.0372929573059082, 0.03861522674560547, 0.039937496185302734, 0.041259765625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 6.0, 7.0, 13.0, 9.0, 16.0, 25.0, 17.0, 13.0, 18.0, 28.0, 22.0, 33.0, 40.0, 45.0, 31.0, 38.0, 48.0, 43.0, 50.0, 37.0, 62.0, 54.0, 40.0, 31.0, 39.0, 30.0, 26.0, 25.0, 23.0, 27.0, 24.0, 18.0, 14.0, 10.0, 8.0, 11.0, 4.0, 3.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0247650146484375, -0.024006366729736328, -0.023247718811035156, -0.022489070892333984, -0.021730422973632812, -0.02097177505493164, -0.02021312713623047, -0.019454479217529297, -0.018695831298828125, -0.017937183380126953, -0.01717853546142578, -0.01641988754272461, -0.015661239624023438, -0.014902591705322266, -0.014143943786621094, -0.013385295867919922, -0.01262664794921875, -0.011868000030517578, -0.011109352111816406, -0.010350704193115234, -0.009592056274414062, -0.00883340835571289, -0.008074760437011719, -0.007316112518310547, -0.006557464599609375, -0.005798816680908203, -0.005040168762207031, -0.004281520843505859, -0.0035228729248046875, -0.0027642250061035156, -0.0020055770874023438, -0.0012469291687011719, -0.00048828125, 0.0002703666687011719, 0.0010290145874023438, 0.0017876625061035156, 0.0025463104248046875, 0.0033049583435058594, 0.004063606262207031, 0.004822254180908203, 0.005580902099609375, 0.006339550018310547, 0.007098197937011719, 0.00785684585571289, 0.008615493774414062, 0.009374141693115234, 0.010132789611816406, 0.010891437530517578, 0.01165008544921875, 0.012408733367919922, 0.013167381286621094, 0.013926029205322266, 0.014684677124023438, 0.01544332504272461, 0.01620197296142578, 0.016960620880126953, 0.017719268798828125, 0.018477916717529297, 0.01923656463623047, 0.01999521255493164, 0.020753860473632812, 0.021512508392333984, 0.022271156311035156, 0.023029804229736328, 0.0237884521484375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 10.0, 6.0, 13.0, 26.0, 40.0, 52.0, 85.0, 104.0, 176.0, 210.0, 310.0, 397.0, 643.0, 860.0, 1277.0, 1833.0, 2668.0, 3827.0, 5841.0, 8717.0, 13667.0, 21964.0, 36824.0, 63799.0, 115084.0, 197668.0, 228053.0, 144350.0, 80063.0, 45203.0, 26676.0, 16426.0, 10357.0, 6811.0, 4588.0, 3046.0, 2069.0, 1439.0, 978.0, 720.0, 500.0, 358.0, 230.0, 174.0, 141.0, 91.0, 56.0, 46.0, 30.0, 22.0, 13.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.0406494140625, -0.039386749267578125, -0.03812408447265625, -0.036861419677734375, -0.0355987548828125, -0.034336090087890625, -0.03307342529296875, -0.031810760498046875, -0.030548095703125, -0.029285430908203125, -0.02802276611328125, -0.026760101318359375, -0.0254974365234375, -0.024234771728515625, -0.02297210693359375, -0.021709442138671875, -0.02044677734375, -0.019184112548828125, -0.01792144775390625, -0.016658782958984375, -0.0153961181640625, -0.014133453369140625, -0.01287078857421875, -0.011608123779296875, -0.010345458984375, -0.009082794189453125, -0.00782012939453125, -0.006557464599609375, -0.0052947998046875, -0.004032135009765625, -0.00276947021484375, -0.001506805419921875, -0.000244140625, 0.001018524169921875, 0.00228118896484375, 0.003543853759765625, 0.0048065185546875, 0.006069183349609375, 0.00733184814453125, 0.008594512939453125, 0.009857177734375, 0.011119842529296875, 0.01238250732421875, 0.013645172119140625, 0.0149078369140625, 0.016170501708984375, 0.01743316650390625, 0.018695831298828125, 0.01995849609375, 0.021221160888671875, 0.02248382568359375, 0.023746490478515625, 0.0250091552734375, 0.026271820068359375, 0.02753448486328125, 0.028797149658203125, 0.030059814453125, 0.031322479248046875, 0.03258514404296875, 0.033847808837890625, 0.0351104736328125, 0.036373138427734375, 0.03763580322265625, 0.038898468017578125, 0.0401611328125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 4.0, 3.0, 4.0, 7.0, 11.0, 5.0, 13.0, 11.0, 12.0, 23.0, 24.0, 26.0, 25.0, 27.0, 28.0, 27.0, 38.0, 37.0, 31.0, 38.0, 38.0, 40.0, 37.0, 37.0, 31.0, 41.0, 39.0, 45.0, 36.0, 39.0, 31.0, 18.0, 26.0, 22.0, 26.0, 16.0, 14.0, 12.0, 13.0, 5.0, 9.0, 10.0, 4.0, 7.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0142364501953125, -0.013802409172058105, -0.013368368148803711, -0.012934327125549316, -0.012500286102294922, -0.012066245079040527, -0.011632204055786133, -0.011198163032531738, -0.010764122009277344, -0.01033008098602295, -0.009896039962768555, -0.00946199893951416, -0.009027957916259766, -0.008593916893005371, -0.008159875869750977, -0.007725834846496582, -0.0072917938232421875, -0.006857752799987793, -0.0064237117767333984, -0.005989670753479004, -0.005555629730224609, -0.005121588706970215, -0.00468754768371582, -0.004253506660461426, -0.0038194656372070312, -0.0033854246139526367, -0.002951383590698242, -0.0025173425674438477, -0.002083301544189453, -0.0016492605209350586, -0.001215219497680664, -0.0007811784744262695, -0.000347137451171875, 8.690357208251953e-05, 0.0005209445953369141, 0.0009549856185913086, 0.0013890266418457031, 0.0018230676651000977, 0.002257108688354492, 0.0026911497116088867, 0.0031251907348632812, 0.0035592317581176758, 0.00399327278137207, 0.004427313804626465, 0.004861354827880859, 0.005295395851135254, 0.0057294368743896484, 0.006163477897644043, 0.0065975189208984375, 0.007031559944152832, 0.0074656009674072266, 0.007899641990661621, 0.008333683013916016, 0.00876772403717041, 0.009201765060424805, 0.0096358060836792, 0.010069847106933594, 0.010503888130187988, 0.010937929153442383, 0.011371970176696777, 0.011806011199951172, 0.012240052223205566, 0.012674093246459961, 0.013108134269714355, 0.01354217529296875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 2.0, 4.0, 2.0, 8.0, 14.0, 10.0, 22.0, 24.0, 24.0, 37.0, 58.0, 62.0, 129.0, 184.0, 240.0, 332.0, 553.0, 793.0, 1228.0, 2025.0, 3257.0, 5573.0, 10106.0, 19671.0, 41896.0, 704168.0, 176964.0, 39270.0, 18281.0, 9610.0, 5395.0, 3121.0, 1894.0, 1168.0, 800.0, 523.0, 316.0, 241.0, 155.0, 113.0, 84.0, 58.0, 26.0, 29.0, 22.0, 19.0, 14.0, 9.0, 6.0, 3.0, 5.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.028472900390625, -0.02758193016052246, -0.026690959930419922, -0.025799989700317383, -0.024909019470214844, -0.024018049240112305, -0.023127079010009766, -0.022236108779907227, -0.021345138549804688, -0.02045416831970215, -0.01956319808959961, -0.01867222785949707, -0.01778125762939453, -0.016890287399291992, -0.015999317169189453, -0.015108346939086914, -0.014217376708984375, -0.013326406478881836, -0.012435436248779297, -0.011544466018676758, -0.010653495788574219, -0.00976252555847168, -0.00887155532836914, -0.007980585098266602, -0.0070896148681640625, -0.0061986446380615234, -0.005307674407958984, -0.004416704177856445, -0.0035257339477539062, -0.002634763717651367, -0.0017437934875488281, -0.0008528232574462891, 3.814697265625e-05, 0.0009291172027587891, 0.0018200874328613281, 0.002711057662963867, 0.0036020278930664062, 0.004492998123168945, 0.005383968353271484, 0.0062749385833740234, 0.0071659088134765625, 0.008056879043579102, 0.00894784927368164, 0.00983881950378418, 0.010729789733886719, 0.011620759963989258, 0.012511730194091797, 0.013402700424194336, 0.014293670654296875, 0.015184640884399414, 0.016075611114501953, 0.016966581344604492, 0.01785755157470703, 0.01874852180480957, 0.01963949203491211, 0.02053046226501465, 0.021421432495117188, 0.022312402725219727, 0.023203372955322266, 0.024094343185424805, 0.024985313415527344, 0.025876283645629883, 0.026767253875732422, 0.02765822410583496, 0.0285491943359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 9.0, 8.0, 17.0, 17.0, 14.0, 35.0, 30.0, 49.0, 48.0, 58.0, 80.0, 124.0, 89.0, 90.0, 61.0, 51.0, 77.0, 15.0, 25.0, 17.0, 9.0, 22.0, 8.0, 7.0, 4.0, 4.0, 2.0, 7.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.291534423828125e-06, -4.161149263381958e-06, -4.030764102935791e-06, -3.900378942489624e-06, -3.769993782043457e-06, -3.63960862159729e-06, -3.509223461151123e-06, -3.378838300704956e-06, -3.248453140258789e-06, -3.118067979812622e-06, -2.987682819366455e-06, -2.857297658920288e-06, -2.726912498474121e-06, -2.596527338027954e-06, -2.466142177581787e-06, -2.33575701713562e-06, -2.205371856689453e-06, -2.074986696243286e-06, -1.944601535797119e-06, -1.8142163753509521e-06, -1.6838312149047852e-06, -1.5534460544586182e-06, -1.4230608940124512e-06, -1.2926757335662842e-06, -1.1622905731201172e-06, -1.0319054126739502e-06, -9.015202522277832e-07, -7.711350917816162e-07, -6.407499313354492e-07, -5.103647708892822e-07, -3.7997961044311523e-07, -2.4959444999694824e-07, -1.1920928955078125e-07, 1.1175870895385742e-08, 1.4156103134155273e-07, 2.7194619178771973e-07, 4.023313522338867e-07, 5.327165126800537e-07, 6.631016731262207e-07, 7.934868335723877e-07, 9.238719940185547e-07, 1.0542571544647217e-06, 1.1846423149108887e-06, 1.3150274753570557e-06, 1.4454126358032227e-06, 1.5757977962493896e-06, 1.7061829566955566e-06, 1.8365681171417236e-06, 1.9669532775878906e-06, 2.0973384380340576e-06, 2.2277235984802246e-06, 2.3581087589263916e-06, 2.4884939193725586e-06, 2.6188790798187256e-06, 2.7492642402648926e-06, 2.8796494007110596e-06, 3.0100345611572266e-06, 3.1404197216033936e-06, 3.2708048820495605e-06, 3.4011900424957275e-06, 3.5315752029418945e-06, 3.6619603633880615e-06, 3.7923455238342285e-06, 3.9227306842803955e-06, 4.0531158447265625e-06]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 9.0, 13.0, 12.0, 16.0, 20.0, 30.0, 35.0, 43.0, 52.0, 66.0, 76.0, 132.0, 196.0, 267.0, 359.0, 480.0, 642.0, 1001.0, 1450.0, 2176.0, 3396.0, 5220.0, 8617.0, 14924.0, 28519.0, 72039.0, 800174.0, 51362.0, 23258.0, 12548.0, 7477.0, 4587.0, 2986.0, 1933.0, 1254.0, 901.0, 651.0, 433.0, 282.0, 229.0, 192.0, 102.0, 94.0, 70.0, 58.0, 42.0, 26.0, 19.0, 15.0, 12.0, 15.0, 16.0, 13.0, 4.0, 6.0, 2.0, 4.0], "bins": [-0.025726318359375, -0.024955034255981445, -0.02418375015258789, -0.023412466049194336, -0.02264118194580078, -0.021869897842407227, -0.021098613739013672, -0.020327329635620117, -0.019556045532226562, -0.018784761428833008, -0.018013477325439453, -0.0172421932220459, -0.016470909118652344, -0.01569962501525879, -0.014928340911865234, -0.01415705680847168, -0.013385772705078125, -0.01261448860168457, -0.011843204498291016, -0.011071920394897461, -0.010300636291503906, -0.009529352188110352, -0.008758068084716797, -0.007986783981323242, -0.0072154998779296875, -0.006444215774536133, -0.005672931671142578, -0.0049016475677490234, -0.004130363464355469, -0.003359079360961914, -0.0025877952575683594, -0.0018165111541748047, -0.00104522705078125, -0.0002739429473876953, 0.0004973411560058594, 0.001268625259399414, 0.0020399093627929688, 0.0028111934661865234, 0.003582477569580078, 0.004353761672973633, 0.0051250457763671875, 0.005896329879760742, 0.006667613983154297, 0.0074388980865478516, 0.008210182189941406, 0.008981466293334961, 0.009752750396728516, 0.01052403450012207, 0.011295318603515625, 0.01206660270690918, 0.012837886810302734, 0.013609170913696289, 0.014380455017089844, 0.015151739120483398, 0.015923023223876953, 0.016694307327270508, 0.017465591430664062, 0.018236875534057617, 0.019008159637451172, 0.019779443740844727, 0.02055072784423828, 0.021322011947631836, 0.02209329605102539, 0.022864580154418945, 0.0236358642578125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 11.0, 5.0, 6.0, 14.0, 11.0, 17.0, 19.0, 12.0, 25.0, 24.0, 46.0, 611.0, 42.0, 25.0, 16.0, 15.0, 12.0, 9.0, 8.0, 13.0, 7.0, 11.0, 3.0, 6.0, 9.0, 0.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.007175445556640625, -0.0069383978843688965, -0.006701350212097168, -0.0064643025398254395, -0.006227254867553711, -0.005990207195281982, -0.005753159523010254, -0.005516111850738525, -0.005279064178466797, -0.005042016506195068, -0.00480496883392334, -0.004567921161651611, -0.004330873489379883, -0.004093825817108154, -0.0038567781448364258, -0.0036197304725646973, -0.0033826828002929688, -0.0031456351280212402, -0.0029085874557495117, -0.002671539783477783, -0.0024344921112060547, -0.002197444438934326, -0.0019603967666625977, -0.0017233490943908691, -0.0014863014221191406, -0.0012492537498474121, -0.0010122060775756836, -0.0007751584053039551, -0.0005381107330322266, -0.00030106306076049805, -6.401538848876953e-05, 0.00017303228378295898, 0.0004100799560546875, 0.000647127628326416, 0.0008841753005981445, 0.001121222972869873, 0.0013582706451416016, 0.00159531831741333, 0.0018323659896850586, 0.002069413661956787, 0.0023064613342285156, 0.002543509006500244, 0.0027805566787719727, 0.003017604351043701, 0.0032546520233154297, 0.003491699695587158, 0.0037287473678588867, 0.003965795040130615, 0.004202842712402344, 0.004439890384674072, 0.004676938056945801, 0.004913985729217529, 0.005151033401489258, 0.005388081073760986, 0.005625128746032715, 0.005862176418304443, 0.006099224090576172, 0.0063362717628479, 0.006573319435119629, 0.006810367107391357, 0.007047414779663086, 0.0072844624519348145, 0.007521510124206543, 0.0077585577964782715, 0.00799560546875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 8.0, 10.0, 19.0, 27.0, 22.0, 33.0, 43.0, 72.0, 107.0, 121.0, 167.0, 99.0, 75.0, 51.0, 36.0, 29.0, 13.0, 10.0, 11.0, 7.0, 3.0, 4.0, 10.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03716970235109329, -0.03571251779794693, -0.03425533324480057, -0.032798148691654205, -0.03134096413850784, -0.02988377958536148, -0.02842659316956997, -0.026969408616423607, -0.025512224063277245, -0.024055039510130882, -0.02259785495698452, -0.02114066854119301, -0.019683483988046646, -0.018226299434900284, -0.01676911488175392, -0.01531193032860756, -0.013854745775461197, -0.012397561222314835, -0.010940376669168472, -0.009483191184699535, -0.008026006631553173, -0.006568822078406811, -0.005111636593937874, -0.0036544520407915115, -0.0021972674876451492, -0.0007400827016681433, 0.0007171020843088627, 0.0021742871031165123, 0.0036314716562628746, 0.005088656209409237, 0.006545841693878174, 0.008003026247024536, 0.009460210800170898, 0.01091739535331726, 0.012374579906463623, 0.01383176539093256, 0.015288949944078922, 0.01674613356590271, 0.01820331998169422, 0.019660504534840584, 0.021117689087986946, 0.02257487364113331, 0.02403205819427967, 0.025489244610071182, 0.026946429163217545, 0.028403613716363907, 0.02986079826951027, 0.03131798282265663, 0.032775167375802994, 0.034232351928949356, 0.03568953648209572, 0.03714672103524208, 0.03860390558838844, 0.040061090141534805, 0.041518278419971466, 0.04297546297311783, 0.04443264752626419, 0.04588983207941055, 0.047347016632556915, 0.04880420118570328, 0.05026138573884964, 0.051718570291996, 0.053175754845142365, 0.05463293939828873, 0.05609012395143509]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 11.0, 10.0, 18.0, 18.0, 6.0, 15.0, 22.0, 28.0, 22.0, 31.0, 29.0, 25.0, 46.0, 35.0, 51.0, 44.0, 40.0, 48.0, 58.0, 53.0, 38.0, 40.0, 34.0, 31.0, 42.0, 26.0, 27.0, 19.0, 22.0, 17.0, 21.0, 15.0, 14.0, 8.0, 8.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02734782174229622, -0.026530755683779716, -0.025713687762618065, -0.024896621704101562, -0.02407955564558506, -0.02326248772442341, -0.022445421665906906, -0.021628353744745255, -0.020811287686228752, -0.01999422162771225, -0.019177153706550598, -0.018360087648034096, -0.017543021589517593, -0.016725953668355942, -0.01590888760983944, -0.015091820620000362, -0.01427475456148386, -0.013457687571644783, -0.01264062151312828, -0.011823554523289204, -0.011006487533450127, -0.010189421474933624, -0.009372354485094547, -0.00855528749525547, -0.007738220971077681, -0.006921154446899891, -0.006104087457060814, -0.005287020932883024, -0.0044699544087052345, -0.0036528874188661575, -0.002835820894688368, -0.002018753904849291, -0.0012016873806715012, -0.00038462068187072873, 0.0004324460169300437, 0.0012495126575231552, 0.0020665794145315886, 0.002883646171540022, 0.0037007126957178116, 0.004517779685556889, 0.005334846209734678, 0.006151912733912468, 0.006968979723751545, 0.007786046247929335, 0.008603112772107124, 0.009420179761946201, 0.010237246751785278, 0.01105431281030178, 0.011871379800140858, 0.012688446789979935, 0.013505512848496437, 0.014322579838335514, 0.015139646828174591, 0.015956712886691093, 0.016773778945207596, 0.017590846866369247, 0.01840791292488575, 0.019224978983402252, 0.020042046904563904, 0.020859112963080406, 0.02167617902159691, 0.02249324694275856, 0.023310313001275063, 0.024127379059791565, 0.024944446980953217]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 11.0, 11.0, 16.0, 35.0, 50.0, 53.0, 78.0, 142.0, 218.0, 320.0, 508.0, 825.0, 1289.0, 1987.0, 3203.0, 5334.0, 8851.0, 15344.0, 26878.0, 49857.0, 97355.0, 219899.0, 768745.0, 2001926.0, 606847.0, 189688.0, 86580.0, 44759.0, 24952.0, 14371.0, 8905.0, 5519.0, 3499.0, 2179.0, 1346.0, 894.0, 575.0, 382.0, 274.0, 212.0, 107.0, 77.0, 61.0, 45.0, 20.0, 16.0, 13.0, 8.0, 8.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-0.037353515625, -0.03620147705078125, -0.0350494384765625, -0.03389739990234375, -0.032745361328125, -0.03159332275390625, -0.0304412841796875, -0.02928924560546875, -0.02813720703125, -0.02698516845703125, -0.0258331298828125, -0.02468109130859375, -0.023529052734375, -0.02237701416015625, -0.0212249755859375, -0.02007293701171875, -0.0189208984375, -0.01776885986328125, -0.0166168212890625, -0.01546478271484375, -0.014312744140625, -0.01316070556640625, -0.0120086669921875, -0.01085662841796875, -0.00970458984375, -0.00855255126953125, -0.0074005126953125, -0.00624847412109375, -0.005096435546875, -0.00394439697265625, -0.0027923583984375, -0.00164031982421875, -0.00048828125, 0.00066375732421875, 0.0018157958984375, 0.00296783447265625, 0.004119873046875, 0.00527191162109375, 0.0064239501953125, 0.00757598876953125, 0.00872802734375, 0.00988006591796875, 0.0110321044921875, 0.01218414306640625, 0.013336181640625, 0.01448822021484375, 0.0156402587890625, 0.01679229736328125, 0.0179443359375, 0.01909637451171875, 0.0202484130859375, 0.02140045166015625, 0.022552490234375, 0.02370452880859375, 0.0248565673828125, 0.02600860595703125, 0.02716064453125, 0.02831268310546875, 0.0294647216796875, 0.03061676025390625, 0.031768798828125, 0.03292083740234375, 0.0340728759765625, 0.03522491455078125, 0.036376953125]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 10.0, 6.0, 13.0, 10.0, 15.0, 13.0, 15.0, 14.0, 22.0, 20.0, 27.0, 18.0, 29.0, 27.0, 37.0, 35.0, 53.0, 46.0, 41.0, 46.0, 46.0, 44.0, 43.0, 39.0, 39.0, 35.0, 30.0, 20.0, 25.0, 31.0, 21.0, 18.0, 20.0, 18.0, 12.0, 23.0, 11.0, 3.0, 3.0, 3.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.0155487060546875, -0.015092134475708008, -0.014635562896728516, -0.014178991317749023, -0.013722419738769531, -0.013265848159790039, -0.012809276580810547, -0.012352705001831055, -0.011896133422851562, -0.01143956184387207, -0.010982990264892578, -0.010526418685913086, -0.010069847106933594, -0.009613275527954102, -0.00915670394897461, -0.008700132369995117, -0.008243560791015625, -0.007786989212036133, -0.007330417633056641, -0.0068738460540771484, -0.006417274475097656, -0.005960702896118164, -0.005504131317138672, -0.00504755973815918, -0.0045909881591796875, -0.004134416580200195, -0.003677845001220703, -0.003221273422241211, -0.0027647018432617188, -0.0023081302642822266, -0.0018515586853027344, -0.0013949871063232422, -0.00093841552734375, -0.0004818439483642578, -2.5272369384765625e-05, 0.00043129920959472656, 0.0008878707885742188, 0.001344442367553711, 0.0018010139465332031, 0.0022575855255126953, 0.0027141571044921875, 0.0031707286834716797, 0.003627300262451172, 0.004083871841430664, 0.004540443420410156, 0.0049970149993896484, 0.005453586578369141, 0.005910158157348633, 0.006366729736328125, 0.006823301315307617, 0.007279872894287109, 0.0077364444732666016, 0.008193016052246094, 0.008649587631225586, 0.009106159210205078, 0.00956273078918457, 0.010019302368164062, 0.010475873947143555, 0.010932445526123047, 0.011389017105102539, 0.011845588684082031, 0.012302160263061523, 0.012758731842041016, 0.013215303421020508, 0.013671875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 5.0, 15.0, 23.0, 24.0, 38.0, 56.0, 93.0, 133.0, 218.0, 352.0, 508.0, 770.0, 1283.0, 1926.0, 3268.0, 5192.0, 8808.0, 15275.0, 27324.0, 51744.0, 105165.0, 243054.0, 693803.0, 1818321.0, 733757.0, 253287.0, 109497.0, 53187.0, 28079.0, 15650.0, 9020.0, 5393.0, 3318.0, 2055.0, 1300.0, 777.0, 559.0, 332.0, 214.0, 163.0, 100.0, 65.0, 41.0, 27.0, 30.0, 5.0, 11.0, 3.0, 6.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0298004150390625, -0.0288240909576416, -0.027847766876220703, -0.026871442794799805, -0.025895118713378906, -0.024918794631958008, -0.02394247055053711, -0.02296614646911621, -0.021989822387695312, -0.021013498306274414, -0.020037174224853516, -0.019060850143432617, -0.01808452606201172, -0.01710820198059082, -0.016131877899169922, -0.015155553817749023, -0.014179229736328125, -0.013202905654907227, -0.012226581573486328, -0.01125025749206543, -0.010273933410644531, -0.009297609329223633, -0.008321285247802734, -0.007344961166381836, -0.0063686370849609375, -0.005392313003540039, -0.004415988922119141, -0.003439664840698242, -0.0024633407592773438, -0.0014870166778564453, -0.0005106925964355469, 0.00046563148498535156, 0.00144195556640625, 0.0024182796478271484, 0.003394603729248047, 0.004370927810668945, 0.005347251892089844, 0.006323575973510742, 0.007299900054931641, 0.008276224136352539, 0.009252548217773438, 0.010228872299194336, 0.011205196380615234, 0.012181520462036133, 0.013157844543457031, 0.01413416862487793, 0.015110492706298828, 0.016086816787719727, 0.017063140869140625, 0.018039464950561523, 0.019015789031982422, 0.01999211311340332, 0.02096843719482422, 0.021944761276245117, 0.022921085357666016, 0.023897409439086914, 0.024873733520507812, 0.02585005760192871, 0.02682638168334961, 0.027802705764770508, 0.028779029846191406, 0.029755353927612305, 0.030731678009033203, 0.0317080020904541, 0.032684326171875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 9.0, 16.0, 16.0, 19.0, 19.0, 17.0, 33.0, 42.0, 43.0, 59.0, 68.0, 87.0, 90.0, 121.0, 137.0, 167.0, 172.0, 204.0, 208.0, 255.0, 275.0, 273.0, 293.0, 218.0, 201.0, 189.0, 157.0, 104.0, 101.0, 88.0, 79.0, 55.0, 47.0, 39.0, 34.0, 24.0, 31.0, 12.0, 10.0, 12.0, 8.0, 9.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.007678985595703125, -0.00744551420211792, -0.007212042808532715, -0.00697857141494751, -0.006745100021362305, -0.0065116286277771, -0.0062781572341918945, -0.0060446858406066895, -0.005811214447021484, -0.005577743053436279, -0.005344271659851074, -0.005110800266265869, -0.004877328872680664, -0.004643857479095459, -0.004410386085510254, -0.004176914691925049, -0.003943443298339844, -0.0037099719047546387, -0.0034765005111694336, -0.0032430291175842285, -0.0030095577239990234, -0.0027760863304138184, -0.0025426149368286133, -0.002309143543243408, -0.002075672149658203, -0.001842200756072998, -0.001608729362487793, -0.0013752579689025879, -0.0011417865753173828, -0.0009083151817321777, -0.0006748437881469727, -0.0004413723945617676, -0.0002079010009765625, 2.5570392608642578e-05, 0.00025904178619384766, 0.0004925131797790527, 0.0007259845733642578, 0.0009594559669494629, 0.001192927360534668, 0.001426398754119873, 0.0016598701477050781, 0.0018933415412902832, 0.0021268129348754883, 0.0023602843284606934, 0.0025937557220458984, 0.0028272271156311035, 0.0030606985092163086, 0.0032941699028015137, 0.0035276412963867188, 0.003761112689971924, 0.003994584083557129, 0.004228055477142334, 0.004461526870727539, 0.004694998264312744, 0.004928469657897949, 0.005161941051483154, 0.005395412445068359, 0.0056288838386535645, 0.0058623552322387695, 0.006095826625823975, 0.00632929801940918, 0.006562769412994385, 0.00679624080657959, 0.007029712200164795, 0.00726318359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 11.0, 14.0, 20.0, 20.0, 38.0, 49.0, 68.0, 86.0, 135.0, 142.0, 104.0, 75.0, 60.0, 34.0, 27.0, 25.0, 17.0, 13.0, 13.0, 7.0, 9.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02560489997267723, -0.024678954854607582, -0.023753009736537933, -0.022827064618468285, -0.021901119500398636, -0.020975174382328987, -0.02004922926425934, -0.01912328414618969, -0.01819733902812004, -0.017271393910050392, -0.016345448791980743, -0.015419503673911095, -0.014493558555841446, -0.013567613437771797, -0.012641668319702148, -0.0117157232016325, -0.010789777152240276, -0.009863832034170628, -0.008937886916100979, -0.00801194179803133, -0.007085996679961681, -0.006160051096230745, -0.005234105978161097, -0.004308160860091448, -0.003382215742021799, -0.0024562706239521503, -0.0015303253894671798, -0.0006043801549822092, 0.00032156496308743954, 0.001247510313987732, 0.0021734554320573807, 0.0030994005501270294, 0.004025345668196678, 0.004951290786266327, 0.005877235904335976, 0.006803181022405624, 0.007729126140475273, 0.008655071258544922, 0.00958101637661457, 0.01050696149468422, 0.011432906612753868, 0.012358851730823517, 0.013284796848893166, 0.014210741966962814, 0.015136687085032463, 0.016062632203102112, 0.01698857732117176, 0.01791452243924141, 0.018840469419956207, 0.019766414538025856, 0.020692359656095505, 0.021618304774165154, 0.022544249892234802, 0.02347019501030445, 0.0243961401283741, 0.02532208524644375, 0.026248030364513397, 0.027173975482583046, 0.028099920600652695, 0.029025865718722343, 0.029951810836791992, 0.03087775595486164, 0.03180370107293129, 0.03272964805364609, 0.03365559130907059]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 11.0, 16.0, 21.0, 16.0, 24.0, 22.0, 26.0, 32.0, 37.0, 35.0, 25.0, 47.0, 46.0, 32.0, 43.0, 41.0, 50.0, 40.0, 41.0, 43.0, 37.0, 35.0, 33.0, 35.0, 25.0, 28.0, 26.0, 27.0, 14.0, 16.0, 14.0, 10.0, 6.0, 8.0, 7.0, 9.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.02004498615860939, -0.01951558329164982, -0.018986178562045097, -0.018456775695085526, -0.017927370965480804, -0.017397968098521233, -0.01686856336891651, -0.01633916050195694, -0.01580975577235222, -0.015280351974070072, -0.014750948175787926, -0.01422154437750578, -0.013692140579223633, -0.013162737712264061, -0.012633333913981915, -0.012103930115699768, -0.011574527248740196, -0.01104512345045805, -0.010515719652175903, -0.009986315853893757, -0.00945691205561161, -0.008927509188652039, -0.008398105390369892, -0.007868701592087746, -0.007339297793805599, -0.006809893995523453, -0.006280490197241306, -0.005751086864620447, -0.005221683066338301, -0.004692279268056154, -0.004162875935435295, -0.0036334721371531487, -0.0031040702015161514, -0.002574666403234005, -0.002045262837782502, -0.0015158591559156775, -0.000986455474048853, -0.00045705167576670647, 7.235188968479633e-05, 0.0006017554551362991, 0.0011311592534184456, 0.0016605629352852702, 0.002189966617152095, 0.0027193701826035976, 0.003248773980885744, 0.0037781777791678905, 0.00430758111178875, 0.004836984910070896, 0.005366388708353043, 0.005895792506635189, 0.0064251963049173355, 0.006954599637538195, 0.007484003435820341, 0.0080134067684412, 0.008542810566723347, 0.009072214365005493, 0.00960161816328764, 0.010131021961569786, 0.010660425759851933, 0.011189829558134079, 0.01171923242509365, 0.012248637154698372, 0.012778040021657944, 0.01330744381994009, 0.013836847618222237]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 5.0, 8.0, 9.0, 10.0, 12.0, 26.0, 29.0, 65.0, 69.0, 118.0, 135.0, 249.0, 389.0, 570.0, 1011.0, 1772.0, 2998.0, 5475.0, 9999.0, 20034.0, 43453.0, 113556.0, 349730.0, 317041.0, 101513.0, 40189.0, 18485.0, 9387.0, 5110.0, 2904.0, 1653.0, 932.0, 581.0, 376.0, 224.0, 156.0, 96.0, 50.0, 42.0, 28.0, 14.0, 25.0, 10.0, 6.0, 6.0, 6.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0258331298828125, -0.024970531463623047, -0.024107933044433594, -0.02324533462524414, -0.022382736206054688, -0.021520137786865234, -0.02065753936767578, -0.019794940948486328, -0.018932342529296875, -0.018069744110107422, -0.01720714569091797, -0.016344547271728516, -0.015481948852539062, -0.01461935043334961, -0.013756752014160156, -0.012894153594970703, -0.01203155517578125, -0.011168956756591797, -0.010306358337402344, -0.00944375991821289, -0.008581161499023438, -0.007718563079833984, -0.006855964660644531, -0.005993366241455078, -0.005130767822265625, -0.004268169403076172, -0.0034055709838867188, -0.0025429725646972656, -0.0016803741455078125, -0.0008177757263183594, 4.482269287109375e-05, 0.0009074211120605469, 0.00177001953125, 0.002632617950439453, 0.0034952163696289062, 0.004357814788818359, 0.0052204132080078125, 0.006083011627197266, 0.006945610046386719, 0.007808208465576172, 0.008670806884765625, 0.009533405303955078, 0.010396003723144531, 0.011258602142333984, 0.012121200561523438, 0.01298379898071289, 0.013846397399902344, 0.014708995819091797, 0.01557159423828125, 0.016434192657470703, 0.017296791076660156, 0.01815938949584961, 0.019021987915039062, 0.019884586334228516, 0.02074718475341797, 0.021609783172607422, 0.022472381591796875, 0.023334980010986328, 0.02419757843017578, 0.025060176849365234, 0.025922775268554688, 0.02678537368774414, 0.027647972106933594, 0.028510570526123047, 0.0293731689453125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 14.0, 12.0, 16.0, 17.0, 17.0, 24.0, 31.0, 29.0, 33.0, 25.0, 46.0, 40.0, 32.0, 48.0, 38.0, 35.0, 48.0, 39.0, 47.0, 46.0, 41.0, 25.0, 34.0, 40.0, 23.0, 30.0, 28.0, 23.0, 12.0, 19.0, 21.0, 8.0, 9.0, 9.0, 5.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0177764892578125, -0.017272114753723145, -0.01676774024963379, -0.016263365745544434, -0.015758991241455078, -0.015254616737365723, -0.014750242233276367, -0.014245867729187012, -0.013741493225097656, -0.0132371187210083, -0.012732744216918945, -0.01222836971282959, -0.011723995208740234, -0.011219620704650879, -0.010715246200561523, -0.010210871696472168, -0.009706497192382812, -0.009202122688293457, -0.008697748184204102, -0.008193373680114746, -0.007688999176025391, -0.007184624671936035, -0.00668025016784668, -0.006175875663757324, -0.005671501159667969, -0.005167126655578613, -0.004662752151489258, -0.004158377647399902, -0.003654003143310547, -0.0031496286392211914, -0.002645254135131836, -0.0021408796310424805, -0.001636505126953125, -0.0011321306228637695, -0.0006277561187744141, -0.0001233816146850586, 0.0003809928894042969, 0.0008853673934936523, 0.0013897418975830078, 0.0018941164016723633, 0.0023984909057617188, 0.0029028654098510742, 0.0034072399139404297, 0.003911614418029785, 0.004415988922119141, 0.004920363426208496, 0.0054247379302978516, 0.005929112434387207, 0.0064334869384765625, 0.006937861442565918, 0.0074422359466552734, 0.007946610450744629, 0.008450984954833984, 0.00895535945892334, 0.009459733963012695, 0.00996410846710205, 0.010468482971191406, 0.010972857475280762, 0.011477231979370117, 0.011981606483459473, 0.012485980987548828, 0.012990355491638184, 0.013494729995727539, 0.013999104499816895, 0.01450347900390625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 11.0, 15.0, 22.0, 20.0, 41.0, 39.0, 53.0, 63.0, 92.0, 134.0, 220.0, 310.0, 463.0, 720.0, 1190.0, 2118.0, 4000.0, 8551.0, 22363.0, 82211.0, 567714.0, 281682.0, 47446.0, 15031.0, 6245.0, 3126.0, 1747.0, 970.0, 677.0, 401.0, 254.0, 183.0, 116.0, 78.0, 44.0, 47.0, 35.0, 20.0, 25.0, 20.0, 19.0, 10.0, 5.0, 8.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.043060302734375, -0.04170703887939453, -0.04035377502441406, -0.039000511169433594, -0.037647247314453125, -0.036293983459472656, -0.03494071960449219, -0.03358745574951172, -0.03223419189453125, -0.03088092803955078, -0.029527664184570312, -0.028174400329589844, -0.026821136474609375, -0.025467872619628906, -0.024114608764648438, -0.02276134490966797, -0.0214080810546875, -0.02005481719970703, -0.018701553344726562, -0.017348289489746094, -0.015995025634765625, -0.014641761779785156, -0.013288497924804688, -0.011935234069824219, -0.01058197021484375, -0.009228706359863281, -0.007875442504882812, -0.006522178649902344, -0.005168914794921875, -0.0038156509399414062, -0.0024623870849609375, -0.0011091232299804688, 0.000244140625, 0.0015974044799804688, 0.0029506683349609375, 0.004303932189941406, 0.005657196044921875, 0.007010459899902344, 0.008363723754882812, 0.009716987609863281, 0.01107025146484375, 0.012423515319824219, 0.013776779174804688, 0.015130043029785156, 0.016483306884765625, 0.017836570739746094, 0.019189834594726562, 0.02054309844970703, 0.0218963623046875, 0.02324962615966797, 0.024602890014648438, 0.025956153869628906, 0.027309417724609375, 0.028662681579589844, 0.030015945434570312, 0.03136920928955078, 0.03272247314453125, 0.03407573699951172, 0.03542900085449219, 0.036782264709472656, 0.038135528564453125, 0.039488792419433594, 0.04084205627441406, 0.04219532012939453, 0.043548583984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 12.0, 9.0, 13.0, 12.0, 22.0, 27.0, 15.0, 27.0, 27.0, 39.0, 47.0, 40.0, 31.0, 41.0, 53.0, 35.0, 46.0, 59.0, 45.0, 33.0, 40.0, 39.0, 32.0, 34.0, 31.0, 25.0, 21.0, 20.0, 20.0, 20.0, 11.0, 13.0, 15.0, 10.0, 3.0, 8.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01010894775390625, -0.009773731231689453, -0.009438514709472656, -0.00910329818725586, -0.008768081665039062, -0.008432865142822266, -0.008097648620605469, -0.007762432098388672, -0.007427215576171875, -0.007091999053955078, -0.006756782531738281, -0.006421566009521484, -0.0060863494873046875, -0.005751132965087891, -0.005415916442871094, -0.005080699920654297, -0.0047454833984375, -0.004410266876220703, -0.004075050354003906, -0.0037398338317871094, -0.0034046173095703125, -0.0030694007873535156, -0.0027341842651367188, -0.002398967742919922, -0.002063751220703125, -0.0017285346984863281, -0.0013933181762695312, -0.0010581016540527344, -0.0007228851318359375, -0.0003876686096191406, -5.245208740234375e-05, 0.0002827644348144531, 0.00061798095703125, 0.0009531974792480469, 0.0012884140014648438, 0.0016236305236816406, 0.0019588470458984375, 0.0022940635681152344, 0.0026292800903320312, 0.002964496612548828, 0.003299713134765625, 0.003634929656982422, 0.003970146179199219, 0.004305362701416016, 0.0046405792236328125, 0.004975795745849609, 0.005311012268066406, 0.005646228790283203, 0.0059814453125, 0.006316661834716797, 0.006651878356933594, 0.006987094879150391, 0.0073223114013671875, 0.007657527923583984, 0.007992744445800781, 0.008327960968017578, 0.008663177490234375, 0.008998394012451172, 0.009333610534667969, 0.009668827056884766, 0.010004043579101562, 0.01033926010131836, 0.010674476623535156, 0.011009693145751953, 0.01134490966796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 10.0, 4.0, 12.0, 26.0, 15.0, 25.0, 46.0, 43.0, 80.0, 63.0, 134.0, 190.0, 263.0, 399.0, 545.0, 756.0, 1203.0, 1665.0, 2596.0, 4076.0, 6712.0, 11295.0, 21156.0, 46616.0, 133781.0, 485027.0, 207695.0, 62340.0, 26419.0, 13686.0, 7842.0, 4759.0, 2950.0, 1981.0, 1275.0, 857.0, 570.0, 395.0, 287.0, 216.0, 157.0, 95.0, 71.0, 61.0, 51.0, 26.0, 26.0, 14.0, 13.0, 6.0, 7.0, 8.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-0.004367828369140625, -0.0042340755462646484, -0.004100322723388672, -0.003966569900512695, -0.0038328170776367188, -0.003699064254760742, -0.0035653114318847656, -0.003431558609008789, -0.0032978057861328125, -0.003164052963256836, -0.0030303001403808594, -0.002896547317504883, -0.0027627944946289062, -0.0026290416717529297, -0.002495288848876953, -0.0023615360260009766, -0.002227783203125, -0.0020940303802490234, -0.001960277557373047, -0.0018265247344970703, -0.0016927719116210938, -0.0015590190887451172, -0.0014252662658691406, -0.001291513442993164, -0.0011577606201171875, -0.001024007797241211, -0.0008902549743652344, -0.0007565021514892578, -0.0006227493286132812, -0.0004889965057373047, -0.0003552436828613281, -0.00022149085998535156, -8.7738037109375e-05, 4.601478576660156e-05, 0.00017976760864257812, 0.0003135204315185547, 0.00044727325439453125, 0.0005810260772705078, 0.0007147789001464844, 0.0008485317230224609, 0.0009822845458984375, 0.001116037368774414, 0.0012497901916503906, 0.0013835430145263672, 0.0015172958374023438, 0.0016510486602783203, 0.0017848014831542969, 0.0019185543060302734, 0.00205230712890625, 0.0021860599517822266, 0.002319812774658203, 0.0024535655975341797, 0.0025873184204101562, 0.002721071243286133, 0.0028548240661621094, 0.002988576889038086, 0.0031223297119140625, 0.003256082534790039, 0.0033898353576660156, 0.003523588180541992, 0.0036573410034179688, 0.0037910938262939453, 0.003924846649169922, 0.0040585994720458984, 0.004192352294921875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 7.0, 4.0, 3.0, 7.0, 15.0, 23.0, 22.0, 25.0, 25.0, 39.0, 63.0, 89.0, 125.0, 147.0, 91.0, 86.0, 37.0, 36.0, 24.0, 30.0, 22.0, 15.0, 16.0, 13.0, 5.0, 5.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.895427703857422e-05, -1.836474984884262e-05, -1.7775222659111023e-05, -1.7185695469379425e-05, -1.6596168279647827e-05, -1.600664108991623e-05, -1.541711390018463e-05, -1.4827586710453033e-05, -1.4238059520721436e-05, -1.3648532330989838e-05, -1.305900514125824e-05, -1.2469477951526642e-05, -1.1879950761795044e-05, -1.1290423572063446e-05, -1.0700896382331848e-05, -1.011136919260025e-05, -9.521842002868652e-06, -8.932314813137054e-06, -8.342787623405457e-06, -7.753260433673859e-06, -7.163733243942261e-06, -6.574206054210663e-06, -5.984678864479065e-06, -5.395151674747467e-06, -4.805624485015869e-06, -4.216097295284271e-06, -3.6265701055526733e-06, -3.0370429158210754e-06, -2.4475157260894775e-06, -1.8579885363578796e-06, -1.2684613466262817e-06, -6.789341568946838e-07, -8.940696716308594e-08, 5.00120222568512e-07, 1.0896474123001099e-06, 1.6791746020317078e-06, 2.2687017917633057e-06, 2.8582289814949036e-06, 3.4477561712265015e-06, 4.037283360958099e-06, 4.626810550689697e-06, 5.216337740421295e-06, 5.805864930152893e-06, 6.395392119884491e-06, 6.984919309616089e-06, 7.574446499347687e-06, 8.163973689079285e-06, 8.753500878810883e-06, 9.34302806854248e-06, 9.932555258274078e-06, 1.0522082448005676e-05, 1.1111609637737274e-05, 1.1701136827468872e-05, 1.229066401720047e-05, 1.2880191206932068e-05, 1.3469718396663666e-05, 1.4059245586395264e-05, 1.4648772776126862e-05, 1.523829996585846e-05, 1.5827827155590057e-05, 1.6417354345321655e-05, 1.7006881535053253e-05, 1.759640872478485e-05, 1.818593591451645e-05, 1.8775463104248047e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 7.0, 13.0, 12.0, 20.0, 32.0, 29.0, 46.0, 80.0, 123.0, 182.0, 317.0, 442.0, 704.0, 1185.0, 1941.0, 3161.0, 5557.0, 10229.0, 19805.0, 41420.0, 97776.0, 276065.0, 356963.0, 128534.0, 51454.0, 23934.0, 12273.0, 6638.0, 3834.0, 2153.0, 1324.0, 776.0, 518.0, 334.0, 221.0, 138.0, 92.0, 73.0, 48.0, 31.0, 24.0, 13.0, 4.0, 11.0, 8.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0030975341796875, -0.0030011534690856934, -0.0029047727584838867, -0.00280839204788208, -0.0027120113372802734, -0.002615630626678467, -0.00251924991607666, -0.0024228692054748535, -0.002326488494873047, -0.0022301077842712402, -0.0021337270736694336, -0.002037346363067627, -0.0019409656524658203, -0.0018445849418640137, -0.001748204231262207, -0.0016518235206604004, -0.0015554428100585938, -0.0014590620994567871, -0.0013626813888549805, -0.0012663006782531738, -0.0011699199676513672, -0.0010735392570495605, -0.000977158546447754, -0.0008807778358459473, -0.0007843971252441406, -0.000688016414642334, -0.0005916357040405273, -0.0004952549934387207, -0.00039887428283691406, -0.0003024935722351074, -0.00020611286163330078, -0.00010973215103149414, -1.33514404296875e-05, 8.302927017211914e-05, 0.00017940998077392578, 0.0002757906913757324, 0.00037217140197753906, 0.0004685521125793457, 0.0005649328231811523, 0.000661313533782959, 0.0007576942443847656, 0.0008540749549865723, 0.0009504556655883789, 0.0010468363761901855, 0.0011432170867919922, 0.0012395977973937988, 0.0013359785079956055, 0.0014323592185974121, 0.0015287399291992188, 0.0016251206398010254, 0.001721501350402832, 0.0018178820610046387, 0.0019142627716064453, 0.002010643482208252, 0.0021070241928100586, 0.0022034049034118652, 0.002299785614013672, 0.0023961663246154785, 0.002492547035217285, 0.002588927745819092, 0.0026853084564208984, 0.002781689167022705, 0.0028780698776245117, 0.0029744505882263184, 0.003070831298828125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 5.0, 8.0, 4.0, 9.0, 11.0, 9.0, 15.0, 13.0, 22.0, 39.0, 32.0, 44.0, 61.0, 70.0, 72.0, 95.0, 88.0, 82.0, 73.0, 55.0, 36.0, 36.0, 24.0, 19.0, 9.0, 16.0, 6.0, 6.0, 4.0, 4.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0011348724365234375, -0.0011012852191925049, -0.0010676980018615723, -0.0010341107845306396, -0.001000523567199707, -0.0009669363498687744, -0.0009333491325378418, -0.0008997619152069092, -0.0008661746978759766, -0.0008325874805450439, -0.0007990002632141113, -0.0007654130458831787, -0.0007318258285522461, -0.0006982386112213135, -0.0006646513938903809, -0.0006310641765594482, -0.0005974769592285156, -0.000563889741897583, -0.0005303025245666504, -0.0004967153072357178, -0.00046312808990478516, -0.00042954087257385254, -0.0003959536552429199, -0.0003623664379119873, -0.0003287792205810547, -0.00029519200325012207, -0.00026160478591918945, -0.00022801756858825684, -0.00019443035125732422, -0.0001608431339263916, -0.00012725591659545898, -9.366869926452637e-05, -6.008148193359375e-05, -2.6494264602661133e-05, 7.092952728271484e-06, 4.06801700592041e-05, 7.426738739013672e-05, 0.00010785460472106934, 0.00014144182205200195, 0.00017502903938293457, 0.0002086162567138672, 0.0002422034740447998, 0.0002757906913757324, 0.00030937790870666504, 0.00034296512603759766, 0.0003765523433685303, 0.0004101395606994629, 0.0004437267780303955, 0.0004773139953613281, 0.0005109012126922607, 0.0005444884300231934, 0.000578075647354126, 0.0006116628646850586, 0.0006452500820159912, 0.0006788372993469238, 0.0007124245166778564, 0.0007460117340087891, 0.0007795989513397217, 0.0008131861686706543, 0.0008467733860015869, 0.0008803606033325195, 0.0009139478206634521, 0.0009475350379943848, 0.0009811222553253174, 0.00101470947265625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 8.0, 8.0, 12.0, 21.0, 24.0, 26.0, 47.0, 58.0, 94.0, 124.0, 150.0, 119.0, 86.0, 54.0, 25.0, 25.0, 24.0, 21.0, 13.0, 12.0, 6.0, 11.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.022909805178642273, -0.022049417719244957, -0.02118903025984764, -0.020328642800450325, -0.01946825534105301, -0.018607867881655693, -0.017747480422258377, -0.01688709296286106, -0.016026705503463745, -0.01516631804406643, -0.014305930584669113, -0.013445543125271797, -0.012585155665874481, -0.011724768206477165, -0.01086438074707985, -0.010003993287682533, -0.009143604896962643, -0.008283217437565327, -0.007422829978168011, -0.006562442518770695, -0.005702055059373379, -0.0048416671343147755, -0.0039812796749174595, -0.0031208922155201435, -0.0022605047561228275, -0.0014001172967255116, -0.0005397297209128737, 0.00032065785489976406, 0.00118104531429708, 0.0020414330065250397, 0.0029018204659223557, 0.0037622079253196716, 0.004622595384716988, 0.005482982844114304, 0.00634337030351162, 0.0072037577629089355, 0.008064145222306252, 0.008924532681703568, 0.009784920141100883, 0.0106453076004982, 0.011505695059895515, 0.012366082519292831, 0.013226469978690147, 0.014086857438087463, 0.01494724489748478, 0.015807632356882095, 0.01666801981627941, 0.017528407275676727, 0.018388796597719193, 0.01924918405711651, 0.020109571516513824, 0.02096995897591114, 0.021830346435308456, 0.022690733894705772, 0.02355112135410309, 0.024411508813500404, 0.02527189627289772, 0.026132283732295036, 0.026992671191692352, 0.02785305865108967, 0.028713446110486984, 0.0295738335698843, 0.030434221029281616, 0.03129461035132408, 0.03215499594807625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 12.0, 18.0, 21.0, 19.0, 18.0, 30.0, 25.0, 34.0, 36.0, 32.0, 27.0, 48.0, 49.0, 35.0, 40.0, 48.0, 43.0, 42.0, 47.0, 37.0, 31.0, 35.0, 40.0, 29.0, 25.0, 33.0, 23.0, 24.0, 15.0, 10.0, 16.0, 9.0, 7.0, 9.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.018828339874744415, -0.018327655270695686, -0.017826968804001808, -0.01732628419995308, -0.01682559959590435, -0.01632491499185562, -0.015824228525161743, -0.015323543921113014, -0.01482285838574171, -0.014322172850370407, -0.013821488246321678, -0.013320802710950375, -0.012820117175579071, -0.012319432571530342, -0.011818747036159039, -0.011318061500787735, -0.010817376896739006, -0.010316691361367702, -0.009816006757318974, -0.00931532122194767, -0.008814636617898941, -0.008313951082527637, -0.007813265547156334, -0.007312580477446318, -0.006811895407736301, -0.006311210338026285, -0.005810525268316269, -0.005309839732944965, -0.004809154663234949, -0.004308469593524933, -0.003807784290984273, -0.003307098988443613, -0.0028064120560884476, -0.0023057269863784313, -0.0018050416838377714, -0.0013043564977124333, -0.0008036713115870953, -0.000302986241877079, 0.0001976990606635809, 0.0006983843632042408, 0.001199069432914257, 0.0016997546190395951, 0.002200439805164933, 0.002701125107705593, 0.0032018101774156094, 0.0037024952471256256, 0.004203180782496929, 0.004703865852206945, 0.005204550921916962, 0.005705235991626978, 0.006205921061336994, 0.006706606596708298, 0.007207291666418314, 0.00770797673612833, 0.008208662271499634, 0.008709346875548363, 0.009210032410919666, 0.00971071794629097, 0.010211402550339699, 0.010712088085711002, 0.011212773621082306, 0.011713458225131035, 0.012214143760502338, 0.012714829295873642, 0.013215513899922371]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 8.0, 9.0, 10.0, 6.0, 9.0, 26.0, 29.0, 46.0, 77.0, 85.0, 144.0, 226.0, 316.0, 446.0, 721.0, 926.0, 1325.0, 2065.0, 3044.0, 4591.0, 6932.0, 10429.0, 16307.0, 26854.0, 44274.0, 77877.0, 141259.0, 234726.0, 202521.0, 112028.0, 62536.0, 36123.0, 22085.0, 13738.0, 8821.0, 5800.0, 3912.0, 2572.0, 1698.0, 1233.0, 852.0, 589.0, 428.0, 275.0, 185.0, 107.0, 87.0, 57.0, 47.0, 36.0, 18.0, 16.0, 16.0, 8.0, 4.0, 5.0, 2.0], "bins": [-0.026580810546875, -0.025817155838012695, -0.02505350112915039, -0.024289846420288086, -0.02352619171142578, -0.022762537002563477, -0.021998882293701172, -0.021235227584838867, -0.020471572875976562, -0.019707918167114258, -0.018944263458251953, -0.01818060874938965, -0.017416954040527344, -0.01665329933166504, -0.015889644622802734, -0.01512598991394043, -0.014362335205078125, -0.01359868049621582, -0.012835025787353516, -0.012071371078491211, -0.011307716369628906, -0.010544061660766602, -0.009780406951904297, -0.009016752243041992, -0.008253097534179688, -0.007489442825317383, -0.006725788116455078, -0.0059621334075927734, -0.005198478698730469, -0.004434823989868164, -0.0036711692810058594, -0.0029075145721435547, -0.00214385986328125, -0.0013802051544189453, -0.0006165504455566406, 0.00014710426330566406, 0.0009107589721679688, 0.0016744136810302734, 0.002438068389892578, 0.003201723098754883, 0.0039653778076171875, 0.004729032516479492, 0.005492687225341797, 0.0062563419342041016, 0.007019996643066406, 0.007783651351928711, 0.008547306060791016, 0.00931096076965332, 0.010074615478515625, 0.01083827018737793, 0.011601924896240234, 0.012365579605102539, 0.013129234313964844, 0.013892889022827148, 0.014656543731689453, 0.015420198440551758, 0.016183853149414062, 0.016947507858276367, 0.017711162567138672, 0.018474817276000977, 0.01923847198486328, 0.020002126693725586, 0.02076578140258789, 0.021529436111450195, 0.0222930908203125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 7.0, 8.0, 14.0, 15.0, 21.0, 24.0, 18.0, 32.0, 24.0, 25.0, 33.0, 39.0, 41.0, 43.0, 42.0, 42.0, 46.0, 43.0, 44.0, 37.0, 42.0, 44.0, 24.0, 35.0, 34.0, 26.0, 33.0, 24.0, 21.0, 24.0, 14.0, 13.0, 9.0, 11.0, 12.0, 5.0, 5.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0144195556640625, -0.014011859893798828, -0.013604164123535156, -0.013196468353271484, -0.012788772583007812, -0.01238107681274414, -0.011973381042480469, -0.011565685272216797, -0.011157989501953125, -0.010750293731689453, -0.010342597961425781, -0.00993490219116211, -0.009527206420898438, -0.009119510650634766, -0.008711814880371094, -0.008304119110107422, -0.00789642333984375, -0.007488727569580078, -0.007081031799316406, -0.006673336029052734, -0.0062656402587890625, -0.005857944488525391, -0.005450248718261719, -0.005042552947998047, -0.004634857177734375, -0.004227161407470703, -0.0038194656372070312, -0.0034117698669433594, -0.0030040740966796875, -0.0025963783264160156, -0.0021886825561523438, -0.0017809867858886719, -0.001373291015625, -0.0009655952453613281, -0.0005578994750976562, -0.00015020370483398438, 0.0002574920654296875, 0.0006651878356933594, 0.0010728836059570312, 0.0014805793762207031, 0.001888275146484375, 0.002295970916748047, 0.0027036666870117188, 0.0031113624572753906, 0.0035190582275390625, 0.003926753997802734, 0.004334449768066406, 0.004742145538330078, 0.00514984130859375, 0.005557537078857422, 0.005965232849121094, 0.006372928619384766, 0.0067806243896484375, 0.007188320159912109, 0.007596015930175781, 0.008003711700439453, 0.008411407470703125, 0.008819103240966797, 0.009226799011230469, 0.00963449478149414, 0.010042190551757812, 0.010449886322021484, 0.010857582092285156, 0.011265277862548828, 0.0116729736328125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 12.0, 15.0, 27.0, 33.0, 40.0, 78.0, 121.0, 185.0, 299.0, 409.0, 670.0, 1053.0, 1743.0, 2798.0, 4747.0, 7798.0, 13645.0, 23851.0, 43319.0, 83165.0, 167329.0, 290758.0, 195492.0, 96330.0, 50000.0, 26922.0, 15177.0, 8893.0, 5226.0, 3228.0, 1853.0, 1209.0, 787.0, 478.0, 285.0, 198.0, 130.0, 84.0, 56.0, 41.0, 24.0, 17.0, 10.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02618408203125, -0.025328636169433594, -0.024473190307617188, -0.02361774444580078, -0.022762298583984375, -0.02190685272216797, -0.021051406860351562, -0.020195960998535156, -0.01934051513671875, -0.018485069274902344, -0.017629623413085938, -0.01677417755126953, -0.015918731689453125, -0.015063285827636719, -0.014207839965820312, -0.013352394104003906, -0.0124969482421875, -0.011641502380371094, -0.010786056518554688, -0.009930610656738281, -0.009075164794921875, -0.008219718933105469, -0.0073642730712890625, -0.006508827209472656, -0.00565338134765625, -0.004797935485839844, -0.0039424896240234375, -0.0030870437622070312, -0.002231597900390625, -0.0013761520385742188, -0.0005207061767578125, 0.00033473968505859375, 0.001190185546875, 0.0020456314086914062, 0.0029010772705078125, 0.0037565231323242188, 0.004611968994140625, 0.005467414855957031, 0.0063228607177734375, 0.007178306579589844, 0.00803375244140625, 0.008889198303222656, 0.009744644165039062, 0.010600090026855469, 0.011455535888671875, 0.012310981750488281, 0.013166427612304688, 0.014021873474121094, 0.0148773193359375, 0.015732765197753906, 0.016588211059570312, 0.01744365692138672, 0.018299102783203125, 0.01915454864501953, 0.020009994506835938, 0.020865440368652344, 0.02172088623046875, 0.022576332092285156, 0.023431777954101562, 0.02428722381591797, 0.025142669677734375, 0.02599811553955078, 0.026853561401367188, 0.027709007263183594, 0.028564453125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 5.0, 9.0, 17.0, 14.0, 18.0, 20.0, 21.0, 19.0, 28.0, 29.0, 34.0, 35.0, 31.0, 35.0, 41.0, 27.0, 44.0, 44.0, 42.0, 49.0, 30.0, 44.0, 33.0, 42.0, 25.0, 39.0, 35.0, 30.0, 21.0, 23.0, 26.0, 17.0, 7.0, 14.0, 15.0, 9.0, 2.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007568359375, -0.007318854331970215, -0.00706934928894043, -0.0068198442459106445, -0.006570339202880859, -0.006320834159851074, -0.006071329116821289, -0.005821824073791504, -0.005572319030761719, -0.005322813987731934, -0.0050733089447021484, -0.004823803901672363, -0.004574298858642578, -0.004324793815612793, -0.004075288772583008, -0.0038257837295532227, -0.0035762786865234375, -0.0033267736434936523, -0.003077268600463867, -0.002827763557434082, -0.002578258514404297, -0.0023287534713745117, -0.0020792484283447266, -0.0018297433853149414, -0.0015802383422851562, -0.001330733299255371, -0.001081228256225586, -0.0008317232131958008, -0.0005822181701660156, -0.00033271312713623047, -8.320808410644531e-05, 0.00016629695892333984, 0.000415802001953125, 0.0006653070449829102, 0.0009148120880126953, 0.0011643171310424805, 0.0014138221740722656, 0.0016633272171020508, 0.001912832260131836, 0.002162337303161621, 0.0024118423461914062, 0.0026613473892211914, 0.0029108524322509766, 0.0031603574752807617, 0.003409862518310547, 0.003659367561340332, 0.003908872604370117, 0.004158377647399902, 0.0044078826904296875, 0.004657387733459473, 0.004906892776489258, 0.005156397819519043, 0.005405902862548828, 0.005655407905578613, 0.0059049129486083984, 0.006154417991638184, 0.006403923034667969, 0.006653428077697754, 0.006902933120727539, 0.007152438163757324, 0.007401943206787109, 0.0076514482498168945, 0.00790095329284668, 0.008150458335876465, 0.00839996337890625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 10.0, 9.0, 14.0, 19.0, 24.0, 31.0, 41.0, 55.0, 101.0, 134.0, 182.0, 234.0, 388.0, 563.0, 900.0, 1316.0, 2150.0, 3273.0, 5675.0, 10038.0, 19188.0, 42003.0, 753905.0, 134404.0, 34563.0, 16647.0, 8960.0, 4979.0, 3112.0, 1880.0, 1218.0, 830.0, 496.0, 341.0, 279.0, 172.0, 132.0, 81.0, 65.0, 41.0, 32.0, 21.0, 17.0, 15.0, 4.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.01300811767578125, -0.012612700462341309, -0.012217283248901367, -0.011821866035461426, -0.011426448822021484, -0.011031031608581543, -0.010635614395141602, -0.01024019718170166, -0.009844779968261719, -0.009449362754821777, -0.009053945541381836, -0.008658528327941895, -0.008263111114501953, -0.007867693901062012, -0.00747227668762207, -0.007076859474182129, -0.0066814422607421875, -0.006286025047302246, -0.005890607833862305, -0.005495190620422363, -0.005099773406982422, -0.0047043561935424805, -0.004308938980102539, -0.003913521766662598, -0.0035181045532226562, -0.003122687339782715, -0.0027272701263427734, -0.002331852912902832, -0.0019364356994628906, -0.0015410184860229492, -0.0011456012725830078, -0.0007501840591430664, -0.000354766845703125, 4.0650367736816406e-05, 0.0004360675811767578, 0.0008314847946166992, 0.0012269020080566406, 0.001622319221496582, 0.0020177364349365234, 0.002413153648376465, 0.0028085708618164062, 0.0032039880752563477, 0.003599405288696289, 0.0039948225021362305, 0.004390239715576172, 0.004785656929016113, 0.005181074142456055, 0.005576491355895996, 0.0059719085693359375, 0.006367325782775879, 0.00676274299621582, 0.007158160209655762, 0.007553577423095703, 0.007948994636535645, 0.008344411849975586, 0.008739829063415527, 0.009135246276855469, 0.00953066349029541, 0.009926080703735352, 0.010321497917175293, 0.010716915130615234, 0.011112332344055176, 0.011507749557495117, 0.011903166770935059, 0.012298583984375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 9.0, 3.0, 8.0, 10.0, 6.0, 14.0, 13.0, 19.0, 20.0, 21.0, 45.0, 55.0, 104.0, 73.0, 121.0, 67.0, 90.0, 78.0, 51.0, 47.0, 29.0, 21.0, 16.0, 8.0, 9.0, 3.0, 9.0, 10.0, 7.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.304813385009766e-06, -5.161389708518982e-06, -5.017966032028198e-06, -4.8745423555374146e-06, -4.731118679046631e-06, -4.587695002555847e-06, -4.4442713260650635e-06, -4.30084764957428e-06, -4.157423973083496e-06, -4.014000296592712e-06, -3.870576620101929e-06, -3.727152943611145e-06, -3.5837292671203613e-06, -3.4403055906295776e-06, -3.296881914138794e-06, -3.1534582376480103e-06, -3.0100345611572266e-06, -2.866610884666443e-06, -2.723187208175659e-06, -2.5797635316848755e-06, -2.436339855194092e-06, -2.292916178703308e-06, -2.1494925022125244e-06, -2.0060688257217407e-06, -1.862645149230957e-06, -1.7192214727401733e-06, -1.5757977962493896e-06, -1.432374119758606e-06, -1.2889504432678223e-06, -1.1455267667770386e-06, -1.0021030902862549e-06, -8.586794137954712e-07, -7.152557373046875e-07, -5.718320608139038e-07, -4.284083843231201e-07, -2.849847078323364e-07, -1.4156103134155273e-07, 1.862645149230957e-09, 1.4528632164001465e-07, 2.8870999813079834e-07, 4.3213367462158203e-07, 5.755573511123657e-07, 7.189810276031494e-07, 8.624047040939331e-07, 1.0058283805847168e-06, 1.1492520570755005e-06, 1.2926757335662842e-06, 1.4360994100570679e-06, 1.5795230865478516e-06, 1.7229467630386353e-06, 1.866370439529419e-06, 2.0097941160202026e-06, 2.1532177925109863e-06, 2.29664146900177e-06, 2.4400651454925537e-06, 2.5834888219833374e-06, 2.726912498474121e-06, 2.8703361749649048e-06, 3.0137598514556885e-06, 3.157183527946472e-06, 3.300607204437256e-06, 3.4440308809280396e-06, 3.5874545574188232e-06, 3.730878233909607e-06, 3.874301910400391e-06]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 7.0, 11.0, 17.0, 18.0, 21.0, 37.0, 43.0, 79.0, 114.0, 179.0, 255.0, 375.0, 564.0, 900.0, 1366.0, 2164.0, 3472.0, 5925.0, 10488.0, 21615.0, 55396.0, 803029.0, 82910.0, 28228.0, 13088.0, 7132.0, 4114.0, 2500.0, 1603.0, 982.0, 642.0, 411.0, 270.0, 183.0, 136.0, 77.0, 63.0, 41.0, 34.0, 16.0, 16.0, 13.0, 9.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01323699951171875, -0.012843728065490723, -0.012450456619262695, -0.012057185173034668, -0.01166391372680664, -0.011270642280578613, -0.010877370834350586, -0.010484099388122559, -0.010090827941894531, -0.009697556495666504, -0.009304285049438477, -0.00891101360321045, -0.008517742156982422, -0.008124470710754395, -0.007731199264526367, -0.00733792781829834, -0.0069446563720703125, -0.006551384925842285, -0.006158113479614258, -0.0057648420333862305, -0.005371570587158203, -0.004978299140930176, -0.0045850276947021484, -0.004191756248474121, -0.0037984848022460938, -0.0034052133560180664, -0.003011941909790039, -0.0026186704635620117, -0.0022253990173339844, -0.001832127571105957, -0.0014388561248779297, -0.0010455846786499023, -0.000652313232421875, -0.00025904178619384766, 0.0001342296600341797, 0.000527501106262207, 0.0009207725524902344, 0.0013140439987182617, 0.001707315444946289, 0.0021005868911743164, 0.0024938583374023438, 0.002887129783630371, 0.0032804012298583984, 0.0036736726760864258, 0.004066944122314453, 0.0044602155685424805, 0.004853487014770508, 0.005246758460998535, 0.0056400299072265625, 0.00603330135345459, 0.006426572799682617, 0.0068198442459106445, 0.007213115692138672, 0.007606387138366699, 0.007999658584594727, 0.008392930030822754, 0.008786201477050781, 0.009179472923278809, 0.009572744369506836, 0.009966015815734863, 0.01035928726196289, 0.010752558708190918, 0.011145830154418945, 0.011539101600646973, 0.011932373046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 9.0, 5.0, 8.0, 10.0, 15.0, 16.0, 24.0, 24.0, 33.0, 40.0, 472.0, 156.0, 21.0, 30.0, 19.0, 16.0, 20.0, 15.0, 11.0, 3.0, 5.0, 4.0, 5.0, 6.0, 6.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00345611572265625, -0.003354191780090332, -0.003252267837524414, -0.003150343894958496, -0.003048419952392578, -0.00294649600982666, -0.002844572067260742, -0.0027426481246948242, -0.0026407241821289062, -0.0025388002395629883, -0.0024368762969970703, -0.0023349523544311523, -0.0022330284118652344, -0.0021311044692993164, -0.0020291805267333984, -0.0019272565841674805, -0.0018253326416015625, -0.0017234086990356445, -0.0016214847564697266, -0.0015195608139038086, -0.0014176368713378906, -0.0013157129287719727, -0.0012137889862060547, -0.0011118650436401367, -0.0010099411010742188, -0.0009080171585083008, -0.0008060932159423828, -0.0007041692733764648, -0.0006022453308105469, -0.0005003213882446289, -0.00039839744567871094, -0.00029647350311279297, -0.000194549560546875, -9.262561798095703e-05, 9.298324584960938e-06, 0.0001112222671508789, 0.00021314620971679688, 0.00031507015228271484, 0.0004169940948486328, 0.0005189180374145508, 0.0006208419799804688, 0.0007227659225463867, 0.0008246898651123047, 0.0009266138076782227, 0.0010285377502441406, 0.0011304616928100586, 0.0012323856353759766, 0.0013343095779418945, 0.0014362335205078125, 0.0015381574630737305, 0.0016400814056396484, 0.0017420053482055664, 0.0018439292907714844, 0.0019458532333374023, 0.0020477771759033203, 0.0021497011184692383, 0.0022516250610351562, 0.0023535490036010742, 0.002455472946166992, 0.00255739688873291, 0.002659320831298828, 0.002761244773864746, 0.002863168716430664, 0.002965092658996582, 0.0030670166015625]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 11.0, 9.0, 11.0, 18.0, 15.0, 24.0, 45.0, 51.0, 72.0, 98.0, 150.0, 138.0, 89.0, 63.0, 49.0, 31.0, 25.0, 20.0, 9.0, 6.0, 16.0, 11.0, 8.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02014574594795704, -0.019432228058576584, -0.01871870830655098, -0.018005188554525375, -0.01729167066514492, -0.016578152775764465, -0.01586463302373886, -0.015151114203035831, -0.014437595382332802, -0.013724076561629772, -0.013010557740926743, -0.012297038920223713, -0.011583520099520683, -0.010870001278817654, -0.010156482458114624, -0.009442963637411594, -0.008729444816708565, -0.008015925996005535, -0.0073024071753025055, -0.006588888354599476, -0.005875369533896446, -0.005161850713193417, -0.004448331892490387, -0.0037348130717873573, -0.0030212942510843277, -0.002307775430381298, -0.0015942566096782684, -0.0008807377889752388, -0.00016721896827220917, 0.0005462998524308205, 0.00125981867313385, 0.0019733374938368797, 0.0026868563145399094, 0.003400375135242939, 0.004113893955945969, 0.004827412776648998, 0.005540931597352028, 0.0062544504180550575, 0.006967969238758087, 0.007681488059461117, 0.008395006880164146, 0.009108525700867176, 0.009822044521570206, 0.010535563342273235, 0.011249082162976265, 0.011962600983679295, 0.012676119804382324, 0.013389638625085354, 0.014103157445788383, 0.014816676266491413, 0.015530195087194443, 0.016243714839220047, 0.016957232728600502, 0.017670750617980957, 0.01838427037000656, 0.019097790122032166, 0.01981130801141262, 0.020524825900793076, 0.02123834565281868, 0.021951865404844284, 0.02266538329422474, 0.023378901183605194, 0.0240924209356308, 0.024805940687656403, 0.025519458577036858]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 9.0, 3.0, 5.0, 14.0, 13.0, 16.0, 25.0, 26.0, 24.0, 37.0, 38.0, 26.0, 31.0, 48.0, 46.0, 58.0, 54.0, 45.0, 48.0, 47.0, 55.0, 46.0, 41.0, 34.0, 37.0, 25.0, 32.0, 20.0, 19.0, 18.0, 14.0, 9.0, 14.0, 5.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0], "bins": [-0.0207980889827013, -0.020295774564146996, -0.01979346200823784, -0.019291147589683533, -0.018788833171129227, -0.01828651875257492, -0.017784204334020615, -0.017281891778111458, -0.016779577359557152, -0.016277262941002846, -0.01577495038509369, -0.015272635966539383, -0.014770321547985077, -0.014268007129430771, -0.01376569364219904, -0.013263380154967308, -0.012761065736413002, -0.012258751317858696, -0.011756437830626965, -0.011254124343395233, -0.010751809924840927, -0.010249495506286621, -0.00974718201905489, -0.009244868531823158, -0.008742554113268852, -0.008240239694714546, -0.007737926207482815, -0.007235612254589796, -0.006733298301696777, -0.006230984348803759, -0.00572867039591074, -0.005226356443017721, -0.004724044352769852, -0.004221730399876833, -0.0037194164469838142, -0.0032171024940907955, -0.002714788541197777, -0.002212474588304758, -0.0017101606354117393, -0.0012078466825187206, -0.0007055327296257019, -0.00020321877673268318, 0.00029909517616033554, 0.0008014091290533543, 0.001303723081946373, 0.0018060370348393917, 0.0023083509877324104, 0.002810664940625429, 0.003312978893518448, 0.0038152928464114666, 0.004317606799304485, 0.004819920752197504, 0.005322234705090523, 0.0058245486579835415, 0.00632686261087656, 0.006829176563769579, 0.007331490516662598, 0.007833804935216904, 0.008336118422448635, 0.008838431909680367, 0.009340746328234673, 0.009843060746788979, 0.01034537423402071, 0.010847687721252441, 0.011350002139806747]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 9.0, 11.0, 11.0, 27.0, 45.0, 44.0, 66.0, 102.0, 142.0, 237.0, 328.0, 540.0, 963.0, 1458.0, 2554.0, 4372.0, 7741.0, 14840.0, 28443.0, 60609.0, 148341.0, 501550.0, 2294975.0, 786314.0, 193769.0, 74925.0, 34622.0, 17179.0, 9070.0, 4781.0, 2659.0, 1492.0, 835.0, 495.0, 303.0, 149.0, 107.0, 75.0, 39.0, 17.0, 11.0, 15.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0], "bins": [-0.0311737060546875, -0.03036665916442871, -0.029559612274169922, -0.028752565383911133, -0.027945518493652344, -0.027138471603393555, -0.026331424713134766, -0.025524377822875977, -0.024717330932617188, -0.0239102840423584, -0.02310323715209961, -0.02229619026184082, -0.02148914337158203, -0.020682096481323242, -0.019875049591064453, -0.019068002700805664, -0.018260955810546875, -0.017453908920288086, -0.016646862030029297, -0.015839815139770508, -0.015032768249511719, -0.01422572135925293, -0.01341867446899414, -0.012611627578735352, -0.011804580688476562, -0.010997533798217773, -0.010190486907958984, -0.009383440017700195, -0.008576393127441406, -0.007769346237182617, -0.006962299346923828, -0.006155252456665039, -0.00534820556640625, -0.004541158676147461, -0.003734111785888672, -0.002927064895629883, -0.0021200180053710938, -0.0013129711151123047, -0.0005059242248535156, 0.00030112266540527344, 0.0011081695556640625, 0.0019152164459228516, 0.0027222633361816406, 0.0035293102264404297, 0.004336357116699219, 0.005143404006958008, 0.005950450897216797, 0.006757497787475586, 0.007564544677734375, 0.008371591567993164, 0.009178638458251953, 0.009985685348510742, 0.010792732238769531, 0.01159977912902832, 0.01240682601928711, 0.013213872909545898, 0.014020919799804688, 0.014827966690063477, 0.015635013580322266, 0.016442060470581055, 0.017249107360839844, 0.018056154251098633, 0.018863201141357422, 0.01967024803161621, 0.020477294921875]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 7.0, 6.0, 19.0, 18.0, 13.0, 17.0, 33.0, 28.0, 37.0, 32.0, 35.0, 46.0, 51.0, 50.0, 58.0, 51.0, 48.0, 51.0, 55.0, 42.0, 39.0, 38.0, 37.0, 34.0, 25.0, 16.0, 21.0, 18.0, 16.0, 15.0, 11.0, 4.0, 8.0, 8.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.01309967041015625, -0.012785494327545166, -0.012471318244934082, -0.012157142162322998, -0.011842966079711914, -0.01152878999710083, -0.011214613914489746, -0.010900437831878662, -0.010586261749267578, -0.010272085666656494, -0.00995790958404541, -0.009643733501434326, -0.009329557418823242, -0.009015381336212158, -0.008701205253601074, -0.00838702917098999, -0.008072853088378906, -0.007758677005767822, -0.007444500923156738, -0.007130324840545654, -0.00681614875793457, -0.006501972675323486, -0.006187796592712402, -0.005873620510101318, -0.005559444427490234, -0.00524526834487915, -0.004931092262268066, -0.004616916179656982, -0.0043027400970458984, -0.0039885640144348145, -0.0036743879318237305, -0.0033602118492126465, -0.0030460357666015625, -0.0027318596839904785, -0.0024176836013793945, -0.0021035075187683105, -0.0017893314361572266, -0.0014751553535461426, -0.0011609792709350586, -0.0008468031883239746, -0.0005326271057128906, -0.00021845102310180664, 9.572505950927734e-05, 0.00040990114212036133, 0.0007240772247314453, 0.0010382533073425293, 0.0013524293899536133, 0.0016666054725646973, 0.0019807815551757812, 0.0022949576377868652, 0.0026091337203979492, 0.002923309803009033, 0.003237485885620117, 0.003551661968231201, 0.003865838050842285, 0.004180014133453369, 0.004494190216064453, 0.004808366298675537, 0.005122542381286621, 0.005436718463897705, 0.005750894546508789, 0.006065070629119873, 0.006379246711730957, 0.006693422794342041, 0.007007598876953125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 5.0, 13.0, 14.0, 26.0, 35.0, 49.0, 73.0, 91.0, 133.0, 209.0, 271.0, 371.0, 508.0, 771.0, 1131.0, 1561.0, 2224.0, 3294.0, 4864.0, 7784.0, 11932.0, 19089.0, 30541.0, 50699.0, 88330.0, 166443.0, 352148.0, 894745.0, 1414275.0, 586367.0, 251486.0, 125571.0, 68889.0, 40696.0, 24401.0, 15180.0, 9934.0, 6336.0, 4223.0, 2855.0, 2000.0, 1380.0, 971.0, 714.0, 495.0, 342.0, 243.0, 197.0, 112.0, 84.0, 65.0, 49.0, 25.0, 17.0, 13.0, 5.0, 9.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.013214111328125, -0.012791752815246582, -0.012369394302368164, -0.011947035789489746, -0.011524677276611328, -0.01110231876373291, -0.010679960250854492, -0.010257601737976074, -0.009835243225097656, -0.009412884712219238, -0.00899052619934082, -0.008568167686462402, -0.008145809173583984, -0.007723450660705566, -0.0073010921478271484, -0.0068787336349487305, -0.0064563751220703125, -0.0060340166091918945, -0.0056116580963134766, -0.005189299583435059, -0.004766941070556641, -0.004344582557678223, -0.003922224044799805, -0.0034998655319213867, -0.0030775070190429688, -0.0026551485061645508, -0.002232789993286133, -0.0018104314804077148, -0.0013880729675292969, -0.0009657144546508789, -0.0005433559417724609, -0.00012099742889404297, 0.000301361083984375, 0.000723719596862793, 0.001146078109741211, 0.001568436622619629, 0.001990795135498047, 0.002413153648376465, 0.002835512161254883, 0.0032578706741333008, 0.0036802291870117188, 0.004102587699890137, 0.004524946212768555, 0.004947304725646973, 0.005369663238525391, 0.005792021751403809, 0.0062143802642822266, 0.0066367387771606445, 0.0070590972900390625, 0.0074814558029174805, 0.007903814315795898, 0.008326172828674316, 0.008748531341552734, 0.009170889854431152, 0.00959324836730957, 0.010015606880187988, 0.010437965393066406, 0.010860323905944824, 0.011282682418823242, 0.01170504093170166, 0.012127399444580078, 0.012549757957458496, 0.012972116470336914, 0.013394474983215332, 0.01381683349609375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 7.0, 6.0, 5.0, 6.0, 8.0, 9.0, 12.0, 17.0, 20.0, 37.0, 33.0, 34.0, 55.0, 52.0, 80.0, 98.0, 123.0, 133.0, 145.0, 179.0, 206.0, 223.0, 265.0, 263.0, 309.0, 248.0, 230.0, 215.0, 206.0, 169.0, 129.0, 110.0, 98.0, 82.0, 65.0, 45.0, 29.0, 21.0, 30.0, 18.0, 15.0, 8.0, 8.0, 3.0, 8.0, 4.0, 2.0, 2.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.004161834716796875, -0.004023134708404541, -0.003884434700012207, -0.003745734691619873, -0.003607034683227539, -0.003468334674835205, -0.003329634666442871, -0.003190934658050537, -0.003052234649658203, -0.002913534641265869, -0.002774834632873535, -0.002636134624481201, -0.002497434616088867, -0.002358734607696533, -0.0022200345993041992, -0.0020813345909118652, -0.0019426345825195312, -0.0018039345741271973, -0.0016652345657348633, -0.0015265345573425293, -0.0013878345489501953, -0.0012491345405578613, -0.0011104345321655273, -0.0009717345237731934, -0.0008330345153808594, -0.0006943345069885254, -0.0005556344985961914, -0.0004169344902038574, -0.00027823448181152344, -0.00013953447341918945, -8.344650268554688e-07, 0.00013786554336547852, 0.0002765655517578125, 0.0004152655601501465, 0.0005539655685424805, 0.0006926655769348145, 0.0008313655853271484, 0.0009700655937194824, 0.0011087656021118164, 0.0012474656105041504, 0.0013861656188964844, 0.0015248656272888184, 0.0016635656356811523, 0.0018022656440734863, 0.0019409656524658203, 0.0020796656608581543, 0.0022183656692504883, 0.0023570656776428223, 0.0024957656860351562, 0.0026344656944274902, 0.0027731657028198242, 0.002911865711212158, 0.003050565719604492, 0.003189265727996826, 0.00332796573638916, 0.003466665744781494, 0.003605365753173828, 0.003744065761566162, 0.003882765769958496, 0.00402146577835083, 0.004160165786743164, 0.004298865795135498, 0.004437565803527832, 0.004576265811920166, 0.0047149658203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 6.0, 5.0, 8.0, 14.0, 20.0, 31.0, 45.0, 62.0, 96.0, 125.0, 145.0, 151.0, 83.0, 56.0, 45.0, 25.0, 20.0, 12.0, 15.0, 4.0, 6.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02188003435730934, -0.021284710615873337, -0.02068938873708248, -0.020094066858291626, -0.01949874311685562, -0.018903419375419617, -0.01830809749662876, -0.017712775617837906, -0.0171174518764019, -0.016522128134965897, -0.01592680625617504, -0.015331483446061611, -0.014736160635948181, -0.014140837825834751, -0.013545515015721321, -0.012950192205607891, -0.012354869395494461, -0.011759546585381031, -0.011164223775267601, -0.010568900965154171, -0.009973578155040741, -0.009378255344927311, -0.008782932534813881, -0.008187609724700451, -0.007592286914587021, -0.006996964104473591, -0.006401641294360161, -0.005806318484246731, -0.005210995674133301, -0.004615672864019871, -0.004020350053906441, -0.0034250272437930107, -0.00282970629632473, -0.0022343834862113, -0.0016390606760978699, -0.0010437378659844398, -0.0004484150558710098, 0.0001469077542424202, 0.0007422305643558502, 0.0013375533744692802, 0.0019328761845827103, 0.0025281989946961403, 0.0031235218048095703, 0.0037188446149230003, 0.00431416742503643, 0.00490949023514986, 0.00550481304526329, 0.00610013585537672, 0.0066954586654901505, 0.0072907814756035805, 0.00788610428571701, 0.00848142709583044, 0.00907674990594387, 0.0096720727160573, 0.01026739552617073, 0.01086271833628416, 0.01145804114639759, 0.01205336395651102, 0.01264868676662445, 0.01324400957673788, 0.01383933238685131, 0.01443465519696474, 0.01502997800707817, 0.015625301748514175, 0.01622062362730503]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 11.0, 8.0, 12.0, 14.0, 17.0, 34.0, 26.0, 32.0, 28.0, 40.0, 46.0, 49.0, 57.0, 40.0, 42.0, 50.0, 48.0, 53.0, 41.0, 65.0, 40.0, 35.0, 38.0, 34.0, 23.0, 25.0, 16.0, 18.0, 12.0, 18.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.01368509978055954, -0.013337675482034683, -0.012990251183509827, -0.01264282688498497, -0.012295402586460114, -0.011947978287935257, -0.0116005539894104, -0.011253129690885544, -0.010905705392360687, -0.01055828109383583, -0.010210856795310974, -0.009863432496786118, -0.009516008198261261, -0.009168583899736404, -0.008821159601211548, -0.008473735302686691, -0.008126311004161835, -0.007778886705636978, -0.007431462407112122, -0.007084038108587265, -0.0067366138100624084, -0.006389189511537552, -0.006041765213012695, -0.005694340914487839, -0.005346917547285557, -0.0049994932487607, -0.004652068950235844, -0.004304644651710987, -0.0039572203531861305, -0.003609796054661274, -0.003262371988967061, -0.0029149476904422045, -0.0025675231590867043, -0.0022200988605618477, -0.0018726745620369911, -0.0015252503799274564, -0.0011778260814025998, -0.0008304017828777432, -0.0004829776007682085, -0.00013555330224335194, 0.00021187099628150463, 0.0005592952948063612, 0.0009067195351235569, 0.0012541437754407525, 0.001601568073965609, 0.0019489923724904656, 0.0022964165546000004, 0.002643840853124857, 0.0029912651516497135, 0.00333868945017457, 0.0036861137486994267, 0.004033538047224283, 0.00438096234574914, 0.004728386644273996, 0.005075810477137566, 0.005423234775662422, 0.005770659074187279, 0.006118083372712135, 0.006465507671236992, 0.0068129319697618484, 0.007160356268286705, 0.007507780566811562, 0.007855204865336418, 0.008202629163861275, 0.008550053462386131]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 10.0, 9.0, 10.0, 25.0, 30.0, 45.0, 65.0, 87.0, 152.0, 246.0, 384.0, 601.0, 889.0, 1278.0, 2053.0, 3301.0, 5378.0, 9368.0, 16398.0, 31390.0, 65684.0, 157816.0, 355615.0, 220670.0, 88118.0, 40069.0, 20420.0, 11137.0, 6453.0, 3942.0, 2454.0, 1574.0, 1041.0, 613.0, 421.0, 282.0, 174.0, 122.0, 95.0, 55.0, 28.0, 17.0, 18.0, 13.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015380859375, -0.014862537384033203, -0.014344215393066406, -0.01382589340209961, -0.013307571411132812, -0.012789249420166016, -0.012270927429199219, -0.011752605438232422, -0.011234283447265625, -0.010715961456298828, -0.010197639465332031, -0.009679317474365234, -0.009160995483398438, -0.00864267349243164, -0.008124351501464844, -0.007606029510498047, -0.00708770751953125, -0.006569385528564453, -0.006051063537597656, -0.005532741546630859, -0.0050144195556640625, -0.004496097564697266, -0.003977775573730469, -0.003459453582763672, -0.002941131591796875, -0.002422809600830078, -0.0019044876098632812, -0.0013861656188964844, -0.0008678436279296875, -0.0003495216369628906, 0.00016880035400390625, 0.0006871223449707031, 0.0012054443359375, 0.0017237663269042969, 0.0022420883178710938, 0.0027604103088378906, 0.0032787322998046875, 0.0037970542907714844, 0.004315376281738281, 0.004833698272705078, 0.005352020263671875, 0.005870342254638672, 0.006388664245605469, 0.006906986236572266, 0.0074253082275390625, 0.00794363021850586, 0.008461952209472656, 0.008980274200439453, 0.00949859619140625, 0.010016918182373047, 0.010535240173339844, 0.01105356216430664, 0.011571884155273438, 0.012090206146240234, 0.012608528137207031, 0.013126850128173828, 0.013645172119140625, 0.014163494110107422, 0.014681816101074219, 0.015200138092041016, 0.015718460083007812, 0.01623678207397461, 0.016755104064941406, 0.017273426055908203, 0.017791748046875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 11.0, 10.0, 14.0, 18.0, 19.0, 23.0, 33.0, 35.0, 28.0, 38.0, 41.0, 50.0, 56.0, 34.0, 45.0, 45.0, 50.0, 48.0, 46.0, 40.0, 49.0, 40.0, 29.0, 42.0, 31.0, 15.0, 23.0, 10.0, 14.0, 13.0, 16.0, 7.0, 9.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.01216888427734375, -0.011868894100189209, -0.011568903923034668, -0.011268913745880127, -0.010968923568725586, -0.010668933391571045, -0.010368943214416504, -0.010068953037261963, -0.009768962860107422, -0.00946897268295288, -0.00916898250579834, -0.008868992328643799, -0.008569002151489258, -0.008269011974334717, -0.007969021797180176, -0.007669031620025635, -0.007369041442871094, -0.007069051265716553, -0.006769061088562012, -0.006469070911407471, -0.00616908073425293, -0.005869090557098389, -0.005569100379943848, -0.005269110202789307, -0.004969120025634766, -0.004669129848480225, -0.004369139671325684, -0.004069149494171143, -0.0037691593170166016, -0.0034691691398620605, -0.0031691789627075195, -0.0028691887855529785, -0.0025691986083984375, -0.0022692084312438965, -0.0019692182540893555, -0.0016692280769348145, -0.0013692378997802734, -0.0010692477226257324, -0.0007692575454711914, -0.0004692673683166504, -0.00016927719116210938, 0.00013071298599243164, 0.00043070316314697266, 0.0007306933403015137, 0.0010306835174560547, 0.0013306736946105957, 0.0016306638717651367, 0.0019306540489196777, 0.0022306442260742188, 0.0025306344032287598, 0.0028306245803833008, 0.003130614757537842, 0.003430604934692383, 0.003730595111846924, 0.004030585289001465, 0.004330575466156006, 0.004630565643310547, 0.004930555820465088, 0.005230545997619629, 0.00553053617477417, 0.005830526351928711, 0.006130516529083252, 0.006430506706237793, 0.006730496883392334, 0.007030487060546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 6.0, 5.0, 12.0, 15.0, 25.0, 23.0, 40.0, 62.0, 98.0, 163.0, 233.0, 371.0, 578.0, 1057.0, 1675.0, 2968.0, 5819.0, 12726.0, 34818.0, 152656.0, 644716.0, 134053.0, 31839.0, 11917.0, 5648.0, 2921.0, 1556.0, 911.0, 566.0, 388.0, 233.0, 157.0, 102.0, 55.0, 39.0, 33.0, 23.0, 18.0, 7.0, 13.0, 4.0, 2.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0219268798828125, -0.021030664443969727, -0.020134449005126953, -0.01923823356628418, -0.018342018127441406, -0.017445802688598633, -0.01654958724975586, -0.015653371810913086, -0.014757156372070312, -0.013860940933227539, -0.012964725494384766, -0.012068510055541992, -0.011172294616699219, -0.010276079177856445, -0.009379863739013672, -0.008483648300170898, -0.007587432861328125, -0.0066912174224853516, -0.005795001983642578, -0.004898786544799805, -0.004002571105957031, -0.003106355667114258, -0.0022101402282714844, -0.001313924789428711, -0.0004177093505859375, 0.00047850608825683594, 0.0013747215270996094, 0.002270936965942383, 0.0031671524047851562, 0.00406336784362793, 0.004959583282470703, 0.0058557987213134766, 0.00675201416015625, 0.0076482295989990234, 0.008544445037841797, 0.00944066047668457, 0.010336875915527344, 0.011233091354370117, 0.01212930679321289, 0.013025522232055664, 0.013921737670898438, 0.014817953109741211, 0.015714168548583984, 0.016610383987426758, 0.01750659942626953, 0.018402814865112305, 0.019299030303955078, 0.02019524574279785, 0.021091461181640625, 0.0219876766204834, 0.022883892059326172, 0.023780107498168945, 0.02467632293701172, 0.025572538375854492, 0.026468753814697266, 0.02736496925354004, 0.028261184692382812, 0.029157400131225586, 0.03005361557006836, 0.030949831008911133, 0.031846046447753906, 0.03274226188659668, 0.03363847732543945, 0.03453469276428223, 0.035430908203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 3.0, 9.0, 10.0, 13.0, 11.0, 11.0, 15.0, 22.0, 29.0, 23.0, 32.0, 31.0, 29.0, 28.0, 37.0, 34.0, 33.0, 45.0, 43.0, 42.0, 37.0, 45.0, 51.0, 42.0, 40.0, 33.0, 40.0, 33.0, 26.0, 19.0, 22.0, 17.0, 14.0, 12.0, 18.0, 13.0, 5.0, 9.0, 3.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005344390869140625, -0.005178511142730713, -0.005012631416320801, -0.004846751689910889, -0.0046808719635009766, -0.0045149922370910645, -0.004349112510681152, -0.00418323278427124, -0.004017353057861328, -0.003851473331451416, -0.003685593605041504, -0.003519713878631592, -0.0033538341522216797, -0.0031879544258117676, -0.0030220746994018555, -0.0028561949729919434, -0.0026903152465820312, -0.002524435520172119, -0.002358555793762207, -0.002192676067352295, -0.002026796340942383, -0.0018609166145324707, -0.0016950368881225586, -0.0015291571617126465, -0.0013632774353027344, -0.0011973977088928223, -0.0010315179824829102, -0.000865638256072998, -0.0006997585296630859, -0.0005338788032531738, -0.0003679990768432617, -0.0002021193504333496, -3.62396240234375e-05, 0.0001296401023864746, 0.0002955198287963867, 0.00046139955520629883, 0.0006272792816162109, 0.000793159008026123, 0.0009590387344360352, 0.0011249184608459473, 0.0012907981872558594, 0.0014566779136657715, 0.0016225576400756836, 0.0017884373664855957, 0.001954317092895508, 0.00212019681930542, 0.002286076545715332, 0.002451956272125244, 0.0026178359985351562, 0.0027837157249450684, 0.0029495954513549805, 0.0031154751777648926, 0.0032813549041748047, 0.003447234630584717, 0.003613114356994629, 0.003778994083404541, 0.003944873809814453, 0.004110753536224365, 0.004276633262634277, 0.0044425129890441895, 0.0046083927154541016, 0.004774272441864014, 0.004940152168273926, 0.005106031894683838, 0.00527191162109375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 5.0, 11.0, 15.0, 34.0, 35.0, 50.0, 79.0, 101.0, 150.0, 187.0, 266.0, 352.0, 548.0, 845.0, 1147.0, 1608.0, 2476.0, 4293.0, 7091.0, 13079.0, 25865.0, 59848.0, 178687.0, 478350.0, 162338.0, 55637.0, 24488.0, 12293.0, 6694.0, 4065.0, 2544.0, 1681.0, 1129.0, 767.0, 519.0, 375.0, 284.0, 196.0, 136.0, 95.0, 63.0, 44.0, 27.0, 20.0, 8.0, 4.0, 10.0, 1.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0], "bins": [-0.003154754638671875, -0.0030575692653656006, -0.002960383892059326, -0.0028631985187530518, -0.0027660131454467773, -0.002668827772140503, -0.0025716423988342285, -0.002474457025527954, -0.0023772716522216797, -0.0022800862789154053, -0.002182900905609131, -0.0020857155323028564, -0.001988530158996582, -0.0018913447856903076, -0.0017941594123840332, -0.0016969740390777588, -0.0015997886657714844, -0.00150260329246521, -0.0014054179191589355, -0.0013082325458526611, -0.0012110471725463867, -0.0011138617992401123, -0.0010166764259338379, -0.0009194910526275635, -0.0008223056793212891, -0.0007251203060150146, -0.0006279349327087402, -0.0005307495594024658, -0.0004335641860961914, -0.000336378812789917, -0.00023919343948364258, -0.00014200806617736816, -4.482269287109375e-05, 5.2362680435180664e-05, 0.00014954805374145508, 0.0002467334270477295, 0.0003439188003540039, 0.0004411041736602783, 0.0005382895469665527, 0.0006354749202728271, 0.0007326602935791016, 0.000829845666885376, 0.0009270310401916504, 0.0010242164134979248, 0.0011214017868041992, 0.0012185871601104736, 0.001315772533416748, 0.0014129579067230225, 0.0015101432800292969, 0.0016073286533355713, 0.0017045140266418457, 0.0018016993999481201, 0.0018988847732543945, 0.001996070146560669, 0.0020932555198669434, 0.0021904408931732178, 0.002287626266479492, 0.0023848116397857666, 0.002481997013092041, 0.0025791823863983154, 0.00267636775970459, 0.0027735531330108643, 0.0028707385063171387, 0.002967923879623413, 0.0030651092529296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 4.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 7.0, 12.0, 22.0, 20.0, 23.0, 23.0, 43.0, 36.0, 37.0, 61.0, 72.0, 94.0, 94.0, 73.0, 70.0, 40.0, 38.0, 40.0, 33.0, 20.0, 26.0, 20.0, 15.0, 10.0, 11.0, 4.0, 2.0, 7.0, 3.0, 6.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9669532775878906e-05, -1.911260187625885e-05, -1.8555670976638794e-05, -1.7998740077018738e-05, -1.744180917739868e-05, -1.6884878277778625e-05, -1.632794737815857e-05, -1.5771016478538513e-05, -1.5214085578918457e-05, -1.4657154679298401e-05, -1.4100223779678345e-05, -1.3543292880058289e-05, -1.2986361980438232e-05, -1.2429431080818176e-05, -1.187250018119812e-05, -1.1315569281578064e-05, -1.0758638381958008e-05, -1.0201707482337952e-05, -9.644776582717896e-06, -9.08784568309784e-06, -8.530914783477783e-06, -7.973983883857727e-06, -7.417052984237671e-06, -6.860122084617615e-06, -6.303191184997559e-06, -5.7462602853775024e-06, -5.189329385757446e-06, -4.63239848613739e-06, -4.075467586517334e-06, -3.518536686897278e-06, -2.9616057872772217e-06, -2.4046748876571655e-06, -1.8477439880371094e-06, -1.2908130884170532e-06, -7.338821887969971e-07, -1.7695128917694092e-07, 3.7997961044311523e-07, 9.369105100631714e-07, 1.4938414096832275e-06, 2.0507723093032837e-06, 2.60770320892334e-06, 3.164634108543396e-06, 3.721565008163452e-06, 4.278495907783508e-06, 4.8354268074035645e-06, 5.392357707023621e-06, 5.949288606643677e-06, 6.506219506263733e-06, 7.063150405883789e-06, 7.620081305503845e-06, 8.177012205123901e-06, 8.733943104743958e-06, 9.290874004364014e-06, 9.84780490398407e-06, 1.0404735803604126e-05, 1.0961666703224182e-05, 1.1518597602844238e-05, 1.2075528502464294e-05, 1.263245940208435e-05, 1.3189390301704407e-05, 1.3746321201324463e-05, 1.4303252100944519e-05, 1.4860183000564575e-05, 1.541711390018463e-05, 1.5974044799804688e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 5.0, 10.0, 11.0, 16.0, 21.0, 28.0, 43.0, 65.0, 80.0, 123.0, 194.0, 257.0, 461.0, 776.0, 1264.0, 2556.0, 5077.0, 10910.0, 23978.0, 58560.0, 163177.0, 437904.0, 214384.0, 73189.0, 29480.0, 12862.0, 6223.0, 3011.0, 1597.0, 853.0, 468.0, 332.0, 213.0, 127.0, 79.0, 65.0, 43.0, 24.0, 28.0, 16.0, 5.0, 11.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002719879150390625, -0.0026364922523498535, -0.002553105354309082, -0.0024697184562683105, -0.002386331558227539, -0.0023029446601867676, -0.002219557762145996, -0.0021361708641052246, -0.002052783966064453, -0.0019693970680236816, -0.0018860101699829102, -0.0018026232719421387, -0.0017192363739013672, -0.0016358494758605957, -0.0015524625778198242, -0.0014690756797790527, -0.0013856887817382812, -0.0013023018836975098, -0.0012189149856567383, -0.0011355280876159668, -0.0010521411895751953, -0.0009687542915344238, -0.0008853673934936523, -0.0008019804954528809, -0.0007185935974121094, -0.0006352066993713379, -0.0005518198013305664, -0.0004684329032897949, -0.00038504600524902344, -0.00030165910720825195, -0.00021827220916748047, -0.00013488531112670898, -5.14984130859375e-05, 3.1888484954833984e-05, 0.00011527538299560547, 0.00019866228103637695, 0.00028204917907714844, 0.0003654360771179199, 0.0004488229751586914, 0.0005322098731994629, 0.0006155967712402344, 0.0006989836692810059, 0.0007823705673217773, 0.0008657574653625488, 0.0009491443634033203, 0.0010325312614440918, 0.0011159181594848633, 0.0011993050575256348, 0.0012826919555664062, 0.0013660788536071777, 0.0014494657516479492, 0.0015328526496887207, 0.0016162395477294922, 0.0016996264457702637, 0.0017830133438110352, 0.0018664002418518066, 0.0019497871398925781, 0.0020331740379333496, 0.002116560935974121, 0.0021999478340148926, 0.002283334732055664, 0.0023667216300964355, 0.002450108528137207, 0.0025334954261779785, 0.00261688232421875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 11.0, 12.0, 29.0, 33.0, 55.0, 57.0, 87.0, 92.0, 106.0, 112.0, 112.0, 85.0, 56.0, 56.0, 42.0, 20.0, 11.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008835792541503906, -0.0008452907204627991, -0.0008070021867752075, -0.000768713653087616, -0.0007304251194000244, -0.0006921365857124329, -0.0006538480520248413, -0.0006155595183372498, -0.0005772709846496582, -0.0005389824509620667, -0.0005006939172744751, -0.00046240538358688354, -0.000424116849899292, -0.00038582831621170044, -0.0003475397825241089, -0.00030925124883651733, -0.0002709627151489258, -0.00023267418146133423, -0.00019438564777374268, -0.00015609711408615112, -0.00011780858039855957, -7.952004671096802e-05, -4.1231513023376465e-05, -2.942979335784912e-06, 3.534555435180664e-05, 7.36340880393982e-05, 0.00011192262172698975, 0.0001502111554145813, 0.00018849968910217285, 0.0002267882227897644, 0.00026507675647735596, 0.0003033652901649475, 0.00034165382385253906, 0.0003799423575401306, 0.00041823089122772217, 0.0004565194249153137, 0.0004948079586029053, 0.0005330964922904968, 0.0005713850259780884, 0.0006096735596656799, 0.0006479620933532715, 0.000686250627040863, 0.0007245391607284546, 0.0007628276944160461, 0.0008011162281036377, 0.0008394047617912292, 0.0008776932954788208, 0.0009159818291664124, 0.0009542703628540039, 0.0009925588965415955, 0.001030847430229187, 0.0010691359639167786, 0.0011074244976043701, 0.0011457130312919617, 0.0011840015649795532, 0.0012222900986671448, 0.0012605786323547363, 0.0012988671660423279, 0.0013371556997299194, 0.001375444233417511, 0.0014137327671051025, 0.001452021300792694, 0.0014903098344802856, 0.0015285983681678772, 0.0015668869018554688]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 0.0, 5.0, 6.0, 12.0, 15.0, 26.0, 32.0, 48.0, 72.0, 125.0, 120.0, 162.0, 123.0, 74.0, 49.0, 32.0, 22.0, 21.0, 11.0, 7.0, 7.0, 6.0, 7.0, 3.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01937452331185341, -0.018839702010154724, -0.01830487884581089, -0.017770057544112206, -0.01723523437976837, -0.016700413078069687, -0.016165591776371002, -0.01563076861202717, -0.015095947310328484, -0.014561125077307224, -0.014026302844285965, -0.01349148154258728, -0.012956659309566021, -0.012421837076544762, -0.011887015774846077, -0.011352193541824818, -0.010817371308803558, -0.010282549075782299, -0.00974772684276104, -0.009212905541062355, -0.008678083308041096, -0.008143261075019836, -0.007608439307659864, -0.007073617540299892, -0.006538795307278633, -0.006003973074257374, -0.005469151306897402, -0.00493432953953743, -0.0043995073065161705, -0.003864685306325555, -0.003329863306134939, -0.0027950413059443235, -0.002260221168398857, -0.0017253991682082415, -0.0011905771680176258, -0.0006557551678270102, -0.0001209331676363945, 0.00041388883255422115, 0.0009487108327448368, 0.0014835328329354525, 0.002018354833126068, 0.0025531768333166838, 0.0030879988335072994, 0.003622820833697915, 0.004157642833888531, 0.00469246506690979, 0.005227286834269762, 0.005762108601629734, 0.006296930834650993, 0.006831753067672253, 0.007366574835032225, 0.007901396602392197, 0.008436218835413456, 0.008971041068434715, 0.0095058623701334, 0.01004068460315466, 0.010575506836175919, 0.011110329069197178, 0.011645151302218437, 0.012179972603917122, 0.012714794836938381, 0.01324961706995964, 0.013784438371658325, 0.014319260604679585, 0.014854082837700844]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 6.0, 4.0, 12.0, 10.0, 11.0, 17.0, 25.0, 33.0, 31.0, 30.0, 38.0, 37.0, 52.0, 42.0, 64.0, 44.0, 54.0, 39.0, 49.0, 47.0, 51.0, 46.0, 47.0, 35.0, 33.0, 27.0, 31.0, 15.0, 14.0, 13.0, 20.0, 11.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.012406989932060242, -0.012095599435269833, -0.011784208938479424, -0.011472818441689014, -0.011161427944898605, -0.010850036516785622, -0.010538646019995213, -0.010227255523204803, -0.009915865026414394, -0.009604474529623985, -0.009293084032833576, -0.008981693536043167, -0.008670302107930183, -0.008358911611139774, -0.008047521114349365, -0.007736130617558956, -0.007424740120768547, -0.007113349623978138, -0.006801959127187729, -0.0064905681647360325, -0.006179177667945623, -0.005867787171155214, -0.005556396208703518, -0.005245005711913109, -0.0049336152151227, -0.004622224718332291, -0.0043108342215418816, -0.003999443259090185, -0.003688052762299776, -0.003376662265509367, -0.0030652715358883142, -0.0027538808062672615, -0.0024424903094768524, -0.0021310998126864433, -0.0018197090830653906, -0.0015083184698596597, -0.0011969278566539288, -0.0008855372434481978, -0.0005741466302424669, -0.0002627559006214142, 4.8634596168994904e-05, 0.0003600252093747258, 0.0006714158225804567, 0.0009828064357861876, 0.0012941970489919186, 0.0016055876621976495, 0.0019169782754033804, 0.002228369005024433, 0.0025397595018148422, 0.0028511499986052513, 0.003162540728226304, 0.003473931457847357, 0.003785321954637766, 0.004096712451428175, 0.004408103413879871, 0.0047194939106702805, 0.0050308844074606895, 0.005342274904251099, 0.005653665401041508, 0.005965056363493204, 0.006276446860283613, 0.006587837357074022, 0.006899228319525719, 0.007210618816316128, 0.007522009313106537]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 7.0, 10.0, 19.0, 22.0, 29.0, 51.0, 62.0, 84.0, 132.0, 202.0, 303.0, 512.0, 807.0, 1264.0, 1879.0, 2920.0, 4603.0, 7371.0, 12283.0, 20791.0, 36280.0, 65821.0, 125274.0, 229290.0, 240041.0, 133464.0, 70530.0, 38141.0, 22048.0, 13013.0, 7842.0, 4850.0, 3043.0, 1965.0, 1279.0, 817.0, 513.0, 343.0, 197.0, 147.0, 82.0, 76.0, 48.0, 40.0, 22.0, 15.0, 6.0, 4.0, 2.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.015716552734375, -0.015241026878356934, -0.014765501022338867, -0.0142899751663208, -0.013814449310302734, -0.013338923454284668, -0.012863397598266602, -0.012387871742248535, -0.011912345886230469, -0.011436820030212402, -0.010961294174194336, -0.01048576831817627, -0.010010242462158203, -0.009534716606140137, -0.00905919075012207, -0.008583664894104004, -0.008108139038085938, -0.007632613182067871, -0.007157087326049805, -0.006681561470031738, -0.006206035614013672, -0.0057305097579956055, -0.005254983901977539, -0.004779458045959473, -0.004303932189941406, -0.00382840633392334, -0.0033528804779052734, -0.002877354621887207, -0.0024018287658691406, -0.0019263029098510742, -0.0014507770538330078, -0.0009752511978149414, -0.000499725341796875, -2.4199485778808594e-05, 0.0004513263702392578, 0.0009268522262573242, 0.0014023780822753906, 0.001877903938293457, 0.0023534297943115234, 0.00282895565032959, 0.0033044815063476562, 0.0037800073623657227, 0.004255533218383789, 0.0047310590744018555, 0.005206584930419922, 0.005682110786437988, 0.006157636642456055, 0.006633162498474121, 0.0071086883544921875, 0.007584214210510254, 0.00805974006652832, 0.008535265922546387, 0.009010791778564453, 0.00948631763458252, 0.009961843490600586, 0.010437369346618652, 0.010912895202636719, 0.011388421058654785, 0.011863946914672852, 0.012339472770690918, 0.012814998626708984, 0.01329052448272705, 0.013766050338745117, 0.014241576194763184, 0.01471710205078125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 11.0, 13.0, 18.0, 20.0, 27.0, 31.0, 28.0, 39.0, 40.0, 38.0, 39.0, 39.0, 47.0, 44.0, 55.0, 43.0, 48.0, 48.0, 49.0, 47.0, 38.0, 37.0, 37.0, 29.0, 22.0, 25.0, 15.0, 4.0, 18.0, 15.0, 12.0, 4.0, 4.0, 2.0, 0.0, 2.0, 4.0, 1.0], "bins": [-0.01015472412109375, -0.009905576705932617, -0.009656429290771484, -0.009407281875610352, -0.009158134460449219, -0.008908987045288086, -0.008659839630126953, -0.00841069221496582, -0.008161544799804688, -0.007912397384643555, -0.007663249969482422, -0.007414102554321289, -0.007164955139160156, -0.0069158077239990234, -0.006666660308837891, -0.006417512893676758, -0.006168365478515625, -0.005919218063354492, -0.005670070648193359, -0.0054209232330322266, -0.005171775817871094, -0.004922628402709961, -0.004673480987548828, -0.004424333572387695, -0.0041751861572265625, -0.00392603874206543, -0.003676891326904297, -0.003427743911743164, -0.0031785964965820312, -0.0029294490814208984, -0.0026803016662597656, -0.002431154251098633, -0.0021820068359375, -0.0019328594207763672, -0.0016837120056152344, -0.0014345645904541016, -0.0011854171752929688, -0.0009362697601318359, -0.0006871223449707031, -0.0004379749298095703, -0.0001888275146484375, 6.031990051269531e-05, 0.0003094673156738281, 0.0005586147308349609, 0.0008077621459960938, 0.0010569095611572266, 0.0013060569763183594, 0.0015552043914794922, 0.001804351806640625, 0.002053499221801758, 0.0023026466369628906, 0.0025517940521240234, 0.0028009414672851562, 0.003050088882446289, 0.003299236297607422, 0.0035483837127685547, 0.0037975311279296875, 0.00404667854309082, 0.004295825958251953, 0.004544973373413086, 0.004794120788574219, 0.0050432682037353516, 0.005292415618896484, 0.005541563034057617, 0.00579071044921875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 11.0, 17.0, 31.0, 26.0, 49.0, 84.0, 93.0, 149.0, 219.0, 338.0, 475.0, 657.0, 930.0, 1377.0, 1873.0, 2800.0, 4020.0, 5678.0, 8736.0, 13287.0, 19567.0, 30426.0, 47265.0, 76117.0, 123935.0, 190902.0, 188572.0, 121731.0, 74106.0, 46446.0, 29538.0, 19151.0, 12693.0, 8673.0, 5801.0, 3944.0, 2643.0, 1845.0, 1306.0, 875.0, 650.0, 491.0, 312.0, 229.0, 144.0, 119.0, 84.0, 46.0, 29.0, 26.0, 13.0, 15.0, 7.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.01110076904296875, -0.010764122009277344, -0.010427474975585938, -0.010090827941894531, -0.009754180908203125, -0.009417533874511719, -0.009080886840820312, -0.008744239807128906, -0.0084075927734375, -0.008070945739746094, -0.0077342987060546875, -0.007397651672363281, -0.007061004638671875, -0.006724357604980469, -0.0063877105712890625, -0.006051063537597656, -0.00571441650390625, -0.005377769470214844, -0.0050411224365234375, -0.004704475402832031, -0.004367828369140625, -0.004031181335449219, -0.0036945343017578125, -0.0033578872680664062, -0.003021240234375, -0.0026845932006835938, -0.0023479461669921875, -0.0020112991333007812, -0.001674652099609375, -0.0013380050659179688, -0.0010013580322265625, -0.0006647109985351562, -0.00032806396484375, 8.58306884765625e-06, 0.0003452301025390625, 0.0006818771362304688, 0.001018524169921875, 0.0013551712036132812, 0.0016918182373046875, 0.0020284652709960938, 0.0023651123046875, 0.0027017593383789062, 0.0030384063720703125, 0.0033750534057617188, 0.003711700439453125, 0.004048347473144531, 0.0043849945068359375, 0.004721641540527344, 0.00505828857421875, 0.005394935607910156, 0.0057315826416015625, 0.006068229675292969, 0.006404876708984375, 0.006741523742675781, 0.0070781707763671875, 0.007414817810058594, 0.00775146484375, 0.008088111877441406, 0.008424758911132812, 0.008761405944824219, 0.009098052978515625, 0.009434700012207031, 0.009771347045898438, 0.010107994079589844, 0.01044464111328125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 9.0, 3.0, 8.0, 5.0, 8.0, 5.0, 7.0, 9.0, 18.0, 8.0, 17.0, 16.0, 15.0, 29.0, 17.0, 20.0, 24.0, 19.0, 36.0, 31.0, 31.0, 32.0, 46.0, 35.0, 36.0, 32.0, 42.0, 33.0, 37.0, 42.0, 35.0, 36.0, 30.0, 31.0, 30.0, 16.0, 30.0, 18.0, 17.0, 16.0, 18.0, 10.0, 10.0, 5.0, 3.0, 5.0, 7.0, 4.0, 2.0, 6.0, 6.0, 2.0, 3.0], "bins": [-0.00443267822265625, -0.004308074712753296, -0.004183471202850342, -0.004058867692947388, -0.003934264183044434, -0.0038096606731414795, -0.0036850571632385254, -0.0035604536533355713, -0.003435850143432617, -0.003311246633529663, -0.003186643123626709, -0.003062039613723755, -0.0029374361038208008, -0.0028128325939178467, -0.0026882290840148926, -0.0025636255741119385, -0.0024390220642089844, -0.0023144185543060303, -0.002189815044403076, -0.002065211534500122, -0.001940608024597168, -0.0018160045146942139, -0.0016914010047912598, -0.0015667974948883057, -0.0014421939849853516, -0.0013175904750823975, -0.0011929869651794434, -0.0010683834552764893, -0.0009437799453735352, -0.0008191764354705811, -0.000694572925567627, -0.0005699694156646729, -0.00044536590576171875, -0.00032076239585876465, -0.00019615888595581055, -7.155537605285645e-05, 5.3048133850097656e-05, 0.00017765164375305176, 0.00030225515365600586, 0.00042685866355895996, 0.0005514621734619141, 0.0006760656833648682, 0.0008006691932678223, 0.0009252727031707764, 0.0010498762130737305, 0.0011744797229766846, 0.0012990832328796387, 0.0014236867427825928, 0.0015482902526855469, 0.001672893762588501, 0.001797497272491455, 0.0019221007823944092, 0.0020467042922973633, 0.0021713078022003174, 0.0022959113121032715, 0.0024205148220062256, 0.0025451183319091797, 0.002669721841812134, 0.002794325351715088, 0.002918928861618042, 0.003043532371520996, 0.00316813588142395, 0.0032927393913269043, 0.0034173429012298584, 0.0035419464111328125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 8.0, 9.0, 12.0, 18.0, 23.0, 27.0, 32.0, 63.0, 63.0, 80.0, 127.0, 173.0, 224.0, 301.0, 429.0, 642.0, 954.0, 1386.0, 2100.0, 3555.0, 6071.0, 11109.0, 22294.0, 64000.0, 854315.0, 40587.0, 17130.0, 9042.0, 5019.0, 2931.0, 1851.0, 1160.0, 828.0, 538.0, 393.0, 269.0, 207.0, 136.0, 127.0, 76.0, 62.0, 47.0, 46.0, 23.0, 24.0, 16.0, 4.0, 9.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00467681884765625, -0.004532158374786377, -0.004387497901916504, -0.004242837429046631, -0.004098176956176758, -0.003953516483306885, -0.0038088560104370117, -0.0036641955375671387, -0.0035195350646972656, -0.0033748745918273926, -0.0032302141189575195, -0.0030855536460876465, -0.0029408931732177734, -0.0027962327003479004, -0.0026515722274780273, -0.0025069117546081543, -0.0023622512817382812, -0.002217590808868408, -0.002072930335998535, -0.0019282698631286621, -0.001783609390258789, -0.001638948917388916, -0.001494288444519043, -0.00134962797164917, -0.0012049674987792969, -0.0010603070259094238, -0.0009156465530395508, -0.0007709860801696777, -0.0006263256072998047, -0.00048166513442993164, -0.0003370046615600586, -0.00019234418869018555, -4.76837158203125e-05, 9.697675704956055e-05, 0.0002416372299194336, 0.00038629770278930664, 0.0005309581756591797, 0.0006756186485290527, 0.0008202791213989258, 0.0009649395942687988, 0.0011096000671386719, 0.001254260540008545, 0.001398921012878418, 0.001543581485748291, 0.001688241958618164, 0.0018329024314880371, 0.00197756290435791, 0.002122223377227783, 0.0022668838500976562, 0.0024115443229675293, 0.0025562047958374023, 0.0027008652687072754, 0.0028455257415771484, 0.0029901862144470215, 0.0031348466873168945, 0.0032795071601867676, 0.0034241676330566406, 0.0035688281059265137, 0.0037134885787963867, 0.0038581490516662598, 0.004002809524536133, 0.004147469997406006, 0.004292130470275879, 0.004436790943145752, 0.004581451416015625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 9.0, 11.0, 4.0, 18.0, 10.0, 24.0, 19.0, 23.0, 46.0, 30.0, 38.0, 75.0, 58.0, 67.0, 108.0, 76.0, 61.0, 69.0, 47.0, 55.0, 36.0, 18.0, 24.0, 21.0, 8.0, 10.0, 5.0, 5.0, 5.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.649162292480469e-06, -4.5085325837135315e-06, -4.367902874946594e-06, -4.227273166179657e-06, -4.08664345741272e-06, -3.9460137486457825e-06, -3.8053840398788452e-06, -3.664754331111908e-06, -3.5241246223449707e-06, -3.3834949135780334e-06, -3.242865204811096e-06, -3.102235496044159e-06, -2.9616057872772217e-06, -2.8209760785102844e-06, -2.680346369743347e-06, -2.53971666097641e-06, -2.3990869522094727e-06, -2.2584572434425354e-06, -2.117827534675598e-06, -1.977197825908661e-06, -1.8365681171417236e-06, -1.6959384083747864e-06, -1.5553086996078491e-06, -1.4146789908409119e-06, -1.2740492820739746e-06, -1.1334195733070374e-06, -9.927898645401e-07, -8.521601557731628e-07, -7.115304470062256e-07, -5.709007382392883e-07, -4.302710294723511e-07, -2.896413207054138e-07, -1.4901161193847656e-07, -8.381903171539307e-09, 1.3224780559539795e-07, 2.728775143623352e-07, 4.1350722312927246e-07, 5.541369318962097e-07, 6.94766640663147e-07, 8.353963494300842e-07, 9.760260581970215e-07, 1.1166557669639587e-06, 1.257285475730896e-06, 1.3979151844978333e-06, 1.5385448932647705e-06, 1.6791746020317078e-06, 1.819804310798645e-06, 1.9604340195655823e-06, 2.1010637283325195e-06, 2.2416934370994568e-06, 2.382323145866394e-06, 2.5229528546333313e-06, 2.6635825634002686e-06, 2.804212272167206e-06, 2.944841980934143e-06, 3.0854716897010803e-06, 3.2261013984680176e-06, 3.366731107234955e-06, 3.507360816001892e-06, 3.6479905247688293e-06, 3.7886202335357666e-06, 3.929249942302704e-06, 4.069879651069641e-06, 4.210509359836578e-06, 4.351139068603516e-06]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 4.0, 14.0, 14.0, 33.0, 30.0, 44.0, 71.0, 117.0, 147.0, 257.0, 327.0, 482.0, 714.0, 1091.0, 1652.0, 2747.0, 4793.0, 8071.0, 15194.0, 37444.0, 870509.0, 60272.0, 19936.0, 9765.0, 5563.0, 3331.0, 2023.0, 1273.0, 784.0, 579.0, 400.0, 251.0, 174.0, 127.0, 85.0, 69.0, 53.0, 30.0, 24.0, 12.0, 14.0, 5.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005084991455078125, -0.004901230335235596, -0.004717469215393066, -0.004533708095550537, -0.004349946975708008, -0.0041661858558654785, -0.003982424736022949, -0.00379866361618042, -0.0036149024963378906, -0.0034311413764953613, -0.003247380256652832, -0.0030636191368103027, -0.0028798580169677734, -0.002696096897125244, -0.002512335777282715, -0.0023285746574401855, -0.0021448135375976562, -0.001961052417755127, -0.0017772912979125977, -0.0015935301780700684, -0.001409769058227539, -0.0012260079383850098, -0.0010422468185424805, -0.0008584856986999512, -0.0006747245788574219, -0.0004909634590148926, -0.0003072023391723633, -0.00012344121932983398, 6.031990051269531e-05, 0.0002440810203552246, 0.0004278421401977539, 0.0006116032600402832, 0.0007953643798828125, 0.0009791254997253418, 0.001162886619567871, 0.0013466477394104004, 0.0015304088592529297, 0.001714169979095459, 0.0018979310989379883, 0.0020816922187805176, 0.002265453338623047, 0.002449214458465576, 0.0026329755783081055, 0.0028167366981506348, 0.003000497817993164, 0.0031842589378356934, 0.0033680200576782227, 0.003551781177520752, 0.0037355422973632812, 0.0039193034172058105, 0.00410306453704834, 0.004286825656890869, 0.0044705867767333984, 0.004654347896575928, 0.004838109016418457, 0.005021870136260986, 0.005205631256103516, 0.005389392375946045, 0.005573153495788574, 0.0057569146156311035, 0.005940675735473633, 0.006124436855316162, 0.006308197975158691, 0.006491959095001221, 0.00667572021484375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 6.0, 15.0, 8.0, 7.0, 11.0, 19.0, 26.0, 47.0, 694.0, 42.0, 23.0, 20.0, 9.0, 6.0, 8.0, 4.0, 7.0, 9.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00188446044921875, -0.0018329918384552002, -0.0017815232276916504, -0.0017300546169281006, -0.0016785860061645508, -0.001627117395401001, -0.0015756487846374512, -0.0015241801738739014, -0.0014727115631103516, -0.0014212429523468018, -0.001369774341583252, -0.0013183057308197021, -0.0012668371200561523, -0.0012153685092926025, -0.0011638998985290527, -0.001112431287765503, -0.0010609626770019531, -0.0010094940662384033, -0.0009580254554748535, -0.0009065568447113037, -0.0008550882339477539, -0.0008036196231842041, -0.0007521510124206543, -0.0007006824016571045, -0.0006492137908935547, -0.0005977451801300049, -0.0005462765693664551, -0.0004948079586029053, -0.00044333934783935547, -0.00039187073707580566, -0.00034040212631225586, -0.00028893351554870605, -0.00023746490478515625, -0.00018599629402160645, -0.00013452768325805664, -8.305907249450684e-05, -3.159046173095703e-05, 1.9878149032592773e-05, 7.134675979614258e-05, 0.00012281537055969238, 0.0001742839813232422, 0.000225752592086792, 0.0002772212028503418, 0.0003286898136138916, 0.0003801584243774414, 0.0004316270351409912, 0.000483095645904541, 0.0005345642566680908, 0.0005860328674316406, 0.0006375014781951904, 0.0006889700889587402, 0.00074043869972229, 0.0007919073104858398, 0.0008433759212493896, 0.0008948445320129395, 0.0009463131427764893, 0.000997781753540039, 0.0010492503643035889, 0.0011007189750671387, 0.0011521875858306885, 0.0012036561965942383, 0.001255124807357788, 0.0013065934181213379, 0.0013580620288848877, 0.0014095306396484375]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 6.0, 11.0, 18.0, 21.0, 39.0, 59.0, 84.0, 125.0, 177.0, 170.0, 88.0, 57.0, 38.0, 29.0, 21.0, 17.0, 10.0, 10.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020647283643484116, -0.020116202533245087, -0.019585121423006058, -0.01905404031276703, -0.018522959202528, -0.01799187622964382, -0.017460795119404793, -0.016929714009165764, -0.016398632898926735, -0.015867551788687706, -0.015336470678448677, -0.014805388636887074, -0.014274307526648045, -0.013743226416409016, -0.013212144374847412, -0.012681063264608383, -0.012149982154369354, -0.011618901044130325, -0.011087819933891296, -0.010556737892329693, -0.010025656782090664, -0.009494575671851635, -0.008963493630290031, -0.008432412520051003, -0.007901331409811974, -0.007370250299572945, -0.006839168723672628, -0.006308087147772312, -0.005777006037533283, -0.005245924927294254, -0.004714843351393938, -0.004183761775493622, -0.003652682527899742, -0.0031216011848300695, -0.002590519841760397, -0.0020594384986907244, -0.0015283571556210518, -0.0009972758125513792, -0.0004661944694817066, 6.488687358796597e-05, 0.0005959682166576385, 0.0011270495597273111, 0.0016581309027969837, 0.0021892122458666563, 0.002720293588936329, 0.0032513749320060015, 0.003782456275075674, 0.00431353785097599, 0.004844618961215019, 0.005375700071454048, 0.005906781647354364, 0.006437863223254681, 0.0069689443334937096, 0.0075000254437327385, 0.008031107485294342, 0.008562188595533371, 0.0090932697057724, 0.009624350816011429, 0.010155431926250458, 0.010686513967812061, 0.01121759507805109, 0.01174867618829012, 0.012279758229851723, 0.012810839340090752, 0.01334192045032978]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 4.0, 2.0, 4.0, 5.0, 7.0, 16.0, 12.0, 8.0, 23.0, 17.0, 20.0, 28.0, 34.0, 30.0, 35.0, 37.0, 25.0, 34.0, 34.0, 56.0, 49.0, 51.0, 53.0, 45.0, 38.0, 39.0, 44.0, 35.0, 31.0, 23.0, 25.0, 31.0, 27.0, 11.0, 16.0, 16.0, 11.0, 5.0, 11.0, 2.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.008906406350433826, -0.008667942136526108, -0.008429478853940964, -0.008191014640033245, -0.007952550426125526, -0.007714086677879095, -0.007475622929632664, -0.007237158715724945, -0.006998694967478514, -0.006760231219232082, -0.006521767005324364, -0.006283303257077932, -0.006044839043170214, -0.005806375294923782, -0.005567911081016064, -0.005329447332769632, -0.005090983584523201, -0.00485251983627677, -0.004614055622369051, -0.00437559187412262, -0.004137127660214901, -0.0038986639119684696, -0.0036601999308913946, -0.0034217359498143196, -0.003183271735906601, -0.002944807754829526, -0.002706343773752451, -0.0024678800255060196, -0.0022294160444289446, -0.0019909520633518696, -0.0017524880822747946, -0.0015140242176130414, -0.0012755603529512882, -0.0010370963718742132, -0.00079863250721246, -0.000560168526135385, -0.00032170460326597095, -8.324068039655685e-05, 0.00015522330068051815, 0.00039368716534227133, 0.0006321511464193463, 0.0008706150692887604, 0.0011090789921581745, 0.0013475429732352495, 0.0015860069543123245, 0.0018244708189740777, 0.0020629349164664745, 0.002301398664712906, 0.002539862645789981, 0.002778326626867056, 0.003016790607944131, 0.003255254589021206, 0.0034937183372676373, 0.0037321823183447123, 0.003970646299421787, 0.004209110047668219, 0.004447574261575937, 0.004686038009822369, 0.004924502223730087, 0.005162965971976519, 0.005401430185884237, 0.005639893934130669, 0.005878358148038387, 0.006116821896284819, 0.00635528564453125]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 11.0, 10.0, 21.0, 27.0, 54.0, 57.0, 93.0, 126.0, 183.0, 260.0, 386.0, 557.0, 805.0, 1241.0, 1950.0, 2948.0, 4633.0, 7785.0, 12990.0, 22795.0, 40796.0, 79761.0, 170991.0, 453501.0, 1599494.0, 1177211.0, 333454.0, 135987.0, 64709.0, 34206.0, 18838.0, 11090.0, 6743.0, 4071.0, 2380.0, 1497.0, 926.0, 610.0, 371.0, 218.0, 150.0, 88.0, 75.0, 49.0, 26.0, 31.0, 15.0, 17.0, 8.0, 11.0, 9.0, 7.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0091552734375, -0.008826613426208496, -0.008497953414916992, -0.008169293403625488, -0.007840633392333984, -0.0075119733810424805, -0.0071833133697509766, -0.006854653358459473, -0.006525993347167969, -0.006197333335876465, -0.005868673324584961, -0.005540013313293457, -0.005211353302001953, -0.004882693290710449, -0.004554033279418945, -0.004225373268127441, -0.0038967132568359375, -0.0035680532455444336, -0.0032393932342529297, -0.0029107332229614258, -0.002582073211669922, -0.002253413200378418, -0.001924753189086914, -0.0015960931777954102, -0.0012674331665039062, -0.0009387731552124023, -0.0006101131439208984, -0.00028145313262939453, 4.7206878662109375e-05, 0.0003758668899536133, 0.0007045269012451172, 0.001033186912536621, 0.001361846923828125, 0.001690506935119629, 0.002019166946411133, 0.0023478269577026367, 0.0026764869689941406, 0.0030051469802856445, 0.0033338069915771484, 0.0036624670028686523, 0.003991127014160156, 0.00431978702545166, 0.004648447036743164, 0.004977107048034668, 0.005305767059326172, 0.005634427070617676, 0.00596308708190918, 0.006291747093200684, 0.0066204071044921875, 0.006949067115783691, 0.007277727127075195, 0.007606387138366699, 0.007935047149658203, 0.008263707160949707, 0.008592367172241211, 0.008921027183532715, 0.009249687194824219, 0.009578347206115723, 0.009907007217407227, 0.01023566722869873, 0.010564327239990234, 0.010892987251281738, 0.011221647262573242, 0.011550307273864746, 0.01187896728515625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 2.0, 10.0, 7.0, 6.0, 18.0, 16.0, 15.0, 22.0, 15.0, 24.0, 24.0, 34.0, 39.0, 33.0, 28.0, 37.0, 47.0, 42.0, 43.0, 40.0, 46.0, 41.0, 48.0, 45.0, 41.0, 41.0, 29.0, 24.0, 23.0, 18.0, 28.0, 21.0, 22.0, 15.0, 13.0, 12.0, 8.0, 4.0, 3.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.00531768798828125, -0.0051721930503845215, -0.005026698112487793, -0.0048812031745910645, -0.004735708236694336, -0.004590213298797607, -0.004444718360900879, -0.00429922342300415, -0.004153728485107422, -0.004008233547210693, -0.003862738609313965, -0.0037172436714172363, -0.003571748733520508, -0.0034262537956237793, -0.0032807588577270508, -0.0031352639198303223, -0.0029897689819335938, -0.0028442740440368652, -0.0026987791061401367, -0.002553284168243408, -0.0024077892303466797, -0.002262294292449951, -0.0021167993545532227, -0.001971304416656494, -0.0018258094787597656, -0.0016803145408630371, -0.0015348196029663086, -0.00138932466506958, -0.0012438297271728516, -0.001098334789276123, -0.0009528398513793945, -0.000807344913482666, -0.0006618499755859375, -0.000516355037689209, -0.00037086009979248047, -0.00022536516189575195, -7.987022399902344e-05, 6.562471389770508e-05, 0.0002111196517944336, 0.0003566145896911621, 0.0005021095275878906, 0.0006476044654846191, 0.0007930994033813477, 0.0009385943412780762, 0.0010840892791748047, 0.0012295842170715332, 0.0013750791549682617, 0.0015205740928649902, 0.0016660690307617188, 0.0018115639686584473, 0.0019570589065551758, 0.0021025538444519043, 0.002248048782348633, 0.0023935437202453613, 0.00253903865814209, 0.0026845335960388184, 0.002830028533935547, 0.0029755234718322754, 0.003121018409729004, 0.0032665133476257324, 0.003412008285522461, 0.0035575032234191895, 0.003702998161315918, 0.0038484930992126465, 0.003993988037109375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 10.0, 17.0, 35.0, 51.0, 70.0, 112.0, 168.0, 249.0, 372.0, 602.0, 879.0, 1308.0, 2101.0, 3323.0, 5155.0, 8293.0, 12988.0, 22214.0, 38252.0, 67969.0, 127328.0, 256738.0, 583680.0, 1360172.0, 928998.0, 377693.0, 178477.0, 92375.0, 50417.0, 28849.0, 17101.0, 10327.0, 6453.0, 4088.0, 2591.0, 1680.0, 1096.0, 713.0, 476.0, 292.0, 197.0, 135.0, 86.0, 45.0, 39.0, 21.0, 13.0, 14.0, 10.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.00832366943359375, -0.008084118366241455, -0.00784456729888916, -0.007605016231536865, -0.00736546516418457, -0.007125914096832275, -0.0068863630294799805, -0.0066468119621276855, -0.006407260894775391, -0.006167709827423096, -0.005928158760070801, -0.005688607692718506, -0.005449056625366211, -0.005209505558013916, -0.004969954490661621, -0.004730403423309326, -0.004490852355957031, -0.004251301288604736, -0.004011750221252441, -0.0037721991539001465, -0.0035326480865478516, -0.0032930970191955566, -0.0030535459518432617, -0.002813994884490967, -0.002574443817138672, -0.002334892749786377, -0.002095341682434082, -0.0018557906150817871, -0.0016162395477294922, -0.0013766884803771973, -0.0011371374130249023, -0.0008975863456726074, -0.0006580352783203125, -0.0004184842109680176, -0.00017893314361572266, 6.0617923736572266e-05, 0.0003001689910888672, 0.0005397200584411621, 0.000779271125793457, 0.001018822193145752, 0.0012583732604980469, 0.0014979243278503418, 0.0017374753952026367, 0.0019770264625549316, 0.0022165775299072266, 0.0024561285972595215, 0.0026956796646118164, 0.0029352307319641113, 0.0031747817993164062, 0.003414332866668701, 0.003653883934020996, 0.003893435001373291, 0.004132986068725586, 0.004372537136077881, 0.004612088203430176, 0.004851639270782471, 0.005091190338134766, 0.0053307414054870605, 0.0055702924728393555, 0.00580984354019165, 0.006049394607543945, 0.00628894567489624, 0.006528496742248535, 0.00676804780960083, 0.007007598876953125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 5.0, 13.0, 15.0, 16.0, 21.0, 29.0, 22.0, 27.0, 39.0, 61.0, 62.0, 68.0, 89.0, 97.0, 125.0, 160.0, 160.0, 186.0, 202.0, 230.0, 255.0, 267.0, 237.0, 239.0, 195.0, 172.0, 164.0, 159.0, 135.0, 102.0, 102.0, 81.0, 59.0, 60.0, 54.0, 30.0, 29.0, 26.0, 12.0, 13.0, 8.0, 8.0, 9.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0020427703857421875, -0.001973867416381836, -0.0019049644470214844, -0.0018360614776611328, -0.0017671585083007812, -0.0016982555389404297, -0.0016293525695800781, -0.0015604496002197266, -0.001491546630859375, -0.0014226436614990234, -0.0013537406921386719, -0.0012848377227783203, -0.0012159347534179688, -0.0011470317840576172, -0.0010781288146972656, -0.001009225845336914, -0.0009403228759765625, -0.0008714199066162109, -0.0008025169372558594, -0.0007336139678955078, -0.0006647109985351562, -0.0005958080291748047, -0.0005269050598144531, -0.00045800209045410156, -0.00038909912109375, -0.00032019615173339844, -0.0002512931823730469, -0.0001823902130126953, -0.00011348724365234375, -4.458427429199219e-05, 2.4318695068359375e-05, 9.322166442871094e-05, 0.0001621246337890625, 0.00023102760314941406, 0.0002999305725097656, 0.0003688335418701172, 0.00043773651123046875, 0.0005066394805908203, 0.0005755424499511719, 0.0006444454193115234, 0.000713348388671875, 0.0007822513580322266, 0.0008511543273925781, 0.0009200572967529297, 0.0009889602661132812, 0.0010578632354736328, 0.0011267662048339844, 0.001195669174194336, 0.0012645721435546875, 0.001333475112915039, 0.0014023780822753906, 0.0014712810516357422, 0.0015401840209960938, 0.0016090869903564453, 0.0016779899597167969, 0.0017468929290771484, 0.0018157958984375, 0.0018846988677978516, 0.001953601837158203, 0.0020225048065185547, 0.0020914077758789062, 0.002160310745239258, 0.0022292137145996094, 0.002298116683959961, 0.0023670196533203125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 14.0, 7.0, 20.0, 17.0, 26.0, 48.0, 78.0, 97.0, 96.0, 164.0, 128.0, 86.0, 58.0, 41.0, 30.0, 23.0, 18.0, 13.0, 14.0, 4.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.012131369672715664, -0.011809755116701126, -0.011488141492009163, -0.011166526935994625, -0.010844912379980087, -0.010523298755288124, -0.010201684199273586, -0.009880069643259048, -0.009558456018567085, -0.009236841462552547, -0.008915227837860584, -0.008593613281846046, -0.008271999657154083, -0.007950385101139545, -0.007628770545125008, -0.007307156454771757, -0.006985542364418507, -0.006663928274065256, -0.006342314183712006, -0.006020699627697468, -0.005699085537344217, -0.005377471446990967, -0.005055856890976429, -0.0047342428006231785, -0.004412628710269928, -0.0040910146199166775, -0.0037694002967327833, -0.003447785973548889, -0.0031261718831956387, -0.002804557792842388, -0.002482943469658494, -0.0021613291464746, -0.001839715987443924, -0.0015181017806753516, -0.0011964875739067793, -0.000874873367138207, -0.0005532591603696346, -0.0002316449536010623, 8.996925316751003e-05, 0.0004115835763514042, 0.0007331976667046547, 0.001054811873473227, 0.0013764260802417994, 0.0016980402870103717, 0.002019654493778944, 0.0023412685841321945, 0.0026628829073160887, 0.002984497230499983, 0.0033061113208532333, 0.003627725411206484, 0.003949339501559734, 0.004270954057574272, 0.004592568147927523, 0.004914182238280773, 0.005235796794295311, 0.0055574108846485615, 0.005879024975001812, 0.0062006390653550625, 0.006522253155708313, 0.006843867711722851, 0.007165481802076101, 0.007487095892429352, 0.00780871044844389, 0.008130325004458427, 0.00845193862915039]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 6.0, 6.0, 14.0, 12.0, 20.0, 26.0, 18.0, 19.0, 29.0, 32.0, 37.0, 31.0, 38.0, 39.0, 46.0, 36.0, 48.0, 32.0, 39.0, 46.0, 37.0, 43.0, 43.0, 35.0, 25.0, 30.0, 31.0, 31.0, 20.0, 14.0, 14.0, 22.0, 17.0, 9.0, 10.0, 8.0, 11.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005460231099277735, -0.00530237564817071, -0.005144519731402397, -0.004986664280295372, -0.004828808829188347, -0.004670953378081322, -0.004513097926974297, -0.004355242010205984, -0.004197386559098959, -0.004039531107991934, -0.003881675424054265, -0.0037238197401165962, -0.003565964289009571, -0.003408108837902546, -0.003250253153964877, -0.0030923974700272083, -0.002934542018920183, -0.002776686567813158, -0.0026188308838754892, -0.0024609751999378204, -0.0023031197488307953, -0.00214526429772377, -0.0019874086137861013, -0.0018295530462637544, -0.0016716974787414074, -0.0015138419112190604, -0.0013559863436967134, -0.0011981307761743665, -0.0010402752086520195, -0.0008824196411296725, -0.0007245640736073256, -0.0005667085060849786, -0.0004088529385626316, -0.00025099737104028463, -9.314180351793766e-05, 6.471376400440931e-05, 0.0002225693315267563, 0.00038042489904910326, 0.0005382804665714502, 0.0006961360340937972, 0.0008539916016161442, 0.0010118471691384912, 0.0011697027366608381, 0.001327558304183185, 0.001485413871705532, 0.001643269439227879, 0.001801125006750226, 0.001958980690687895, 0.00211683614179492, 0.002274691592901945, 0.002432547276839614, 0.0025904029607772827, 0.002748258411884308, 0.002906113862991333, 0.003063969546929002, 0.0032218252308666706, 0.0033796806819736958, 0.003537536133080721, 0.0036953918170183897, 0.0038532475009560585, 0.004011102952063084, 0.004168958403170109, 0.004326813854277134, 0.004484669771045446, 0.0046425252221524715]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 6.0, 8.0, 7.0, 6.0, 16.0, 26.0, 43.0, 57.0, 82.0, 111.0, 213.0, 309.0, 519.0, 885.0, 1410.0, 2473.0, 4398.0, 7627.0, 14043.0, 26508.0, 51836.0, 106621.0, 231792.0, 301452.0, 150595.0, 70455.0, 35430.0, 18304.0, 10103.0, 5441.0, 2970.0, 1860.0, 1116.0, 659.0, 427.0, 262.0, 156.0, 106.0, 74.0, 50.0, 34.0, 27.0, 17.0, 12.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010040283203125, -0.009728670120239258, -0.009417057037353516, -0.009105443954467773, -0.008793830871582031, -0.008482217788696289, -0.008170604705810547, -0.007858991622924805, -0.0075473785400390625, -0.00723576545715332, -0.006924152374267578, -0.006612539291381836, -0.006300926208496094, -0.0059893131256103516, -0.005677700042724609, -0.005366086959838867, -0.005054473876953125, -0.004742860794067383, -0.004431247711181641, -0.0041196346282958984, -0.0038080215454101562, -0.003496408462524414, -0.003184795379638672, -0.0028731822967529297, -0.0025615692138671875, -0.0022499561309814453, -0.0019383430480957031, -0.001626729965209961, -0.0013151168823242188, -0.0010035037994384766, -0.0006918907165527344, -0.0003802776336669922, -6.866455078125e-05, 0.0002429485321044922, 0.0005545616149902344, 0.0008661746978759766, 0.0011777877807617188, 0.001489400863647461, 0.0018010139465332031, 0.0021126270294189453, 0.0024242401123046875, 0.0027358531951904297, 0.003047466278076172, 0.003359079360961914, 0.0036706924438476562, 0.0039823055267333984, 0.004293918609619141, 0.004605531692504883, 0.004917144775390625, 0.005228757858276367, 0.005540370941162109, 0.0058519840240478516, 0.006163597106933594, 0.006475210189819336, 0.006786823272705078, 0.00709843635559082, 0.0074100494384765625, 0.007721662521362305, 0.008033275604248047, 0.008344888687133789, 0.008656501770019531, 0.008968114852905273, 0.009279727935791016, 0.009591341018676758, 0.0099029541015625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 4.0, 2.0, 6.0, 14.0, 8.0, 14.0, 20.0, 13.0, 20.0, 26.0, 24.0, 33.0, 40.0, 36.0, 36.0, 44.0, 35.0, 44.0, 37.0, 47.0, 39.0, 46.0, 37.0, 42.0, 52.0, 27.0, 35.0, 44.0, 24.0, 20.0, 18.0, 19.0, 14.0, 16.0, 13.0, 10.0, 12.0, 4.0, 10.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004657745361328125, -0.004510223865509033, -0.004362702369689941, -0.00421518087387085, -0.004067659378051758, -0.003920137882232666, -0.0037726163864135742, -0.0036250948905944824, -0.0034775733947753906, -0.003330051898956299, -0.003182530403137207, -0.0030350089073181152, -0.0028874874114990234, -0.0027399659156799316, -0.00259244441986084, -0.002444922924041748, -0.0022974014282226562, -0.0021498799324035645, -0.0020023584365844727, -0.0018548369407653809, -0.001707315444946289, -0.0015597939491271973, -0.0014122724533081055, -0.0012647509574890137, -0.0011172294616699219, -0.0009697079658508301, -0.0008221864700317383, -0.0006746649742126465, -0.0005271434783935547, -0.0003796219825744629, -0.0002321004867553711, -8.45789909362793e-05, 6.29425048828125e-05, 0.0002104640007019043, 0.0003579854965209961, 0.0005055069923400879, 0.0006530284881591797, 0.0008005499839782715, 0.0009480714797973633, 0.001095592975616455, 0.0012431144714355469, 0.0013906359672546387, 0.0015381574630737305, 0.0016856789588928223, 0.001833200454711914, 0.001980721950531006, 0.0021282434463500977, 0.0022757649421691895, 0.0024232864379882812, 0.002570807933807373, 0.002718329429626465, 0.0028658509254455566, 0.0030133724212646484, 0.0031608939170837402, 0.003308415412902832, 0.003455936908721924, 0.0036034584045410156, 0.0037509799003601074, 0.0038985013961791992, 0.004046022891998291, 0.004193544387817383, 0.004341065883636475, 0.004488587379455566, 0.004636108875274658, 0.00478363037109375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 4.0, 11.0, 8.0, 13.0, 26.0, 21.0, 47.0, 62.0, 106.0, 158.0, 247.0, 400.0, 652.0, 1041.0, 1897.0, 3356.0, 6478.0, 14139.0, 36962.0, 141595.0, 597014.0, 171016.0, 41857.0, 15643.0, 7088.0, 3707.0, 2030.0, 1187.0, 654.0, 395.0, 243.0, 171.0, 114.0, 73.0, 49.0, 26.0, 31.0, 9.0, 8.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013763427734375, -0.013245105743408203, -0.012726783752441406, -0.01220846176147461, -0.011690139770507812, -0.011171817779541016, -0.010653495788574219, -0.010135173797607422, -0.009616851806640625, -0.009098529815673828, -0.008580207824707031, -0.008061885833740234, -0.0075435638427734375, -0.007025241851806641, -0.006506919860839844, -0.005988597869873047, -0.00547027587890625, -0.004951953887939453, -0.004433631896972656, -0.003915309906005859, -0.0033969879150390625, -0.0028786659240722656, -0.0023603439331054688, -0.0018420219421386719, -0.001323699951171875, -0.0008053779602050781, -0.00028705596923828125, 0.00023126602172851562, 0.0007495880126953125, 0.0012679100036621094, 0.0017862319946289062, 0.002304553985595703, 0.0028228759765625, 0.003341197967529297, 0.0038595199584960938, 0.004377841949462891, 0.0048961639404296875, 0.005414485931396484, 0.005932807922363281, 0.006451129913330078, 0.006969451904296875, 0.007487773895263672, 0.008006095886230469, 0.008524417877197266, 0.009042739868164062, 0.00956106185913086, 0.010079383850097656, 0.010597705841064453, 0.01111602783203125, 0.011634349822998047, 0.012152671813964844, 0.01267099380493164, 0.013189315795898438, 0.013707637786865234, 0.014225959777832031, 0.014744281768798828, 0.015262603759765625, 0.015780925750732422, 0.01629924774169922, 0.016817569732666016, 0.017335891723632812, 0.01785421371459961, 0.018372535705566406, 0.018890857696533203, 0.0194091796875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 6.0, 5.0, 12.0, 16.0, 14.0, 11.0, 13.0, 19.0, 21.0, 27.0, 19.0, 28.0, 37.0, 42.0, 36.0, 39.0, 48.0, 41.0, 51.0, 39.0, 41.0, 39.0, 40.0, 44.0, 38.0, 33.0, 24.0, 28.0, 32.0, 30.0, 16.0, 15.0, 23.0, 13.0, 11.0, 8.0, 13.0, 5.0, 4.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.00342559814453125, -0.003329366445541382, -0.0032331347465515137, -0.0031369030475616455, -0.0030406713485717773, -0.002944439649581909, -0.002848207950592041, -0.002751976251602173, -0.0026557445526123047, -0.0025595128536224365, -0.0024632811546325684, -0.0023670494556427, -0.002270817756652832, -0.002174586057662964, -0.0020783543586730957, -0.0019821226596832275, -0.0018858909606933594, -0.0017896592617034912, -0.001693427562713623, -0.0015971958637237549, -0.0015009641647338867, -0.0014047324657440186, -0.0013085007667541504, -0.0012122690677642822, -0.001116037368774414, -0.001019805669784546, -0.0009235739707946777, -0.0008273422718048096, -0.0007311105728149414, -0.0006348788738250732, -0.0005386471748352051, -0.0004424154758453369, -0.00034618377685546875, -0.0002499520778656006, -0.00015372037887573242, -5.748867988586426e-05, 3.8743019104003906e-05, 0.00013497471809387207, 0.00023120641708374023, 0.0003274381160736084, 0.00042366981506347656, 0.0005199015140533447, 0.0006161332130432129, 0.0007123649120330811, 0.0008085966110229492, 0.0009048283100128174, 0.0010010600090026855, 0.0010972917079925537, 0.0011935234069824219, 0.00128975510597229, 0.0013859868049621582, 0.0014822185039520264, 0.0015784502029418945, 0.0016746819019317627, 0.0017709136009216309, 0.001867145299911499, 0.001963376998901367, 0.0020596086978912354, 0.0021558403968811035, 0.0022520720958709717, 0.00234830379486084, 0.002444535493850708, 0.002540767192840576, 0.0026369988918304443, 0.0027332305908203125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 14.0, 8.0, 21.0, 26.0, 23.0, 33.0, 42.0, 77.0, 86.0, 115.0, 165.0, 200.0, 289.0, 363.0, 592.0, 781.0, 1231.0, 1969.0, 3204.0, 5786.0, 11758.0, 29464.0, 108029.0, 616099.0, 192684.0, 42088.0, 15387.0, 7138.0, 3823.0, 2267.0, 1480.0, 944.0, 648.0, 478.0, 348.0, 244.0, 180.0, 136.0, 99.0, 53.0, 39.0, 30.0, 34.0, 22.0, 21.0, 11.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00337982177734375, -0.0032730698585510254, -0.0031663179397583008, -0.003059566020965576, -0.0029528141021728516, -0.002846062183380127, -0.0027393102645874023, -0.0026325583457946777, -0.002525806427001953, -0.0024190545082092285, -0.002312302589416504, -0.0022055506706237793, -0.0020987987518310547, -0.00199204683303833, -0.0018852949142456055, -0.0017785429954528809, -0.0016717910766601562, -0.0015650391578674316, -0.001458287239074707, -0.0013515353202819824, -0.0012447834014892578, -0.0011380314826965332, -0.0010312795639038086, -0.000924527645111084, -0.0008177757263183594, -0.0007110238075256348, -0.0006042718887329102, -0.0004975199699401855, -0.00039076805114746094, -0.00028401613235473633, -0.00017726421356201172, -7.051229476928711e-05, 3.62396240234375e-05, 0.0001429915428161621, 0.0002497434616088867, 0.00035649538040161133, 0.00046324729919433594, 0.0005699992179870605, 0.0006767511367797852, 0.0007835030555725098, 0.0008902549743652344, 0.000997006893157959, 0.0011037588119506836, 0.0012105107307434082, 0.0013172626495361328, 0.0014240145683288574, 0.001530766487121582, 0.0016375184059143066, 0.0017442703247070312, 0.0018510222434997559, 0.0019577741622924805, 0.002064526081085205, 0.0021712779998779297, 0.0022780299186706543, 0.002384781837463379, 0.0024915337562561035, 0.002598285675048828, 0.0027050375938415527, 0.0028117895126342773, 0.002918541431427002, 0.0030252933502197266, 0.003132045269012451, 0.0032387971878051758, 0.0033455491065979004, 0.003452301025390625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 7.0, 6.0, 21.0, 18.0, 16.0, 20.0, 23.0, 26.0, 25.0, 41.0, 57.0, 43.0, 42.0, 74.0, 92.0, 75.0, 68.0, 50.0, 36.0, 30.0, 37.0, 29.0, 26.0, 16.0, 20.0, 18.0, 14.0, 6.0, 10.0, 7.0, 7.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.9252300262451172e-05, -1.8700025975704193e-05, -1.8147751688957214e-05, -1.7595477402210236e-05, -1.7043203115463257e-05, -1.6490928828716278e-05, -1.59386545419693e-05, -1.538638025522232e-05, -1.4834105968475342e-05, -1.4281831681728363e-05, -1.3729557394981384e-05, -1.3177283108234406e-05, -1.2625008821487427e-05, -1.2072734534740448e-05, -1.152046024799347e-05, -1.096818596124649e-05, -1.0415911674499512e-05, -9.863637387752533e-06, -9.311363101005554e-06, -8.759088814258575e-06, -8.206814527511597e-06, -7.654540240764618e-06, -7.102265954017639e-06, -6.54999166727066e-06, -5.997717380523682e-06, -5.445443093776703e-06, -4.893168807029724e-06, -4.340894520282745e-06, -3.7886202335357666e-06, -3.236345946788788e-06, -2.684071660041809e-06, -2.1317973732948303e-06, -1.5795230865478516e-06, -1.0272487998008728e-06, -4.7497451305389404e-07, 7.729977369308472e-08, 6.295740604400635e-07, 1.1818483471870422e-06, 1.734122633934021e-06, 2.2863969206809998e-06, 2.8386712074279785e-06, 3.3909454941749573e-06, 3.943219780921936e-06, 4.495494067668915e-06, 5.0477683544158936e-06, 5.600042641162872e-06, 6.152316927909851e-06, 6.70459121465683e-06, 7.256865501403809e-06, 7.809139788150787e-06, 8.361414074897766e-06, 8.913688361644745e-06, 9.465962648391724e-06, 1.0018236935138702e-05, 1.0570511221885681e-05, 1.112278550863266e-05, 1.1675059795379639e-05, 1.2227334082126617e-05, 1.2779608368873596e-05, 1.3331882655620575e-05, 1.3884156942367554e-05, 1.4436431229114532e-05, 1.4988705515861511e-05, 1.554097980260849e-05, 1.609325408935547e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 5.0, 5.0, 3.0, 1.0, 4.0, 16.0, 22.0, 25.0, 34.0, 44.0, 64.0, 83.0, 139.0, 225.0, 278.0, 362.0, 592.0, 906.0, 1586.0, 2575.0, 4632.0, 8603.0, 17277.0, 37264.0, 94181.0, 308150.0, 373276.0, 113608.0, 43280.0, 19372.0, 9448.0, 4998.0, 2771.0, 1665.0, 1046.0, 650.0, 404.0, 284.0, 186.0, 152.0, 86.0, 80.0, 42.0, 25.0, 39.0, 21.0, 20.0, 11.0, 6.0, 11.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0016336441040039062, -0.0015810877084732056, -0.0015285313129425049, -0.0014759749174118042, -0.0014234185218811035, -0.0013708621263504028, -0.0013183057308197021, -0.0012657493352890015, -0.0012131929397583008, -0.0011606365442276, -0.0011080801486968994, -0.0010555237531661987, -0.001002967357635498, -0.0009504109621047974, -0.0008978545665740967, -0.000845298171043396, -0.0007927417755126953, -0.0007401853799819946, -0.0006876289844512939, -0.0006350725889205933, -0.0005825161933898926, -0.0005299597978591919, -0.0004774034023284912, -0.00042484700679779053, -0.00037229061126708984, -0.00031973421573638916, -0.0002671778202056885, -0.0002146214246749878, -0.0001620650291442871, -0.00010950863361358643, -5.695223808288574e-05, -4.395842552185059e-06, 4.8160552978515625e-05, 0.00010071694850921631, 0.000153273344039917, 0.00020582973957061768, 0.00025838613510131836, 0.00031094253063201904, 0.0003634989261627197, 0.0004160553216934204, 0.0004686117172241211, 0.0005211681127548218, 0.0005737245082855225, 0.0006262809038162231, 0.0006788372993469238, 0.0007313936948776245, 0.0007839500904083252, 0.0008365064859390259, 0.0008890628814697266, 0.0009416192770004272, 0.000994175672531128, 0.0010467320680618286, 0.0010992884635925293, 0.00115184485912323, 0.0012044012546539307, 0.0012569576501846313, 0.001309514045715332, 0.0013620704412460327, 0.0014146268367767334, 0.001467183232307434, 0.0015197396278381348, 0.0015722960233688354, 0.0016248524188995361, 0.0016774088144302368, 0.0017299652099609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 11.0, 9.0, 9.0, 16.0, 21.0, 19.0, 27.0, 24.0, 42.0, 29.0, 41.0, 44.0, 48.0, 54.0, 44.0, 64.0, 47.0, 56.0, 52.0, 52.0, 42.0, 38.0, 33.0, 34.0, 26.0, 23.0, 16.0, 15.0, 18.0, 3.0, 6.0, 10.0, 3.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003590583801269531, -0.0003480352461338043, -0.0003370121121406555, -0.0003259889781475067, -0.0003149658441543579, -0.0003039427101612091, -0.0002929195761680603, -0.0002818964421749115, -0.0002708733081817627, -0.0002598501741886139, -0.0002488270401954651, -0.00023780390620231628, -0.00022678077220916748, -0.00021575763821601868, -0.00020473450422286987, -0.00019371137022972107, -0.00018268823623657227, -0.00017166510224342346, -0.00016064196825027466, -0.00014961883425712585, -0.00013859570026397705, -0.00012757256627082825, -0.00011654943227767944, -0.00010552629828453064, -9.450316429138184e-05, -8.348003029823303e-05, -7.245689630508423e-05, -6.143376231193542e-05, -5.041062831878662e-05, -3.938749432563782e-05, -2.8364360332489014e-05, -1.734122633934021e-05, -6.318092346191406e-06, 4.7050416469573975e-06, 1.57281756401062e-05, 2.6751309633255005e-05, 3.777444362640381e-05, 4.879757761955261e-05, 5.9820711612701416e-05, 7.084384560585022e-05, 8.186697959899902e-05, 9.289011359214783e-05, 0.00010391324758529663, 0.00011493638157844543, 0.00012595951557159424, 0.00013698264956474304, 0.00014800578355789185, 0.00015902891755104065, 0.00017005205154418945, 0.00018107518553733826, 0.00019209831953048706, 0.00020312145352363586, 0.00021414458751678467, 0.00022516772150993347, 0.00023619085550308228, 0.0002472139894962311, 0.0002582371234893799, 0.0002692602574825287, 0.0002802833914756775, 0.0002913065254688263, 0.0003023296594619751, 0.0003133527934551239, 0.0003243759274482727, 0.0003353990614414215, 0.0003464221954345703]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 8.0, 10.0, 15.0, 15.0, 18.0, 19.0, 29.0, 44.0, 61.0, 74.0, 98.0, 128.0, 125.0, 83.0, 67.0, 55.0, 34.0, 18.0, 15.0, 20.0, 14.0, 6.0, 16.0, 8.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.007771916221827269, -0.007542204111814499, -0.007312492001801729, -0.0070827798917889595, -0.0068530673161149025, -0.006623355206102133, -0.006393643096089363, -0.006163930986076593, -0.005934218876063824, -0.005704506766051054, -0.005474794656038284, -0.005245082080364227, -0.005015369970351458, -0.004785657860338688, -0.004555945750325918, -0.0043262336403131485, -0.0040965210646390915, -0.003866808954626322, -0.0036370966117829084, -0.0034073845017701387, -0.0031776721589267254, -0.0029479600489139557, -0.002718247938901186, -0.0024885358288884163, -0.002258823486045003, -0.0020291113760322332, -0.0017993990331888199, -0.0015696869231760502, -0.0013399746967479587, -0.0011102624703198671, -0.0008805503603070974, -0.0006508381338790059, -0.0004211263731122017, -0.00019141417578794062, 3.829802153632045e-05, 0.00026801018975675106, 0.0004977224161848426, 0.0007274346426129341, 0.0009571467526257038, 0.0011868589790537953, 0.0014165712054818869, 0.0016462834319099784, 0.00187599565833807, 0.0021057077683508396, 0.0023354198783636093, 0.0025651322212070227, 0.0027948443312197924, 0.0030245566740632057, 0.0032542687840759754, 0.003483980894088745, 0.0037136932369321585, 0.0039434051141142845, 0.0041731176897883415, 0.004402829799801111, 0.004632541909813881, 0.004862254019826651, 0.00509196612983942, 0.00532167823985219, 0.00555139034986496, 0.005781102925539017, 0.006010815035551786, 0.006240527145564556, 0.006470239255577326, 0.0066999513655900955, 0.0069296639412641525]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 9.0, 7.0, 7.0, 8.0, 15.0, 17.0, 21.0, 20.0, 16.0, 33.0, 25.0, 38.0, 32.0, 35.0, 40.0, 52.0, 35.0, 47.0, 40.0, 39.0, 51.0, 37.0, 43.0, 47.0, 30.0, 29.0, 33.0, 34.0, 27.0, 16.0, 17.0, 17.0, 23.0, 16.0, 8.0, 10.0, 7.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004885593894869089, -0.004740923643112183, -0.004596253391355276, -0.004451583605259657, -0.00430691335350275, -0.004162243101745844, -0.004017572849988937, -0.003872902598232031, -0.003728232579305768, -0.0035835623275488615, -0.0034388923086225986, -0.003294222056865692, -0.0031495518051087856, -0.0030048817861825228, -0.0028602115344256163, -0.0027155415154993534, -0.002570871263742447, -0.0024262010119855404, -0.0022815309930592775, -0.002136860741302371, -0.001992190722376108, -0.0018475204706192017, -0.0017028502188622952, -0.0015581800835207105, -0.0014135099481791258, -0.001268839812837541, -0.0011241696774959564, -0.00097949942573905, -0.0008348292903974652, -0.0006901591550558805, -0.000545488961506635, -0.00040081876795738935, -0.000256149098277092, -0.00011147893383167684, 3.31912306137383e-05, 0.00017786139505915344, 0.0003225315595045686, 0.00046720169484615326, 0.0006118718883953989, 0.0007565420819446445, 0.0009012122172862291, 0.0010458823526278138, 0.0011905524879693985, 0.001335222739726305, 0.0014798928750678897, 0.0016245630104094744, 0.0017692332621663809, 0.0019139033975079656, 0.0020585735328495502, 0.0022032437846064568, 0.0023479138035327196, 0.002492584055289626, 0.002637254074215889, 0.0027819243259727955, 0.002926594577729702, 0.0030712648294866085, 0.0032159348484128714, 0.003360605100169778, 0.0035052751190960407, 0.0036499453708529472, 0.0037946156226098537, 0.00393928587436676, 0.0040839556604623795, 0.004228625912219286, 0.0043732961639761925]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 6.0, 15.0, 15.0, 22.0, 40.0, 74.0, 104.0, 177.0, 234.0, 388.0, 713.0, 1177.0, 2150.0, 4090.0, 7870.0, 15371.0, 31763.0, 69168.0, 164216.0, 342106.0, 230555.0, 94383.0, 41977.0, 20179.0, 10065.0, 5235.0, 2916.0, 1503.0, 855.0, 491.0, 271.0, 151.0, 101.0, 45.0, 36.0, 19.0, 20.0, 16.0, 11.0, 12.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0125885009765625, -0.012235760688781738, -0.011883020401000977, -0.011530280113220215, -0.011177539825439453, -0.010824799537658691, -0.01047205924987793, -0.010119318962097168, -0.009766578674316406, -0.009413838386535645, -0.009061098098754883, -0.008708357810974121, -0.00835561752319336, -0.008002877235412598, -0.007650136947631836, -0.007297396659851074, -0.0069446563720703125, -0.006591916084289551, -0.006239175796508789, -0.005886435508728027, -0.005533695220947266, -0.005180954933166504, -0.004828214645385742, -0.0044754743576049805, -0.004122734069824219, -0.003769993782043457, -0.0034172534942626953, -0.0030645132064819336, -0.002711772918701172, -0.00235903263092041, -0.0020062923431396484, -0.0016535520553588867, -0.001300811767578125, -0.0009480714797973633, -0.0005953311920166016, -0.00024259090423583984, 0.00011014938354492188, 0.0004628896713256836, 0.0008156299591064453, 0.001168370246887207, 0.0015211105346679688, 0.0018738508224487305, 0.002226591110229492, 0.002579331398010254, 0.0029320716857910156, 0.0032848119735717773, 0.003637552261352539, 0.003990292549133301, 0.0043430328369140625, 0.004695773124694824, 0.005048513412475586, 0.005401253700256348, 0.005753993988037109, 0.006106734275817871, 0.006459474563598633, 0.0068122148513793945, 0.007164955139160156, 0.007517695426940918, 0.00787043571472168, 0.008223176002502441, 0.008575916290283203, 0.008928656578063965, 0.009281396865844727, 0.009634137153625488, 0.00998687744140625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 3.0, 8.0, 10.0, 9.0, 14.0, 20.0, 13.0, 27.0, 26.0, 19.0, 31.0, 34.0, 39.0, 36.0, 43.0, 56.0, 44.0, 53.0, 44.0, 46.0, 48.0, 45.0, 42.0, 42.0, 34.0, 32.0, 27.0, 35.0, 23.0, 17.0, 19.0, 19.0, 11.0, 8.0, 8.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004383087158203125, -0.004254519939422607, -0.00412595272064209, -0.003997385501861572, -0.0038688182830810547, -0.003740251064300537, -0.0036116838455200195, -0.003483116626739502, -0.0033545494079589844, -0.003225982189178467, -0.0030974149703979492, -0.0029688477516174316, -0.002840280532836914, -0.0027117133140563965, -0.002583146095275879, -0.0024545788764953613, -0.0023260116577148438, -0.002197444438934326, -0.0020688772201538086, -0.001940310001373291, -0.0018117427825927734, -0.0016831755638122559, -0.0015546083450317383, -0.0014260411262512207, -0.0012974739074707031, -0.0011689066886901855, -0.001040339469909668, -0.0009117722511291504, -0.0007832050323486328, -0.0006546378135681152, -0.0005260705947875977, -0.0003975033760070801, -0.0002689361572265625, -0.00014036893844604492, -1.1801719665527344e-05, 0.00011676549911499023, 0.0002453327178955078, 0.0003738999366760254, 0.000502467155456543, 0.0006310343742370605, 0.0007596015930175781, 0.0008881688117980957, 0.0010167360305786133, 0.0011453032493591309, 0.0012738704681396484, 0.001402437686920166, 0.0015310049057006836, 0.0016595721244812012, 0.0017881393432617188, 0.0019167065620422363, 0.002045273780822754, 0.0021738409996032715, 0.002302408218383789, 0.0024309754371643066, 0.0025595426559448242, 0.002688109874725342, 0.0028166770935058594, 0.002945244312286377, 0.0030738115310668945, 0.003202378749847412, 0.0033309459686279297, 0.0034595131874084473, 0.003588080406188965, 0.0037166476249694824, 0.00384521484375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 10.0, 10.0, 11.0, 24.0, 45.0, 56.0, 107.0, 133.0, 176.0, 290.0, 415.0, 659.0, 1159.0, 1748.0, 2644.0, 4027.0, 6168.0, 9040.0, 14048.0, 22013.0, 34977.0, 58530.0, 98610.0, 165503.0, 223401.0, 159672.0, 94838.0, 55715.0, 33806.0, 21036.0, 13530.0, 8934.0, 6009.0, 3856.0, 2565.0, 1770.0, 1082.0, 659.0, 444.0, 290.0, 200.0, 109.0, 84.0, 55.0, 38.0, 17.0, 17.0, 8.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.007076263427734375, -0.006870925426483154, -0.006665587425231934, -0.006460249423980713, -0.006254911422729492, -0.0060495734214782715, -0.005844235420227051, -0.00563889741897583, -0.005433559417724609, -0.005228221416473389, -0.005022883415222168, -0.004817545413970947, -0.0046122074127197266, -0.004406869411468506, -0.004201531410217285, -0.0039961934089660645, -0.0037908554077148438, -0.003585517406463623, -0.0033801794052124023, -0.0031748414039611816, -0.002969503402709961, -0.0027641654014587402, -0.0025588274002075195, -0.002353489398956299, -0.002148151397705078, -0.0019428133964538574, -0.0017374753952026367, -0.001532137393951416, -0.0013267993927001953, -0.0011214613914489746, -0.0009161233901977539, -0.0007107853889465332, -0.0005054473876953125, -0.0003001093864440918, -9.47713851928711e-05, 0.00011056661605834961, 0.0003159046173095703, 0.000521242618560791, 0.0007265806198120117, 0.0009319186210632324, 0.0011372566223144531, 0.0013425946235656738, 0.0015479326248168945, 0.0017532706260681152, 0.001958608627319336, 0.0021639466285705566, 0.0023692846298217773, 0.002574622631072998, 0.0027799606323242188, 0.0029852986335754395, 0.00319063663482666, 0.003395974636077881, 0.0036013126373291016, 0.0038066506385803223, 0.004011988639831543, 0.004217326641082764, 0.004422664642333984, 0.004628002643585205, 0.004833340644836426, 0.0050386786460876465, 0.005244016647338867, 0.005449354648590088, 0.005654692649841309, 0.005860030651092529, 0.00606536865234375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 6.0, 10.0, 9.0, 10.0, 26.0, 17.0, 23.0, 24.0, 16.0, 34.0, 36.0, 36.0, 31.0, 45.0, 29.0, 37.0, 46.0, 34.0, 45.0, 46.0, 35.0, 44.0, 42.0, 39.0, 33.0, 43.0, 23.0, 20.0, 24.0, 24.0, 23.0, 15.0, 16.0, 11.0, 10.0, 10.0, 4.0, 7.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0022525787353515625, -0.0021780431270599365, -0.0021035075187683105, -0.0020289719104766846, -0.0019544363021850586, -0.0018799006938934326, -0.0018053650856018066, -0.0017308294773101807, -0.0016562938690185547, -0.0015817582607269287, -0.0015072226524353027, -0.0014326870441436768, -0.0013581514358520508, -0.0012836158275604248, -0.0012090802192687988, -0.0011345446109771729, -0.0010600090026855469, -0.000985473394393921, -0.0009109377861022949, -0.0008364021778106689, -0.000761866569519043, -0.000687330961227417, -0.000612795352935791, -0.000538259744644165, -0.00046372413635253906, -0.0003891885280609131, -0.0003146529197692871, -0.00024011731147766113, -0.00016558170318603516, -9.104609489440918e-05, -1.6510486602783203e-05, 5.8025121688842773e-05, 0.00013256072998046875, 0.00020709633827209473, 0.0002816319465637207, 0.0003561675548553467, 0.00043070316314697266, 0.0005052387714385986, 0.0005797743797302246, 0.0006543099880218506, 0.0007288455963134766, 0.0008033812046051025, 0.0008779168128967285, 0.0009524524211883545, 0.0010269880294799805, 0.0011015236377716064, 0.0011760592460632324, 0.0012505948543548584, 0.0013251304626464844, 0.0013996660709381104, 0.0014742016792297363, 0.0015487372875213623, 0.0016232728958129883, 0.0016978085041046143, 0.0017723441123962402, 0.0018468797206878662, 0.0019214153289794922, 0.001995950937271118, 0.002070486545562744, 0.00214502215385437, 0.002219557762145996, 0.002294093370437622, 0.002368628978729248, 0.002443164587020874, 0.0025177001953125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 6.0, 8.0, 11.0, 16.0, 21.0, 31.0, 38.0, 59.0, 71.0, 121.0, 136.0, 209.0, 271.0, 373.0, 566.0, 742.0, 1175.0, 1831.0, 2962.0, 5142.0, 9349.0, 19373.0, 59916.0, 852997.0, 52792.0, 18138.0, 8990.0, 4816.0, 2849.0, 1785.0, 1165.0, 740.0, 544.0, 352.0, 259.0, 192.0, 120.0, 102.0, 80.0, 58.0, 40.0, 36.0, 20.0, 17.0, 11.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0009598731994628906, -0.0009293630719184875, -0.0008988529443740845, -0.0008683428168296814, -0.0008378326892852783, -0.0008073225617408752, -0.0007768124341964722, -0.0007463023066520691, -0.000715792179107666, -0.0006852820515632629, -0.0006547719240188599, -0.0006242617964744568, -0.0005937516689300537, -0.0005632415413856506, -0.0005327314138412476, -0.0005022212862968445, -0.0004717111587524414, -0.00044120103120803833, -0.00041069090366363525, -0.0003801807761192322, -0.0003496706485748291, -0.000319160521030426, -0.00028865039348602295, -0.0002581402659416199, -0.0002276301383972168, -0.00019712001085281372, -0.00016660988330841064, -0.00013609975576400757, -0.00010558962821960449, -7.507950067520142e-05, -4.456937313079834e-05, -1.4059245586395264e-05, 1.6450881958007812e-05, 4.696100950241089e-05, 7.747113704681396e-05, 0.00010798126459121704, 0.00013849139213562012, 0.0001690015196800232, 0.00019951164722442627, 0.00023002177476882935, 0.0002605319023132324, 0.0002910420298576355, 0.0003215521574020386, 0.00035206228494644165, 0.0003825724124908447, 0.0004130825400352478, 0.0004435926675796509, 0.00047410279512405396, 0.000504612922668457, 0.0005351230502128601, 0.0005656331777572632, 0.0005961433053016663, 0.0006266534328460693, 0.0006571635603904724, 0.0006876736879348755, 0.0007181838154792786, 0.0007486939430236816, 0.0007792040705680847, 0.0008097141981124878, 0.0008402243256568909, 0.0008707344532012939, 0.000901244580745697, 0.0009317547082901001, 0.0009622648358345032, 0.0009927749633789062]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 7.0, 9.0, 7.0, 21.0, 15.0, 40.0, 68.0, 64.0, 85.0, 136.0, 121.0, 95.0, 83.0, 76.0, 42.0, 32.0, 26.0, 12.0, 11.0, 10.0, 2.0, 4.0, 3.0, 6.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.781650543212891e-06, -5.584210157394409e-06, -5.386769771575928e-06, -5.189329385757446e-06, -4.991888999938965e-06, -4.794448614120483e-06, -4.597008228302002e-06, -4.3995678424835205e-06, -4.202127456665039e-06, -4.004687070846558e-06, -3.807246685028076e-06, -3.6098062992095947e-06, -3.4123659133911133e-06, -3.214925527572632e-06, -3.0174851417541504e-06, -2.820044755935669e-06, -2.6226043701171875e-06, -2.425163984298706e-06, -2.2277235984802246e-06, -2.030283212661743e-06, -1.8328428268432617e-06, -1.6354024410247803e-06, -1.4379620552062988e-06, -1.2405216693878174e-06, -1.043081283569336e-06, -8.456408977508545e-07, -6.48200511932373e-07, -4.507601261138916e-07, -2.5331974029541016e-07, -5.587935447692871e-08, 1.4156103134155273e-07, 3.390014171600342e-07, 5.364418029785156e-07, 7.338821887969971e-07, 9.313225746154785e-07, 1.12876296043396e-06, 1.3262033462524414e-06, 1.5236437320709229e-06, 1.7210841178894043e-06, 1.9185245037078857e-06, 2.115964889526367e-06, 2.3134052753448486e-06, 2.51084566116333e-06, 2.7082860469818115e-06, 2.905726432800293e-06, 3.1031668186187744e-06, 3.300607204437256e-06, 3.4980475902557373e-06, 3.6954879760742188e-06, 3.8929283618927e-06, 4.090368747711182e-06, 4.287809133529663e-06, 4.4852495193481445e-06, 4.682689905166626e-06, 4.880130290985107e-06, 5.077570676803589e-06, 5.27501106262207e-06, 5.472451448440552e-06, 5.669891834259033e-06, 5.867332220077515e-06, 6.064772605895996e-06, 6.2622129917144775e-06, 6.459653377532959e-06, 6.6570937633514404e-06, 6.854534149169922e-06]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 6.0, 15.0, 32.0, 34.0, 44.0, 71.0, 94.0, 129.0, 230.0, 313.0, 451.0, 694.0, 1183.0, 1893.0, 3134.0, 5652.0, 10035.0, 20344.0, 53243.0, 843529.0, 60436.0, 21924.0, 10645.0, 5760.0, 3204.0, 1997.0, 1212.0, 721.0, 477.0, 337.0, 211.0, 158.0, 115.0, 64.0, 55.0, 29.0, 17.0, 12.0, 21.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000949859619140625, -0.0009187608957290649, -0.0008876621723175049, -0.0008565634489059448, -0.0008254647254943848, -0.0007943660020828247, -0.0007632672786712646, -0.0007321685552597046, -0.0007010698318481445, -0.0006699711084365845, -0.0006388723850250244, -0.0006077736616134644, -0.0005766749382019043, -0.0005455762147903442, -0.0005144774913787842, -0.0004833787679672241, -0.00045228004455566406, -0.000421181321144104, -0.00039008259773254395, -0.0003589838743209839, -0.00032788515090942383, -0.00029678642749786377, -0.0002656877040863037, -0.00023458898067474365, -0.0002034902572631836, -0.00017239153385162354, -0.00014129281044006348, -0.00011019408702850342, -7.909536361694336e-05, -4.79966402053833e-05, -1.6897916793823242e-05, 1.4200806617736816e-05, 4.5299530029296875e-05, 7.639825344085693e-05, 0.00010749697685241699, 0.00013859570026397705, 0.0001696944236755371, 0.00020079314708709717, 0.00023189187049865723, 0.0002629905939102173, 0.00029408931732177734, 0.0003251880407333374, 0.00035628676414489746, 0.0003873854875564575, 0.0004184842109680176, 0.00044958293437957764, 0.0004806816577911377, 0.0005117803812026978, 0.0005428791046142578, 0.0005739778280258179, 0.0006050765514373779, 0.000636175274848938, 0.000667273998260498, 0.0006983727216720581, 0.0007294714450836182, 0.0007605701684951782, 0.0007916688919067383, 0.0008227676153182983, 0.0008538663387298584, 0.0008849650621414185, 0.0009160637855529785, 0.0009471625089645386, 0.0009782612323760986, 0.0010093599557876587, 0.0010404586791992188]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 4.0, 4.0, 10.0, 5.0, 6.0, 8.0, 5.0, 13.0, 13.0, 15.0, 16.0, 24.0, 199.0, 480.0, 63.0, 19.0, 21.0, 9.0, 10.0, 14.0, 11.0, 9.0, 4.0, 7.0, 11.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00025844573974609375, -0.000251108780503273, -0.00024377182126045227, -0.00023643486201763153, -0.0002290979027748108, -0.00022176094353199005, -0.0002144239842891693, -0.00020708702504634857, -0.00019975006580352783, -0.0001924131065607071, -0.00018507614731788635, -0.0001777391880750656, -0.00017040222883224487, -0.00016306526958942413, -0.0001557283103466034, -0.00014839135110378265, -0.00014105439186096191, -0.00013371743261814117, -0.00012638047337532043, -0.0001190435141324997, -0.00011170655488967896, -0.00010436959564685822, -9.703263640403748e-05, -8.969567716121674e-05, -8.2358717918396e-05, -7.502175867557526e-05, -6.768479943275452e-05, -6.034784018993378e-05, -5.301088094711304e-05, -4.56739217042923e-05, -3.833696246147156e-05, -3.100000321865082e-05, -2.3663043975830078e-05, -1.632608473300934e-05, -8.989125490188599e-06, -1.6521662473678589e-06, 5.684792995452881e-06, 1.302175223827362e-05, 2.035871148109436e-05, 2.76956707239151e-05, 3.503262996673584e-05, 4.236958920955658e-05, 4.970654845237732e-05, 5.704350769519806e-05, 6.43804669380188e-05, 7.171742618083954e-05, 7.905438542366028e-05, 8.639134466648102e-05, 9.372830390930176e-05, 0.0001010652631521225, 0.00010840222239494324, 0.00011573918163776398, 0.00012307614088058472, 0.00013041310012340546, 0.0001377500593662262, 0.00014508701860904694, 0.00015242397785186768, 0.00015976093709468842, 0.00016709789633750916, 0.0001744348555803299, 0.00018177181482315063, 0.00018910877406597137, 0.00019644573330879211, 0.00020378269255161285, 0.0002111196517944336]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 9.0, 8.0, 18.0, 18.0, 21.0, 28.0, 50.0, 49.0, 75.0, 84.0, 121.0, 118.0, 100.0, 80.0, 47.0, 24.0, 32.0, 29.0, 18.0, 17.0, 12.0, 10.0, 6.0, 2.0, 6.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005534959491342306, -0.005338046699762344, -0.005141133908182383, -0.004944221116602421, -0.004747308790683746, -0.0045503959991037846, -0.004353483207523823, -0.004156570415943861, -0.003959657624363899, -0.0037627448327839375, -0.0035658322740346193, -0.0033689194824546576, -0.0031720069237053394, -0.0029750941321253777, -0.002778181340545416, -0.002581268548965454, -0.0023843562230467796, -0.002187443431466818, -0.0019905308727174997, -0.001793618081137538, -0.001596705405972898, -0.001399792730808258, -0.0012028799392282963, -0.0010059672640636563, -0.0008090545888990164, -0.0006121419137343764, -0.00041522918036207557, -0.0002183164469897747, -2.1403771825134754e-05, 0.0001755089033395052, 0.00037242169491946697, 0.0005693343700841069, 0.0007662470452487469, 0.0009631597204133868, 0.0011600723955780268, 0.0013569851871579885, 0.0015538978623226285, 0.0017508105374872684, 0.0019477233290672302, 0.002144636120647192, 0.00234154867939651, 0.002538461470976472, 0.00273537402972579, 0.002932286821305752, 0.0031291996128857136, 0.0033261121716350317, 0.0035230249632149935, 0.0037199375219643116, 0.003916850313544273, 0.004113763105124235, 0.004310675896704197, 0.004507588222622871, 0.004704501014202833, 0.004901413805782795, 0.005098326597362757, 0.0052952393889427185, 0.005492151714861393, 0.005689064506441355, 0.0058859772980213165, 0.006082889623939991, 0.006279802415519953, 0.0064767152070999146, 0.006673627998679876, 0.006870540790259838, 0.0070674535818398]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 3.0, 7.0, 8.0, 11.0, 11.0, 20.0, 16.0, 13.0, 12.0, 20.0, 14.0, 24.0, 27.0, 30.0, 29.0, 33.0, 27.0, 30.0, 35.0, 46.0, 45.0, 44.0, 39.0, 47.0, 30.0, 36.0, 24.0, 35.0, 30.0, 29.0, 32.0, 24.0, 23.0, 19.0, 19.0, 22.0, 19.0, 17.0, 11.0, 7.0, 8.0, 9.0, 5.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00321229943074286, -0.0031003376934677362, -0.002988375723361969, -0.0028764139860868454, -0.002764452248811722, -0.002652490511536598, -0.002540528541430831, -0.0024285668041557074, -0.00231660483404994, -0.0022046430967748165, -0.0020926811266690493, -0.0019807193893939257, -0.001868757652118802, -0.0017567957984283566, -0.0016448339447379112, -0.0015328722074627876, -0.001420910470187664, -0.0013089486164972186, -0.001196986879222095, -0.0010850250255316496, -0.0009730632300488651, -0.0008611014345660806, -0.0007491395808756351, -0.0006371777853928506, -0.0005252159899100661, -0.0004132541944272816, -0.00030129236984066665, -0.00018933054525405169, -7.736874977126718e-05, 3.4593045711517334e-05, 0.00014655489940196276, 0.00025851669488474727, 0.00037047872319817543, 0.00048244051868095994, 0.0005944023141637444, 0.0007063641678541899, 0.0008183259633369744, 0.0009302877588197589, 0.0010422496125102043, 0.001154211349785328, 0.0012661732034757733, 0.0013781350571662188, 0.0014900967944413424, 0.0016020586481317878, 0.0017140205018222332, 0.0018259822390973568, 0.0019379440927878022, 0.0020499059464782476, 0.0021618676837533712, 0.002273829421028495, 0.002385791391134262, 0.0024977531284093857, 0.0026097148656845093, 0.002721676602959633, 0.0028336385730654, 0.0029456003103405237, 0.003057562280446291, 0.0031695240177214146, 0.003281485987827182, 0.0033934477251023054, 0.003505409462377429, 0.0036173714324831963, 0.00372933316975832, 0.0038412949070334435, 0.003953256644308567]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 8.0, 9.0, 11.0, 15.0, 33.0, 50.0, 74.0, 98.0, 143.0, 192.0, 290.0, 448.0, 631.0, 883.0, 1300.0, 1836.0, 2932.0, 4253.0, 6413.0, 10014.0, 15349.0, 24449.0, 40664.0, 70239.0, 129311.0, 266951.0, 704612.0, 1510322.0, 774910.0, 295217.0, 142399.0, 76904.0, 43432.0, 25694.0, 15826.0, 9807.0, 6371.0, 4129.0, 2690.0, 1795.0, 1250.0, 763.0, 517.0, 364.0, 215.0, 157.0, 107.0, 69.0, 42.0, 34.0, 19.0, 12.0, 12.0, 9.0, 4.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.004138946533203125, -0.003998875617980957, -0.003858804702758789, -0.003718733787536621, -0.003578662872314453, -0.003438591957092285, -0.003298521041870117, -0.0031584501266479492, -0.0030183792114257812, -0.0028783082962036133, -0.0027382373809814453, -0.0025981664657592773, -0.0024580955505371094, -0.0023180246353149414, -0.0021779537200927734, -0.0020378828048706055, -0.0018978118896484375, -0.0017577409744262695, -0.0016176700592041016, -0.0014775991439819336, -0.0013375282287597656, -0.0011974573135375977, -0.0010573863983154297, -0.0009173154830932617, -0.0007772445678710938, -0.0006371736526489258, -0.0004971027374267578, -0.00035703182220458984, -0.00021696090698242188, -7.68899917602539e-05, 6.318092346191406e-05, 0.00020325183868408203, 0.00034332275390625, 0.00048339366912841797, 0.0006234645843505859, 0.0007635354995727539, 0.0009036064147949219, 0.0010436773300170898, 0.0011837482452392578, 0.0013238191604614258, 0.0014638900756835938, 0.0016039609909057617, 0.0017440319061279297, 0.0018841028213500977, 0.0020241737365722656, 0.0021642446517944336, 0.0023043155670166016, 0.0024443864822387695, 0.0025844573974609375, 0.0027245283126831055, 0.0028645992279052734, 0.0030046701431274414, 0.0031447410583496094, 0.0032848119735717773, 0.0034248828887939453, 0.0035649538040161133, 0.0037050247192382812, 0.0038450956344604492, 0.003985166549682617, 0.004125237464904785, 0.004265308380126953, 0.004405379295349121, 0.004545450210571289, 0.004685521125793457, 0.004825592041015625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 1.0, 2.0, 6.0, 6.0, 6.0, 10.0, 14.0, 16.0, 11.0, 11.0, 13.0, 17.0, 10.0, 23.0, 21.0, 19.0, 30.0, 30.0, 36.0, 32.0, 31.0, 35.0, 27.0, 48.0, 36.0, 47.0, 43.0, 34.0, 33.0, 30.0, 29.0, 28.0, 33.0, 29.0, 33.0, 21.0, 18.0, 11.0, 13.0, 21.0, 17.0, 14.0, 12.0, 9.0, 6.0, 11.0, 6.0, 5.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002124786376953125, -0.0020564496517181396, -0.0019881129264831543, -0.001919776201248169, -0.0018514394760131836, -0.0017831027507781982, -0.0017147660255432129, -0.0016464293003082275, -0.0015780925750732422, -0.0015097558498382568, -0.0014414191246032715, -0.0013730823993682861, -0.0013047456741333008, -0.0012364089488983154, -0.00116807222366333, -0.0010997354984283447, -0.0010313987731933594, -0.000963062047958374, -0.0008947253227233887, -0.0008263885974884033, -0.000758051872253418, -0.0006897151470184326, -0.0006213784217834473, -0.0005530416965484619, -0.00048470497131347656, -0.0004163682460784912, -0.00034803152084350586, -0.0002796947956085205, -0.00021135807037353516, -0.0001430213451385498, -7.468461990356445e-05, -6.3478946685791016e-06, 6.198883056640625e-05, 0.0001303255558013916, 0.00019866228103637695, 0.0002669990062713623, 0.00033533573150634766, 0.000403672456741333, 0.00047200918197631836, 0.0005403459072113037, 0.0006086826324462891, 0.0006770193576812744, 0.0007453560829162598, 0.0008136928081512451, 0.0008820295333862305, 0.0009503662586212158, 0.0010187029838562012, 0.0010870397090911865, 0.0011553764343261719, 0.0012237131595611572, 0.0012920498847961426, 0.001360386610031128, 0.0014287233352661133, 0.0014970600605010986, 0.001565396785736084, 0.0016337335109710693, 0.0017020702362060547, 0.00177040696144104, 0.0018387436866760254, 0.0019070804119110107, 0.001975417137145996, 0.0020437538623809814, 0.002112090587615967, 0.002180427312850952, 0.0022487640380859375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 9.0, 8.0, 12.0, 8.0, 19.0, 27.0, 43.0, 52.0, 58.0, 84.0, 126.0, 221.0, 305.0, 438.0, 658.0, 959.0, 1442.0, 2186.0, 3430.0, 5410.0, 8683.0, 14680.0, 24608.0, 43081.0, 77906.0, 147070.0, 296448.0, 678876.0, 1389109.0, 793754.0, 337002.0, 164463.0, 86042.0, 47934.0, 27228.0, 15900.0, 9305.0, 5914.0, 3750.0, 2333.0, 1503.0, 1051.0, 668.0, 469.0, 307.0, 226.0, 142.0, 88.0, 76.0, 51.0, 45.0, 25.0, 22.0, 13.0, 9.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0], "bins": [-0.004055023193359375, -0.003926634788513184, -0.003798246383666992, -0.0036698579788208008, -0.0035414695739746094, -0.003413081169128418, -0.0032846927642822266, -0.003156304359436035, -0.0030279159545898438, -0.0028995275497436523, -0.002771139144897461, -0.0026427507400512695, -0.002514362335205078, -0.0023859739303588867, -0.0022575855255126953, -0.002129197120666504, -0.0020008087158203125, -0.001872420310974121, -0.0017440319061279297, -0.0016156435012817383, -0.0014872550964355469, -0.0013588666915893555, -0.001230478286743164, -0.0011020898818969727, -0.0009737014770507812, -0.0008453130722045898, -0.0007169246673583984, -0.000588536262512207, -0.0004601478576660156, -0.0003317594528198242, -0.0002033710479736328, -7.49826431274414e-05, 5.340576171875e-05, 0.0001817941665649414, 0.0003101825714111328, 0.0004385709762573242, 0.0005669593811035156, 0.000695347785949707, 0.0008237361907958984, 0.0009521245956420898, 0.0010805130004882812, 0.0012089014053344727, 0.001337289810180664, 0.0014656782150268555, 0.0015940666198730469, 0.0017224550247192383, 0.0018508434295654297, 0.001979231834411621, 0.0021076202392578125, 0.002236008644104004, 0.0023643970489501953, 0.0024927854537963867, 0.002621173858642578, 0.0027495622634887695, 0.002877950668334961, 0.0030063390731811523, 0.0031347274780273438, 0.003263115882873535, 0.0033915042877197266, 0.003519892692565918, 0.0036482810974121094, 0.0037766695022583008, 0.003905057907104492, 0.004033446311950684, 0.004161834716796875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 3.0, 4.0, 5.0, 5.0, 9.0, 18.0, 20.0, 17.0, 22.0, 27.0, 52.0, 34.0, 51.0, 75.0, 86.0, 119.0, 118.0, 147.0, 139.0, 188.0, 232.0, 255.0, 205.0, 248.0, 240.0, 228.0, 231.0, 194.0, 179.0, 161.0, 127.0, 124.0, 93.0, 74.0, 73.0, 71.0, 49.0, 36.0, 30.0, 18.0, 13.0, 12.0, 14.0, 5.0, 3.0, 7.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0012636184692382812, -0.0012249499559402466, -0.001186281442642212, -0.0011476129293441772, -0.0011089444160461426, -0.001070275902748108, -0.0010316073894500732, -0.0009929388761520386, -0.0009542703628540039, -0.0009156018495559692, -0.0008769333362579346, -0.0008382648229598999, -0.0007995963096618652, -0.0007609277963638306, -0.0007222592830657959, -0.0006835907697677612, -0.0006449222564697266, -0.0006062537431716919, -0.0005675852298736572, -0.0005289167165756226, -0.0004902482032775879, -0.0004515796899795532, -0.00041291117668151855, -0.0003742426633834839, -0.0003355741500854492, -0.00029690563678741455, -0.0002582371234893799, -0.00021956861019134521, -0.00018090009689331055, -0.00014223158359527588, -0.00010356307029724121, -6.489455699920654e-05, -2.6226043701171875e-05, 1.2442469596862793e-05, 5.111098289489746e-05, 8.977949619293213e-05, 0.0001284480094909668, 0.00016711652278900146, 0.00020578503608703613, 0.0002444535493850708, 0.00028312206268310547, 0.00032179057598114014, 0.0003604590892791748, 0.00039912760257720947, 0.00043779611587524414, 0.0004764646291732788, 0.0005151331424713135, 0.0005538016557693481, 0.0005924701690673828, 0.0006311386823654175, 0.0006698071956634521, 0.0007084757089614868, 0.0007471442222595215, 0.0007858127355575562, 0.0008244812488555908, 0.0008631497621536255, 0.0009018182754516602, 0.0009404867887496948, 0.0009791553020477295, 0.0010178238153457642, 0.0010564923286437988, 0.0010951608419418335, 0.0011338293552398682, 0.0011724978685379028, 0.0012111663818359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 9.0, 5.0, 12.0, 10.0, 21.0, 29.0, 40.0, 49.0, 73.0, 122.0, 165.0, 158.0, 116.0, 65.0, 43.0, 33.0, 19.0, 12.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005865850951522589, -0.005662374664098024, -0.00545889837667346, -0.005255422554910183, -0.005051946267485619, -0.004848469980061054, -0.00464499369263649, -0.0044415174052119255, -0.0042380415834486485, -0.004034565296024084, -0.0038310892414301634, -0.003627612954005599, -0.0034241368994116783, -0.003220660611987114, -0.0030171843245625496, -0.002813708269968629, -0.0026102319825440645, -0.0024067556951195, -0.0022032796405255795, -0.001999803353101015, -0.0017963272985070944, -0.00159285101108253, -0.0013893748400732875, -0.001185898669064045, -0.0009824224980548024, -0.0007789463270455599, -0.0005754701560363173, -0.0003719939268194139, -0.00016851775581017137, 3.495847340673208e-05, 0.00023843464441597462, 0.00044191081542521715, 0.0006453869864344597, 0.0008488631574437022, 0.0010523393284529448, 0.0012558156158775091, 0.0014592916704714298, 0.0016627679578959942, 0.0018662441289052367, 0.0020697202999144793, 0.0022731963545084, 0.0024766726419329643, 0.002680148696526885, 0.0028836249839514494, 0.00308710103854537, 0.0032905773259699345, 0.003494053613394499, 0.0036975296679884195, 0.003901005955412984, 0.004104482010006905, 0.004307958297431469, 0.004511434584856033, 0.004714910872280598, 0.004918387159705162, 0.005121862981468439, 0.0053253392688930035, 0.005528815556317568, 0.005732291843742132, 0.0059357681311666965, 0.006139243952929974, 0.006342720240354538, 0.006546196527779102, 0.006749672815203667, 0.006953149102628231, 0.007156624924391508]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 6.0, 1.0, 4.0, 10.0, 8.0, 13.0, 11.0, 18.0, 16.0, 16.0, 16.0, 17.0, 19.0, 15.0, 33.0, 31.0, 27.0, 33.0, 40.0, 38.0, 39.0, 42.0, 61.0, 42.0, 37.0, 32.0, 44.0, 37.0, 37.0, 32.0, 34.0, 29.0, 30.0, 23.0, 24.0, 20.0, 13.0, 10.0, 12.0, 11.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025942407082766294, -0.0025094933807849884, -0.0024247460532933474, -0.0023399987258017063, -0.0022552513983100653, -0.0021705040708184242, -0.002085756743326783, -0.002001009415835142, -0.001916262088343501, -0.00183151476085186, -0.001746767433360219, -0.001662020105868578, -0.001577272778376937, -0.0014925254508852959, -0.0014077781233936548, -0.0013230307959020138, -0.0012382834684103727, -0.0011535361409187317, -0.0010687888134270906, -0.0009840414859354496, -0.0008992941584438086, -0.0008145468309521675, -0.0007297995034605265, -0.0006450521759688854, -0.0005603048484772444, -0.00047555752098560333, -0.0003908101934939623, -0.00030606286600232124, -0.0002213155385106802, -0.00013656821101903915, -5.182088352739811e-05, 3.2926443964242935e-05, 0.00011767353862524033, 0.00020242086611688137, 0.0002871681936085224, 0.00037191552110016346, 0.0004566628485918045, 0.0005414101760834455, 0.0006261575035750866, 0.0007109048310667276, 0.0007956521585583687, 0.0008803994860500097, 0.0009651468135416508, 0.0010498941410332918, 0.0011346414685249329, 0.001219388796016574, 0.001304136123508215, 0.001388883450999856, 0.001473630778491497, 0.001558378105983138, 0.0016431254334747791, 0.0017278727609664202, 0.0018126200884580612, 0.0018973674159497023, 0.0019821147434413433, 0.0020668620709329844, 0.0021516093984246254, 0.0022363567259162664, 0.0023211040534079075, 0.0024058513808995485, 0.0024905987083911896, 0.0025753460358828306, 0.0026600933633744717, 0.0027448406908661127, 0.0028295880183577538]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 18.0, 30.0, 70.0, 79.0, 124.0, 226.0, 371.0, 609.0, 949.0, 1677.0, 2916.0, 5060.0, 8876.0, 16217.0, 29885.0, 55315.0, 108634.0, 230467.0, 287692.0, 144141.0, 71033.0, 37634.0, 20189.0, 11068.0, 6270.0, 3623.0, 2114.0, 1298.0, 744.0, 448.0, 293.0, 170.0, 84.0, 79.0, 51.0, 33.0, 19.0, 12.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00579071044921875, -0.005616247653961182, -0.005441784858703613, -0.005267322063446045, -0.0050928592681884766, -0.004918396472930908, -0.00474393367767334, -0.0045694708824157715, -0.004395008087158203, -0.004220545291900635, -0.004046082496643066, -0.003871619701385498, -0.0036971569061279297, -0.0035226941108703613, -0.003348231315612793, -0.0031737685203552246, -0.0029993057250976562, -0.002824842929840088, -0.0026503801345825195, -0.002475917339324951, -0.002301454544067383, -0.0021269917488098145, -0.001952528953552246, -0.0017780661582946777, -0.0016036033630371094, -0.001429140567779541, -0.0012546777725219727, -0.0010802149772644043, -0.0009057521820068359, -0.0007312893867492676, -0.0005568265914916992, -0.00038236379623413086, -0.0002079010009765625, -3.343820571899414e-05, 0.00014102458953857422, 0.0003154873847961426, 0.0004899501800537109, 0.0006644129753112793, 0.0008388757705688477, 0.001013338565826416, 0.0011878013610839844, 0.0013622641563415527, 0.001536726951599121, 0.0017111897468566895, 0.0018856525421142578, 0.002060115337371826, 0.0022345781326293945, 0.002409040927886963, 0.0025835037231445312, 0.0027579665184020996, 0.002932429313659668, 0.0031068921089172363, 0.0032813549041748047, 0.003455817699432373, 0.0036302804946899414, 0.0038047432899475098, 0.003979206085205078, 0.0041536688804626465, 0.004328131675720215, 0.004502594470977783, 0.0046770572662353516, 0.00485152006149292, 0.005025982856750488, 0.005200445652008057, 0.005374908447265625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 4.0, 7.0, 2.0, 5.0, 8.0, 11.0, 18.0, 9.0, 14.0, 16.0, 16.0, 20.0, 19.0, 31.0, 33.0, 26.0, 37.0, 33.0, 30.0, 50.0, 34.0, 37.0, 64.0, 47.0, 35.0, 38.0, 45.0, 38.0, 38.0, 36.0, 38.0, 30.0, 23.0, 32.0, 13.0, 15.0, 13.0, 8.0, 14.0, 6.0, 5.0, 5.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00258636474609375, -0.0025066733360290527, -0.0024269819259643555, -0.002347290515899658, -0.002267599105834961, -0.0021879076957702637, -0.0021082162857055664, -0.002028524875640869, -0.0019488334655761719, -0.0018691420555114746, -0.0017894506454467773, -0.00170975923538208, -0.0016300678253173828, -0.0015503764152526855, -0.0014706850051879883, -0.001390993595123291, -0.0013113021850585938, -0.0012316107749938965, -0.0011519193649291992, -0.001072227954864502, -0.0009925365447998047, -0.0009128451347351074, -0.0008331537246704102, -0.0007534623146057129, -0.0006737709045410156, -0.0005940794944763184, -0.0005143880844116211, -0.00043469667434692383, -0.00035500526428222656, -0.0002753138542175293, -0.00019562244415283203, -0.00011593103408813477, -3.62396240234375e-05, 4.3451786041259766e-05, 0.00012314319610595703, 0.0002028346061706543, 0.00028252601623535156, 0.00036221742630004883, 0.0004419088363647461, 0.0005216002464294434, 0.0006012916564941406, 0.0006809830665588379, 0.0007606744766235352, 0.0008403658866882324, 0.0009200572967529297, 0.000999748706817627, 0.0010794401168823242, 0.0011591315269470215, 0.0012388229370117188, 0.001318514347076416, 0.0013982057571411133, 0.0014778971672058105, 0.0015575885772705078, 0.001637279987335205, 0.0017169713973999023, 0.0017966628074645996, 0.0018763542175292969, 0.001956045627593994, 0.0020357370376586914, 0.0021154284477233887, 0.002195119857788086, 0.002274811267852783, 0.0023545026779174805, 0.0024341940879821777, 0.002513885498046875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 18.0, 20.0, 30.0, 52.0, 83.0, 165.0, 239.0, 408.0, 671.0, 1223.0, 2199.0, 4364.0, 9044.0, 22729.0, 77282.0, 531563.0, 312133.0, 53596.0, 17353.0, 7257.0, 3549.0, 1919.0, 1064.0, 672.0, 376.0, 211.0, 127.0, 78.0, 46.0, 26.0, 13.0, 7.0, 7.0, 3.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0087127685546875, -0.008388519287109375, -0.00806427001953125, -0.007740020751953125, -0.007415771484375, -0.007091522216796875, -0.00676727294921875, -0.006443023681640625, -0.0061187744140625, -0.005794525146484375, -0.00547027587890625, -0.005146026611328125, -0.00482177734375, -0.004497528076171875, -0.00417327880859375, -0.003849029541015625, -0.0035247802734375, -0.003200531005859375, -0.00287628173828125, -0.002552032470703125, -0.002227783203125, -0.001903533935546875, -0.00157928466796875, -0.001255035400390625, -0.0009307861328125, -0.000606536865234375, -0.00028228759765625, 4.1961669921875e-05, 0.0003662109375, 0.000690460205078125, 0.00101470947265625, 0.001338958740234375, 0.0016632080078125, 0.001987457275390625, 0.00231170654296875, 0.002635955810546875, 0.002960205078125, 0.003284454345703125, 0.00360870361328125, 0.003932952880859375, 0.0042572021484375, 0.004581451416015625, 0.00490570068359375, 0.005229949951171875, 0.00555419921875, 0.005878448486328125, 0.00620269775390625, 0.006526947021484375, 0.0068511962890625, 0.007175445556640625, 0.00749969482421875, 0.007823944091796875, 0.008148193359375, 0.008472442626953125, 0.00879669189453125, 0.009120941162109375, 0.0094451904296875, 0.009769439697265625, 0.01009368896484375, 0.010417938232421875, 0.0107421875, 0.011066436767578125, 0.01139068603515625, 0.011714935302734375, 0.0120391845703125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 9.0, 9.0, 13.0, 14.0, 18.0, 12.0, 27.0, 19.0, 36.0, 27.0, 38.0, 35.0, 36.0, 49.0, 50.0, 47.0, 41.0, 46.0, 31.0, 44.0, 51.0, 52.0, 31.0, 39.0, 33.0, 40.0, 30.0, 18.0, 15.0, 21.0, 19.0, 12.0, 16.0, 6.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016317367553710938, -0.0015757977962493896, -0.0015198588371276855, -0.0014639198780059814, -0.0014079809188842773, -0.0013520419597625732, -0.0012961030006408691, -0.001240164041519165, -0.001184225082397461, -0.0011282861232757568, -0.0010723471641540527, -0.0010164082050323486, -0.0009604692459106445, -0.0009045302867889404, -0.0008485913276672363, -0.0007926523685455322, -0.0007367134094238281, -0.000680774450302124, -0.0006248354911804199, -0.0005688965320587158, -0.0005129575729370117, -0.0004570186138153076, -0.0004010796546936035, -0.0003451406955718994, -0.0002892017364501953, -0.0002332627773284912, -0.0001773238182067871, -0.00012138485908508301, -6.54458999633789e-05, -9.506940841674805e-06, 4.64320182800293e-05, 0.0001023709774017334, 0.0001583099365234375, 0.0002142488956451416, 0.0002701878547668457, 0.0003261268138885498, 0.0003820657730102539, 0.000438004732131958, 0.0004939436912536621, 0.0005498826503753662, 0.0006058216094970703, 0.0006617605686187744, 0.0007176995277404785, 0.0007736384868621826, 0.0008295774459838867, 0.0008855164051055908, 0.0009414553642272949, 0.000997394323348999, 0.0010533332824707031, 0.0011092722415924072, 0.0011652112007141113, 0.0012211501598358154, 0.0012770891189575195, 0.0013330280780792236, 0.0013889670372009277, 0.0014449059963226318, 0.001500844955444336, 0.00155678391456604, 0.0016127228736877441, 0.0016686618328094482, 0.0017246007919311523, 0.0017805397510528564, 0.0018364787101745605, 0.0018924176692962646, 0.0019483566284179688]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 11.0, 13.0, 15.0, 31.0, 61.0, 65.0, 110.0, 160.0, 286.0, 414.0, 707.0, 1144.0, 1744.0, 3018.0, 5835.0, 13528.0, 41447.0, 231453.0, 629631.0, 79426.0, 21337.0, 8051.0, 4070.0, 2296.0, 1388.0, 848.0, 502.0, 361.0, 204.0, 140.0, 73.0, 57.0, 36.0, 22.0, 22.0, 16.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.0024471282958984375, -0.0023813843727111816, -0.0023156404495239258, -0.00224989652633667, -0.002184152603149414, -0.002118408679962158, -0.0020526647567749023, -0.0019869208335876465, -0.0019211769104003906, -0.0018554329872131348, -0.001789689064025879, -0.001723945140838623, -0.0016582012176513672, -0.0015924572944641113, -0.0015267133712768555, -0.0014609694480895996, -0.0013952255249023438, -0.0013294816017150879, -0.001263737678527832, -0.0011979937553405762, -0.0011322498321533203, -0.0010665059089660645, -0.0010007619857788086, -0.0009350180625915527, -0.0008692741394042969, -0.000803530216217041, -0.0007377862930297852, -0.0006720423698425293, -0.0006062984466552734, -0.0005405545234680176, -0.0004748106002807617, -0.00040906667709350586, -0.00034332275390625, -0.00027757883071899414, -0.00021183490753173828, -0.00014609098434448242, -8.034706115722656e-05, -1.4603137969970703e-05, 5.1140785217285156e-05, 0.00011688470840454102, 0.00018262863159179688, 0.00024837255477905273, 0.0003141164779663086, 0.00037986040115356445, 0.0004456043243408203, 0.0005113482475280762, 0.000577092170715332, 0.0006428360939025879, 0.0007085800170898438, 0.0007743239402770996, 0.0008400678634643555, 0.0009058117866516113, 0.0009715557098388672, 0.001037299633026123, 0.001103043556213379, 0.0011687874794006348, 0.0012345314025878906, 0.0013002753257751465, 0.0013660192489624023, 0.0014317631721496582, 0.001497507095336914, 0.00156325101852417, 0.0016289949417114258, 0.0016947388648986816, 0.0017604827880859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 0.0, 6.0, 7.0, 7.0, 11.0, 12.0, 18.0, 24.0, 37.0, 42.0, 68.0, 59.0, 75.0, 91.0, 102.0, 95.0, 82.0, 55.0, 52.0, 38.0, 39.0, 21.0, 9.0, 16.0, 6.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.0517578125e-05, -2.971850335597992e-05, -2.891942858695984e-05, -2.8120353817939758e-05, -2.7321279048919678e-05, -2.6522204279899597e-05, -2.5723129510879517e-05, -2.4924054741859436e-05, -2.4124979972839355e-05, -2.3325905203819275e-05, -2.2526830434799194e-05, -2.1727755665779114e-05, -2.0928680896759033e-05, -2.0129606127738953e-05, -1.9330531358718872e-05, -1.853145658969879e-05, -1.773238182067871e-05, -1.693330705165863e-05, -1.613423228263855e-05, -1.533515751361847e-05, -1.4536082744598389e-05, -1.3737007975578308e-05, -1.2937933206558228e-05, -1.2138858437538147e-05, -1.1339783668518066e-05, -1.0540708899497986e-05, -9.741634130477905e-06, -8.942559361457825e-06, -8.143484592437744e-06, -7.3444098234176636e-06, -6.545335054397583e-06, -5.7462602853775024e-06, -4.947185516357422e-06, -4.148110747337341e-06, -3.3490359783172607e-06, -2.54996120929718e-06, -1.7508864402770996e-06, -9.51811671257019e-07, -1.5273690223693848e-07, 6.463378667831421e-07, 1.4454126358032227e-06, 2.2444874048233032e-06, 3.043562173843384e-06, 3.842636942863464e-06, 4.641711711883545e-06, 5.4407864809036255e-06, 6.239861249923706e-06, 7.038936018943787e-06, 7.838010787963867e-06, 8.637085556983948e-06, 9.436160326004028e-06, 1.0235235095024109e-05, 1.103430986404419e-05, 1.183338463306427e-05, 1.263245940208435e-05, 1.3431534171104431e-05, 1.4230608940124512e-05, 1.5029683709144592e-05, 1.5828758478164673e-05, 1.6627833247184753e-05, 1.7426908016204834e-05, 1.8225982785224915e-05, 1.9025057554244995e-05, 1.9824132323265076e-05, 2.0623207092285156e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 13.0, 19.0, 23.0, 33.0, 43.0, 82.0, 106.0, 179.0, 247.0, 359.0, 560.0, 748.0, 1193.0, 1716.0, 2618.0, 4330.0, 6808.0, 12029.0, 22412.0, 47493.0, 121749.0, 419535.0, 250934.0, 79218.0, 33992.0, 16986.0, 9357.0, 5523.0, 3484.0, 2255.0, 1479.0, 1013.0, 643.0, 389.0, 320.0, 217.0, 131.0, 93.0, 87.0, 39.0, 34.0, 17.0, 9.0, 12.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0008344650268554688, -0.000809013843536377, -0.0007835626602172852, -0.0007581114768981934, -0.0007326602935791016, -0.0007072091102600098, -0.000681757926940918, -0.0006563067436218262, -0.0006308555603027344, -0.0006054043769836426, -0.0005799531936645508, -0.000554502010345459, -0.0005290508270263672, -0.0005035996437072754, -0.0004781484603881836, -0.0004526972770690918, -0.00042724609375, -0.0004017949104309082, -0.0003763437271118164, -0.0003508925437927246, -0.0003254413604736328, -0.000299990177154541, -0.0002745389938354492, -0.0002490878105163574, -0.00022363662719726562, -0.00019818544387817383, -0.00017273426055908203, -0.00014728307723999023, -0.00012183189392089844, -9.638071060180664e-05, -7.092952728271484e-05, -4.547834396362305e-05, -2.002716064453125e-05, 5.424022674560547e-06, 3.0875205993652344e-05, 5.632638931274414e-05, 8.177757263183594e-05, 0.00010722875595092773, 0.00013267993927001953, 0.00015813112258911133, 0.00018358230590820312, 0.00020903348922729492, 0.00023448467254638672, 0.0002599358558654785, 0.0002853870391845703, 0.0003108382225036621, 0.0003362894058227539, 0.0003617405891418457, 0.0003871917724609375, 0.0004126429557800293, 0.0004380941390991211, 0.0004635453224182129, 0.0004889965057373047, 0.0005144476890563965, 0.0005398988723754883, 0.0005653500556945801, 0.0005908012390136719, 0.0006162524223327637, 0.0006417036056518555, 0.0006671547889709473, 0.0006926059722900391, 0.0007180571556091309, 0.0007435083389282227, 0.0007689595222473145, 0.0007944107055664062]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 8.0, 1.0, 8.0, 9.0, 8.0, 14.0, 21.0, 18.0, 21.0, 26.0, 20.0, 35.0, 51.0, 46.0, 59.0, 69.0, 73.0, 68.0, 82.0, 67.0, 46.0, 63.0, 28.0, 35.0, 22.0, 27.0, 25.0, 11.0, 9.0, 9.0, 9.0, 6.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020945072174072266, -0.00020335428416728973, -0.0001972578465938568, -0.0001911614090204239, -0.00018506497144699097, -0.00017896853387355804, -0.00017287209630012512, -0.0001667756587266922, -0.00016067922115325928, -0.00015458278357982635, -0.00014848634600639343, -0.0001423899084329605, -0.0001362934708595276, -0.00013019703328609467, -0.00012410059571266174, -0.00011800415813922882, -0.0001119077205657959, -0.00010581128299236298, -9.971484541893005e-05, -9.361840784549713e-05, -8.752197027206421e-05, -8.142553269863129e-05, -7.532909512519836e-05, -6.923265755176544e-05, -6.313621997833252e-05, -5.70397824048996e-05, -5.0943344831466675e-05, -4.484690725803375e-05, -3.875046968460083e-05, -3.265403211116791e-05, -2.6557594537734985e-05, -2.0461156964302063e-05, -1.436471939086914e-05, -8.268281817436218e-06, -2.171844244003296e-06, 3.9245933294296265e-06, 1.0021030902862549e-05, 1.611746847629547e-05, 2.2213906049728394e-05, 2.8310343623161316e-05, 3.440678119659424e-05, 4.050321877002716e-05, 4.659965634346008e-05, 5.2696093916893005e-05, 5.879253149032593e-05, 6.488896906375885e-05, 7.098540663719177e-05, 7.70818442106247e-05, 8.317828178405762e-05, 8.927471935749054e-05, 9.537115693092346e-05, 0.00010146759450435638, 0.0001075640320777893, 0.00011366046965122223, 0.00011975690722465515, 0.00012585334479808807, 0.000131949782371521, 0.00013804621994495392, 0.00014414265751838684, 0.00015023909509181976, 0.00015633553266525269, 0.0001624319702386856, 0.00016852840781211853, 0.00017462484538555145, 0.00018072128295898438]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 7.0, 12.0, 8.0, 17.0, 20.0, 27.0, 38.0, 43.0, 79.0, 119.0, 163.0, 128.0, 110.0, 63.0, 45.0, 33.0, 26.0, 12.0, 15.0, 8.0, 5.0, 8.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003399189794436097, -0.0032499174121767282, -0.003100645262748003, -0.002951372880488634, -0.002802100731059909, -0.00265282834880054, -0.0025035561993718147, -0.002354283817112446, -0.002205011434853077, -0.002055739052593708, -0.0019064669031649828, -0.001757194520905614, -0.0016079223714768887, -0.0014586499892175198, -0.0013093777233734727, -0.0011601054575294256, -0.0010108333081007004, -0.0008615610422566533, -0.0007122887764126062, -0.0005630164523608983, -0.0004137441865168512, -0.0002644719206728041, -0.00011519959662109613, 3.4072669222950935e-05, 0.000183344935066998, 0.0003326172009110451, 0.0004818894958589226, 0.0006311617908068001, 0.0007804340566508472, 0.0009297063224948943, 0.0010789786465466022, 0.0012282509123906493, 0.00137752341106534, 0.0015267956769093871, 0.0016760679427534342, 0.001825340325012803, 0.0019746124744415283, 0.002123884856700897, 0.002273157238960266, 0.0024224293883889914, 0.0025717015378177166, 0.0027209739200770855, 0.0028702460695058107, 0.0030195184517651796, 0.003168790601193905, 0.0033180629834532738, 0.0034673353657126427, 0.003616607515141368, 0.003765879897400737, 0.003915152046829462, 0.004064424429088831, 0.0042136968113482, 0.004362969193607569, 0.00451224111020565, 0.004661513492465019, 0.004810785874724388, 0.004960058256983757, 0.005109330639243126, 0.005258603021502495, 0.005407874938100576, 0.005557147320359945, 0.005706419702619314, 0.005855692084878683, 0.006004964001476765, 0.006154236383736134]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 9.0, 9.0, 17.0, 16.0, 17.0, 17.0, 15.0, 16.0, 17.0, 21.0, 30.0, 28.0, 29.0, 35.0, 44.0, 40.0, 39.0, 43.0, 57.0, 46.0, 29.0, 41.0, 39.0, 39.0, 34.0, 40.0, 26.0, 34.0, 29.0, 30.0, 18.0, 20.0, 11.0, 10.0, 9.0, 13.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002225827192887664, -0.0021506878547370434, -0.0020755482837557793, -0.002000408945605159, -0.0019252696074545383, -0.001850130152888596, -0.0017749906983226538, -0.0016998513601720333, -0.001624711905606091, -0.0015495724510401487, -0.0014744331128895283, -0.001399293658323586, -0.0013241542037576437, -0.0012490148656070232, -0.001173875411041081, -0.0010987359564751387, -0.0010235966183245182, -0.0009484572219662368, -0.0008733178256079555, -0.0007981783710420132, -0.0007230389746837318, -0.0006478995783254504, -0.0005727601237595081, -0.0004976207274012268, -0.0004224813310429454, -0.000347341934684664, -0.0002722025092225522, -0.00019706309831235558, -0.00012192368740215898, -4.67842910438776e-05, 2.835513441823423e-05, 0.00010349455988034606, 0.0001786341890692711, 0.00025377358542755246, 0.0003289130108896643, 0.0004040524363517761, 0.0004791918327100575, 0.0005543312290683389, 0.0006294706836342812, 0.0007046100799925625, 0.0007797494763508439, 0.0008548888727091253, 0.0009300282690674067, 0.001005167723633349, 0.0010803071781992912, 0.0011554465163499117, 0.001230585970915854, 0.0013057254254817963, 0.0013808647636324167, 0.001456004218198359, 0.0015311435563489795, 0.0016062830109149218, 0.0016814223490655422, 0.0017565618036314845, 0.0018317012581974268, 0.0019068405963480473, 0.0019819801673293114, 0.002057119505479932, 0.002132259076461196, 0.0022073984146118164, 0.002282537752762437, 0.0023576770909130573, 0.0024328166618943214, 0.002507956000044942, 0.0025830953381955624]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 12.0, 6.0, 13.0, 20.0, 31.0, 26.0, 47.0, 68.0, 112.0, 138.0, 214.0, 307.0, 515.0, 764.0, 1195.0, 1914.0, 3294.0, 5271.0, 8605.0, 13354.0, 22422.0, 37395.0, 64783.0, 116266.0, 210795.0, 236668.0, 137883.0, 75991.0, 43434.0, 25742.0, 15729.0, 9614.0, 6085.0, 3630.0, 2293.0, 1378.0, 843.0, 569.0, 374.0, 244.0, 153.0, 93.0, 84.0, 54.0, 33.0, 36.0, 19.0, 11.0, 9.0, 9.0, 3.0, 3.0, 1.0, 0.0, 4.0, 4.0], "bins": [-0.004436492919921875, -0.004302620887756348, -0.00416874885559082, -0.004034876823425293, -0.0039010047912597656, -0.0037671327590942383, -0.003633260726928711, -0.0034993886947631836, -0.0033655166625976562, -0.003231644630432129, -0.0030977725982666016, -0.0029639005661010742, -0.002830028533935547, -0.0026961565017700195, -0.002562284469604492, -0.002428412437438965, -0.0022945404052734375, -0.00216066837310791, -0.002026796340942383, -0.0018929243087768555, -0.0017590522766113281, -0.0016251802444458008, -0.0014913082122802734, -0.001357436180114746, -0.0012235641479492188, -0.0010896921157836914, -0.0009558200836181641, -0.0008219480514526367, -0.0006880760192871094, -0.000554203987121582, -0.0004203319549560547, -0.00028645992279052734, -0.000152587890625, -1.8715858459472656e-05, 0.00011515617370605469, 0.00024902820587158203, 0.0003829002380371094, 0.0005167722702026367, 0.0006506443023681641, 0.0007845163345336914, 0.0009183883666992188, 0.001052260398864746, 0.0011861324310302734, 0.0013200044631958008, 0.0014538764953613281, 0.0015877485275268555, 0.0017216205596923828, 0.0018554925918579102, 0.0019893646240234375, 0.002123236656188965, 0.002257108688354492, 0.0023909807205200195, 0.002524852752685547, 0.0026587247848510742, 0.0027925968170166016, 0.002926468849182129, 0.0030603408813476562, 0.0031942129135131836, 0.003328084945678711, 0.0034619569778442383, 0.0035958290100097656, 0.003729701042175293, 0.0038635730743408203, 0.003997445106506348, 0.004131317138671875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 4.0, 10.0, 9.0, 10.0, 16.0, 12.0, 16.0, 15.0, 17.0, 21.0, 21.0, 21.0, 39.0, 24.0, 27.0, 35.0, 60.0, 22.0, 46.0, 36.0, 44.0, 41.0, 34.0, 42.0, 50.0, 34.0, 37.0, 25.0, 35.0, 29.0, 20.0, 22.0, 15.0, 26.0, 10.0, 12.0, 11.0, 10.0, 11.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0018672943115234375, -0.0018113404512405396, -0.0017553865909576416, -0.0016994327306747437, -0.0016434788703918457, -0.0015875250101089478, -0.0015315711498260498, -0.0014756172895431519, -0.001419663429260254, -0.001363709568977356, -0.001307755708694458, -0.00125180184841156, -0.0011958479881286621, -0.0011398941278457642, -0.0010839402675628662, -0.0010279864072799683, -0.0009720325469970703, -0.0009160786867141724, -0.0008601248264312744, -0.0008041709661483765, -0.0007482171058654785, -0.0006922632455825806, -0.0006363093852996826, -0.0005803555250167847, -0.0005244016647338867, -0.00046844780445098877, -0.0004124939441680908, -0.00035654008388519287, -0.0003005862236022949, -0.00024463236331939697, -0.00018867850303649902, -0.00013272464275360107, -7.677078247070312e-05, -2.0816922187805176e-05, 3.5136938095092773e-05, 9.109079837799072e-05, 0.00014704465866088867, 0.00020299851894378662, 0.00025895237922668457, 0.0003149062395095825, 0.00037086009979248047, 0.0004268139600753784, 0.00048276782035827637, 0.0005387216806411743, 0.0005946755409240723, 0.0006506294012069702, 0.0007065832614898682, 0.0007625371217727661, 0.0008184909820556641, 0.000874444842338562, 0.00093039870262146, 0.000986352562904358, 0.0010423064231872559, 0.0010982602834701538, 0.0011542141437530518, 0.0012101680040359497, 0.0012661218643188477, 0.0013220757246017456, 0.0013780295848846436, 0.0014339834451675415, 0.0014899373054504395, 0.0015458911657333374, 0.0016018450260162354, 0.0016577988862991333, 0.0017137527465820312]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 9.0, 13.0, 8.0, 22.0, 42.0, 45.0, 89.0, 95.0, 193.0, 309.0, 519.0, 845.0, 1352.0, 2448.0, 4053.0, 6751.0, 11174.0, 19624.0, 34149.0, 63495.0, 125192.0, 249357.0, 253434.0, 127864.0, 64415.0, 34955.0, 19590.0, 11490.0, 6941.0, 4126.0, 2349.0, 1429.0, 848.0, 520.0, 308.0, 185.0, 101.0, 85.0, 36.0, 35.0, 25.0, 15.0, 11.0, 3.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00466156005859375, -0.00452035665512085, -0.004379153251647949, -0.004237949848175049, -0.0040967464447021484, -0.003955543041229248, -0.0038143396377563477, -0.0036731362342834473, -0.003531932830810547, -0.0033907294273376465, -0.003249526023864746, -0.0031083226203918457, -0.0029671192169189453, -0.002825915813446045, -0.0026847124099731445, -0.002543509006500244, -0.0024023056030273438, -0.0022611021995544434, -0.002119898796081543, -0.0019786953926086426, -0.0018374919891357422, -0.0016962885856628418, -0.0015550851821899414, -0.001413881778717041, -0.0012726783752441406, -0.0011314749717712402, -0.0009902715682983398, -0.0008490681648254395, -0.0007078647613525391, -0.0005666613578796387, -0.0004254579544067383, -0.0002842545509338379, -0.0001430511474609375, -1.8477439880371094e-06, 0.00013935565948486328, 0.00028055906295776367, 0.00042176246643066406, 0.0005629658699035645, 0.0007041692733764648, 0.0008453726768493652, 0.0009865760803222656, 0.001127779483795166, 0.0012689828872680664, 0.0014101862907409668, 0.0015513896942138672, 0.0016925930976867676, 0.001833796501159668, 0.0019749999046325684, 0.0021162033081054688, 0.002257406711578369, 0.0023986101150512695, 0.00253981351852417, 0.0026810169219970703, 0.0028222203254699707, 0.002963423728942871, 0.0031046271324157715, 0.003245830535888672, 0.0033870339393615723, 0.0035282373428344727, 0.003669440746307373, 0.0038106441497802734, 0.003951847553253174, 0.004093050956726074, 0.004234254360198975, 0.004375457763671875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 11.0, 9.0, 8.0, 16.0, 20.0, 10.0, 21.0, 22.0, 28.0, 22.0, 19.0, 34.0, 34.0, 39.0, 30.0, 49.0, 43.0, 43.0, 41.0, 33.0, 30.0, 40.0, 35.0, 41.0, 36.0, 27.0, 28.0, 26.0, 30.0, 33.0, 20.0, 16.0, 23.0, 18.0, 8.0, 6.0, 8.0, 4.0, 9.0, 5.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001110076904296875, -0.0010740309953689575, -0.00103798508644104, -0.0010019391775131226, -0.0009658932685852051, -0.0009298473596572876, -0.0008938014507293701, -0.0008577555418014526, -0.0008217096328735352, -0.0007856637239456177, -0.0007496178150177002, -0.0007135719060897827, -0.0006775259971618652, -0.0006414800882339478, -0.0006054341793060303, -0.0005693882703781128, -0.0005333423614501953, -0.0004972964525222778, -0.00046125054359436035, -0.00042520463466644287, -0.0003891587257385254, -0.0003531128168106079, -0.00031706690788269043, -0.00028102099895477295, -0.00024497509002685547, -0.000208929181098938, -0.0001728832721710205, -0.00013683736324310303, -0.00010079145431518555, -6.474554538726807e-05, -2.8699636459350586e-05, 7.3462724685668945e-06, 4.3392181396484375e-05, 7.943809032440186e-05, 0.00011548399925231934, 0.00015152990818023682, 0.0001875758171081543, 0.00022362172603607178, 0.00025966763496398926, 0.00029571354389190674, 0.0003317594528198242, 0.0003678053617477417, 0.0004038512706756592, 0.00043989717960357666, 0.00047594308853149414, 0.0005119889974594116, 0.0005480349063873291, 0.0005840808153152466, 0.0006201267242431641, 0.0006561726331710815, 0.000692218542098999, 0.0007282644510269165, 0.000764310359954834, 0.0008003562688827515, 0.0008364021778106689, 0.0008724480867385864, 0.0009084939956665039, 0.0009445399045944214, 0.0009805858135223389, 0.0010166317224502563, 0.0010526776313781738, 0.0010887235403060913, 0.0011247694492340088, 0.0011608153581619263, 0.0011968612670898438]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 20.0, 20.0, 27.0, 38.0, 55.0, 74.0, 101.0, 146.0, 186.0, 222.0, 304.0, 425.0, 588.0, 823.0, 1182.0, 1919.0, 3096.0, 5750.0, 10881.0, 27598.0, 929868.0, 36025.0, 12682.0, 6304.0, 3527.0, 2086.0, 1299.0, 906.0, 634.0, 451.0, 338.0, 272.0, 159.0, 125.0, 123.0, 70.0, 67.0, 42.0, 30.0, 19.0, 22.0, 7.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0008387565612792969, -0.000813022255897522, -0.0007872879505157471, -0.0007615536451339722, -0.0007358193397521973, -0.0007100850343704224, -0.0006843507289886475, -0.0006586164236068726, -0.0006328821182250977, -0.0006071478128433228, -0.0005814135074615479, -0.000555679202079773, -0.000529944896697998, -0.0005042105913162231, -0.00047847628593444824, -0.00045274198055267334, -0.00042700767517089844, -0.00040127336978912354, -0.00037553906440734863, -0.00034980475902557373, -0.00032407045364379883, -0.0002983361482620239, -0.000272601842880249, -0.0002468675374984741, -0.00022113323211669922, -0.00019539892673492432, -0.00016966462135314941, -0.0001439303159713745, -0.00011819601058959961, -9.246170520782471e-05, -6.67273998260498e-05, -4.09930944442749e-05, -1.52587890625e-05, 1.0475516319274902e-05, 3.6209821701049805e-05, 6.194412708282471e-05, 8.767843246459961e-05, 0.00011341273784637451, 0.00013914704322814941, 0.00016488134860992432, 0.00019061565399169922, 0.00021634995937347412, 0.00024208426475524902, 0.0002678185701370239, 0.00029355287551879883, 0.00031928718090057373, 0.00034502148628234863, 0.00037075579166412354, 0.00039649009704589844, 0.00042222440242767334, 0.00044795870780944824, 0.00047369301319122314, 0.000499427318572998, 0.000525161623954773, 0.0005508959293365479, 0.0005766302347183228, 0.0006023645401000977, 0.0006280988454818726, 0.0006538331508636475, 0.0006795674562454224, 0.0007053017616271973, 0.0007310360670089722, 0.0007567703723907471, 0.000782504677772522, 0.0008082389831542969]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 10.0, 6.0, 6.0, 18.0, 8.0, 8.0, 23.0, 11.0, 25.0, 11.0, 21.0, 45.0, 24.0, 71.0, 52.0, 56.0, 109.0, 64.0, 89.0, 38.0, 24.0, 66.0, 27.0, 41.0, 18.0, 16.0, 32.0, 8.0, 7.0, 17.0, 7.0, 8.0, 2.0, 4.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8014183044433594e-06, -2.7185305953025818e-06, -2.635642886161804e-06, -2.5527551770210266e-06, -2.469867467880249e-06, -2.3869797587394714e-06, -2.304092049598694e-06, -2.2212043404579163e-06, -2.1383166313171387e-06, -2.055428922176361e-06, -1.9725412130355835e-06, -1.889653503894806e-06, -1.8067657947540283e-06, -1.7238780856132507e-06, -1.6409903764724731e-06, -1.5581026673316956e-06, -1.475214958190918e-06, -1.3923272490501404e-06, -1.3094395399093628e-06, -1.2265518307685852e-06, -1.1436641216278076e-06, -1.06077641248703e-06, -9.778887033462524e-07, -8.950009942054749e-07, -8.121132850646973e-07, -7.292255759239197e-07, -6.463378667831421e-07, -5.634501576423645e-07, -4.805624485015869e-07, -3.976747393608093e-07, -3.1478703022003174e-07, -2.3189932107925415e-07, -1.4901161193847656e-07, -6.612390279769897e-08, 1.6763806343078613e-08, 9.96515154838562e-08, 1.825392246246338e-07, 2.654269337654114e-07, 3.4831464290618896e-07, 4.3120235204696655e-07, 5.140900611877441e-07, 5.969777703285217e-07, 6.798654794692993e-07, 7.627531886100769e-07, 8.456408977508545e-07, 9.285286068916321e-07, 1.0114163160324097e-06, 1.0943040251731873e-06, 1.1771917343139648e-06, 1.2600794434547424e-06, 1.34296715259552e-06, 1.4258548617362976e-06, 1.5087425708770752e-06, 1.5916302800178528e-06, 1.6745179891586304e-06, 1.757405698299408e-06, 1.8402934074401855e-06, 1.923181116580963e-06, 2.0060688257217407e-06, 2.0889565348625183e-06, 2.171844244003296e-06, 2.2547319531440735e-06, 2.337619662284851e-06, 2.4205073714256287e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 9.0, 12.0, 17.0, 18.0, 27.0, 36.0, 59.0, 73.0, 104.0, 154.0, 224.0, 273.0, 404.0, 555.0, 811.0, 1094.0, 1538.0, 2285.0, 3474.0, 5420.0, 9156.0, 16593.0, 99242.0, 858121.0, 20131.0, 10315.0, 6162.0, 3784.0, 2543.0, 1736.0, 1194.0, 841.0, 581.0, 456.0, 322.0, 226.0, 168.0, 112.0, 85.0, 52.0, 43.0, 31.0, 22.0, 19.0, 10.0, 6.0, 6.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.0007710456848144531, -0.0007470399141311646, -0.000723034143447876, -0.0006990283727645874, -0.0006750226020812988, -0.0006510168313980103, -0.0006270110607147217, -0.0006030052900314331, -0.0005789995193481445, -0.000554993748664856, -0.0005309879779815674, -0.0005069822072982788, -0.00048297643661499023, -0.00045897066593170166, -0.0004349648952484131, -0.0004109591245651245, -0.00038695335388183594, -0.00036294758319854736, -0.0003389418125152588, -0.0003149360418319702, -0.00029093027114868164, -0.00026692450046539307, -0.0002429187297821045, -0.00021891295909881592, -0.00019490718841552734, -0.00017090141773223877, -0.0001468956470489502, -0.00012288987636566162, -9.888410568237305e-05, -7.487833499908447e-05, -5.08725643157959e-05, -2.6866793632507324e-05, -2.86102294921875e-06, 2.1144747734069824e-05, 4.51505184173584e-05, 6.915628910064697e-05, 9.316205978393555e-05, 0.00011716783046722412, 0.0001411736011505127, 0.00016517937183380127, 0.00018918514251708984, 0.00021319091320037842, 0.000237196683883667, 0.00026120245456695557, 0.00028520822525024414, 0.0003092139959335327, 0.0003332197666168213, 0.00035722553730010986, 0.00038123130798339844, 0.000405237078666687, 0.0004292428493499756, 0.00045324862003326416, 0.00047725439071655273, 0.0005012601613998413, 0.0005252659320831299, 0.0005492717027664185, 0.000573277473449707, 0.0005972832441329956, 0.0006212890148162842, 0.0006452947854995728, 0.0006693005561828613, 0.0006933063268661499, 0.0007173120975494385, 0.000741317868232727, 0.0007653236389160156]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 7.0, 5.0, 6.0, 13.0, 10.0, 23.0, 579.0, 250.0, 21.0, 8.0, 2.0, 6.0, 10.0, 7.0, 4.0, 1.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00021564960479736328, -0.00020887888967990875, -0.00020210817456245422, -0.0001953374594449997, -0.00018856674432754517, -0.00018179602921009064, -0.0001750253140926361, -0.00016825459897518158, -0.00016148388385772705, -0.00015471316874027252, -0.000147942453622818, -0.00014117173850536346, -0.00013440102338790894, -0.0001276303082704544, -0.00012085959315299988, -0.00011408887803554535, -0.00010731816291809082, -0.00010054744780063629, -9.377673268318176e-05, -8.700601756572723e-05, -8.02353024482727e-05, -7.346458733081818e-05, -6.669387221336365e-05, -5.992315709590912e-05, -5.315244197845459e-05, -4.638172686100006e-05, -3.961101174354553e-05, -3.2840296626091003e-05, -2.6069581508636475e-05, -1.9298866391181946e-05, -1.2528151273727417e-05, -5.757436156272888e-06, 1.0132789611816406e-06, 7.78399407863617e-06, 1.4554709196090698e-05, 2.1325424313545227e-05, 2.8096139430999756e-05, 3.4866854548454285e-05, 4.1637569665908813e-05, 4.840828478336334e-05, 5.517899990081787e-05, 6.19497150182724e-05, 6.872043013572693e-05, 7.549114525318146e-05, 8.226186037063599e-05, 8.903257548809052e-05, 9.580329060554504e-05, 0.00010257400572299957, 0.0001093447208404541, 0.00011611543595790863, 0.00012288615107536316, 0.0001296568661928177, 0.00013642758131027222, 0.00014319829642772675, 0.00014996901154518127, 0.0001567397266626358, 0.00016351044178009033, 0.00017028115689754486, 0.0001770518720149994, 0.00018382258713245392, 0.00019059330224990845, 0.00019736401736736298, 0.0002041347324848175, 0.00021090544760227203, 0.00021767616271972656]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 8.0, 2.0, 9.0, 12.0, 12.0, 13.0, 27.0, 26.0, 46.0, 59.0, 71.0, 103.0, 103.0, 103.0, 93.0, 69.0, 49.0, 45.0, 34.0, 25.0, 16.0, 18.0, 11.0, 12.0, 11.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0025737187825143337, -0.002476002089679241, -0.002378285164013505, -0.0022805684711784124, -0.0021828515455126762, -0.0020851348526775837, -0.001987418159842491, -0.0018897013505920768, -0.0017919845413416624, -0.001694267732091248, -0.0015965509228408337, -0.0014988342300057411, -0.0014011174207553267, -0.0013034006115049124, -0.0012056839186698198, -0.0011079671094194055, -0.001010250300168991, -0.0009125334909185767, -0.0008148167398758233, -0.0007170999888330698, -0.0006193831795826554, -0.0005216663703322411, -0.0004239496192894876, -0.00032623286824673414, -0.00022851605899631977, -0.00013079927884973586, -3.308249870315194e-05, 6.463428144343197e-05, 0.0001623510615900159, 0.00026006787084043026, 0.0003577846218831837, 0.0004555013729259372, 0.0005532179493457079, 0.0006509347585961223, 0.0007486515096388757, 0.0008463682606816292, 0.0009440850699320436, 0.001041801879182458, 0.0011395185720175505, 0.0012372353812679648, 0.0013349521905183792, 0.0014326689997687936, 0.001530385809019208, 0.0016281025018543005, 0.0017258193111047149, 0.0018235361203551292, 0.0019212528131902218, 0.0020189695060253143, 0.0021166864316910505, 0.002214403124526143, 0.0023121200501918793, 0.002409836743026972, 0.0025075534358620644, 0.0026052703615278006, 0.002702987054362893, 0.0028007039800286293, 0.002898420672863722, 0.0029961373656988144, 0.0030938542913645506, 0.003191570984199643, 0.0032892879098653793, 0.003387004602700472, 0.0034847212955355644, 0.003582437988370657, 0.003680154914036393]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 7.0, 8.0, 7.0, 5.0, 6.0, 21.0, 17.0, 18.0, 23.0, 22.0, 32.0, 36.0, 23.0, 33.0, 47.0, 38.0, 43.0, 36.0, 43.0, 42.0, 49.0, 49.0, 54.0, 41.0, 46.0, 47.0, 32.0, 36.0, 24.0, 17.0, 20.0, 12.0, 18.0, 14.0, 13.0, 8.0, 7.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00232955371029675, -0.002257940825074911, -0.002186327939853072, -0.002114715054631233, -0.0020431019365787506, -0.0019714890513569117, -0.0018998761661350727, -0.0018282632809132338, -0.0017566503956913948, -0.0016850375104695559, -0.001613424625247717, -0.0015418116236105561, -0.0014701987383887172, -0.0013985858531668782, -0.0013269728515297174, -0.0012553599663078785, -0.0011837470810860395, -0.0011121341958642006, -0.0010405213106423616, -0.0009689083090052009, -0.0008972954237833619, -0.000825682538561523, -0.0007540695951320231, -0.0006824566517025232, -0.0006108437664806843, -0.0005392308812588453, -0.00046761793782934546, -0.00039600502350367606, -0.00032439210917800665, -0.00025277919485233724, -0.00018116628052666783, -0.00010955333709716797, -3.794068470597267e-05, 3.3672229619696736e-05, 0.00010528514394536614, 0.00017689805827103555, 0.00024851097259670496, 0.00032012388692237437, 0.0003917368012480438, 0.00046334974467754364, 0.0005349626298993826, 0.0006065755151212215, 0.0006781884585507214, 0.0007498014019802213, 0.0008214142872020602, 0.0008930271724238992, 0.000964640115853399, 0.001036253059282899, 0.0011078659445047379, 0.0011794788297265768, 0.0012510917149484158, 0.0013227047165855765, 0.0013943176018074155, 0.0014659304870292544, 0.0015375434886664152, 0.0016091563738882542, 0.0016807692591100931, 0.001752382144331932, 0.001823995029553771, 0.0018956080311909318, 0.0019672210328280926, 0.0020388339180499315, 0.0021104468032717705, 0.0021820596884936094, 0.0022536725737154484]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 15.0, 38.0, 53.0, 77.0, 115.0, 239.0, 391.0, 636.0, 1033.0, 1752.0, 2825.0, 4720.0, 8158.0, 13950.0, 25519.0, 47470.0, 95633.0, 213680.0, 654258.0, 1870906.0, 782423.0, 254415.0, 109351.0, 51623.0, 25475.0, 13230.0, 7153.0, 3993.0, 2137.0, 1172.0, 691.0, 356.0, 253.0, 154.0, 101.0, 65.0, 54.0, 42.0, 21.0, 25.0, 15.0, 17.0, 14.0, 5.0, 6.0, 12.0, 5.0, 3.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025177001953125, -0.0024191737174987793, -0.0023206472396850586, -0.002222120761871338, -0.002123594284057617, -0.0020250678062438965, -0.0019265413284301758, -0.001828014850616455, -0.0017294883728027344, -0.0016309618949890137, -0.001532435417175293, -0.0014339089393615723, -0.0013353824615478516, -0.0012368559837341309, -0.0011383295059204102, -0.0010398030281066895, -0.0009412765502929688, -0.000842750072479248, -0.0007442235946655273, -0.0006456971168518066, -0.0005471706390380859, -0.00044864416122436523, -0.00035011768341064453, -0.00025159120559692383, -0.00015306472778320312, -5.453824996948242e-05, 4.398822784423828e-05, 0.00014251470565795898, 0.0002410411834716797, 0.0003395676612854004, 0.0004380941390991211, 0.0005366206169128418, 0.0006351470947265625, 0.0007336735725402832, 0.0008322000503540039, 0.0009307265281677246, 0.0010292530059814453, 0.001127779483795166, 0.0012263059616088867, 0.0013248324394226074, 0.0014233589172363281, 0.0015218853950500488, 0.0016204118728637695, 0.0017189383506774902, 0.001817464828491211, 0.0019159913063049316, 0.0020145177841186523, 0.002113044261932373, 0.0022115707397460938, 0.0023100972175598145, 0.002408623695373535, 0.002507150173187256, 0.0026056766510009766, 0.0027042031288146973, 0.002802729606628418, 0.0029012560844421387, 0.0029997825622558594, 0.00309830904006958, 0.0031968355178833008, 0.0032953619956970215, 0.003393888473510742, 0.003492414951324463, 0.0035909414291381836, 0.0036894679069519043, 0.003787994384765625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 7.0, 17.0, 13.0, 12.0, 21.0, 27.0, 28.0, 25.0, 36.0, 29.0, 37.0, 42.0, 43.0, 38.0, 44.0, 47.0, 43.0, 45.0, 46.0, 47.0, 46.0, 46.0, 35.0, 37.0, 26.0, 29.0, 22.0, 16.0, 11.0, 11.0, 12.0, 14.0, 8.0, 7.0, 4.0, 0.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0014657974243164062, -0.0014225095510482788, -0.0013792216777801514, -0.001335933804512024, -0.0012926459312438965, -0.001249358057975769, -0.0012060701847076416, -0.0011627823114395142, -0.0011194944381713867, -0.0010762065649032593, -0.0010329186916351318, -0.0009896308183670044, -0.000946342945098877, -0.0009030550718307495, -0.0008597671985626221, -0.0008164793252944946, -0.0007731914520263672, -0.0007299035787582397, -0.0006866157054901123, -0.0006433278322219849, -0.0006000399589538574, -0.00055675208568573, -0.0005134642124176025, -0.0004701763391494751, -0.00042688846588134766, -0.0003836005926132202, -0.0003403127193450928, -0.00029702484607696533, -0.0002537369728088379, -0.00021044909954071045, -0.000167161226272583, -0.00012387335300445557, -8.058547973632812e-05, -3.7297606468200684e-05, 5.990266799926758e-06, 4.92781400680542e-05, 9.256601333618164e-05, 0.00013585388660430908, 0.00017914175987243652, 0.00022242963314056396, 0.0002657175064086914, 0.00030900537967681885, 0.0003522932529449463, 0.00039558112621307373, 0.00043886899948120117, 0.0004821568727493286, 0.0005254447460174561, 0.0005687326192855835, 0.0006120204925537109, 0.0006553083658218384, 0.0006985962390899658, 0.0007418841123580933, 0.0007851719856262207, 0.0008284598588943481, 0.0008717477321624756, 0.000915035605430603, 0.0009583234786987305, 0.001001611351966858, 0.0010448992252349854, 0.0010881870985031128, 0.0011314749717712402, 0.0011747628450393677, 0.0012180507183074951, 0.0012613385915756226, 0.00130462646484375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 9.0, 7.0, 12.0, 17.0, 29.0, 39.0, 39.0, 68.0, 112.0, 179.0, 260.0, 352.0, 564.0, 795.0, 1287.0, 1965.0, 3159.0, 4658.0, 7478.0, 11610.0, 18364.0, 29430.0, 49374.0, 84929.0, 152625.0, 293847.0, 638751.0, 1295778.0, 810448.0, 358731.0, 181348.0, 98856.0, 57240.0, 33871.0, 21212.0, 13265.0, 8256.0, 5437.0, 3397.0, 2210.0, 1418.0, 995.0, 614.0, 432.0, 257.0, 172.0, 135.0, 86.0, 59.0, 37.0, 12.0, 21.0, 14.0, 12.0, 7.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.001842498779296875, -0.0017803311347961426, -0.0017181634902954102, -0.0016559958457946777, -0.0015938282012939453, -0.0015316605567932129, -0.0014694929122924805, -0.001407325267791748, -0.0013451576232910156, -0.0012829899787902832, -0.0012208223342895508, -0.0011586546897888184, -0.001096487045288086, -0.0010343194007873535, -0.0009721517562866211, -0.0009099841117858887, -0.0008478164672851562, -0.0007856488227844238, -0.0007234811782836914, -0.000661313533782959, -0.0005991458892822266, -0.0005369782447814941, -0.0004748106002807617, -0.0004126429557800293, -0.0003504753112792969, -0.00028830766677856445, -0.00022614002227783203, -0.0001639723777770996, -0.00010180473327636719, -3.9637088775634766e-05, 2.2530555725097656e-05, 8.469820022583008e-05, 0.0001468658447265625, 0.00020903348922729492, 0.00027120113372802734, 0.00033336877822875977, 0.0003955364227294922, 0.0004577040672302246, 0.000519871711730957, 0.0005820393562316895, 0.0006442070007324219, 0.0007063746452331543, 0.0007685422897338867, 0.0008307099342346191, 0.0008928775787353516, 0.000955045223236084, 0.0010172128677368164, 0.0010793805122375488, 0.0011415481567382812, 0.0012037158012390137, 0.001265883445739746, 0.0013280510902404785, 0.001390218734741211, 0.0014523863792419434, 0.0015145540237426758, 0.0015767216682434082, 0.0016388893127441406, 0.001701056957244873, 0.0017632246017456055, 0.0018253922462463379, 0.0018875598907470703, 0.0019497275352478027, 0.002011895179748535, 0.0020740628242492676, 0.00213623046875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 8.0, 11.0, 7.0, 8.0, 20.0, 20.0, 27.0, 32.0, 30.0, 53.0, 69.0, 64.0, 69.0, 101.0, 101.0, 131.0, 158.0, 182.0, 196.0, 222.0, 237.0, 245.0, 233.0, 244.0, 250.0, 199.0, 199.0, 169.0, 145.0, 111.0, 106.0, 98.0, 77.0, 54.0, 51.0, 24.0, 26.0, 18.0, 22.0, 16.0, 10.0, 10.0, 5.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.000728607177734375, -0.0007084012031555176, -0.0006881952285766602, -0.0006679892539978027, -0.0006477832794189453, -0.0006275773048400879, -0.0006073713302612305, -0.000587165355682373, -0.0005669593811035156, -0.0005467534065246582, -0.0005265474319458008, -0.0005063414573669434, -0.00048613548278808594, -0.0004659295082092285, -0.0004457235336303711, -0.00042551755905151367, -0.00040531158447265625, -0.00038510560989379883, -0.0003648996353149414, -0.000344693660736084, -0.00032448768615722656, -0.00030428171157836914, -0.0002840757369995117, -0.0002638697624206543, -0.00024366378784179688, -0.00022345781326293945, -0.00020325183868408203, -0.0001830458641052246, -0.0001628398895263672, -0.00014263391494750977, -0.00012242794036865234, -0.00010222196578979492, -8.20159912109375e-05, -6.181001663208008e-05, -4.1604042053222656e-05, -2.1398067474365234e-05, -1.1920928955078125e-06, 1.901388168334961e-05, 3.921985626220703e-05, 5.942583084106445e-05, 7.963180541992188e-05, 9.98377799987793e-05, 0.00012004375457763672, 0.00014024972915649414, 0.00016045570373535156, 0.00018066167831420898, 0.0002008676528930664, 0.00022107362747192383, 0.00024127960205078125, 0.00026148557662963867, 0.0002816915512084961, 0.0003018975257873535, 0.00032210350036621094, 0.00034230947494506836, 0.0003625154495239258, 0.0003827214241027832, 0.0004029273986816406, 0.00042313337326049805, 0.00044333934783935547, 0.0004635453224182129, 0.0004837512969970703, 0.0005039572715759277, 0.0005241632461547852, 0.0005443692207336426, 0.0005645751953125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 2.0, 4.0, 3.0, 5.0, 9.0, 5.0, 6.0, 13.0, 8.0, 16.0, 24.0, 34.0, 56.0, 60.0, 64.0, 94.0, 103.0, 97.0, 84.0, 60.0, 57.0, 46.0, 43.0, 18.0, 15.0, 10.0, 17.0, 13.0, 4.0, 5.0, 7.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001890539308078587, -0.0018278262577950954, -0.0017651133239269257, -0.001702400273643434, -0.0016396872233599424, -0.0015769742894917727, -0.001514261239208281, -0.0014515481889247894, -0.0013888352550566196, -0.001326122204773128, -0.0012634092709049582, -0.0012006962206214666, -0.001137983170337975, -0.0010752701200544834, -0.0010125571861863136, -0.000949844135902822, -0.0008871310856193304, -0.0008244180935434997, -0.0007617050432600081, -0.0006989920511841774, -0.0006362790009006858, -0.0005735660088248551, -0.0005108530167490244, -0.00044813999556936324, -0.0003854269743897021, -0.0003227139532100409, -0.00026000093203037977, -0.00019728793995454907, -0.00013457491877488792, -7.186189759522676e-05, -9.148905519396067e-06, 5.356411566026509e-05, 0.00011627725325524807, 0.00017899027443490922, 0.00024170328106265515, 0.0003044162876904011, 0.00036712930887006223, 0.0004298423300497234, 0.0004925553221255541, 0.0005552683724090457, 0.0006179813644848764, 0.0006806943565607071, 0.0007434074068441987, 0.0008061203989200294, 0.0008688333909958601, 0.0009315464412793517, 0.0009942594915628433, 0.001056972425431013, 0.0011196854757145047, 0.0011823985259979963, 0.0012451114598661661, 0.0013078245101496577, 0.0013705375604331493, 0.0014332504943013191, 0.0014959635445848107, 0.0015586765948683023, 0.0016213895287364721, 0.0016841025790199637, 0.0017468155128881335, 0.0018095285631716251, 0.0018722416134551167, 0.0019349546637386084, 0.001997667597606778, 0.002060380531474948, 0.0021230936981737614]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 8.0, 4.0, 8.0, 13.0, 12.0, 16.0, 16.0, 17.0, 24.0, 34.0, 16.0, 25.0, 31.0, 30.0, 27.0, 34.0, 26.0, 46.0, 41.0, 35.0, 46.0, 37.0, 43.0, 38.0, 33.0, 43.0, 36.0, 34.0, 30.0, 17.0, 24.0, 21.0, 19.0, 23.0, 25.0, 5.0, 11.0, 9.0, 11.0, 6.0, 6.0, 4.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013730599312111735, -0.0013317173579707742, -0.0012903747847303748, -0.0012490322114899755, -0.0012076895218342543, -0.001166346948593855, -0.0011250043753534555, -0.0010836618021130562, -0.0010423192288726568, -0.0010009766556322575, -0.0009596340823918581, -0.0009182914509437978, -0.0008769488777033985, -0.0008356063044629991, -0.0007942636730149388, -0.0007529210997745395, -0.0007115785265341401, -0.0006702359532937407, -0.0006288933800533414, -0.0005875507486052811, -0.0005462081753648818, -0.0005048656021244824, -0.0004635229997802526, -0.00042218039743602276, -0.0003808378241956234, -0.00033949525095522404, -0.0002981526486109942, -0.0002568100462667644, -0.00021546747302636504, -0.00017412488523405045, -0.00013278229744173586, -9.143969509750605e-05, -5.0097121857106686e-05, -8.754534064792097e-06, 3.258805372752249e-05, 7.393064151983708e-05, 0.00011527322931215167, 0.00015661581710446626, 0.00019795840489678085, 0.00023930100724101067, 0.00028064358048141, 0.0003219861537218094, 0.0003633287560660392, 0.000404671358410269, 0.0004460139316506684, 0.00048735650489106774, 0.000528699136339128, 0.0005700417095795274, 0.0006113842828199267, 0.0006527268560603261, 0.0006940694293007255, 0.0007354120607487857, 0.0007767546339891851, 0.0008180972072295845, 0.0008594398386776447, 0.0009007824119180441, 0.0009421249851584435, 0.0009834675583988428, 0.0010248101316392422, 0.0010661527048796415, 0.001107495278120041, 0.001148837967775762, 0.0011901805410161614, 0.0012315231142565608, 0.0012728656874969602]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 7.0, 7.0, 10.0, 20.0, 21.0, 32.0, 58.0, 76.0, 118.0, 157.0, 279.0, 394.0, 520.0, 764.0, 1175.0, 1762.0, 2670.0, 3943.0, 5994.0, 9033.0, 14137.0, 20681.0, 32035.0, 49537.0, 75854.0, 116684.0, 168298.0, 177251.0, 126846.0, 83593.0, 53992.0, 35126.0, 23131.0, 14992.0, 9741.0, 6508.0, 4403.0, 2797.0, 1925.0, 1264.0, 929.0, 606.0, 378.0, 265.0, 178.0, 114.0, 79.0, 61.0, 38.0, 28.0, 21.0, 12.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0018558502197265625, -0.0017961859703063965, -0.0017365217208862305, -0.0016768574714660645, -0.0016171932220458984, -0.0015575289726257324, -0.0014978647232055664, -0.0014382004737854004, -0.0013785362243652344, -0.0013188719749450684, -0.0012592077255249023, -0.0011995434761047363, -0.0011398792266845703, -0.0010802149772644043, -0.0010205507278442383, -0.0009608864784240723, -0.0009012222290039062, -0.0008415579795837402, -0.0007818937301635742, -0.0007222294807434082, -0.0006625652313232422, -0.0006029009819030762, -0.0005432367324829102, -0.00048357248306274414, -0.0004239082336425781, -0.0003642439842224121, -0.0003045797348022461, -0.0002449154853820801, -0.00018525123596191406, -0.00012558698654174805, -6.592273712158203e-05, -6.258487701416016e-06, 5.340576171875e-05, 0.00011307001113891602, 0.00017273426055908203, 0.00023239850997924805, 0.00029206275939941406, 0.0003517270088195801, 0.0004113912582397461, 0.0004710555076599121, 0.0005307197570800781, 0.0005903840065002441, 0.0006500482559204102, 0.0007097125053405762, 0.0007693767547607422, 0.0008290410041809082, 0.0008887052536010742, 0.0009483695030212402, 0.0010080337524414062, 0.0010676980018615723, 0.0011273622512817383, 0.0011870265007019043, 0.0012466907501220703, 0.0013063549995422363, 0.0013660192489624023, 0.0014256834983825684, 0.0014853477478027344, 0.0015450119972229004, 0.0016046762466430664, 0.0016643404960632324, 0.0017240047454833984, 0.0017836689949035645, 0.0018433332443237305, 0.0019029974937438965, 0.0019626617431640625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 1.0, 4.0, 5.0, 6.0, 8.0, 13.0, 9.0, 17.0, 9.0, 23.0, 20.0, 21.0, 24.0, 26.0, 35.0, 26.0, 35.0, 26.0, 32.0, 26.0, 32.0, 36.0, 39.0, 46.0, 36.0, 38.0, 36.0, 46.0, 33.0, 46.0, 32.0, 21.0, 17.0, 36.0, 19.0, 21.0, 22.0, 19.0, 16.0, 9.0, 6.0, 4.0, 14.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0011987686157226562, -0.001163586974143982, -0.0011284053325653076, -0.0010932236909866333, -0.001058042049407959, -0.0010228604078292847, -0.0009876787662506104, -0.000952497124671936, -0.0009173154830932617, -0.0008821338415145874, -0.0008469521999359131, -0.0008117705583572388, -0.0007765889167785645, -0.0007414072751998901, -0.0007062256336212158, -0.0006710439920425415, -0.0006358623504638672, -0.0006006807088851929, -0.0005654990673065186, -0.0005303174257278442, -0.0004951357841491699, -0.0004599541425704956, -0.0004247725009918213, -0.00038959085941314697, -0.00035440921783447266, -0.00031922757625579834, -0.000284045934677124, -0.0002488642930984497, -0.0002136826515197754, -0.00017850100994110107, -0.00014331936836242676, -0.00010813772678375244, -7.295608520507812e-05, -3.777444362640381e-05, -2.592802047729492e-06, 3.2588839530944824e-05, 6.777048110961914e-05, 0.00010295212268829346, 0.00013813376426696777, 0.0001733154058456421, 0.0002084970474243164, 0.00024367868900299072, 0.00027886033058166504, 0.00031404197216033936, 0.00034922361373901367, 0.000384405255317688, 0.0004195868968963623, 0.0004547685384750366, 0.0004899501800537109, 0.0005251318216323853, 0.0005603134632110596, 0.0005954951047897339, 0.0006306767463684082, 0.0006658583879470825, 0.0007010400295257568, 0.0007362216711044312, 0.0007714033126831055, 0.0008065849542617798, 0.0008417665958404541, 0.0008769482374191284, 0.0009121298789978027, 0.000947311520576477, 0.0009824931621551514, 0.0010176748037338257, 0.0010528564453125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 5.0, 5.0, 8.0, 9.0, 23.0, 27.0, 30.0, 75.0, 102.0, 150.0, 224.0, 366.0, 575.0, 885.0, 1482.0, 2539.0, 4363.0, 8057.0, 15843.0, 35894.0, 110614.0, 506397.0, 250879.0, 60855.0, 23605.0, 11234.0, 5966.0, 3353.0, 1860.0, 1155.0, 718.0, 449.0, 276.0, 150.0, 143.0, 78.0, 58.0, 32.0, 26.0, 15.0, 12.0, 11.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00438690185546875, -0.00426068902015686, -0.004134476184844971, -0.004008263349533081, -0.0038820505142211914, -0.0037558376789093018, -0.003629624843597412, -0.0035034120082855225, -0.003377199172973633, -0.003250986337661743, -0.0031247735023498535, -0.002998560667037964, -0.0028723478317260742, -0.0027461349964141846, -0.002619922161102295, -0.0024937093257904053, -0.0023674964904785156, -0.002241283655166626, -0.0021150708198547363, -0.0019888579845428467, -0.001862645149230957, -0.0017364323139190674, -0.0016102194786071777, -0.001484006643295288, -0.0013577938079833984, -0.0012315809726715088, -0.0011053681373596191, -0.0009791553020477295, -0.0008529424667358398, -0.0007267296314239502, -0.0006005167961120605, -0.0004743039608001709, -0.00034809112548828125, -0.0002218782901763916, -9.566545486450195e-05, 3.0547380447387695e-05, 0.00015676021575927734, 0.000282973051071167, 0.00040918588638305664, 0.0005353987216949463, 0.0006616115570068359, 0.0007878243923187256, 0.0009140372276306152, 0.0010402500629425049, 0.0011664628982543945, 0.0012926757335662842, 0.0014188885688781738, 0.0015451014041900635, 0.0016713142395019531, 0.0017975270748138428, 0.0019237399101257324, 0.002049952745437622, 0.0021761655807495117, 0.0023023784160614014, 0.002428591251373291, 0.0025548040866851807, 0.0026810169219970703, 0.00280722975730896, 0.0029334425926208496, 0.0030596554279327393, 0.003185868263244629, 0.0033120810985565186, 0.003438293933868408, 0.003564506769180298, 0.0036907196044921875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 4.0, 5.0, 7.0, 9.0, 16.0, 5.0, 13.0, 18.0, 15.0, 13.0, 18.0, 24.0, 25.0, 32.0, 25.0, 36.0, 38.0, 38.0, 33.0, 37.0, 39.0, 45.0, 50.0, 48.0, 42.0, 41.0, 27.0, 38.0, 36.0, 27.0, 26.0, 31.0, 22.0, 12.0, 18.0, 15.0, 15.0, 18.0, 12.0, 7.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000736236572265625, -0.0007123500108718872, -0.0006884634494781494, -0.0006645768880844116, -0.0006406903266906738, -0.000616803765296936, -0.0005929172039031982, -0.0005690306425094604, -0.0005451440811157227, -0.0005212575197219849, -0.0004973709583282471, -0.0004734843969345093, -0.0004495978355407715, -0.0004257112741470337, -0.0004018247127532959, -0.0003779381513595581, -0.0003540515899658203, -0.0003301650285720825, -0.0003062784671783447, -0.00028239190578460693, -0.00025850534439086914, -0.00023461878299713135, -0.00021073222160339355, -0.00018684566020965576, -0.00016295909881591797, -0.00013907253742218018, -0.00011518597602844238, -9.129941463470459e-05, -6.74128532409668e-05, -4.3526291847229004e-05, -1.963973045349121e-05, 4.246830940246582e-06, 2.8133392333984375e-05, 5.201995372772217e-05, 7.590651512145996e-05, 9.979307651519775e-05, 0.00012367963790893555, 0.00014756619930267334, 0.00017145276069641113, 0.00019533932209014893, 0.00021922588348388672, 0.0002431124448776245, 0.0002669990062713623, 0.0002908855676651001, 0.0003147721290588379, 0.0003386586904525757, 0.0003625452518463135, 0.00038643181324005127, 0.00041031837463378906, 0.00043420493602752686, 0.00045809149742126465, 0.00048197805881500244, 0.0005058646202087402, 0.000529751181602478, 0.0005536377429962158, 0.0005775243043899536, 0.0006014108657836914, 0.0006252974271774292, 0.000649183988571167, 0.0006730705499649048, 0.0006969571113586426, 0.0007208436727523804, 0.0007447302341461182, 0.000768616795539856, 0.0007925033569335938]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 18.0, 19.0, 21.0, 30.0, 35.0, 50.0, 85.0, 106.0, 181.0, 251.0, 406.0, 578.0, 837.0, 1376.0, 2118.0, 3452.0, 6125.0, 12079.0, 30034.0, 96018.0, 520571.0, 270040.0, 60787.0, 20931.0, 9340.0, 4941.0, 2848.0, 1728.0, 1130.0, 739.0, 513.0, 371.0, 256.0, 149.0, 115.0, 86.0, 58.0, 44.0, 28.0, 14.0, 17.0, 10.0, 7.0, 8.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008230209350585938, -0.0007963180541992188, -0.0007696151733398438, -0.0007429122924804688, -0.0007162094116210938, -0.0006895065307617188, -0.0006628036499023438, -0.0006361007690429688, -0.0006093978881835938, -0.0005826950073242188, -0.0005559921264648438, -0.0005292892456054688, -0.0005025863647460938, -0.00047588348388671875, -0.00044918060302734375, -0.00042247772216796875, -0.00039577484130859375, -0.00036907196044921875, -0.00034236907958984375, -0.00031566619873046875, -0.00028896331787109375, -0.00026226043701171875, -0.00023555755615234375, -0.00020885467529296875, -0.00018215179443359375, -0.00015544891357421875, -0.00012874603271484375, -0.00010204315185546875, -7.534027099609375e-05, -4.863739013671875e-05, -2.193450927734375e-05, 4.76837158203125e-06, 3.147125244140625e-05, 5.817413330078125e-05, 8.487701416015625e-05, 0.00011157989501953125, 0.00013828277587890625, 0.00016498565673828125, 0.00019168853759765625, 0.00021839141845703125, 0.00024509429931640625, 0.00027179718017578125, 0.00029850006103515625, 0.00032520294189453125, 0.00035190582275390625, 0.00037860870361328125, 0.00040531158447265625, 0.00043201446533203125, 0.00045871734619140625, 0.00048542022705078125, 0.0005121231079101562, 0.0005388259887695312, 0.0005655288696289062, 0.0005922317504882812, 0.0006189346313476562, 0.0006456375122070312, 0.0006723403930664062, 0.0006990432739257812, 0.0007257461547851562, 0.0007524490356445312, 0.0007791519165039062, 0.0008058547973632812, 0.0008325576782226562, 0.0008592605590820312, 0.0008859634399414062]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 2.0, 8.0, 9.0, 6.0, 13.0, 16.0, 14.0, 22.0, 22.0, 32.0, 30.0, 44.0, 37.0, 38.0, 41.0, 61.0, 61.0, 45.0, 69.0, 50.0, 50.0, 46.0, 40.0, 42.0, 25.0, 36.0, 18.0, 24.0, 14.0, 19.0, 13.0, 9.0, 4.0, 11.0, 6.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4185905456542969e-05, -1.3724900782108307e-05, -1.3263896107673645e-05, -1.2802891433238983e-05, -1.2341886758804321e-05, -1.188088208436966e-05, -1.1419877409934998e-05, -1.0958872735500336e-05, -1.0497868061065674e-05, -1.0036863386631012e-05, -9.57585871219635e-06, -9.114854037761688e-06, -8.653849363327026e-06, -8.192844688892365e-06, -7.731840014457703e-06, -7.270835340023041e-06, -6.809830665588379e-06, -6.348825991153717e-06, -5.887821316719055e-06, -5.426816642284393e-06, -4.9658119678497314e-06, -4.50480729341507e-06, -4.043802618980408e-06, -3.582797944545746e-06, -3.121793270111084e-06, -2.660788595676422e-06, -2.1997839212417603e-06, -1.7387792468070984e-06, -1.2777745723724365e-06, -8.167698979377747e-07, -3.557652235031128e-07, 1.0523945093154907e-07, 5.662441253662109e-07, 1.0272487998008728e-06, 1.4882534742355347e-06, 1.9492581486701965e-06, 2.4102628231048584e-06, 2.8712674975395203e-06, 3.332272171974182e-06, 3.793276846408844e-06, 4.254281520843506e-06, 4.715286195278168e-06, 5.17629086971283e-06, 5.6372955441474915e-06, 6.098300218582153e-06, 6.559304893016815e-06, 7.020309567451477e-06, 7.481314241886139e-06, 7.9423189163208e-06, 8.403323590755463e-06, 8.864328265190125e-06, 9.325332939624786e-06, 9.786337614059448e-06, 1.024734228849411e-05, 1.0708346962928772e-05, 1.1169351637363434e-05, 1.1630356311798096e-05, 1.2091360986232758e-05, 1.255236566066742e-05, 1.3013370335102081e-05, 1.3474375009536743e-05, 1.3935379683971405e-05, 1.4396384358406067e-05, 1.4857389032840729e-05, 1.531839370727539e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 17.0, 11.0, 26.0, 39.0, 65.0, 88.0, 169.0, 210.0, 360.0, 481.0, 784.0, 1188.0, 1917.0, 3205.0, 5139.0, 8942.0, 15938.0, 28981.0, 56006.0, 124156.0, 317067.0, 268078.0, 104748.0, 50077.0, 25833.0, 14232.0, 8131.0, 4806.0, 2946.0, 1720.0, 1101.0, 696.0, 530.0, 316.0, 186.0, 115.0, 74.0, 60.0, 43.0, 24.0, 19.0, 13.0, 5.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003600120544433594, -0.0003493949770927429, -0.00033877789974212646, -0.00032816082239151, -0.00031754374504089355, -0.0003069266676902771, -0.00029630959033966064, -0.0002856925129890442, -0.00027507543563842773, -0.0002644583582878113, -0.0002538412809371948, -0.00024322420358657837, -0.00023260712623596191, -0.00022199004888534546, -0.000211372971534729, -0.00020075589418411255, -0.0001901388168334961, -0.00017952173948287964, -0.00016890466213226318, -0.00015828758478164673, -0.00014767050743103027, -0.00013705343008041382, -0.00012643635272979736, -0.00011581927537918091, -0.00010520219802856445, -9.4585120677948e-05, -8.396804332733154e-05, -7.335096597671509e-05, -6.273388862609863e-05, -5.211681127548218e-05, -4.149973392486572e-05, -3.088265657424927e-05, -2.0265579223632812e-05, -9.648501873016357e-06, 9.685754776000977e-07, 1.1585652828216553e-05, 2.2202730178833008e-05, 3.281980752944946e-05, 4.343688488006592e-05, 5.405396223068237e-05, 6.467103958129883e-05, 7.528811693191528e-05, 8.590519428253174e-05, 9.65222716331482e-05, 0.00010713934898376465, 0.0001177564263343811, 0.00012837350368499756, 0.00013899058103561401, 0.00014960765838623047, 0.00016022473573684692, 0.00017084181308746338, 0.00018145889043807983, 0.0001920759677886963, 0.00020269304513931274, 0.0002133101224899292, 0.00022392719984054565, 0.0002345442771911621, 0.00024516135454177856, 0.000255778431892395, 0.0002663955092430115, 0.00027701258659362793, 0.0002876296639442444, 0.00029824674129486084, 0.0003088638186454773, 0.00031948089599609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 5.0, 3.0, 7.0, 6.0, 7.0, 9.0, 9.0, 11.0, 15.0, 20.0, 19.0, 35.0, 38.0, 42.0, 43.0, 45.0, 43.0, 54.0, 68.0, 52.0, 55.0, 54.0, 60.0, 50.0, 43.0, 40.0, 21.0, 27.0, 21.0, 16.0, 19.0, 15.0, 7.0, 6.0, 4.0, 7.0, 8.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.113550186157227e-05, -8.814781904220581e-05, -8.516013622283936e-05, -8.21724534034729e-05, -7.918477058410645e-05, -7.619708776473999e-05, -7.320940494537354e-05, -7.022172212600708e-05, -6.723403930664062e-05, -6.424635648727417e-05, -6.125867366790771e-05, -5.827099084854126e-05, -5.5283308029174805e-05, -5.229562520980835e-05, -4.9307942390441895e-05, -4.632025957107544e-05, -4.3332576751708984e-05, -4.034489393234253e-05, -3.7357211112976074e-05, -3.436952829360962e-05, -3.1381845474243164e-05, -2.839416265487671e-05, -2.5406479835510254e-05, -2.24187970161438e-05, -1.9431114196777344e-05, -1.644343137741089e-05, -1.3455748558044434e-05, -1.0468065738677979e-05, -7.4803829193115234e-06, -4.492700099945068e-06, -1.5050172805786133e-06, 1.4826655387878418e-06, 4.470348358154297e-06, 7.458031177520752e-06, 1.0445713996887207e-05, 1.3433396816253662e-05, 1.6421079635620117e-05, 1.9408762454986572e-05, 2.2396445274353027e-05, 2.5384128093719482e-05, 2.8371810913085938e-05, 3.135949373245239e-05, 3.434717655181885e-05, 3.73348593711853e-05, 4.032254219055176e-05, 4.331022500991821e-05, 4.629790782928467e-05, 4.928559064865112e-05, 5.227327346801758e-05, 5.526095628738403e-05, 5.824863910675049e-05, 6.123632192611694e-05, 6.42240047454834e-05, 6.721168756484985e-05, 7.019937038421631e-05, 7.318705320358276e-05, 7.617473602294922e-05, 7.916241884231567e-05, 8.215010166168213e-05, 8.513778448104858e-05, 8.812546730041504e-05, 9.11131501197815e-05, 9.410083293914795e-05, 9.70885157585144e-05, 0.00010007619857788086]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 7.0, 8.0, 8.0, 11.0, 20.0, 15.0, 26.0, 37.0, 51.0, 69.0, 109.0, 117.0, 128.0, 94.0, 74.0, 46.0, 38.0, 36.0, 17.0, 11.0, 15.0, 12.0, 10.0, 13.0, 7.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016265162266790867, -0.00156866863835603, -0.0015108210500329733, -0.0014529735781252384, -0.0013951259898021817, -0.001337278401479125, -0.0012794309295713902, -0.0012215833412483335, -0.0011637357529252768, -0.00110588816460222, -0.0010480405762791634, -0.0009901931043714285, -0.0009323455160483718, -0.0008744979277253151, -0.0008166503976099193, -0.0007588028674945235, -0.0007009552791714668, -0.0006431076908484101, -0.0005852601607330143, -0.0005274126306176186, -0.00046956504229456186, -0.0004117174830753356, -0.0003538699238561094, -0.00029602236463688314, -0.0002381748054176569, -0.00018032724619843066, -0.00012247968697920442, -6.463212775997818e-05, -6.784568540751934e-06, 5.106299067847431e-05, 0.00010891054989770055, 0.0001667581091169268, 0.00022460566833615303, 0.00028245322755537927, 0.0003403007867746055, 0.00039814834599383175, 0.000455995905213058, 0.0005138434935361147, 0.0005716910236515105, 0.0006295385537669063, 0.000687386142089963, 0.0007452337304130197, 0.0008030812605284154, 0.0008609287906438112, 0.0009187763789668679, 0.0009766239672899246, 0.0010344714391976595, 0.0010923190275207162, 0.0011501666158437729, 0.0012080142041668296, 0.0012658617924898863, 0.0013237092643976212, 0.0013815568527206779, 0.0014394044410437346, 0.0014972519129514694, 0.0015550995012745261, 0.0016129470895975828, 0.0016707946779206395, 0.0017286422662436962, 0.001786489738151431, 0.0018443373264744878, 0.0019021849147975445, 0.0019600323867052794, 0.002017880091443658, 0.0020757275633513927]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 11.0, 3.0, 5.0, 8.0, 7.0, 13.0, 12.0, 12.0, 16.0, 23.0, 21.0, 28.0, 19.0, 28.0, 34.0, 19.0, 30.0, 42.0, 26.0, 36.0, 34.0, 48.0, 48.0, 28.0, 40.0, 38.0, 40.0, 29.0, 41.0, 36.0, 35.0, 16.0, 21.0, 30.0, 15.0, 23.0, 25.0, 8.0, 9.0, 9.0, 10.0, 7.0, 7.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010892567224800587, -0.0010554756736382842, -0.001021694508381188, -0.0009879134595394135, -0.0009541322942823172, -0.0009203512454405427, -0.0008865701383911073, -0.0008527890313416719, -0.0008190079242922366, -0.0007852268172428012, -0.0007514457101933658, -0.0007176646031439304, -0.000683883554302156, -0.0006501023890450597, -0.0006163213402032852, -0.0005825402331538498, -0.0005487591261044145, -0.0005149780190549791, -0.0004811969120055437, -0.0004474158340599388, -0.0004136347270105034, -0.00037985361996106803, -0.0003460725420154631, -0.00031229143496602774, -0.00027851032791659236, -0.000244729220867157, -0.00021094812836963683, -0.00017716703587211668, -0.0001433859288226813, -0.00010960482177324593, -7.582372927572578e-05, -4.204263677820563e-05, -8.261529728770256e-06, 2.5519570044707507e-05, 5.930066981818527e-05, 9.308176959166303e-05, 0.0001268628693651408, 0.00016064397641457617, 0.00019442506891209632, 0.00022820616140961647, 0.00026198726845905185, 0.0002957683755084872, 0.0003295494825579226, 0.0003633305605035275, 0.0003971116675529629, 0.0004308927746023983, 0.0004646738525480032, 0.0004984549595974386, 0.000532236066646874, 0.0005660171736963093, 0.0005997982807457447, 0.0006335793877951801, 0.0006673604948446155, 0.0007011415436863899, 0.0007349226507358253, 0.0007687037577852607, 0.0008024848648346961, 0.0008362659718841314, 0.0008700470789335668, 0.0009038281859830022, 0.0009376092348247766, 0.0009713904000818729, 0.0010051714489236474, 0.0010389524977654219, 0.0010727336630225182]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 16.0, 20.0, 32.0, 42.0, 66.0, 102.0, 145.0, 191.0, 301.0, 458.0, 719.0, 1029.0, 1553.0, 2285.0, 3520.0, 5448.0, 8385.0, 12650.0, 20363.0, 33435.0, 55931.0, 98031.0, 170118.0, 230204.0, 165415.0, 94777.0, 54669.0, 32572.0, 19873.0, 12485.0, 8079.0, 5359.0, 3411.0, 2269.0, 1500.0, 968.0, 678.0, 485.0, 319.0, 202.0, 141.0, 97.0, 61.0, 42.0, 34.0, 27.0, 16.0, 9.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0019893646240234375, -0.0019281059503555298, -0.001866847276687622, -0.0018055886030197144, -0.0017443299293518066, -0.001683071255683899, -0.0016218125820159912, -0.0015605539083480835, -0.0014992952346801758, -0.001438036561012268, -0.0013767778873443604, -0.0013155192136764526, -0.001254260540008545, -0.0011930018663406372, -0.0011317431926727295, -0.0010704845190048218, -0.001009225845336914, -0.0009479671716690063, -0.0008867084980010986, -0.0008254498243331909, -0.0007641911506652832, -0.0007029324769973755, -0.0006416738033294678, -0.0005804151296615601, -0.0005191564559936523, -0.00045789778232574463, -0.0003966391086578369, -0.0003353804349899292, -0.0002741217613220215, -0.00021286308765411377, -0.00015160441398620605, -9.034574031829834e-05, -2.9087066650390625e-05, 3.217160701751709e-05, 9.34302806854248e-05, 0.00015468895435333252, 0.00021594762802124023, 0.00027720630168914795, 0.00033846497535705566, 0.0003997236490249634, 0.0004609823226928711, 0.0005222409963607788, 0.0005834996700286865, 0.0006447583436965942, 0.000706017017364502, 0.0007672756910324097, 0.0008285343647003174, 0.0008897930383682251, 0.0009510517120361328, 0.0010123103857040405, 0.0010735690593719482, 0.001134827733039856, 0.0011960864067077637, 0.0012573450803756714, 0.001318603754043579, 0.0013798624277114868, 0.0014411211013793945, 0.0015023797750473022, 0.00156363844871521, 0.0016248971223831177, 0.0016861557960510254, 0.001747414469718933, 0.0018086731433868408, 0.0018699318170547485, 0.0019311904907226562]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 7.0, 5.0, 15.0, 13.0, 17.0, 8.0, 16.0, 20.0, 29.0, 13.0, 25.0, 26.0, 31.0, 27.0, 43.0, 34.0, 30.0, 41.0, 41.0, 37.0, 54.0, 33.0, 38.0, 28.0, 33.0, 25.0, 40.0, 27.0, 31.0, 26.0, 29.0, 23.0, 19.0, 15.0, 24.0, 14.0, 6.0, 9.0, 9.0, 9.0, 5.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007987022399902344, -0.0007727816700935364, -0.0007468611001968384, -0.0007209405303001404, -0.0006950199604034424, -0.0006690993905067444, -0.0006431788206100464, -0.0006172582507133484, -0.0005913376808166504, -0.0005654171109199524, -0.0005394965410232544, -0.0005135759711265564, -0.0004876554012298584, -0.0004617348313331604, -0.0004358142614364624, -0.0004098936915397644, -0.0003839731216430664, -0.0003580525517463684, -0.0003321319818496704, -0.0003062114119529724, -0.0002802908420562744, -0.0002543702721595764, -0.00022844970226287842, -0.00020252913236618042, -0.00017660856246948242, -0.00015068799257278442, -0.00012476742267608643, -9.884685277938843e-05, -7.292628288269043e-05, -4.700571298599243e-05, -2.1085143089294434e-05, 4.8354268074035645e-06, 3.075599670410156e-05, 5.667656660079956e-05, 8.259713649749756e-05, 0.00010851770639419556, 0.00013443827629089355, 0.00016035884618759155, 0.00018627941608428955, 0.00021219998598098755, 0.00023812055587768555, 0.00026404112577438354, 0.00028996169567108154, 0.00031588226556777954, 0.00034180283546447754, 0.00036772340536117554, 0.00039364397525787354, 0.00041956454515457153, 0.00044548511505126953, 0.00047140568494796753, 0.0004973262548446655, 0.0005232468247413635, 0.0005491673946380615, 0.0005750879645347595, 0.0006010085344314575, 0.0006269291043281555, 0.0006528496742248535, 0.0006787702441215515, 0.0007046908140182495, 0.0007306113839149475, 0.0007565319538116455, 0.0007824525237083435, 0.0008083730936050415, 0.0008342936635017395, 0.0008602142333984375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 5.0, 10.0, 8.0, 12.0, 20.0, 35.0, 34.0, 67.0, 83.0, 125.0, 196.0, 291.0, 432.0, 595.0, 845.0, 1374.0, 2012.0, 2994.0, 4337.0, 6379.0, 9489.0, 14294.0, 21572.0, 32192.0, 49954.0, 80213.0, 130017.0, 192299.0, 179009.0, 115637.0, 71225.0, 44563.0, 28957.0, 19378.0, 13153.0, 8817.0, 5765.0, 3916.0, 2702.0, 1804.0, 1160.0, 793.0, 562.0, 405.0, 290.0, 175.0, 132.0, 77.0, 57.0, 36.0, 30.0, 17.0, 7.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00144195556640625, -0.0013952553272247314, -0.0013485550880432129, -0.0013018548488616943, -0.0012551546096801758, -0.0012084543704986572, -0.0011617541313171387, -0.0011150538921356201, -0.0010683536529541016, -0.001021653413772583, -0.0009749531745910645, -0.0009282529354095459, -0.0008815526962280273, -0.0008348524570465088, -0.0007881522178649902, -0.0007414519786834717, -0.0006947517395019531, -0.0006480515003204346, -0.000601351261138916, -0.0005546510219573975, -0.0005079507827758789, -0.00046125054359436035, -0.0004145503044128418, -0.00036785006523132324, -0.0003211498260498047, -0.00027444958686828613, -0.00022774934768676758, -0.00018104910850524902, -0.00013434886932373047, -8.764863014221191e-05, -4.094839096069336e-05, 5.751848220825195e-06, 5.245208740234375e-05, 9.91523265838623e-05, 0.00014585256576538086, 0.00019255280494689941, 0.00023925304412841797, 0.0002859532833099365, 0.0003326535224914551, 0.00037935376167297363, 0.0004260540008544922, 0.00047275424003601074, 0.0005194544792175293, 0.0005661547183990479, 0.0006128549575805664, 0.000659555196762085, 0.0007062554359436035, 0.0007529556751251221, 0.0007996559143066406, 0.0008463561534881592, 0.0008930563926696777, 0.0009397566318511963, 0.0009864568710327148, 0.0010331571102142334, 0.001079857349395752, 0.0011265575885772705, 0.001173257827758789, 0.0012199580669403076, 0.0012666583061218262, 0.0013133585453033447, 0.0013600587844848633, 0.0014067590236663818, 0.0014534592628479004, 0.001500159502029419, 0.0015468597412109375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 4.0, 10.0, 6.0, 8.0, 11.0, 14.0, 19.0, 22.0, 20.0, 32.0, 34.0, 34.0, 37.0, 31.0, 34.0, 36.0, 32.0, 32.0, 41.0, 32.0, 48.0, 37.0, 43.0, 40.0, 29.0, 32.0, 25.0, 26.0, 32.0, 32.0, 20.0, 21.0, 16.0, 21.0, 26.0, 10.0, 8.0, 10.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00048470497131347656, -0.0004676990211009979, -0.0004506930708885193, -0.00043368712067604065, -0.000416681170463562, -0.0003996752202510834, -0.00038266927003860474, -0.0003656633198261261, -0.00034865736961364746, -0.0003316514194011688, -0.0003146454691886902, -0.00029763951897621155, -0.0002806335687637329, -0.00026362761855125427, -0.00024662166833877563, -0.000229615718126297, -0.00021260976791381836, -0.00019560381770133972, -0.00017859786748886108, -0.00016159191727638245, -0.0001445859670639038, -0.00012758001685142517, -0.00011057406663894653, -9.35681164264679e-05, -7.656216621398926e-05, -5.955621600151062e-05, -4.255026578903198e-05, -2.5544315576553345e-05, -8.538365364074707e-06, 8.46758484840393e-06, 2.547353506088257e-05, 4.2479485273361206e-05, 5.9485435485839844e-05, 7.649138569831848e-05, 9.349733591079712e-05, 0.00011050328612327576, 0.0001275092363357544, 0.00014451518654823303, 0.00016152113676071167, 0.0001785270869731903, 0.00019553303718566895, 0.00021253898739814758, 0.00022954493761062622, 0.00024655088782310486, 0.0002635568380355835, 0.00028056278824806213, 0.00029756873846054077, 0.0003145746886730194, 0.00033158063888549805, 0.0003485865890979767, 0.0003655925393104553, 0.00038259848952293396, 0.0003996044397354126, 0.00041661038994789124, 0.0004336163401603699, 0.0004506222903728485, 0.00046762824058532715, 0.0004846341907978058, 0.0005016401410102844, 0.0005186460912227631, 0.0005356520414352417, 0.0005526579916477203, 0.000569663941860199, 0.0005866698920726776, 0.0006036758422851562]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 7.0, 14.0, 9.0, 15.0, 21.0, 40.0, 62.0, 66.0, 104.0, 135.0, 172.0, 227.0, 344.0, 485.0, 693.0, 1013.0, 1395.0, 2071.0, 3109.0, 4524.0, 7129.0, 12028.0, 23662.0, 138347.0, 784951.0, 29439.0, 14313.0, 8110.0, 5249.0, 3232.0, 2295.0, 1571.0, 1077.0, 745.0, 542.0, 388.0, 264.0, 196.0, 131.0, 77.0, 76.0, 57.0, 37.0, 37.0, 23.0, 18.0, 12.0, 10.0, 5.0, 1.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.00023508071899414062, -0.00022776424884796143, -0.00022044777870178223, -0.00021313130855560303, -0.00020581483840942383, -0.00019849836826324463, -0.00019118189811706543, -0.00018386542797088623, -0.00017654895782470703, -0.00016923248767852783, -0.00016191601753234863, -0.00015459954738616943, -0.00014728307723999023, -0.00013996660709381104, -0.00013265013694763184, -0.00012533366680145264, -0.00011801719665527344, -0.00011070072650909424, -0.00010338425636291504, -9.606778621673584e-05, -8.875131607055664e-05, -8.143484592437744e-05, -7.411837577819824e-05, -6.680190563201904e-05, -5.9485435485839844e-05, -5.2168965339660645e-05, -4.4852495193481445e-05, -3.7536025047302246e-05, -3.0219554901123047e-05, -2.2903084754943848e-05, -1.558661460876465e-05, -8.27014446258545e-06, -9.5367431640625e-07, 6.362795829772949e-06, 1.3679265975952148e-05, 2.0995736122131348e-05, 2.8312206268310547e-05, 3.5628676414489746e-05, 4.2945146560668945e-05, 5.0261616706848145e-05, 5.7578086853027344e-05, 6.489455699920654e-05, 7.221102714538574e-05, 7.952749729156494e-05, 8.684396743774414e-05, 9.416043758392334e-05, 0.00010147690773010254, 0.00010879337787628174, 0.00011610984802246094, 0.00012342631816864014, 0.00013074278831481934, 0.00013805925846099854, 0.00014537572860717773, 0.00015269219875335693, 0.00016000866889953613, 0.00016732513904571533, 0.00017464160919189453, 0.00018195807933807373, 0.00018927454948425293, 0.00019659101963043213, 0.00020390748977661133, 0.00021122395992279053, 0.00021854043006896973, 0.00022585690021514893, 0.00023317337036132812]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 7.0, 8.0, 3.0, 23.0, 16.0, 17.0, 54.0, 38.0, 36.0, 44.0, 75.0, 55.0, 60.0, 50.0, 126.0, 46.0, 49.0, 93.0, 29.0, 27.0, 22.0, 41.0, 17.0, 5.0, 17.0, 12.0, 6.0, 3.0, 7.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-06, -2.3078173398971558e-06, -2.2314488887786865e-06, -2.1550804376602173e-06, -2.078711986541748e-06, -2.002343535423279e-06, -1.9259750843048096e-06, -1.8496066331863403e-06, -1.773238182067871e-06, -1.6968697309494019e-06, -1.6205012798309326e-06, -1.5441328287124634e-06, -1.4677643775939941e-06, -1.391395926475525e-06, -1.3150274753570557e-06, -1.2386590242385864e-06, -1.1622905731201172e-06, -1.085922122001648e-06, -1.0095536708831787e-06, -9.331852197647095e-07, -8.568167686462402e-07, -7.80448317527771e-07, -7.040798664093018e-07, -6.277114152908325e-07, -5.513429641723633e-07, -4.7497451305389404e-07, -3.986060619354248e-07, -3.2223761081695557e-07, -2.4586915969848633e-07, -1.695007085800171e-07, -9.313225746154785e-08, -1.6763806343078613e-08, 5.960464477539063e-08, 1.3597309589385986e-07, 2.123415470123291e-07, 2.8870999813079834e-07, 3.650784492492676e-07, 4.414469003677368e-07, 5.178153514862061e-07, 5.941838026046753e-07, 6.705522537231445e-07, 7.469207048416138e-07, 8.23289155960083e-07, 8.996576070785522e-07, 9.760260581970215e-07, 1.0523945093154907e-06, 1.12876296043396e-06, 1.2051314115524292e-06, 1.2814998626708984e-06, 1.3578683137893677e-06, 1.434236764907837e-06, 1.5106052160263062e-06, 1.5869736671447754e-06, 1.6633421182632446e-06, 1.7397105693817139e-06, 1.816079020500183e-06, 1.8924474716186523e-06, 1.9688159227371216e-06, 2.045184373855591e-06, 2.12155282497406e-06, 2.1979212760925293e-06, 2.2742897272109985e-06, 2.3506581783294678e-06, 2.427026629447937e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 8.0, 8.0, 12.0, 8.0, 26.0, 20.0, 43.0, 61.0, 81.0, 102.0, 158.0, 222.0, 322.0, 482.0, 734.0, 1091.0, 1601.0, 2287.0, 3446.0, 5253.0, 8340.0, 15281.0, 32246.0, 882928.0, 47708.0, 18380.0, 9782.0, 5835.0, 3967.0, 2596.0, 1776.0, 1181.0, 805.0, 534.0, 383.0, 246.0, 186.0, 126.0, 89.0, 59.0, 35.0, 35.0, 24.0, 10.0, 17.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0003044605255126953, -0.0002941899001598358, -0.0002839192748069763, -0.0002736486494541168, -0.0002633780241012573, -0.00025310739874839783, -0.00024283677339553833, -0.00023256614804267883, -0.00022229552268981934, -0.00021202489733695984, -0.00020175427198410034, -0.00019148364663124084, -0.00018121302127838135, -0.00017094239592552185, -0.00016067177057266235, -0.00015040114521980286, -0.00014013051986694336, -0.00012985989451408386, -0.00011958926916122437, -0.00010931864380836487, -9.904801845550537e-05, -8.877739310264587e-05, -7.850676774978638e-05, -6.823614239692688e-05, -5.796551704406738e-05, -4.7694891691207886e-05, -3.742426633834839e-05, -2.715364098548889e-05, -1.6883015632629395e-05, -6.6123902797698975e-06, 3.6582350730895996e-06, 1.3928860425949097e-05, 2.4199485778808594e-05, 3.447011113166809e-05, 4.474073648452759e-05, 5.5011361837387085e-05, 6.528198719024658e-05, 7.555261254310608e-05, 8.582323789596558e-05, 9.609386324882507e-05, 0.00010636448860168457, 0.00011663511395454407, 0.00012690573930740356, 0.00013717636466026306, 0.00014744699001312256, 0.00015771761536598206, 0.00016798824071884155, 0.00017825886607170105, 0.00018852949142456055, 0.00019880011677742004, 0.00020907074213027954, 0.00021934136748313904, 0.00022961199283599854, 0.00023988261818885803, 0.00025015324354171753, 0.000260423868894577, 0.0002706944942474365, 0.000280965119600296, 0.0002912357449531555, 0.000301506370306015, 0.0003117769956588745, 0.000322047621011734, 0.0003323182463645935, 0.000342588871717453, 0.0003528594970703125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 6.0, 2.0, 4.0, 8.0, 9.0, 9.0, 5.0, 10.0, 21.0, 38.0, 632.0, 149.0, 10.0, 12.0, 9.0, 13.0, 10.0, 5.0, 3.0, 2.0, 2.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.147954940795898e-05, -7.85384327173233e-05, -7.559731602668762e-05, -7.265619933605194e-05, -6.971508264541626e-05, -6.677396595478058e-05, -6.38328492641449e-05, -6.0891732573509216e-05, -5.7950615882873535e-05, -5.5009499192237854e-05, -5.206838250160217e-05, -4.912726581096649e-05, -4.618614912033081e-05, -4.324503242969513e-05, -4.030391573905945e-05, -3.736279904842377e-05, -3.4421682357788086e-05, -3.1480565667152405e-05, -2.8539448976516724e-05, -2.5598332285881042e-05, -2.265721559524536e-05, -1.971609890460968e-05, -1.6774982213974e-05, -1.3833865523338318e-05, -1.0892748832702637e-05, -7.951632142066956e-06, -5.010515451431274e-06, -2.0693987607955933e-06, 8.717179298400879e-07, 3.812834620475769e-06, 6.75395131111145e-06, 9.695068001747131e-06, 1.2636184692382812e-05, 1.5577301383018494e-05, 1.8518418073654175e-05, 2.1459534764289856e-05, 2.4400651454925537e-05, 2.7341768145561218e-05, 3.02828848361969e-05, 3.322400152683258e-05, 3.616511821746826e-05, 3.910623490810394e-05, 4.2047351598739624e-05, 4.4988468289375305e-05, 4.7929584980010986e-05, 5.087070167064667e-05, 5.381181836128235e-05, 5.675293505191803e-05, 5.969405174255371e-05, 6.263516843318939e-05, 6.557628512382507e-05, 6.851740181446075e-05, 7.145851850509644e-05, 7.439963519573212e-05, 7.73407518863678e-05, 8.028186857700348e-05, 8.322298526763916e-05, 8.616410195827484e-05, 8.910521864891052e-05, 9.20463353395462e-05, 9.498745203018188e-05, 9.792856872081757e-05, 0.00010086968541145325, 0.00010381080210208893, 0.00010675191879272461]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 6.0, 4.0, 11.0, 17.0, 9.0, 12.0, 18.0, 16.0, 34.0, 44.0, 38.0, 46.0, 100.0, 109.0, 108.0, 98.0, 87.0, 53.0, 44.0, 34.0, 29.0, 19.0, 8.0, 12.0, 6.0, 10.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015584576176479459, -0.0015129238599911332, -0.0014673902187496424, -0.0014218564610928297, -0.001376322703436017, -0.0013307890621945262, -0.0012852553045377135, -0.0012397216632962227, -0.00119418790563941, -0.0011486541479825974, -0.0011031205067411065, -0.0010575867490842938, -0.0010120529914274812, -0.0009665193501859903, -0.0009209855925291777, -0.0008754518930800259, -0.0008299181354232132, -0.0007843844359740615, -0.0007388506783172488, -0.0006933169788680971, -0.0006477832794189453, -0.0006022495217621326, -0.0005567158223129809, -0.0005111821228638291, -0.0004656483943108469, -0.0004201146657578647, -0.00037458096630871296, -0.00032904723775573075, -0.00028351350920274854, -0.00023797980975359678, -0.00019244608120061457, -0.00014691238175146282, -0.0001013786531984806, -5.5844935559434816e-05, -1.0311217920389026e-05, 3.522250335663557e-05, 8.075621735770255e-05, 0.00012628993135876954, 0.00017182365991175175, 0.0002173573593609035, 0.0002628910879138857, 0.0003084248164668679, 0.0003539585159160197, 0.0003994922444690019, 0.0004450259730219841, 0.0004905596724711359, 0.0005360933719202876, 0.0005816271295771003, 0.000627160829026252, 0.0006726945284754038, 0.0007182282861322165, 0.0007637619855813682, 0.00080929568503052, 0.0008548294426873326, 0.0009003631421364844, 0.0009458968415856361, 0.0009914305992424488, 0.0010369643568992615, 0.0010824979981407523, 0.001128031755797565, 0.0011735655134543777, 0.0012190991546958685, 0.0012646329123526812, 0.0013101666700094938, 0.0013557003112509847]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 6.0, 7.0, 7.0, 9.0, 9.0, 10.0, 14.0, 22.0, 13.0, 18.0, 21.0, 19.0, 34.0, 29.0, 42.0, 33.0, 37.0, 32.0, 31.0, 45.0, 33.0, 51.0, 34.0, 38.0, 32.0, 42.0, 36.0, 29.0, 39.0, 39.0, 33.0, 21.0, 18.0, 24.0, 12.0, 11.0, 15.0, 13.0, 6.0, 9.0, 8.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000905559107195586, -0.0008773088338784873, -0.0008490585605613887, -0.0008208082872442901, -0.0007925580721348524, -0.0007643077988177538, -0.0007360575255006552, -0.0007078072521835566, -0.0006795569788664579, -0.0006513067055493593, -0.0006230564322322607, -0.0005948061589151621, -0.0005665558855980635, -0.0005383056122809649, -0.0005100553971715271, -0.00048180512385442853, -0.0004535548505373299, -0.0004253045772202313, -0.0003970543039031327, -0.0003688040596898645, -0.0003405537863727659, -0.0003123035130556673, -0.0002840532688423991, -0.0002558029955253005, -0.00022755272220820189, -0.00019930244889110327, -0.00017105219012591988, -0.0001428019313607365, -0.00011455165804363787, -8.630138472653925e-05, -5.8051125961355865e-05, -2.9800867196172476e-05, -1.5505938790738583e-06, 2.6699672162067145e-05, 5.494993820320815e-05, 8.320020424434915e-05, 0.00011145047028549016, 0.00013970074360258877, 0.00016795100236777216, 0.00019620126113295555, 0.00022445153445005417, 0.0002527018077671528, 0.0002809520810842514, 0.00030920232529751956, 0.0003374525986146182, 0.0003657028719317168, 0.00039395311614498496, 0.0004222033894620836, 0.0004504536627791822, 0.0004787039360962808, 0.0005069542094133794, 0.000535204482730478, 0.0005634546978399158, 0.0005917049711570144, 0.000619955244474113, 0.0006482055177912116, 0.0006764557911083102, 0.0007047060644254088, 0.0007329563377425075, 0.0007612066110596061, 0.0007894568843767047, 0.0008177071576938033, 0.000845957372803241, 0.0008742076461203396, 0.0009024579194374382]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 5.0, 11.0, 20.0, 25.0, 44.0, 46.0, 71.0, 117.0, 174.0, 258.0, 400.0, 575.0, 923.0, 1323.0, 2072.0, 3168.0, 5105.0, 8172.0, 13380.0, 22299.0, 37829.0, 67779.0, 128501.0, 278962.0, 829547.0, 1669209.0, 628268.0, 236266.0, 113571.0, 60099.0, 33571.0, 19744.0, 12011.0, 7467.0, 4594.0, 2982.0, 1933.0, 1340.0, 822.0, 513.0, 375.0, 253.0, 155.0, 103.0, 70.0, 47.0, 31.0, 13.0, 15.0, 12.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0012884140014648438, -0.0012498199939727783, -0.0012112259864807129, -0.0011726319789886475, -0.001134037971496582, -0.0010954439640045166, -0.0010568499565124512, -0.0010182559490203857, -0.0009796619415283203, -0.0009410679340362549, -0.0009024739265441895, -0.000863879919052124, -0.0008252859115600586, -0.0007866919040679932, -0.0007480978965759277, -0.0007095038890838623, -0.0006709098815917969, -0.0006323158740997314, -0.000593721866607666, -0.0005551278591156006, -0.0005165338516235352, -0.0004779398441314697, -0.0004393458366394043, -0.00040075182914733887, -0.00036215782165527344, -0.000323563814163208, -0.0002849698066711426, -0.00024637579917907715, -0.00020778179168701172, -0.0001691877841949463, -0.00013059377670288086, -9.199976921081543e-05, -5.340576171875e-05, -1.481175422668457e-05, 2.378225326538086e-05, 6.237626075744629e-05, 0.00010097026824951172, 0.00013956427574157715, 0.00017815828323364258, 0.000216752290725708, 0.00025534629821777344, 0.00029394030570983887, 0.0003325343132019043, 0.0003711283206939697, 0.00040972232818603516, 0.0004483163356781006, 0.000486910343170166, 0.0005255043506622314, 0.0005640983581542969, 0.0006026923656463623, 0.0006412863731384277, 0.0006798803806304932, 0.0007184743881225586, 0.000757068395614624, 0.0007956624031066895, 0.0008342564105987549, 0.0008728504180908203, 0.0009114444255828857, 0.0009500384330749512, 0.0009886324405670166, 0.001027226448059082, 0.0010658204555511475, 0.0011044144630432129, 0.0011430084705352783, 0.0011816024780273438]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 3.0, 6.0, 5.0, 6.0, 3.0, 10.0, 15.0, 14.0, 11.0, 16.0, 24.0, 14.0, 18.0, 24.0, 25.0, 28.0, 30.0, 30.0, 34.0, 29.0, 37.0, 29.0, 49.0, 34.0, 38.0, 35.0, 18.0, 36.0, 51.0, 41.0, 24.0, 35.0, 29.0, 27.0, 19.0, 23.0, 10.0, 20.0, 16.0, 12.0, 10.0, 11.0, 7.0, 10.0, 4.0, 6.0, 9.0, 2.0, 0.0, 3.0, 5.0, 3.0, 2.0, 4.0], "bins": [-0.0005316734313964844, -0.0005159229040145874, -0.0005001723766326904, -0.00048442184925079346, -0.0004686713218688965, -0.0004529207944869995, -0.00043717026710510254, -0.00042141973972320557, -0.0004056692123413086, -0.0003899186849594116, -0.00037416815757751465, -0.0003584176301956177, -0.0003426671028137207, -0.00032691657543182373, -0.00031116604804992676, -0.0002954155206680298, -0.0002796649932861328, -0.00026391446590423584, -0.00024816393852233887, -0.0002324134111404419, -0.00021666288375854492, -0.00020091235637664795, -0.00018516182899475098, -0.000169411301612854, -0.00015366077423095703, -0.00013791024684906006, -0.00012215971946716309, -0.00010640919208526611, -9.065866470336914e-05, -7.490813732147217e-05, -5.9157609939575195e-05, -4.340708255767822e-05, -2.765655517578125e-05, -1.1906027793884277e-05, 3.844499588012695e-06, 1.9595026969909668e-05, 3.534555435180664e-05, 5.109608173370361e-05, 6.684660911560059e-05, 8.259713649749756e-05, 9.834766387939453e-05, 0.0001140981912612915, 0.00012984871864318848, 0.00014559924602508545, 0.00016134977340698242, 0.0001771003007888794, 0.00019285082817077637, 0.00020860135555267334, 0.0002243518829345703, 0.00024010241031646729, 0.00025585293769836426, 0.00027160346508026123, 0.0002873539924621582, 0.0003031045198440552, 0.00031885504722595215, 0.0003346055746078491, 0.0003503561019897461, 0.00036610662937164307, 0.00038185715675354004, 0.000397607684135437, 0.000413358211517334, 0.00042910873889923096, 0.00044485926628112793, 0.0004606097936630249, 0.0004763603210449219]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 8.0, 4.0, 2.0, 3.0, 14.0, 11.0, 20.0, 34.0, 41.0, 83.0, 110.0, 192.0, 297.0, 484.0, 735.0, 1186.0, 2019.0, 3106.0, 5421.0, 9191.0, 15936.0, 27947.0, 50469.0, 93098.0, 183016.0, 398642.0, 1017669.0, 1348534.0, 539505.0, 236587.0, 117092.0, 61745.0, 34214.0, 19301.0, 11012.0, 6543.0, 3939.0, 2288.0, 1433.0, 870.0, 567.0, 336.0, 198.0, 141.0, 98.0, 51.0, 37.0, 26.0, 11.0, 8.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00098419189453125, -0.0009515732526779175, -0.000918954610824585, -0.0008863359689712524, -0.0008537173271179199, -0.0008210986852645874, -0.0007884800434112549, -0.0007558614015579224, -0.0007232427597045898, -0.0006906241178512573, -0.0006580054759979248, -0.0006253868341445923, -0.0005927681922912598, -0.0005601495504379272, -0.0005275309085845947, -0.0004949122667312622, -0.0004622936248779297, -0.00042967498302459717, -0.00039705634117126465, -0.00036443769931793213, -0.0003318190574645996, -0.0002992004156112671, -0.00026658177375793457, -0.00023396313190460205, -0.00020134449005126953, -0.000168725848197937, -0.0001361072063446045, -0.00010348856449127197, -7.086992263793945e-05, -3.8251280784606934e-05, -5.632638931274414e-06, 2.6986002922058105e-05, 5.9604644775390625e-05, 9.222328662872314e-05, 0.00012484192848205566, 0.00015746057033538818, 0.0001900792121887207, 0.00022269785404205322, 0.00025531649589538574, 0.00028793513774871826, 0.0003205537796020508, 0.0003531724214553833, 0.0003857910633087158, 0.00041840970516204834, 0.00045102834701538086, 0.0004836469888687134, 0.0005162656307220459, 0.0005488842725753784, 0.0005815029144287109, 0.0006141215562820435, 0.000646740198135376, 0.0006793588399887085, 0.000711977481842041, 0.0007445961236953735, 0.0007772147655487061, 0.0008098334074020386, 0.0008424520492553711, 0.0008750706911087036, 0.0009076893329620361, 0.0009403079748153687, 0.0009729266166687012, 0.0010055452585220337, 0.0010381639003753662, 0.0010707825422286987, 0.0011034011840820312]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 10.0, 5.0, 10.0, 19.0, 25.0, 36.0, 32.0, 42.0, 58.0, 66.0, 90.0, 85.0, 116.0, 156.0, 176.0, 188.0, 253.0, 261.0, 264.0, 281.0, 281.0, 256.0, 218.0, 203.0, 188.0, 141.0, 130.0, 106.0, 105.0, 68.0, 45.0, 47.0, 23.0, 27.0, 19.0, 12.0, 4.0, 12.0, 3.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028634071350097656, -0.0002759285271167755, -0.00026551634073257446, -0.0002551041543483734, -0.00024469196796417236, -0.0002342797815799713, -0.00022386759519577026, -0.00021345540881156921, -0.00020304322242736816, -0.00019263103604316711, -0.00018221884965896606, -0.00017180666327476501, -0.00016139447689056396, -0.00015098229050636292, -0.00014057010412216187, -0.00013015791773796082, -0.00011974573135375977, -0.00010933354496955872, -9.892135858535767e-05, -8.850917220115662e-05, -7.809698581695557e-05, -6.768479943275452e-05, -5.727261304855347e-05, -4.686042666435242e-05, -3.644824028015137e-05, -2.6036053895950317e-05, -1.5623867511749268e-05, -5.211681127548218e-06, 5.200505256652832e-06, 1.5612691640853882e-05, 2.602487802505493e-05, 3.643706440925598e-05, 4.684925079345703e-05, 5.726143717765808e-05, 6.767362356185913e-05, 7.808580994606018e-05, 8.849799633026123e-05, 9.891018271446228e-05, 0.00010932236909866333, 0.00011973455548286438, 0.00013014674186706543, 0.00014055892825126648, 0.00015097111463546753, 0.00016138330101966858, 0.00017179548740386963, 0.00018220767378807068, 0.00019261986017227173, 0.00020303204655647278, 0.00021344423294067383, 0.00022385641932487488, 0.00023426860570907593, 0.000244680792093277, 0.00025509297847747803, 0.0002655051648616791, 0.0002759173512458801, 0.0002863295376300812, 0.0002967417240142822, 0.0003071539103984833, 0.0003175660967826843, 0.0003279782831668854, 0.0003383904695510864, 0.0003488026559352875, 0.0003592148423194885, 0.0003696270287036896, 0.0003800392150878906]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 8.0, 19.0, 23.0, 16.0, 34.0, 38.0, 60.0, 77.0, 100.0, 139.0, 118.0, 87.0, 88.0, 55.0, 43.0, 22.0, 13.0, 11.0, 10.0, 11.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012677049962803721, -0.001231212168931961, -0.00119471934158355, -0.001158226397819817, -0.001121733570471406, -0.001085240743122995, -0.0010487479157745838, -0.0010122550884261727, -0.0009757622028701007, -0.0009392693755216897, -0.0009027764899656177, -0.0008662836626172066, -0.0008297908352687955, -0.0007932979497127235, -0.0007568051223643124, -0.0007203122368082404, -0.0006838194094598293, -0.0006473265821114182, -0.0006108336965553463, -0.0005743408692069352, -0.0005378479836508632, -0.0005013551563024521, -0.000464862328954041, -0.00042836947250179946, -0.0003918766160495579, -0.0003553837595973164, -0.00031889090314507484, -0.00028239807579666376, -0.0002459052193444222, -0.00020941236289218068, -0.00017291952099185437, -0.00013642667909152806, -9.993370622396469e-05, -6.344085704768077e-05, -2.694800787139684e-05, 9.544841304887086e-06, 4.603769048117101e-05, 8.253054693341255e-05, 0.00011902338883373886, 0.00015551623073406518, 0.00019200908718630672, 0.00022850194363854825, 0.0002649948000907898, 0.0003014876274392009, 0.0003379804838914424, 0.00037447334034368396, 0.00041096616769209504, 0.0004474590241443366, 0.0004839518805965781, 0.0005204447079449892, 0.0005569375935010612, 0.0005934304208494723, 0.0006299233064055443, 0.0006664161337539554, 0.0007029089611023664, 0.0007394017884507775, 0.0007758946740068495, 0.0008123875013552606, 0.0008488803869113326, 0.0008853732142597437, 0.0009218660416081548, 0.0009583589271642268, 0.0009948518127202988, 0.0010313446400687099, 0.001067837467417121]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 2.0, 4.0, 11.0, 15.0, 12.0, 13.0, 13.0, 25.0, 29.0, 20.0, 29.0, 25.0, 25.0, 31.0, 29.0, 48.0, 16.0, 36.0, 38.0, 36.0, 44.0, 32.0, 45.0, 33.0, 33.0, 39.0, 29.0, 25.0, 33.0, 27.0, 22.0, 33.0, 23.0, 16.0, 15.0, 14.0, 19.0, 11.0, 6.0, 6.0, 8.0, 10.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.0006234552711248398, -0.0006053918041288853, -0.0005873283371329308, -0.0005692648701369762, -0.0005512014031410217, -0.0005331379943527281, -0.0005150745273567736, -0.0004970110603608191, -0.0004789475933648646, -0.0004608841263689101, -0.00044282065937295556, -0.0004247572214808315, -0.000406693754484877, -0.0003886302874889225, -0.0003705668495967984, -0.0003525033826008439, -0.0003344399156048894, -0.0003163764486089349, -0.00029831298161298037, -0.0002802495437208563, -0.0002621860767249018, -0.00024412260972894728, -0.000226059157284908, -0.0002079957048408687, -0.0001899322378449142, -0.00017186877084895968, -0.0001538053184049204, -0.00013574186596088111, -0.0001176783989649266, -9.96149392449297e-05, -8.15514795249328e-05, -6.348802708089352e-05, -4.5424560084939e-05, -2.7361100364942104e-05, -9.297640644945204e-06, 8.765819075051695e-06, 2.6829278795048594e-05, 4.4892738515045494e-05, 6.295619823504239e-05, 8.101965067908168e-05, 9.908311767503619e-05, 0.00011714657739503309, 0.00013521003711503, 0.00015327348955906928, 0.0001713369565550238, 0.0001894004235509783, 0.0002074638759950176, 0.00022552732843905687, 0.0002435907954350114, 0.0002616542624309659, 0.0002797177294269204, 0.00029778116731904447, 0.000315844634314999, 0.0003339081013109535, 0.00035197153920307755, 0.00037003500619903207, 0.0003880984731949866, 0.0004061619401909411, 0.0004242254071868956, 0.00044228884507901967, 0.0004603523120749742, 0.0004784157790709287, 0.0004964792169630527, 0.0005145426839590073, 0.0005326061509549618]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 8.0, 5.0, 12.0, 15.0, 25.0, 44.0, 70.0, 115.0, 177.0, 258.0, 387.0, 560.0, 940.0, 1483.0, 2347.0, 3957.0, 6652.0, 11535.0, 19886.0, 36821.0, 69033.0, 132243.0, 239451.0, 237772.0, 131146.0, 68868.0, 36628.0, 19728.0, 11421.0, 6669.0, 3939.0, 2311.0, 1462.0, 857.0, 600.0, 411.0, 254.0, 149.0, 115.0, 75.0, 45.0, 31.0, 13.0, 13.0, 9.0, 13.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012025833129882812, -0.0011661350727081299, -0.0011296868324279785, -0.0010932385921478271, -0.0010567903518676758, -0.0010203421115875244, -0.000983893871307373, -0.0009474456310272217, -0.0009109973907470703, -0.0008745491504669189, -0.0008381009101867676, -0.0008016526699066162, -0.0007652044296264648, -0.0007287561893463135, -0.0006923079490661621, -0.0006558597087860107, -0.0006194114685058594, -0.000582963228225708, -0.0005465149879455566, -0.0005100667476654053, -0.0004736185073852539, -0.00043717026710510254, -0.00040072202682495117, -0.0003642737865447998, -0.00032782554626464844, -0.00029137730598449707, -0.0002549290657043457, -0.00021848082542419434, -0.00018203258514404297, -0.0001455843448638916, -0.00010913610458374023, -7.268786430358887e-05, -3.62396240234375e-05, 2.086162567138672e-07, 3.6656856536865234e-05, 7.31050968170166e-05, 0.00010955333709716797, 0.00014600157737731934, 0.0001824498176574707, 0.00021889805793762207, 0.00025534629821777344, 0.0002917945384979248, 0.00032824277877807617, 0.00036469101905822754, 0.0004011392593383789, 0.0004375874996185303, 0.00047403573989868164, 0.000510483980178833, 0.0005469322204589844, 0.0005833804607391357, 0.0006198287010192871, 0.0006562769412994385, 0.0006927251815795898, 0.0007291734218597412, 0.0007656216621398926, 0.0008020699024200439, 0.0008385181427001953, 0.0008749663829803467, 0.000911414623260498, 0.0009478628635406494, 0.0009843111038208008, 0.0010207593441009521, 0.0010572075843811035, 0.0010936558246612549, 0.0011301040649414062]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 16.0, 8.0, 17.0, 16.0, 19.0, 17.0, 24.0, 15.0, 28.0, 30.0, 31.0, 31.0, 41.0, 34.0, 36.0, 37.0, 37.0, 45.0, 39.0, 29.0, 51.0, 54.0, 40.0, 19.0, 39.0, 42.0, 24.0, 22.0, 22.0, 26.0, 17.0, 18.0, 13.0, 11.0, 5.0, 5.0, 6.0, 7.0, 10.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0005669593811035156, -0.0005502030253410339, -0.0005334466695785522, -0.0005166903138160706, -0.0004999339580535889, -0.0004831776022911072, -0.0004664212465286255, -0.0004496648907661438, -0.0004329085350036621, -0.0004161521792411804, -0.00039939582347869873, -0.00038263946771621704, -0.00036588311195373535, -0.00034912675619125366, -0.00033237040042877197, -0.0003156140446662903, -0.0002988576889038086, -0.0002821013331413269, -0.0002653449773788452, -0.0002485886216163635, -0.00023183226585388184, -0.00021507591009140015, -0.00019831955432891846, -0.00018156319856643677, -0.00016480684280395508, -0.0001480504870414734, -0.0001312941312789917, -0.00011453777551651001, -9.778141975402832e-05, -8.102506399154663e-05, -6.426870822906494e-05, -4.751235246658325e-05, -3.075599670410156e-05, -1.3999640941619873e-05, 2.7567148208618164e-06, 1.9513070583343506e-05, 3.6269426345825195e-05, 5.3025782108306885e-05, 6.978213787078857e-05, 8.653849363327026e-05, 0.00010329484939575195, 0.00012005120515823364, 0.00013680756092071533, 0.00015356391668319702, 0.0001703202724456787, 0.0001870766282081604, 0.0002038329839706421, 0.00022058933973312378, 0.00023734569549560547, 0.00025410205125808716, 0.00027085840702056885, 0.00028761476278305054, 0.0003043711185455322, 0.0003211274743080139, 0.0003378838300704956, 0.0003546401858329773, 0.000371396541595459, 0.0003881528973579407, 0.00040490925312042236, 0.00042166560888290405, 0.00043842196464538574, 0.00045517832040786743, 0.0004719346761703491, 0.0004886910319328308, 0.0005054473876953125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 5.0, 4.0, 14.0, 18.0, 21.0, 30.0, 49.0, 60.0, 121.0, 141.0, 242.0, 366.0, 507.0, 773.0, 1120.0, 1774.0, 2771.0, 4480.0, 7671.0, 14178.0, 30532.0, 86351.0, 388288.0, 363390.0, 82383.0, 29523.0, 14124.0, 7352.0, 4413.0, 2714.0, 1750.0, 1062.0, 742.0, 487.0, 335.0, 245.0, 160.0, 112.0, 74.0, 59.0, 26.0, 17.0, 13.0, 18.0, 8.0, 1.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0015764236450195312, -0.0015255361795425415, -0.0014746487140655518, -0.001423761248588562, -0.0013728737831115723, -0.0013219863176345825, -0.0012710988521575928, -0.001220211386680603, -0.0011693239212036133, -0.0011184364557266235, -0.0010675489902496338, -0.001016661524772644, -0.0009657740592956543, -0.0009148865938186646, -0.0008639991283416748, -0.0008131116628646851, -0.0007622241973876953, -0.0007113367319107056, -0.0006604492664337158, -0.0006095618009567261, -0.0005586743354797363, -0.0005077868700027466, -0.00045689940452575684, -0.0004060119390487671, -0.00035512447357177734, -0.0003042370080947876, -0.00025334954261779785, -0.0002024620771408081, -0.00015157461166381836, -0.00010068714618682861, -4.979968070983887e-05, 1.087784767150879e-06, 5.1975250244140625e-05, 0.00010286271572113037, 0.00015375018119812012, 0.00020463764667510986, 0.0002555251121520996, 0.00030641257762908936, 0.0003573000431060791, 0.00040818750858306885, 0.0004590749740600586, 0.0005099624395370483, 0.0005608499050140381, 0.0006117373704910278, 0.0006626248359680176, 0.0007135123014450073, 0.0007643997669219971, 0.0008152872323989868, 0.0008661746978759766, 0.0009170621633529663, 0.0009679496288299561, 0.0010188370943069458, 0.0010697245597839355, 0.0011206120252609253, 0.001171499490737915, 0.0012223869562149048, 0.0012732744216918945, 0.0013241618871688843, 0.001375049352645874, 0.0014259368181228638, 0.0014768242835998535, 0.0015277117490768433, 0.001578599214553833, 0.0016294866800308228, 0.0016803741455078125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 9.0, 5.0, 8.0, 10.0, 10.0, 20.0, 17.0, 22.0, 19.0, 29.0, 18.0, 28.0, 18.0, 31.0, 28.0, 37.0, 38.0, 38.0, 44.0, 38.0, 45.0, 39.0, 38.0, 34.0, 46.0, 46.0, 40.0, 35.0, 25.0, 16.0, 26.0, 26.0, 17.0, 15.0, 17.0, 12.0, 9.0, 7.0, 7.0, 8.0, 3.0, 2.0, 3.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0003409385681152344, -0.0003301352262496948, -0.0003193318843841553, -0.0003085285425186157, -0.00029772520065307617, -0.0002869218587875366, -0.00027611851692199707, -0.0002653151750564575, -0.00025451183319091797, -0.00024370849132537842, -0.00023290514945983887, -0.00022210180759429932, -0.00021129846572875977, -0.00020049512386322021, -0.00018969178199768066, -0.0001788884401321411, -0.00016808509826660156, -0.000157281756401062, -0.00014647841453552246, -0.0001356750726699829, -0.00012487173080444336, -0.00011406838893890381, -0.00010326504707336426, -9.246170520782471e-05, -8.165836334228516e-05, -7.08550214767456e-05, -6.0051679611206055e-05, -4.9248337745666504e-05, -3.844499588012695e-05, -2.7641654014587402e-05, -1.683831214904785e-05, -6.034970283508301e-06, 4.76837158203125e-06, 1.55717134475708e-05, 2.637505531311035e-05, 3.71783971786499e-05, 4.798173904418945e-05, 5.8785080909729004e-05, 6.958842277526855e-05, 8.03917646408081e-05, 9.119510650634766e-05, 0.00010199844837188721, 0.00011280179023742676, 0.0001236051321029663, 0.00013440847396850586, 0.0001452118158340454, 0.00015601515769958496, 0.0001668184995651245, 0.00017762184143066406, 0.0001884251832962036, 0.00019922852516174316, 0.00021003186702728271, 0.00022083520889282227, 0.00023163855075836182, 0.00024244189262390137, 0.0002532452344894409, 0.00026404857635498047, 0.00027485191822052, 0.00028565526008605957, 0.0002964586019515991, 0.00030726194381713867, 0.0003180652856826782, 0.0003288686275482178, 0.0003396719694137573, 0.0003504753112792969]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 8.0, 5.0, 15.0, 22.0, 22.0, 44.0, 55.0, 69.0, 126.0, 175.0, 260.0, 387.0, 523.0, 828.0, 1337.0, 2403.0, 4734.0, 10711.0, 30747.0, 136655.0, 677194.0, 131176.0, 29811.0, 10417.0, 4525.0, 2397.0, 1381.0, 797.0, 549.0, 375.0, 234.0, 178.0, 112.0, 96.0, 58.0, 35.0, 25.0, 19.0, 16.0, 10.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005893707275390625, -0.0005717724561691284, -0.0005541741847991943, -0.0005365759134292603, -0.0005189776420593262, -0.0005013793706893921, -0.000483781099319458, -0.0004661828279495239, -0.00044858455657958984, -0.00043098628520965576, -0.0004133880138397217, -0.0003957897424697876, -0.0003781914710998535, -0.00036059319972991943, -0.00034299492835998535, -0.00032539665699005127, -0.0003077983856201172, -0.0002902001142501831, -0.000272601842880249, -0.00025500357151031494, -0.00023740530014038086, -0.00021980702877044678, -0.0002022087574005127, -0.0001846104860305786, -0.00016701221466064453, -0.00014941394329071045, -0.00013181567192077637, -0.00011421740055084229, -9.66191291809082e-05, -7.902085781097412e-05, -6.142258644104004e-05, -4.382431507110596e-05, -2.6226043701171875e-05, -8.627772331237793e-06, 8.970499038696289e-06, 2.656877040863037e-05, 4.416704177856445e-05, 6.176531314849854e-05, 7.936358451843262e-05, 9.69618558883667e-05, 0.00011456012725830078, 0.00013215839862823486, 0.00014975666999816895, 0.00016735494136810303, 0.0001849532127380371, 0.0002025514841079712, 0.00022014975547790527, 0.00023774802684783936, 0.00025534629821777344, 0.0002729445695877075, 0.0002905428409576416, 0.0003081411123275757, 0.00032573938369750977, 0.00034333765506744385, 0.00036093592643737793, 0.000378534197807312, 0.0003961324691772461, 0.0004137307405471802, 0.00043132901191711426, 0.00044892728328704834, 0.0004665255546569824, 0.0004841238260269165, 0.0005017220973968506, 0.0005193203687667847, 0.0005369186401367188]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 4.0, 5.0, 8.0, 13.0, 17.0, 22.0, 30.0, 19.0, 40.0, 45.0, 63.0, 88.0, 111.0, 112.0, 99.0, 70.0, 53.0, 30.0, 23.0, 37.0, 19.0, 15.0, 17.0, 11.0, 3.0, 11.0, 4.0, 3.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6510486602783203e-05, -1.5994533896446228e-05, -1.5478581190109253e-05, -1.4962628483772278e-05, -1.4446675777435303e-05, -1.3930723071098328e-05, -1.3414770364761353e-05, -1.2898817658424377e-05, -1.2382864952087402e-05, -1.1866912245750427e-05, -1.1350959539413452e-05, -1.0835006833076477e-05, -1.0319054126739502e-05, -9.803101420402527e-06, -9.287148714065552e-06, -8.771196007728577e-06, -8.255243301391602e-06, -7.739290595054626e-06, -7.223337888717651e-06, -6.707385182380676e-06, -6.191432476043701e-06, -5.675479769706726e-06, -5.159527063369751e-06, -4.643574357032776e-06, -4.127621650695801e-06, -3.6116689443588257e-06, -3.0957162380218506e-06, -2.5797635316848755e-06, -2.0638108253479004e-06, -1.5478581190109253e-06, -1.0319054126739502e-06, -5.159527063369751e-07, 0.0, 5.159527063369751e-07, 1.0319054126739502e-06, 1.5478581190109253e-06, 2.0638108253479004e-06, 2.5797635316848755e-06, 3.0957162380218506e-06, 3.6116689443588257e-06, 4.127621650695801e-06, 4.643574357032776e-06, 5.159527063369751e-06, 5.675479769706726e-06, 6.191432476043701e-06, 6.707385182380676e-06, 7.223337888717651e-06, 7.739290595054626e-06, 8.255243301391602e-06, 8.771196007728577e-06, 9.287148714065552e-06, 9.803101420402527e-06, 1.0319054126739502e-05, 1.0835006833076477e-05, 1.1350959539413452e-05, 1.1866912245750427e-05, 1.2382864952087402e-05, 1.2898817658424377e-05, 1.3414770364761353e-05, 1.3930723071098328e-05, 1.4446675777435303e-05, 1.4962628483772278e-05, 1.5478581190109253e-05, 1.5994533896446228e-05, 1.6510486602783203e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 11.0, 11.0, 18.0, 22.0, 29.0, 48.0, 67.0, 81.0, 97.0, 189.0, 274.0, 359.0, 545.0, 800.0, 1147.0, 1745.0, 2541.0, 4061.0, 6453.0, 10273.0, 17303.0, 31036.0, 57391.0, 119485.0, 300799.0, 262580.0, 107055.0, 52225.0, 28544.0, 16199.0, 9689.0, 6218.0, 3853.0, 2395.0, 1590.0, 1053.0, 734.0, 455.0, 370.0, 239.0, 182.0, 131.0, 78.0, 58.0, 43.0, 37.0, 16.0, 14.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00015056133270263672, -0.00014535710215568542, -0.00014015287160873413, -0.00013494864106178284, -0.00012974441051483154, -0.00012454017996788025, -0.00011933594942092896, -0.00011413171887397766, -0.00010892748832702637, -0.00010372325778007507, -9.851902723312378e-05, -9.331479668617249e-05, -8.811056613922119e-05, -8.29063355922699e-05, -7.77021050453186e-05, -7.249787449836731e-05, -6.729364395141602e-05, -6.208941340446472e-05, -5.688518285751343e-05, -5.1680952310562134e-05, -4.647672176361084e-05, -4.1272491216659546e-05, -3.606826066970825e-05, -3.086403012275696e-05, -2.5659799575805664e-05, -2.045556902885437e-05, -1.5251338481903076e-05, -1.0047107934951782e-05, -4.842877388000488e-06, 3.6135315895080566e-07, 5.5655837059021e-06, 1.0769814252853394e-05, 1.5974044799804688e-05, 2.117827534675598e-05, 2.6382505893707275e-05, 3.158673644065857e-05, 3.679096698760986e-05, 4.199519753456116e-05, 4.719942808151245e-05, 5.2403658628463745e-05, 5.760788917541504e-05, 6.281211972236633e-05, 6.801635026931763e-05, 7.322058081626892e-05, 7.842481136322021e-05, 8.362904191017151e-05, 8.88332724571228e-05, 9.40375030040741e-05, 9.924173355102539e-05, 0.00010444596409797668, 0.00010965019464492798, 0.00011485442519187927, 0.00012005865573883057, 0.00012526288628578186, 0.00013046711683273315, 0.00013567134737968445, 0.00014087557792663574, 0.00014607980847358704, 0.00015128403902053833, 0.00015648826956748962, 0.00016169250011444092, 0.0001668967306613922, 0.0001721009612083435, 0.0001773051917552948, 0.0001825094223022461]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 8.0, 3.0, 6.0, 8.0, 2.0, 7.0, 14.0, 12.0, 20.0, 23.0, 32.0, 43.0, 37.0, 80.0, 62.0, 100.0, 94.0, 93.0, 78.0, 41.0, 50.0, 45.0, 27.0, 28.0, 18.0, 18.0, 7.0, 9.0, 8.0, 4.0, 1.0, 6.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.543231964111328e-05, -5.347002297639847e-05, -5.1507726311683655e-05, -4.954542964696884e-05, -4.758313298225403e-05, -4.5620836317539215e-05, -4.36585396528244e-05, -4.169624298810959e-05, -3.9733946323394775e-05, -3.777164965867996e-05, -3.580935299396515e-05, -3.3847056329250336e-05, -3.188475966453552e-05, -2.992246299982071e-05, -2.7960166335105896e-05, -2.5997869670391083e-05, -2.403557300567627e-05, -2.2073276340961456e-05, -2.0110979676246643e-05, -1.814868301153183e-05, -1.6186386346817017e-05, -1.4224089682102203e-05, -1.226179301738739e-05, -1.0299496352672577e-05, -8.337199687957764e-06, -6.3749030232429504e-06, -4.412606358528137e-06, -2.450309693813324e-06, -4.880130290985107e-07, 1.4742836356163025e-06, 3.4365803003311157e-06, 5.398876965045929e-06, 7.361173629760742e-06, 9.323470294475555e-06, 1.1285766959190369e-05, 1.3248063623905182e-05, 1.5210360288619995e-05, 1.717265695333481e-05, 1.913495361804962e-05, 2.1097250282764435e-05, 2.3059546947479248e-05, 2.502184361219406e-05, 2.6984140276908875e-05, 2.8946436941623688e-05, 3.09087336063385e-05, 3.2871030271053314e-05, 3.483332693576813e-05, 3.679562360048294e-05, 3.8757920265197754e-05, 4.072021692991257e-05, 4.268251359462738e-05, 4.4644810259342194e-05, 4.660710692405701e-05, 4.856940358877182e-05, 5.053170025348663e-05, 5.2493996918201447e-05, 5.445629358291626e-05, 5.641859024763107e-05, 5.8380886912345886e-05, 6.03431835770607e-05, 6.230548024177551e-05, 6.426777690649033e-05, 6.623007357120514e-05, 6.819237023591995e-05, 7.015466690063477e-05]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 3.0, 1.0, 5.0, 1.0, 11.0, 9.0, 14.0, 20.0, 21.0, 37.0, 29.0, 49.0, 59.0, 79.0, 124.0, 124.0, 92.0, 97.0, 57.0, 37.0, 33.0, 28.0, 15.0, 7.0, 8.0, 12.0, 9.0, 6.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000870297197252512, -0.0008431752794422209, -0.0008160533616319299, -0.0007889314438216388, -0.0007618095260113478, -0.0007346876082010567, -0.0007075656903907657, -0.0006804438307881355, -0.0006533218547701836, -0.0006261999369598925, -0.0005990780191496015, -0.0005719561013393104, -0.0005448341835290194, -0.0005177122657187283, -0.0004905903479084373, -0.00046346845920197666, -0.00043634657049551606, -0.000409224652685225, -0.00038210273487493396, -0.0003549808170646429, -0.00032785889925435185, -0.0003007369814440608, -0.0002736150927376002, -0.00024649317492730916, -0.0002193712571170181, -0.00019224933930672705, -0.000165127421496436, -0.00013800551823806018, -0.00011088360042776912, -8.376168261747807e-05, -5.663977935910225e-05, -2.9517861548811197e-05, -2.395885530859232e-06, 2.4726028641453013e-05, 5.184794281376526e-05, 7.89698533480987e-05, 0.00010609177115838975, 0.0001332136889686808, 0.00016033559222705662, 0.00018745751003734767, 0.00021457942784763873, 0.00024170134565792978, 0.00026882326346822083, 0.0002959451521746814, 0.0003230670699849725, 0.00035018898779526353, 0.0003773109056055546, 0.00040443282341584563, 0.0004315547412261367, 0.00045867665903642774, 0.0004857985768467188, 0.0005129204946570098, 0.0005400424124673009, 0.0005671643302775919, 0.000594286248087883, 0.0006214081076905131, 0.0006485300837084651, 0.0006756520015187562, 0.0007027739193290472, 0.0007298958371393383, 0.0007570177549496293, 0.0007841396727599204, 0.0008112615905702114, 0.0008383834501728415, 0.0008655053679831326]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 3.0, 12.0, 7.0, 12.0, 16.0, 12.0, 19.0, 23.0, 23.0, 27.0, 33.0, 25.0, 25.0, 34.0, 35.0, 28.0, 34.0, 46.0, 42.0, 30.0, 33.0, 43.0, 36.0, 43.0, 41.0, 21.0, 31.0, 37.0, 25.0, 24.0, 28.0, 25.0, 19.0, 20.0, 10.0, 13.0, 14.0, 7.0, 8.0, 8.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.0005403722170740366, -0.0005248453235253692, -0.0005093184299767017, -0.0004937915364280343, -0.0004782646428793669, -0.00046273774933069944, -0.000447210855782032, -0.0004316839622333646, -0.00041615706868469715, -0.0004006301751360297, -0.0003851032815873623, -0.00036957638803869486, -0.00035404949449002743, -0.00033852260094136, -0.00032299570739269257, -0.00030746881384402514, -0.0002919419202953577, -0.0002764150267466903, -0.00026088813319802284, -0.0002453612396493554, -0.00022983434610068798, -0.00021430745255202055, -0.00019878055900335312, -0.0001832536654546857, -0.00016772677190601826, -0.00015219987835735083, -0.0001366729848086834, -0.00012114609126001596, -0.00010561919771134853, -9.00923041626811e-05, -7.456541061401367e-05, -5.903851706534624e-05, -4.35115653090179e-05, -2.7984671760350466e-05, -1.2457778211683035e-05, 3.069115336984396e-06, 1.8596008885651827e-05, 3.412290243431926e-05, 4.964979598298669e-05, 6.517668953165412e-05, 8.070358308032155e-05, 9.623047662898898e-05, 0.00011175737017765641, 0.00012728426372632384, 0.00014281115727499127, 0.0001583380508236587, 0.00017386494437232614, 0.00018939183792099357, 0.000204918731469661, 0.00022044562501832843, 0.00023597251856699586, 0.0002514994121156633, 0.0002670263056643307, 0.00028255319921299815, 0.0002980800927616656, 0.000313606986310333, 0.00032913387985900044, 0.0003446607734076679, 0.0003601876669563353, 0.00037571456050500274, 0.00039124145405367017, 0.0004067683476023376, 0.00042229524115100503, 0.00043782213469967246, 0.0004533490282483399]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 13.0, 13.0, 22.0, 33.0, 48.0, 73.0, 109.0, 145.0, 193.0, 288.0, 433.0, 699.0, 991.0, 1509.0, 2275.0, 3437.0, 5510.0, 8453.0, 13378.0, 20628.0, 33758.0, 57520.0, 103321.0, 192325.0, 248467.0, 150180.0, 81087.0, 46716.0, 28066.0, 17286.0, 11045.0, 7039.0, 4615.0, 2979.0, 1955.0, 1311.0, 850.0, 625.0, 382.0, 277.0, 164.0, 116.0, 68.0, 40.0, 33.0, 31.0, 15.0, 9.0, 13.0, 7.0, 6.0, 3.0, 1.0, 4.0], "bins": [-0.00102996826171875, -0.000999942421913147, -0.0009699165821075439, -0.0009398907423019409, -0.0009098649024963379, -0.0008798390626907349, -0.0008498132228851318, -0.0008197873830795288, -0.0007897615432739258, -0.0007597357034683228, -0.0007297098636627197, -0.0006996840238571167, -0.0006696581840515137, -0.0006396323442459106, -0.0006096065044403076, -0.0005795806646347046, -0.0005495548248291016, -0.0005195289850234985, -0.0004895031452178955, -0.0004594773054122925, -0.00042945146560668945, -0.0003994256258010864, -0.0003693997859954834, -0.00033937394618988037, -0.00030934810638427734, -0.0002793222665786743, -0.0002492964267730713, -0.00021927058696746826, -0.00018924474716186523, -0.0001592189073562622, -0.00012919306755065918, -9.916722774505615e-05, -6.914138793945312e-05, -3.91155481338501e-05, -9.08970832824707e-06, 2.0936131477355957e-05, 5.0961971282958984e-05, 8.098781108856201e-05, 0.00011101365089416504, 0.00014103949069976807, 0.0001710653305053711, 0.00020109117031097412, 0.00023111701011657715, 0.0002611428499221802, 0.0002911686897277832, 0.00032119452953338623, 0.00035122036933898926, 0.0003812462091445923, 0.0004112720489501953, 0.00044129788875579834, 0.00047132372856140137, 0.0005013495683670044, 0.0005313754081726074, 0.0005614012479782104, 0.0005914270877838135, 0.0006214529275894165, 0.0006514787673950195, 0.0006815046072006226, 0.0007115304470062256, 0.0007415562868118286, 0.0007715821266174316, 0.0008016079664230347, 0.0008316338062286377, 0.0008616596460342407, 0.0008916854858398438]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 8.0, 10.0, 4.0, 10.0, 12.0, 17.0, 20.0, 14.0, 20.0, 19.0, 22.0, 24.0, 28.0, 31.0, 29.0, 33.0, 29.0, 43.0, 35.0, 37.0, 33.0, 52.0, 44.0, 25.0, 41.0, 36.0, 25.0, 26.0, 37.0, 31.0, 29.0, 15.0, 19.0, 23.0, 11.0, 18.0, 11.0, 13.0, 15.0, 9.0, 9.0, 11.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.00041794776916503906, -0.0004060231149196625, -0.0003940984606742859, -0.0003821738064289093, -0.0003702491521835327, -0.00035832449793815613, -0.00034639984369277954, -0.00033447518944740295, -0.00032255053520202637, -0.0003106258809566498, -0.0002987012267112732, -0.0002867765724658966, -0.00027485191822052, -0.00026292726397514343, -0.00025100260972976685, -0.00023907795548439026, -0.00022715330123901367, -0.00021522864699363708, -0.0002033039927482605, -0.0001913793385028839, -0.00017945468425750732, -0.00016753003001213074, -0.00015560537576675415, -0.00014368072152137756, -0.00013175606727600098, -0.00011983141303062439, -0.0001079067587852478, -9.598210453987122e-05, -8.405745029449463e-05, -7.213279604911804e-05, -6.0208141803741455e-05, -4.828348755836487e-05, -3.635883331298828e-05, -2.4434179067611694e-05, -1.2509524822235107e-05, -5.848705768585205e-07, 1.1339783668518066e-05, 2.3264437913894653e-05, 3.518909215927124e-05, 4.711374640464783e-05, 5.9038400650024414e-05, 7.0963054895401e-05, 8.288770914077759e-05, 9.481236338615417e-05, 0.00010673701763153076, 0.00011866167187690735, 0.00013058632612228394, 0.00014251098036766052, 0.0001544356346130371, 0.0001663602888584137, 0.00017828494310379028, 0.00019020959734916687, 0.00020213425159454346, 0.00021405890583992004, 0.00022598356008529663, 0.00023790821433067322, 0.0002498328685760498, 0.0002617575228214264, 0.000273682177066803, 0.00028560683131217957, 0.00029753148555755615, 0.00030945613980293274, 0.0003213807940483093, 0.0003333054482936859, 0.0003452301025390625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 9.0, 7.0, 9.0, 19.0, 18.0, 45.0, 51.0, 104.0, 130.0, 216.0, 304.0, 419.0, 599.0, 877.0, 1265.0, 1838.0, 2742.0, 4232.0, 6203.0, 9089.0, 14285.0, 22114.0, 34788.0, 55137.0, 88080.0, 140504.0, 197683.0, 169619.0, 109480.0, 68256.0, 42465.0, 26864.0, 17242.0, 11174.0, 7378.0, 4904.0, 3322.0, 2180.0, 1581.0, 1049.0, 710.0, 475.0, 347.0, 237.0, 165.0, 120.0, 80.0, 54.0, 32.0, 25.0, 18.0, 13.0, 7.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0007696151733398438, -0.0007467940449714661, -0.0007239729166030884, -0.0007011517882347107, -0.000678330659866333, -0.0006555095314979553, -0.0006326884031295776, -0.0006098672747612, -0.0005870461463928223, -0.0005642250180244446, -0.0005414038896560669, -0.0005185827612876892, -0.0004957616329193115, -0.00047294050455093384, -0.00045011937618255615, -0.00042729824781417847, -0.0004044771194458008, -0.0003816559910774231, -0.0003588348627090454, -0.0003360137343406677, -0.00031319260597229004, -0.00029037147760391235, -0.00026755034923553467, -0.000244729220867157, -0.0002219080924987793, -0.0001990869641304016, -0.00017626583576202393, -0.00015344470739364624, -0.00013062357902526855, -0.00010780245065689087, -8.498132228851318e-05, -6.21601939201355e-05, -3.933906555175781e-05, -1.6517937183380127e-05, 6.303191184997559e-06, 2.9124319553375244e-05, 5.194544792175293e-05, 7.476657629013062e-05, 9.75877046585083e-05, 0.00012040883302688599, 0.00014322996139526367, 0.00016605108976364136, 0.00018887221813201904, 0.00021169334650039673, 0.00023451447486877441, 0.0002573356032371521, 0.0002801567316055298, 0.00030297785997390747, 0.00032579898834228516, 0.00034862011671066284, 0.00037144124507904053, 0.0003942623734474182, 0.0004170835018157959, 0.0004399046301841736, 0.00046272575855255127, 0.00048554688692092896, 0.0005083680152893066, 0.0005311891436576843, 0.000554010272026062, 0.0005768314003944397, 0.0005996525287628174, 0.0006224736571311951, 0.0006452947854995728, 0.0006681159138679504, 0.0006909370422363281]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 2.0, 7.0, 12.0, 12.0, 13.0, 17.0, 12.0, 18.0, 18.0, 15.0, 26.0, 23.0, 23.0, 32.0, 32.0, 33.0, 26.0, 32.0, 32.0, 31.0, 26.0, 34.0, 35.0, 38.0, 40.0, 32.0, 44.0, 36.0, 29.0, 23.0, 32.0, 22.0, 28.0, 35.0, 21.0, 17.0, 17.0, 9.0, 9.0, 17.0, 11.0, 11.0, 2.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002532005310058594, -0.0002452731132507324, -0.00023734569549560547, -0.00022941827774047852, -0.00022149085998535156, -0.0002135634422302246, -0.00020563602447509766, -0.0001977086067199707, -0.00018978118896484375, -0.0001818537712097168, -0.00017392635345458984, -0.0001659989356994629, -0.00015807151794433594, -0.00015014410018920898, -0.00014221668243408203, -0.00013428926467895508, -0.00012636184692382812, -0.00011843442916870117, -0.00011050701141357422, -0.00010257959365844727, -9.465217590332031e-05, -8.672475814819336e-05, -7.87973403930664e-05, -7.086992263793945e-05, -6.29425048828125e-05, -5.501508712768555e-05, -4.7087669372558594e-05, -3.916025161743164e-05, -3.123283386230469e-05, -2.3305416107177734e-05, -1.537799835205078e-05, -7.450580596923828e-06, 4.76837158203125e-07, 8.404254913330078e-06, 1.633167266845703e-05, 2.4259090423583984e-05, 3.218650817871094e-05, 4.011392593383789e-05, 4.8041343688964844e-05, 5.59687614440918e-05, 6.389617919921875e-05, 7.18235969543457e-05, 7.975101470947266e-05, 8.767843246459961e-05, 9.560585021972656e-05, 0.00010353326797485352, 0.00011146068572998047, 0.00011938810348510742, 0.00012731552124023438, 0.00013524293899536133, 0.00014317035675048828, 0.00015109777450561523, 0.0001590251922607422, 0.00016695261001586914, 0.0001748800277709961, 0.00018280744552612305, 0.00019073486328125, 0.00019866228103637695, 0.0002065896987915039, 0.00021451711654663086, 0.0002224445343017578, 0.00023037195205688477, 0.00023829936981201172, 0.00024622678756713867, 0.0002541542053222656]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 9.0, 17.0, 16.0, 18.0, 32.0, 59.0, 87.0, 132.0, 155.0, 238.0, 327.0, 467.0, 620.0, 951.0, 1411.0, 2054.0, 3157.0, 4765.0, 7983.0, 14140.0, 31484.0, 908913.0, 33915.0, 14423.0, 8313.0, 4892.0, 3215.0, 2092.0, 1368.0, 997.0, 658.0, 484.0, 300.0, 252.0, 173.0, 141.0, 81.0, 60.0, 39.0, 30.0, 17.0, 18.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.00019121170043945312, -0.00018514692783355713, -0.00017908215522766113, -0.00017301738262176514, -0.00016695261001586914, -0.00016088783740997314, -0.00015482306480407715, -0.00014875829219818115, -0.00014269351959228516, -0.00013662874698638916, -0.00013056397438049316, -0.00012449920177459717, -0.00011843442916870117, -0.00011236965656280518, -0.00010630488395690918, -0.00010024011135101318, -9.417533874511719e-05, -8.811056613922119e-05, -8.20457935333252e-05, -7.59810209274292e-05, -6.99162483215332e-05, -6.385147571563721e-05, -5.778670310974121e-05, -5.1721930503845215e-05, -4.565715789794922e-05, -3.959238529205322e-05, -3.3527612686157227e-05, -2.746284008026123e-05, -2.1398067474365234e-05, -1.5333294868469238e-05, -9.268522262573242e-06, -3.203749656677246e-06, 2.86102294921875e-06, 8.925795555114746e-06, 1.4990568161010742e-05, 2.1055340766906738e-05, 2.7120113372802734e-05, 3.318488597869873e-05, 3.9249658584594727e-05, 4.531443119049072e-05, 5.137920379638672e-05, 5.7443976402282715e-05, 6.350874900817871e-05, 6.957352161407471e-05, 7.56382942199707e-05, 8.17030668258667e-05, 8.77678394317627e-05, 9.383261203765869e-05, 9.989738464355469e-05, 0.00010596215724945068, 0.00011202692985534668, 0.00011809170246124268, 0.00012415647506713867, 0.00013022124767303467, 0.00013628602027893066, 0.00014235079288482666, 0.00014841556549072266, 0.00015448033809661865, 0.00016054511070251465, 0.00016660988330841064, 0.00017267465591430664, 0.00017873942852020264, 0.00018480420112609863, 0.00019086897373199463, 0.00019693374633789062]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 7.0, 2.0, 7.0, 13.0, 26.0, 20.0, 26.0, 45.0, 51.0, 61.0, 69.0, 88.0, 209.0, 84.0, 60.0, 36.0, 40.0, 28.0, 26.0, 16.0, 20.0, 9.0, 12.0, 4.0, 4.0, 4.0, 4.0, 7.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.1457672119140625e-06, -2.078711986541748e-06, -2.0116567611694336e-06, -1.944601535797119e-06, -1.8775463104248047e-06, -1.8104910850524902e-06, -1.7434358596801758e-06, -1.6763806343078613e-06, -1.6093254089355469e-06, -1.5422701835632324e-06, -1.475214958190918e-06, -1.4081597328186035e-06, -1.341104507446289e-06, -1.2740492820739746e-06, -1.2069940567016602e-06, -1.1399388313293457e-06, -1.0728836059570312e-06, -1.0058283805847168e-06, -9.387731552124023e-07, -8.717179298400879e-07, -8.046627044677734e-07, -7.37607479095459e-07, -6.705522537231445e-07, -6.034970283508301e-07, -5.364418029785156e-07, -4.6938657760620117e-07, -4.023313522338867e-07, -3.3527612686157227e-07, -2.682209014892578e-07, -2.0116567611694336e-07, -1.341104507446289e-07, -6.705522537231445e-08, 0.0, 6.705522537231445e-08, 1.341104507446289e-07, 2.0116567611694336e-07, 2.682209014892578e-07, 3.3527612686157227e-07, 4.023313522338867e-07, 4.6938657760620117e-07, 5.364418029785156e-07, 6.034970283508301e-07, 6.705522537231445e-07, 7.37607479095459e-07, 8.046627044677734e-07, 8.717179298400879e-07, 9.387731552124023e-07, 1.0058283805847168e-06, 1.0728836059570312e-06, 1.1399388313293457e-06, 1.2069940567016602e-06, 1.2740492820739746e-06, 1.341104507446289e-06, 1.4081597328186035e-06, 1.475214958190918e-06, 1.5422701835632324e-06, 1.6093254089355469e-06, 1.6763806343078613e-06, 1.7434358596801758e-06, 1.8104910850524902e-06, 1.8775463104248047e-06, 1.944601535797119e-06, 2.0116567611694336e-06, 2.078711986541748e-06, 2.1457672119140625e-06]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 12.0, 6.0, 29.0, 24.0, 49.0, 65.0, 80.0, 138.0, 167.0, 239.0, 365.0, 546.0, 765.0, 1193.0, 1697.0, 2687.0, 4123.0, 6763.0, 10969.0, 18350.0, 40353.0, 895614.0, 25720.0, 14473.0, 8788.0, 5364.0, 3295.0, 2195.0, 1423.0, 960.0, 627.0, 452.0, 319.0, 206.0, 142.0, 128.0, 62.0, 57.0, 38.0, 18.0, 16.0, 10.0, 13.0, 5.0, 2.0, 8.0, 1.0, 1.0, 3.0], "bins": [-0.0002951622009277344, -0.0002870243042707443, -0.00027888640761375427, -0.0002707485109567642, -0.00026261061429977417, -0.0002544727176427841, -0.00024633482098579407, -0.00023819692432880402, -0.00023005902767181396, -0.00022192113101482391, -0.00021378323435783386, -0.0002056453377008438, -0.00019750744104385376, -0.0001893695443868637, -0.00018123164772987366, -0.0001730937510728836, -0.00016495585441589355, -0.0001568179577589035, -0.00014868006110191345, -0.0001405421644449234, -0.00013240426778793335, -0.0001242663711309433, -0.00011612847447395325, -0.0001079905778169632, -9.985268115997314e-05, -9.17147845029831e-05, -8.357688784599304e-05, -7.543899118900299e-05, -6.730109453201294e-05, -5.916319787502289e-05, -5.102530121803284e-05, -4.2887404561042786e-05, -3.4749507904052734e-05, -2.6611611247062683e-05, -1.8473714590072632e-05, -1.033581793308258e-05, -2.1979212760925293e-06, 5.939975380897522e-06, 1.4077872037887573e-05, 2.2215768694877625e-05, 3.0353665351867676e-05, 3.849156200885773e-05, 4.662945866584778e-05, 5.476735532283783e-05, 6.290525197982788e-05, 7.104314863681793e-05, 7.918104529380798e-05, 8.731894195079803e-05, 9.545683860778809e-05, 0.00010359473526477814, 0.00011173263192176819, 0.00011987052857875824, 0.0001280084252357483, 0.00013614632189273834, 0.0001442842185497284, 0.00015242211520671844, 0.0001605600118637085, 0.00016869790852069855, 0.0001768358051776886, 0.00018497370183467865, 0.0001931115984916687, 0.00020124949514865875, 0.0002093873918056488, 0.00021752528846263885, 0.0002256631851196289]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 3.0, 6.0, 9.0, 8.0, 7.0, 8.0, 6.0, 6.0, 619.0, 216.0, 12.0, 2.0, 10.0, 3.0, 5.0, 9.0, 7.0, 8.0, 5.0, 3.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.195638656616211e-05, -7.967185229063034e-05, -7.738731801509857e-05, -7.51027837395668e-05, -7.281824946403503e-05, -7.053371518850327e-05, -6.82491809129715e-05, -6.596464663743973e-05, -6.368011236190796e-05, -6.139557808637619e-05, -5.911104381084442e-05, -5.682650953531265e-05, -5.4541975259780884e-05, -5.2257440984249115e-05, -4.9972906708717346e-05, -4.768837243318558e-05, -4.540383815765381e-05, -4.311930388212204e-05, -4.083476960659027e-05, -3.85502353310585e-05, -3.6265701055526733e-05, -3.3981166779994965e-05, -3.1696632504463196e-05, -2.9412098228931427e-05, -2.7127563953399658e-05, -2.484302967786789e-05, -2.255849540233612e-05, -2.0273961126804352e-05, -1.7989426851272583e-05, -1.5704892575740814e-05, -1.3420358300209045e-05, -1.1135824024677277e-05, -8.851289749145508e-06, -6.566755473613739e-06, -4.28222119808197e-06, -1.9976869225502014e-06, 2.868473529815674e-07, 2.571381628513336e-06, 4.855915904045105e-06, 7.140450179576874e-06, 9.424984455108643e-06, 1.1709518730640411e-05, 1.399405300617218e-05, 1.627858728170395e-05, 1.8563121557235718e-05, 2.0847655832767487e-05, 2.3132190108299255e-05, 2.5416724383831024e-05, 2.7701258659362793e-05, 2.9985792934894562e-05, 3.227032721042633e-05, 3.45548614859581e-05, 3.683939576148987e-05, 3.912393003702164e-05, 4.1408464312553406e-05, 4.3692998588085175e-05, 4.597753286361694e-05, 4.826206713914871e-05, 5.054660141468048e-05, 5.283113569021225e-05, 5.511566996574402e-05, 5.740020424127579e-05, 5.9684738516807556e-05, 6.196927279233932e-05, 6.42538070678711e-05]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 10.0, 6.0, 14.0, 9.0, 19.0, 21.0, 24.0, 34.0, 48.0, 68.0, 77.0, 120.0, 121.0, 83.0, 77.0, 74.0, 57.0, 32.0, 21.0, 19.0, 16.0, 14.0, 3.0, 3.0, 5.0, 5.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007306183688342571, -0.0007079864153638482, -0.0006853545201011002, -0.0006627225666306913, -0.0006400906713679433, -0.0006174587178975344, -0.0005948267644271255, -0.0005721948109567165, -0.0005495629156939685, -0.0005269309622235596, -0.0005042990669608116, -0.0004816671134904027, -0.00045903518912382424, -0.0004364032647572458, -0.00041377131128683686, -0.0003911393869202584, -0.00036850746255367994, -0.0003458755381871015, -0.000323243613820523, -0.0003006116603501141, -0.00027797973598353565, -0.0002553478116169572, -0.0002327158726984635, -0.0002100839337799698, -0.00018745200941339135, -0.0001648200850468129, -0.0001421881461283192, -0.00011955621448578313, -9.692428284324706e-05, -7.429235120071098e-05, -5.166041955817491e-05, -2.902848063968122e-05, -6.39655627310276e-06, 1.6235375369433314e-05, 3.886730701196939e-05, 6.149923865450546e-05, 8.413117029704154e-05, 0.00010676310193957761, 0.00012939503358211368, 0.00015202697250060737, 0.00017465889686718583, 0.0001972908212337643, 0.00021992276015225798, 0.00024255469907075167, 0.0002651866234373301, 0.0002878185478039086, 0.0003104505012743175, 0.00033308242564089596, 0.0003557143500074744, 0.0003783462743740529, 0.00040097819874063134, 0.00042361015221104026, 0.0004462420765776187, 0.0004688740009441972, 0.0004915059544146061, 0.000514137907885015, 0.000536769803147763, 0.0005594017566181719, 0.0005820336518809199, 0.0006046656053513288, 0.0006272975588217378, 0.0006499294540844858, 0.0006725614075548947, 0.0006951933028176427, 0.0007178252562880516]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 7.0, 9.0, 3.0, 5.0, 13.0, 16.0, 13.0, 18.0, 21.0, 16.0, 25.0, 27.0, 28.0, 42.0, 39.0, 34.0, 35.0, 34.0, 29.0, 43.0, 31.0, 34.0, 43.0, 53.0, 39.0, 47.0, 26.0, 26.0, 17.0, 29.0, 27.0, 19.0, 16.0, 21.0, 20.0, 13.0, 13.0, 7.0, 12.0, 8.0, 7.0, 9.0, 6.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00042779522482305765, -0.0004148656444158405, -0.0004019360349047929, -0.00038900645449757576, -0.00037607684498652816, -0.000363147264579311, -0.00035021768417209387, -0.00033728807466104627, -0.00032435846514999866, -0.0003114288847427815, -0.0002984992752317339, -0.0002855696948245168, -0.00027264008531346917, -0.000259710504906252, -0.0002467809244990349, -0.00023385131498798728, -0.00022092173458077013, -0.00020799213962163776, -0.0001950625446625054, -0.00018213296425528824, -0.00016920335474424064, -0.0001562737743370235, -0.00014334417937789112, -0.00013041458441875875, -0.00011748498945962638, -0.000104555394500494, -9.162579954136163e-05, -7.869621185818687e-05, -6.57666168990545e-05, -5.2837021939922124e-05, -3.9907434256747365e-05, -2.697783929761499e-05, -1.4048244338482618e-05, -1.1186511983396485e-06, 1.1810941941803321e-05, 2.4740533262956887e-05, 3.767012822208926e-05, 5.0599723181221634e-05, 6.35293108643964e-05, 7.645890582352877e-05, 8.938850078266114e-05, 0.00010231809574179351, 0.00011524769070092589, 0.00012817728566005826, 0.0001411068660672754, 0.000154036475578323, 0.00016696605598554015, 0.00017989565094467252, 0.0001928252459038049, 0.00020575484086293727, 0.00021868443582206964, 0.0002316140162292868, 0.0002445436257403344, 0.00025747320614755154, 0.00027040281565859914, 0.0002833323960658163, 0.00029626197647303343, 0.0003091915568802506, 0.0003221211663912982, 0.0003350507467985153, 0.0003479803563095629, 0.00036090993671678007, 0.0003738395171239972, 0.0003867691266350448, 0.0003996987361460924]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 10.0, 8.0, 21.0, 21.0, 34.0, 45.0, 84.0, 110.0, 159.0, 234.0, 330.0, 444.0, 725.0, 1052.0, 1632.0, 2402.0, 3579.0, 5567.0, 8864.0, 13684.0, 22462.0, 36918.0, 64420.0, 117720.0, 246308.0, 700900.0, 1658987.0, 751339.0, 263843.0, 125610.0, 67660.0, 38445.0, 22940.0, 13866.0, 8509.0, 5565.0, 3433.0, 2141.0, 1475.0, 962.0, 621.0, 393.0, 269.0, 179.0, 119.0, 68.0, 44.0, 33.0, 22.0, 12.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005669593811035156, -0.0005495250225067139, -0.0005320906639099121, -0.0005146563053131104, -0.0004972219467163086, -0.00047978758811950684, -0.0004623532295227051, -0.0004449188709259033, -0.00042748451232910156, -0.0004100501537322998, -0.00039261579513549805, -0.0003751814365386963, -0.00035774707794189453, -0.0003403127193450928, -0.000322878360748291, -0.00030544400215148926, -0.0002880096435546875, -0.00027057528495788574, -0.000253140926361084, -0.00023570656776428223, -0.00021827220916748047, -0.0002008378505706787, -0.00018340349197387695, -0.0001659691333770752, -0.00014853477478027344, -0.00013110041618347168, -0.00011366605758666992, -9.623169898986816e-05, -7.87973403930664e-05, -6.136298179626465e-05, -4.392862319946289e-05, -2.6494264602661133e-05, -9.059906005859375e-06, 8.374452590942383e-06, 2.580881118774414e-05, 4.32431697845459e-05, 6.0677528381347656e-05, 7.811188697814941e-05, 9.554624557495117e-05, 0.00011298060417175293, 0.0001304149627685547, 0.00014784932136535645, 0.0001652836799621582, 0.00018271803855895996, 0.00020015239715576172, 0.00021758675575256348, 0.00023502111434936523, 0.000252455472946167, 0.00026988983154296875, 0.0002873241901397705, 0.00030475854873657227, 0.000322192907333374, 0.0003396272659301758, 0.00035706162452697754, 0.0003744959831237793, 0.00039193034172058105, 0.0004093647003173828, 0.00042679905891418457, 0.00044423341751098633, 0.0004616677761077881, 0.00047910213470458984, 0.0004965364933013916, 0.0005139708518981934, 0.0005314052104949951, 0.0005488395690917969]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 5.0, 4.0, 4.0, 7.0, 10.0, 14.0, 14.0, 14.0, 20.0, 17.0, 16.0, 23.0, 32.0, 36.0, 23.0, 38.0, 28.0, 38.0, 42.0, 33.0, 39.0, 43.0, 46.0, 36.0, 48.0, 41.0, 36.0, 38.0, 20.0, 32.0, 24.0, 24.0, 21.0, 22.0, 10.0, 18.0, 14.0, 12.0, 6.0, 13.0, 7.0, 5.0, 2.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0], "bins": [-0.0002617835998535156, -0.00025396794080734253, -0.00024615228176116943, -0.00023833662271499634, -0.00023052096366882324, -0.00022270530462265015, -0.00021488964557647705, -0.00020707398653030396, -0.00019925832748413086, -0.00019144266843795776, -0.00018362700939178467, -0.00017581135034561157, -0.00016799569129943848, -0.00016018003225326538, -0.00015236437320709229, -0.0001445487141609192, -0.0001367330551147461, -0.000128917396068573, -0.0001211017370223999, -0.0001132860779762268, -0.00010547041893005371, -9.765475988388062e-05, -8.983910083770752e-05, -8.202344179153442e-05, -7.420778274536133e-05, -6.639212369918823e-05, -5.857646465301514e-05, -5.076080560684204e-05, -4.2945146560668945e-05, -3.512948751449585e-05, -2.7313828468322754e-05, -1.9498169422149658e-05, -1.1682510375976562e-05, -3.866851329803467e-06, 3.948807716369629e-06, 1.1764466762542725e-05, 1.958012580871582e-05, 2.7395784854888916e-05, 3.521144390106201e-05, 4.302710294723511e-05, 5.08427619934082e-05, 5.86584210395813e-05, 6.64740800857544e-05, 7.428973913192749e-05, 8.210539817810059e-05, 8.992105722427368e-05, 9.773671627044678e-05, 0.00010555237531661987, 0.00011336803436279297, 0.00012118369340896606, 0.00012899935245513916, 0.00013681501150131226, 0.00014463067054748535, 0.00015244632959365845, 0.00016026198863983154, 0.00016807764768600464, 0.00017589330673217773, 0.00018370896577835083, 0.00019152462482452393, 0.00019934028387069702, 0.00020715594291687012, 0.0002149716019630432, 0.0002227872610092163, 0.0002306029200553894, 0.0002384185791015625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 8.0, 12.0, 18.0, 30.0, 50.0, 61.0, 92.0, 165.0, 233.0, 311.0, 521.0, 830.0, 1213.0, 2002.0, 3312.0, 5268.0, 8580.0, 14591.0, 24372.0, 41830.0, 75303.0, 141019.0, 287353.0, 680622.0, 1456191.0, 780824.0, 320811.0, 155169.0, 82134.0, 45546.0, 25901.0, 15682.0, 9249.0, 5602.0, 3445.0, 2115.0, 1400.0, 809.0, 560.0, 369.0, 233.0, 142.0, 103.0, 66.0, 43.0, 30.0, 21.0, 11.0, 13.0, 10.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004813671112060547, -0.0004661194980144501, -0.00045087188482284546, -0.00043562427163124084, -0.00042037665843963623, -0.0004051290452480316, -0.000389881432056427, -0.0003746338188648224, -0.0003593862056732178, -0.00034413859248161316, -0.00032889097929000854, -0.00031364336609840393, -0.0002983957529067993, -0.0002831481397151947, -0.0002679005265235901, -0.0002526529133319855, -0.00023740530014038086, -0.00022215768694877625, -0.00020691007375717163, -0.00019166246056556702, -0.0001764148473739624, -0.0001611672341823578, -0.00014591962099075317, -0.00013067200779914856, -0.00011542439460754395, -0.00010017678141593933, -8.492916822433472e-05, -6.96815550327301e-05, -5.443394184112549e-05, -3.9186328649520874e-05, -2.393871545791626e-05, -8.691102266311646e-06, 6.556510925292969e-06, 2.1804124116897583e-05, 3.70517373085022e-05, 5.229935050010681e-05, 6.754696369171143e-05, 8.279457688331604e-05, 9.804219007492065e-05, 0.00011328980326652527, 0.00012853741645812988, 0.0001437850296497345, 0.0001590326428413391, 0.00017428025603294373, 0.00018952786922454834, 0.00020477548241615295, 0.00022002309560775757, 0.00023527070879936218, 0.0002505183219909668, 0.0002657659351825714, 0.000281013548374176, 0.00029626116156578064, 0.00031150877475738525, 0.00032675638794898987, 0.0003420040011405945, 0.0003572516143321991, 0.0003724992275238037, 0.0003877468407154083, 0.00040299445390701294, 0.00041824206709861755, 0.00043348968029022217, 0.0004487372934818268, 0.0004639849066734314, 0.000479232519865036, 0.0004944801330566406]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 15.0, 11.0, 16.0, 31.0, 28.0, 36.0, 59.0, 71.0, 88.0, 96.0, 111.0, 120.0, 176.0, 188.0, 224.0, 261.0, 281.0, 282.0, 293.0, 270.0, 231.0, 218.0, 181.0, 153.0, 126.0, 118.0, 74.0, 56.0, 58.0, 41.0, 38.0, 30.0, 25.0, 12.0, 11.0, 8.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00015616416931152344, -0.00015125423669815063, -0.00014634430408477783, -0.00014143437147140503, -0.00013652443885803223, -0.00013161450624465942, -0.00012670457363128662, -0.00012179464101791382, -0.00011688470840454102, -0.00011197477579116821, -0.00010706484317779541, -0.00010215491056442261, -9.72449779510498e-05, -9.2335045337677e-05, -8.74251127243042e-05, -8.25151801109314e-05, -7.76052474975586e-05, -7.269531488418579e-05, -6.778538227081299e-05, -6.287544965744019e-05, -5.796551704406738e-05, -5.305558443069458e-05, -4.814565181732178e-05, -4.3235719203948975e-05, -3.832578659057617e-05, -3.341585397720337e-05, -2.8505921363830566e-05, -2.3595988750457764e-05, -1.868605613708496e-05, -1.3776123523712158e-05, -8.866190910339355e-06, -3.956258296966553e-06, 9.5367431640625e-07, 5.863606929779053e-06, 1.0773539543151855e-05, 1.5683472156524658e-05, 2.059340476989746e-05, 2.5503337383270264e-05, 3.0413269996643066e-05, 3.532320261001587e-05, 4.023313522338867e-05, 4.5143067836761475e-05, 5.005300045013428e-05, 5.496293306350708e-05, 5.987286567687988e-05, 6.478279829025269e-05, 6.969273090362549e-05, 7.460266351699829e-05, 7.95125961303711e-05, 8.44225287437439e-05, 8.93324613571167e-05, 9.42423939704895e-05, 9.91523265838623e-05, 0.00010406225919723511, 0.00010897219181060791, 0.00011388212442398071, 0.00011879205703735352, 0.00012370198965072632, 0.00012861192226409912, 0.00013352185487747192, 0.00013843178749084473, 0.00014334172010421753, 0.00014825165271759033, 0.00015316158533096313, 0.00015807151794433594]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 7.0, 7.0, 12.0, 11.0, 19.0, 17.0, 26.0, 22.0, 32.0, 45.0, 63.0, 73.0, 71.0, 85.0, 86.0, 78.0, 66.0, 56.0, 43.0, 43.0, 26.0, 24.0, 24.0, 10.0, 10.0, 7.0, 5.0, 7.0, 3.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00044371484545990825, -0.00043095386354252696, -0.0004181928525213152, -0.00040543187060393393, -0.0003926708595827222, -0.0003799098776653409, -0.0003671488957479596, -0.00035438788472674787, -0.0003416269028093666, -0.0003288659208919853, -0.00031610490987077355, -0.00030334392795339227, -0.0002905829169321805, -0.00027782193501479924, -0.0002650609239935875, -0.0002522999420762062, -0.0002395389456069097, -0.00022677794913761318, -0.00021401695266831666, -0.00020125595619902015, -0.00018849497428163886, -0.00017573397781234235, -0.00016297298134304583, -0.00015021199942566454, -0.0001374509884044528, -0.00012468999193515629, -0.00011192900274181738, -9.916800627252087e-05, -8.640701707918197e-05, -7.364602060988545e-05, -6.088502414058894e-05, -4.812403494725004e-05, -3.536304575391114e-05, -2.260205292259343e-05, -9.841058272286318e-06, 2.919936378020793e-06, 1.56809292093385e-05, 2.844192204065621e-05, 4.1202918509952724e-05, 5.3963907703291625e-05, 6.672490417258814e-05, 7.948590064188465e-05, 9.224688983522356e-05, 0.00010500788630452007, 0.00011776888277381659, 0.00013052986469119787, 0.00014329087571240962, 0.0001560518576297909, 0.00016881285409908742, 0.00018157385056838393, 0.00019433484703768045, 0.00020709584350697696, 0.00021985682542435825, 0.00023261782189365476, 0.0002453788183629513, 0.00025813980028033257, 0.0002709008113015443, 0.0002836617932189256, 0.00029642280424013734, 0.0003091837861575186, 0.00032194479717873037, 0.00033470577909611166, 0.0003474667901173234, 0.0003602277720347047, 0.00037298875395208597]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 5.0, 2.0, 6.0, 6.0, 8.0, 13.0, 17.0, 11.0, 14.0, 14.0, 24.0, 23.0, 23.0, 28.0, 33.0, 29.0, 32.0, 35.0, 36.0, 34.0, 45.0, 32.0, 29.0, 30.0, 34.0, 38.0, 46.0, 41.0, 35.0, 26.0, 30.0, 17.0, 29.0, 23.0, 24.0, 12.0, 21.0, 15.0, 14.0, 7.0, 8.0, 11.0, 10.0, 10.0, 5.0, 7.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0002826947020366788, -0.00027439312543720007, -0.00026609154883772135, -0.0002577899722382426, -0.0002494883956387639, -0.00024118681903928518, -0.0002328852569917217, -0.00022458368039224297, -0.00021628210379276425, -0.00020798052719328552, -0.0001996789505938068, -0.00019137737399432808, -0.0001830758119467646, -0.00017477423534728587, -0.00016647265874780715, -0.00015817108214832842, -0.0001498695055488497, -0.00014156792894937098, -0.00013326635234989226, -0.00012496477575041354, -0.00011666320642689243, -0.00010836162982741371, -0.0001000600605038926, -9.175848390441388e-05, -8.345690730493516e-05, -7.515533070545644e-05, -6.685375410597771e-05, -5.855218478245661e-05, -5.0250608182977885e-05, -4.1949031583499163e-05, -3.364745862199925e-05, -2.5345885660499334e-05, -1.704433816485107e-05, -8.742763384361751e-06, -4.411886038724333e-07, 7.860386176616885e-06, 1.6161960957106203e-05, 2.4463537556584924e-05, 3.276511051808484e-05, 4.1066683479584754e-05, 4.9368260079063475e-05, 5.76698366785422e-05, 6.597141327802092e-05, 7.427298260154203e-05, 8.257455920102075e-05, 9.087613580049947e-05, 9.917770512402058e-05, 0.0001074792817234993, 0.00011578085832297802, 0.00012408243492245674, 0.00013238401152193546, 0.00014068558812141418, 0.0001489871647208929, 0.00015728874132037163, 0.00016559030336793512, 0.00017389187996741384, 0.00018219345656689256, 0.00019049503316637129, 0.00019879660976585, 0.00020709818636532873, 0.00021539974841289222, 0.00022370132501237094, 0.00023200290161184967, 0.0002403044782113284, 0.0002486060548108071]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 2.0, 7.0, 18.0, 22.0, 38.0, 55.0, 69.0, 103.0, 174.0, 261.0, 446.0, 642.0, 1055.0, 1833.0, 3052.0, 5113.0, 8677.0, 15314.0, 26756.0, 48405.0, 88402.0, 158182.0, 243155.0, 194833.0, 111306.0, 61004.0, 33977.0, 18934.0, 10913.0, 6252.0, 3829.0, 2210.0, 1338.0, 754.0, 510.0, 331.0, 198.0, 136.0, 88.0, 47.0, 40.0, 21.0, 18.0, 11.0, 10.0, 10.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0005984306335449219, -0.0005811825394630432, -0.0005639344453811646, -0.0005466863512992859, -0.0005294382572174072, -0.0005121901631355286, -0.0004949420690536499, -0.00047769397497177124, -0.0004604458808898926, -0.0004431977868080139, -0.00042594969272613525, -0.0004087015986442566, -0.00039145350456237793, -0.00037420541048049927, -0.0003569573163986206, -0.00033970922231674194, -0.0003224611282348633, -0.0003052130341529846, -0.00028796494007110596, -0.0002707168459892273, -0.00025346875190734863, -0.00023622065782546997, -0.0002189725637435913, -0.00020172446966171265, -0.00018447637557983398, -0.00016722828149795532, -0.00014998018741607666, -0.000132732093334198, -0.00011548399925231934, -9.823590517044067e-05, -8.098781108856201e-05, -6.373971700668335e-05, -4.649162292480469e-05, -2.9243528842926025e-05, -1.1995434761047363e-05, 5.252659320831299e-06, 2.250075340270996e-05, 3.974884748458862e-05, 5.6996941566467285e-05, 7.424503564834595e-05, 9.149312973022461e-05, 0.00010874122381210327, 0.00012598931789398193, 0.0001432374119758606, 0.00016048550605773926, 0.00017773360013961792, 0.00019498169422149658, 0.00021222978830337524, 0.0002294778823852539, 0.00024672597646713257, 0.00026397407054901123, 0.0002812221646308899, 0.00029847025871276855, 0.0003157183527946472, 0.0003329664468765259, 0.00035021454095840454, 0.0003674626350402832, 0.00038471072912216187, 0.00040195882320404053, 0.0004192069172859192, 0.00043645501136779785, 0.0004537031054496765, 0.0004709511995315552, 0.00048819929361343384, 0.0005054473876953125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 9.0, 5.0, 14.0, 10.0, 6.0, 7.0, 19.0, 11.0, 25.0, 23.0, 32.0, 21.0, 27.0, 39.0, 33.0, 26.0, 34.0, 44.0, 34.0, 38.0, 25.0, 30.0, 44.0, 33.0, 44.0, 43.0, 30.0, 38.0, 24.0, 30.0, 22.0, 23.0, 21.0, 23.0, 13.0, 24.0, 10.0, 12.0, 8.0, 9.0, 9.0, 4.0, 8.0, 3.0, 3.0, 1.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.00023627281188964844, -0.0002291649580001831, -0.00022205710411071777, -0.00021494925022125244, -0.0002078413963317871, -0.00020073354244232178, -0.00019362568855285645, -0.0001865178346633911, -0.00017940998077392578, -0.00017230212688446045, -0.00016519427299499512, -0.00015808641910552979, -0.00015097856521606445, -0.00014387071132659912, -0.0001367628574371338, -0.00012965500354766846, -0.00012254714965820312, -0.00011543929576873779, -0.00010833144187927246, -0.00010122358798980713, -9.41157341003418e-05, -8.700788021087646e-05, -7.990002632141113e-05, -7.27921724319458e-05, -6.568431854248047e-05, -5.857646465301514e-05, -5.1468610763549805e-05, -4.436075687408447e-05, -3.725290298461914e-05, -3.014504909515381e-05, -2.3037195205688477e-05, -1.5929341316223145e-05, -8.821487426757812e-06, -1.7136335372924805e-06, 5.3942203521728516e-06, 1.2502074241638184e-05, 1.9609928131103516e-05, 2.6717782020568848e-05, 3.382563591003418e-05, 4.093348979949951e-05, 4.8041343688964844e-05, 5.5149197578430176e-05, 6.225705146789551e-05, 6.936490535736084e-05, 7.647275924682617e-05, 8.35806131362915e-05, 9.068846702575684e-05, 9.779632091522217e-05, 0.0001049041748046875, 0.00011201202869415283, 0.00011911988258361816, 0.0001262277364730835, 0.00013333559036254883, 0.00014044344425201416, 0.0001475512981414795, 0.00015465915203094482, 0.00016176700592041016, 0.0001688748598098755, 0.00017598271369934082, 0.00018309056758880615, 0.00019019842147827148, 0.00019730627536773682, 0.00020441412925720215, 0.00021152198314666748, 0.0002186298370361328]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 13.0, 10.0, 17.0, 19.0, 37.0, 67.0, 89.0, 167.0, 240.0, 399.0, 691.0, 1223.0, 1983.0, 3554.0, 6710.0, 13745.0, 31972.0, 112327.0, 599752.0, 196001.0, 43726.0, 17402.0, 8220.0, 4379.0, 2334.0, 1370.0, 846.0, 470.0, 294.0, 177.0, 102.0, 74.0, 51.0, 26.0, 14.0, 17.0, 13.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010204315185546875, -0.0009901076555252075, -0.0009597837924957275, -0.0009294599294662476, -0.0008991360664367676, -0.0008688122034072876, -0.0008384883403778076, -0.0008081644773483276, -0.0007778406143188477, -0.0007475167512893677, -0.0007171928882598877, -0.0006868690252304077, -0.0006565451622009277, -0.0006262212991714478, -0.0005958974361419678, -0.0005655735731124878, -0.0005352497100830078, -0.0005049258470535278, -0.00047460198402404785, -0.00044427812099456787, -0.0004139542579650879, -0.0003836303949356079, -0.00035330653190612793, -0.00032298266887664795, -0.00029265880584716797, -0.000262334942817688, -0.000232011079788208, -0.00020168721675872803, -0.00017136335372924805, -0.00014103949069976807, -0.00011071562767028809, -8.03917646408081e-05, -5.0067901611328125e-05, -1.9744038581848145e-05, 1.0579824447631836e-05, 4.0903687477111816e-05, 7.12275505065918e-05, 0.00010155141353607178, 0.00013187527656555176, 0.00016219913959503174, 0.00019252300262451172, 0.0002228468656539917, 0.0002531707286834717, 0.00028349459171295166, 0.00031381845474243164, 0.0003441423177719116, 0.0003744661808013916, 0.0004047900438308716, 0.00043511390686035156, 0.00046543776988983154, 0.0004957616329193115, 0.0005260854959487915, 0.0005564093589782715, 0.0005867332220077515, 0.0006170570850372314, 0.0006473809480667114, 0.0006777048110961914, 0.0007080286741256714, 0.0007383525371551514, 0.0007686764001846313, 0.0007990002632141113, 0.0008293241262435913, 0.0008596479892730713, 0.0008899718523025513, 0.0009202957153320312]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 4.0, 7.0, 5.0, 11.0, 13.0, 9.0, 12.0, 12.0, 23.0, 16.0, 21.0, 23.0, 25.0, 33.0, 42.0, 21.0, 32.0, 41.0, 39.0, 30.0, 33.0, 29.0, 29.0, 39.0, 44.0, 43.0, 38.0, 43.0, 33.0, 27.0, 22.0, 19.0, 24.0, 25.0, 23.0, 21.0, 7.0, 18.0, 14.0, 7.0, 9.0, 10.0, 6.0, 5.0, 5.0, 7.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.00014972686767578125, -0.00014508888125419617, -0.00014045089483261108, -0.000135812908411026, -0.00013117492198944092, -0.00012653693556785583, -0.00012189894914627075, -0.00011726096272468567, -0.00011262297630310059, -0.0001079849898815155, -0.00010334700345993042, -9.870901703834534e-05, -9.407103061676025e-05, -8.943304419517517e-05, -8.479505777359009e-05, -8.0157071352005e-05, -7.551908493041992e-05, -7.088109850883484e-05, -6.624311208724976e-05, -6.160512566566467e-05, -5.696713924407959e-05, -5.232915282249451e-05, -4.7691166400909424e-05, -4.305317997932434e-05, -3.841519355773926e-05, -3.3777207136154175e-05, -2.9139220714569092e-05, -2.450123429298401e-05, -1.9863247871398926e-05, -1.5225261449813843e-05, -1.058727502822876e-05, -5.949288606643677e-06, -1.3113021850585938e-06, 3.3266842365264893e-06, 7.964670658111572e-06, 1.2602657079696655e-05, 1.7240643501281738e-05, 2.187862992286682e-05, 2.6516616344451904e-05, 3.115460276603699e-05, 3.579258918762207e-05, 4.043057560920715e-05, 4.5068562030792236e-05, 4.970654845237732e-05, 5.43445348739624e-05, 5.8982521295547485e-05, 6.362050771713257e-05, 6.825849413871765e-05, 7.289648056030273e-05, 7.753446698188782e-05, 8.21724534034729e-05, 8.681043982505798e-05, 9.144842624664307e-05, 9.608641266822815e-05, 0.00010072439908981323, 0.00010536238551139832, 0.0001100003719329834, 0.00011463835835456848, 0.00011927634477615356, 0.00012391433119773865, 0.00012855231761932373, 0.0001331903040409088, 0.0001378282904624939, 0.00014246627688407898, 0.00014710426330566406]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 9.0, 13.0, 21.0, 25.0, 43.0, 54.0, 78.0, 111.0, 175.0, 254.0, 395.0, 610.0, 979.0, 1573.0, 2933.0, 5861.0, 13402.0, 45023.0, 446596.0, 458027.0, 45825.0, 13544.0, 5697.0, 2886.0, 1610.0, 953.0, 612.0, 408.0, 251.0, 183.0, 108.0, 79.0, 66.0, 38.0, 29.0, 14.0, 17.0, 15.0, 3.0, 5.0, 6.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0003705024719238281, -0.000359605997800827, -0.00034870952367782593, -0.00033781304955482483, -0.00032691657543182373, -0.00031602010130882263, -0.00030512362718582153, -0.00029422715306282043, -0.00028333067893981934, -0.00027243420481681824, -0.00026153773069381714, -0.00025064125657081604, -0.00023974478244781494, -0.00022884830832481384, -0.00021795183420181274, -0.00020705536007881165, -0.00019615888595581055, -0.00018526241183280945, -0.00017436593770980835, -0.00016346946358680725, -0.00015257298946380615, -0.00014167651534080505, -0.00013078004121780396, -0.00011988356709480286, -0.00010898709297180176, -9.809061884880066e-05, -8.719414472579956e-05, -7.629767060279846e-05, -6.540119647979736e-05, -5.4504722356796265e-05, -4.3608248233795166e-05, -3.271177411079407e-05, -2.181529998779297e-05, -1.091882586479187e-05, -2.2351741790771484e-08, 1.0874122381210327e-05, 2.1770596504211426e-05, 3.2667070627212524e-05, 4.356354475021362e-05, 5.446001887321472e-05, 6.535649299621582e-05, 7.625296711921692e-05, 8.714944124221802e-05, 9.804591536521912e-05, 0.00010894238948822021, 0.00011983886361122131, 0.0001307353377342224, 0.0001416318118572235, 0.0001525282859802246, 0.0001634247601032257, 0.0001743212342262268, 0.0001852177083492279, 0.000196114182472229, 0.0002070106565952301, 0.0002179071307182312, 0.0002288036048412323, 0.0002397000789642334, 0.0002505965530872345, 0.0002614930272102356, 0.0002723895013332367, 0.0002832859754562378, 0.0002941824495792389, 0.00030507892370224, 0.0003159753978252411, 0.0003268718719482422]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 4.0, 5.0, 8.0, 7.0, 8.0, 15.0, 19.0, 10.0, 31.0, 31.0, 75.0, 97.0, 151.0, 171.0, 114.0, 78.0, 45.0, 42.0, 18.0, 20.0, 10.0, 6.0, 5.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2576580047607422e-05, -1.2184493243694305e-05, -1.1792406439781189e-05, -1.1400319635868073e-05, -1.1008232831954956e-05, -1.061614602804184e-05, -1.0224059224128723e-05, -9.831972420215607e-06, -9.43988561630249e-06, -9.047798812389374e-06, -8.655712008476257e-06, -8.263625204563141e-06, -7.871538400650024e-06, -7.479451596736908e-06, -7.0873647928237915e-06, -6.695277988910675e-06, -6.303191184997559e-06, -5.911104381084442e-06, -5.519017577171326e-06, -5.126930773258209e-06, -4.734843969345093e-06, -4.342757165431976e-06, -3.95067036151886e-06, -3.5585835576057434e-06, -3.166496753692627e-06, -2.7744099497795105e-06, -2.382323145866394e-06, -1.9902363419532776e-06, -1.5981495380401611e-06, -1.2060627341270447e-06, -8.139759302139282e-07, -4.2188912630081177e-07, -2.9802322387695312e-08, 3.6228448152542114e-07, 7.543712854385376e-07, 1.146458089351654e-06, 1.5385448932647705e-06, 1.930631697177887e-06, 2.3227185010910034e-06, 2.71480530500412e-06, 3.1068921089172363e-06, 3.4989789128303528e-06, 3.891065716743469e-06, 4.283152520656586e-06, 4.675239324569702e-06, 5.067326128482819e-06, 5.459412932395935e-06, 5.8514997363090515e-06, 6.243586540222168e-06, 6.6356733441352844e-06, 7.027760148048401e-06, 7.419846951961517e-06, 7.811933755874634e-06, 8.20402055978775e-06, 8.596107363700867e-06, 8.988194167613983e-06, 9.3802809715271e-06, 9.772367775440216e-06, 1.0164454579353333e-05, 1.0556541383266449e-05, 1.0948628187179565e-05, 1.1340714991092682e-05, 1.1732801795005798e-05, 1.2124888598918915e-05, 1.2516975402832031e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 1.0, 6.0, 11.0, 14.0, 27.0, 28.0, 46.0, 56.0, 53.0, 90.0, 126.0, 177.0, 215.0, 286.0, 412.0, 530.0, 722.0, 1056.0, 1496.0, 2271.0, 3679.0, 5569.0, 9147.0, 15994.0, 29832.0, 67478.0, 186225.0, 428301.0, 165566.0, 61444.0, 27900.0, 14828.0, 8835.0, 5315.0, 3406.0, 2259.0, 1493.0, 972.0, 676.0, 569.0, 352.0, 276.0, 203.0, 182.0, 119.0, 80.0, 63.0, 48.0, 44.0, 26.0, 17.0, 12.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.00010633468627929688, -0.00010284222662448883, -9.934976696968079e-05, -9.585730731487274e-05, -9.23648476600647e-05, -8.887238800525665e-05, -8.537992835044861e-05, -8.188746869564056e-05, -7.839500904083252e-05, -7.490254938602448e-05, -7.141008973121643e-05, -6.791763007640839e-05, -6.442517042160034e-05, -6.09327107667923e-05, -5.744025111198425e-05, -5.394779145717621e-05, -5.0455331802368164e-05, -4.696287214756012e-05, -4.3470412492752075e-05, -3.997795283794403e-05, -3.6485493183135986e-05, -3.299303352832794e-05, -2.9500573873519897e-05, -2.6008114218711853e-05, -2.251565456390381e-05, -1.9023194909095764e-05, -1.553073525428772e-05, -1.2038275599479675e-05, -8.545815944671631e-06, -5.0533562898635864e-06, -1.560896635055542e-06, 1.9315630197525024e-06, 5.424022674560547e-06, 8.916482329368591e-06, 1.2408941984176636e-05, 1.590140163898468e-05, 1.9393861293792725e-05, 2.288632094860077e-05, 2.6378780603408813e-05, 2.9871240258216858e-05, 3.33636999130249e-05, 3.685615956783295e-05, 4.034861922264099e-05, 4.3841078877449036e-05, 4.733353853225708e-05, 5.0825998187065125e-05, 5.431845784187317e-05, 5.781091749668121e-05, 6.130337715148926e-05, 6.47958368062973e-05, 6.828829646110535e-05, 7.178075611591339e-05, 7.527321577072144e-05, 7.876567542552948e-05, 8.225813508033752e-05, 8.575059473514557e-05, 8.924305438995361e-05, 9.273551404476166e-05, 9.62279736995697e-05, 9.972043335437775e-05, 0.00010321289300918579, 0.00010670535266399384, 0.00011019781231880188, 0.00011369027197360992, 0.00011718273162841797]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 4.0, 6.0, 14.0, 10.0, 14.0, 13.0, 23.0, 25.0, 27.0, 43.0, 51.0, 63.0, 80.0, 71.0, 89.0, 95.0, 70.0, 68.0, 54.0, 42.0, 29.0, 26.0, 21.0, 14.0, 13.0, 6.0, 10.0, 6.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-05, -2.4049542844295502e-05, -2.306513488292694e-05, -2.208072692155838e-05, -2.109631896018982e-05, -2.011191099882126e-05, -1.9127503037452698e-05, -1.8143095076084137e-05, -1.7158687114715576e-05, -1.6174279153347015e-05, -1.5189871191978455e-05, -1.4205463230609894e-05, -1.3221055269241333e-05, -1.2236647307872772e-05, -1.1252239346504211e-05, -1.026783138513565e-05, -9.28342342376709e-06, -8.299015462398529e-06, -7.314607501029968e-06, -6.3301995396614075e-06, -5.345791578292847e-06, -4.361383616924286e-06, -3.376975655555725e-06, -2.3925676941871643e-06, -1.4081597328186035e-06, -4.237517714500427e-07, 5.606561899185181e-07, 1.5450641512870789e-06, 2.5294721126556396e-06, 3.5138800740242004e-06, 4.498288035392761e-06, 5.482695996761322e-06, 6.467103958129883e-06, 7.451511919498444e-06, 8.435919880867004e-06, 9.420327842235565e-06, 1.0404735803604126e-05, 1.1389143764972687e-05, 1.2373551726341248e-05, 1.3357959687709808e-05, 1.4342367649078369e-05, 1.532677561044693e-05, 1.631118357181549e-05, 1.729559153318405e-05, 1.8279999494552612e-05, 1.9264407455921173e-05, 2.0248815417289734e-05, 2.1233223378658295e-05, 2.2217631340026855e-05, 2.3202039301395416e-05, 2.4186447262763977e-05, 2.5170855224132538e-05, 2.61552631855011e-05, 2.713967114686966e-05, 2.812407910823822e-05, 2.910848706960678e-05, 3.0092895030975342e-05, 3.10773029923439e-05, 3.206171095371246e-05, 3.3046118915081024e-05, 3.4030526876449585e-05, 3.5014934837818146e-05, 3.5999342799186707e-05, 3.698375076055527e-05, 3.796815872192383e-05]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 9.0, 7.0, 12.0, 12.0, 17.0, 16.0, 25.0, 35.0, 33.0, 40.0, 59.0, 70.0, 68.0, 91.0, 75.0, 89.0, 72.0, 45.0, 41.0, 24.0, 35.0, 26.0, 22.0, 17.0, 9.0, 7.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0003416316758375615, -0.00033181466278620064, -0.00032199762063100934, -0.0003121806075796485, -0.00030236359452828765, -0.0002925465814769268, -0.00028272956842556596, -0.00027291252627037466, -0.0002630955132190138, -0.00025327850016765296, -0.0002434614725643769, -0.00023364444496110082, -0.00022382743190973997, -0.00021401041885837913, -0.00020419339125510305, -0.00019437636365182698, -0.00018455935060046613, -0.0001747423375491053, -0.0001649253099458292, -0.00015510828234255314, -0.0001452912692911923, -0.00013547425623983145, -0.00012565722863655537, -0.00011584020830923691, -0.00010602318798191845, -9.62061676546e-05, -8.638914732728153e-05, -7.657212699996307e-05, -6.675510667264462e-05, -5.6938086345326155e-05, -4.7121066018007696e-05, -3.7304045690689236e-05, -2.748699625954032e-05, -1.766997593222186e-05, -7.8529556049034e-06, 1.96406472241506e-06, 1.178108504973352e-05, 2.159810537705198e-05, 3.141512570437044e-05, 4.12321460316889e-05, 5.104916635900736e-05, 6.086618668632582e-05, 7.068320701364428e-05, 8.050022734096274e-05, 9.03172476682812e-05, 0.00010013426799559966, 0.00010995128832291812, 0.00011976830865023658, 0.00012958532897755504, 0.00013940234202891588, 0.00014921936963219196, 0.00015903639723546803, 0.00016885341028682888, 0.00017867042333818972, 0.0001884874509414658, 0.00019830447854474187, 0.00020812149159610271, 0.00021793850464746356, 0.00022775553225073963, 0.0002375725598540157, 0.00024738957290537655, 0.0002572065859567374, 0.0002670236281119287, 0.00027684064116328955, 0.0002866576542146504]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 2.0, 8.0, 6.0, 9.0, 14.0, 9.0, 17.0, 15.0, 19.0, 19.0, 17.0, 26.0, 34.0, 34.0, 30.0, 31.0, 30.0, 42.0, 37.0, 35.0, 37.0, 35.0, 31.0, 31.0, 41.0, 45.0, 46.0, 25.0, 26.0, 26.0, 29.0, 26.0, 17.0, 22.0, 20.0, 20.0, 11.0, 11.0, 10.0, 11.0, 10.0, 10.0, 6.0, 3.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00023243452596943825, -0.00022555378382094204, -0.00021867304167244583, -0.00021179229952394962, -0.0002049115573754534, -0.0001980308152269572, -0.00019115005852654576, -0.00018426933092996478, -0.00017738857422955334, -0.00017050783208105713, -0.00016362708993256092, -0.0001567463477840647, -0.0001498656056355685, -0.0001429848634870723, -0.00013610412133857608, -0.00012922336463816464, -0.00012234263704158366, -0.00011546189489308745, -0.00010858115274459124, -0.00010170041059609503, -9.481966844759881e-05, -8.79389262991026e-05, -8.105817687464878e-05, -7.417743472615257e-05, -6.729669257765636e-05, -6.041595042916015e-05, -5.353520828066394e-05, -4.665446249418892e-05, -3.977372034569271e-05, -3.28929781971965e-05, -2.601223241072148e-05, -1.913149026222527e-05, -1.2250733561813831e-05, -5.369990503822919e-06, 1.5107525541679934e-06, 8.391496521653607e-06, 1.5272238670149818e-05, 2.215298081864603e-05, 2.9033726605121046e-05, 3.591446875361726e-05, 4.279521090211347e-05, 4.967595305060968e-05, 5.655669519910589e-05, 6.343744462355971e-05, 7.031818677205592e-05, 7.719892892055213e-05, 8.407967106904835e-05, 9.096041321754456e-05, 9.784115536604077e-05, 0.00010472189751453698, 0.00011160263966303319, 0.0001184833818115294, 0.0001253641239600256, 0.00013224486610852182, 0.00013912562280893326, 0.00014600635040551424, 0.00015288710710592568, 0.0001597678492544219, 0.0001666485914029181, 0.0001735293335514143, 0.00018041007569991052, 0.00018729081784840673, 0.00019417155999690294, 0.00020105231669731438, 0.00020793304429389536]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 5.0, 12.0, 17.0, 35.0, 33.0, 48.0, 62.0, 114.0, 138.0, 180.0, 258.0, 355.0, 546.0, 696.0, 1001.0, 1444.0, 1909.0, 2715.0, 3708.0, 5258.0, 7138.0, 10367.0, 14543.0, 21198.0, 30364.0, 45420.0, 67450.0, 101662.0, 146587.0, 169525.0, 133569.0, 90139.0, 60009.0, 40202.0, 27135.0, 18989.0, 13234.0, 9264.0, 6484.0, 4773.0, 3336.0, 2426.0, 1673.0, 1329.0, 933.0, 663.0, 512.0, 316.0, 220.0, 166.0, 112.0, 89.0, 67.0, 51.0, 35.0, 20.0, 11.0, 13.0, 4.0, 4.0, 2.0], "bins": [-0.0003173351287841797, -0.00030752643942832947, -0.00029771775007247925, -0.00028790906071662903, -0.0002781003713607788, -0.0002682916820049286, -0.00025848299264907837, -0.00024867430329322815, -0.00023886561393737793, -0.0002290569245815277, -0.0002192482352256775, -0.00020943954586982727, -0.00019963085651397705, -0.00018982216715812683, -0.0001800134778022766, -0.0001702047884464264, -0.00016039609909057617, -0.00015058740973472595, -0.00014077872037887573, -0.0001309700310230255, -0.00012116134166717529, -0.00011135265231132507, -0.00010154396295547485, -9.173527359962463e-05, -8.192658424377441e-05, -7.21178948879242e-05, -6.230920553207397e-05, -5.2500516176223755e-05, -4.2691826820373535e-05, -3.2883137464523315e-05, -2.3074448108673096e-05, -1.3265758752822876e-05, -3.4570693969726562e-06, 6.3516199588775635e-06, 1.6160309314727783e-05, 2.5968998670578003e-05, 3.577768802642822e-05, 4.558637738227844e-05, 5.539506673812866e-05, 6.520375609397888e-05, 7.50124454498291e-05, 8.482113480567932e-05, 9.462982416152954e-05, 0.00010443851351737976, 0.00011424720287322998, 0.0001240558922290802, 0.00013386458158493042, 0.00014367327094078064, 0.00015348196029663086, 0.00016329064965248108, 0.0001730993390083313, 0.00018290802836418152, 0.00019271671772003174, 0.00020252540707588196, 0.00021233409643173218, 0.0002221427857875824, 0.00023195147514343262, 0.00024176016449928284, 0.00025156885385513306, 0.0002613775432109833, 0.0002711862325668335, 0.0002809949219226837, 0.00029080361127853394, 0.00030061230063438416, 0.0003104209899902344]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 3.0, 12.0, 5.0, 14.0, 11.0, 14.0, 14.0, 12.0, 22.0, 30.0, 26.0, 27.0, 45.0, 29.0, 32.0, 44.0, 39.0, 38.0, 46.0, 36.0, 44.0, 31.0, 54.0, 36.0, 34.0, 45.0, 29.0, 25.0, 35.0, 23.0, 23.0, 22.0, 18.0, 10.0, 11.0, 6.0, 17.0, 10.0, 8.0, 6.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020694732666015625, -0.0002005062997341156, -0.00019406527280807495, -0.0001876242458820343, -0.00018118321895599365, -0.000174742192029953, -0.00016830116510391235, -0.0001618601381778717, -0.00015541911125183105, -0.0001489780843257904, -0.00014253705739974976, -0.0001360960304737091, -0.00012965500354766846, -0.0001232139766216278, -0.00011677294969558716, -0.00011033192276954651, -0.00010389089584350586, -9.744986891746521e-05, -9.100884199142456e-05, -8.456781506538391e-05, -7.812678813934326e-05, -7.168576121330261e-05, -6.524473428726196e-05, -5.8803707361221313e-05, -5.2362680435180664e-05, -4.5921653509140015e-05, -3.9480626583099365e-05, -3.3039599657058716e-05, -2.6598572731018066e-05, -2.0157545804977417e-05, -1.3716518878936768e-05, -7.275491952896118e-06, -8.344650268554688e-07, 5.606561899185181e-06, 1.204758882522583e-05, 1.848861575126648e-05, 2.492964267730713e-05, 3.137066960334778e-05, 3.781169652938843e-05, 4.425272345542908e-05, 5.0693750381469727e-05, 5.7134777307510376e-05, 6.357580423355103e-05, 7.001683115959167e-05, 7.645785808563232e-05, 8.289888501167297e-05, 8.933991193771362e-05, 9.578093886375427e-05, 0.00010222196578979492, 0.00010866299271583557, 0.00011510401964187622, 0.00012154504656791687, 0.00012798607349395752, 0.00013442710041999817, 0.00014086812734603882, 0.00014730915427207947, 0.00015375018119812012, 0.00016019120812416077, 0.00016663223505020142, 0.00017307326197624207, 0.00017951428890228271, 0.00018595531582832336, 0.00019239634275436401, 0.00019883736968040466, 0.0002052783966064453]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 8.0, 4.0, 9.0, 13.0, 18.0, 33.0, 48.0, 54.0, 90.0, 116.0, 175.0, 229.0, 368.0, 521.0, 817.0, 1182.0, 1729.0, 2742.0, 4255.0, 6896.0, 10750.0, 17135.0, 27855.0, 46017.0, 75889.0, 126003.0, 198284.0, 200965.0, 127943.0, 76448.0, 46229.0, 28088.0, 17262.0, 10929.0, 6816.0, 4347.0, 2755.0, 1843.0, 1184.0, 825.0, 520.0, 351.0, 244.0, 183.0, 114.0, 87.0, 53.0, 42.0, 29.0, 23.0, 19.0, 8.0, 2.0, 10.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.0003821849822998047, -0.00037024542689323425, -0.0003583058714866638, -0.0003463663160800934, -0.00033442676067352295, -0.0003224872052669525, -0.0003105476498603821, -0.00029860809445381165, -0.0002866685390472412, -0.0002747289836406708, -0.00026278942823410034, -0.0002508498728275299, -0.00023891031742095947, -0.00022697076201438904, -0.0002150312066078186, -0.00020309165120124817, -0.00019115209579467773, -0.0001792125403881073, -0.00016727298498153687, -0.00015533342957496643, -0.000143393874168396, -0.00013145431876182556, -0.00011951476335525513, -0.00010757520794868469, -9.563565254211426e-05, -8.369609713554382e-05, -7.175654172897339e-05, -5.9816986322402954e-05, -4.787743091583252e-05, -3.5937875509262085e-05, -2.399832010269165e-05, -1.2058764696121216e-05, -1.1920928955078125e-07, 1.1820346117019653e-05, 2.3759901523590088e-05, 3.569945693016052e-05, 4.763901233673096e-05, 5.957856774330139e-05, 7.151812314987183e-05, 8.345767855644226e-05, 9.53972339630127e-05, 0.00010733678936958313, 0.00011927634477615356, 0.000131215900182724, 0.00014315545558929443, 0.00015509501099586487, 0.0001670345664024353, 0.00017897412180900574, 0.00019091367721557617, 0.0002028532326221466, 0.00021479278802871704, 0.00022673234343528748, 0.0002386718988418579, 0.00025061145424842834, 0.0002625510096549988, 0.0002744905650615692, 0.00028643012046813965, 0.0002983696758747101, 0.0003103092312812805, 0.00032224878668785095, 0.0003341883420944214, 0.0003461278975009918, 0.00035806745290756226, 0.0003700070083141327, 0.0003819465637207031]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 8.0, 7.0, 6.0, 13.0, 13.0, 10.0, 20.0, 18.0, 21.0, 19.0, 28.0, 34.0, 35.0, 30.0, 42.0, 35.0, 24.0, 37.0, 30.0, 39.0, 50.0, 34.0, 43.0, 37.0, 37.0, 44.0, 30.0, 39.0, 29.0, 28.0, 21.0, 29.0, 15.0, 23.0, 10.0, 12.0, 7.0, 7.0, 7.0, 4.0, 6.0, 6.0, 1.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00013756752014160156, -0.0001335740089416504, -0.00012958049774169922, -0.00012558698654174805, -0.00012159347534179688, -0.0001175999641418457, -0.00011360645294189453, -0.00010961294174194336, -0.00010561943054199219, -0.00010162591934204102, -9.763240814208984e-05, -9.363889694213867e-05, -8.96453857421875e-05, -8.565187454223633e-05, -8.165836334228516e-05, -7.766485214233398e-05, -7.367134094238281e-05, -6.967782974243164e-05, -6.568431854248047e-05, -6.16908073425293e-05, -5.7697296142578125e-05, -5.370378494262695e-05, -4.971027374267578e-05, -4.571676254272461e-05, -4.172325134277344e-05, -3.7729740142822266e-05, -3.3736228942871094e-05, -2.9742717742919922e-05, -2.574920654296875e-05, -2.1755695343017578e-05, -1.7762184143066406e-05, -1.3768672943115234e-05, -9.775161743164062e-06, -5.781650543212891e-06, -1.7881393432617188e-06, 2.205371856689453e-06, 6.198883056640625e-06, 1.0192394256591797e-05, 1.4185905456542969e-05, 1.817941665649414e-05, 2.2172927856445312e-05, 2.6166439056396484e-05, 3.0159950256347656e-05, 3.415346145629883e-05, 3.814697265625e-05, 4.214048385620117e-05, 4.6133995056152344e-05, 5.0127506256103516e-05, 5.412101745605469e-05, 5.811452865600586e-05, 6.210803985595703e-05, 6.61015510559082e-05, 7.009506225585938e-05, 7.408857345581055e-05, 7.808208465576172e-05, 8.207559585571289e-05, 8.606910705566406e-05, 9.006261825561523e-05, 9.40561294555664e-05, 9.804964065551758e-05, 0.00010204315185546875, 0.00010603666305541992, 0.0001100301742553711, 0.00011402368545532227, 0.00011801719665527344]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 10.0, 4.0, 10.0, 10.0, 24.0, 26.0, 29.0, 51.0, 77.0, 90.0, 135.0, 202.0, 248.0, 441.0, 670.0, 1014.0, 1584.0, 2471.0, 4504.0, 8555.0, 19616.0, 66238.0, 859586.0, 48481.0, 16481.0, 7465.0, 3997.0, 2317.0, 1396.0, 954.0, 590.0, 403.0, 279.0, 169.0, 113.0, 100.0, 47.0, 45.0, 40.0, 17.0, 20.0, 12.0, 8.0, 10.0, 2.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00013959407806396484, -0.00013528577983379364, -0.00013097748160362244, -0.00012666918337345123, -0.00012236088514328003, -0.00011805258691310883, -0.00011374428868293762, -0.00010943599045276642, -0.00010512769222259521, -0.00010081939399242401, -9.651109576225281e-05, -9.22027975320816e-05, -8.78944993019104e-05, -8.35862010717392e-05, -7.927790284156799e-05, -7.496960461139679e-05, -7.066130638122559e-05, -6.635300815105438e-05, -6.204470992088318e-05, -5.7736411690711975e-05, -5.342811346054077e-05, -4.911981523036957e-05, -4.4811517000198364e-05, -4.050321877002716e-05, -3.619492053985596e-05, -3.1886622309684753e-05, -2.757832407951355e-05, -2.3270025849342346e-05, -1.8961727619171143e-05, -1.4653429388999939e-05, -1.0345131158828735e-05, -6.036832928657532e-06, -1.7285346984863281e-06, 2.5797635316848755e-06, 6.888061761856079e-06, 1.1196359992027283e-05, 1.5504658222198486e-05, 1.981295645236969e-05, 2.4121254682540894e-05, 2.8429552912712097e-05, 3.27378511428833e-05, 3.7046149373054504e-05, 4.135444760322571e-05, 4.566274583339691e-05, 4.9971044063568115e-05, 5.427934229373932e-05, 5.858764052391052e-05, 6.289593875408173e-05, 6.720423698425293e-05, 7.151253521442413e-05, 7.582083344459534e-05, 8.012913167476654e-05, 8.443742990493774e-05, 8.874572813510895e-05, 9.305402636528015e-05, 9.736232459545135e-05, 0.00010167062282562256, 0.00010597892105579376, 0.00011028721928596497, 0.00011459551751613617, 0.00011890381574630737, 0.00012321211397647858, 0.00012752041220664978, 0.00013182871043682098, 0.0001361370086669922]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 13.0, 0.0, 12.0, 29.0, 39.0, 64.0, 92.0, 158.0, 151.0, 145.0, 0.0, 86.0, 59.0, 43.0, 29.0, 16.0, 12.0, 9.0, 6.0, 0.0, 5.0, 5.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-06, -1.794658601284027e-06, -1.7415732145309448e-06, -1.6884878277778625e-06, -1.6354024410247803e-06, -1.582317054271698e-06, -1.5292316675186157e-06, -1.4761462807655334e-06, -1.4230608940124512e-06, -1.369975507259369e-06, -1.3168901205062866e-06, -1.2638047337532043e-06, -1.210719347000122e-06, -1.1576339602470398e-06, -1.1045485734939575e-06, -1.0514631867408752e-06, -9.98377799987793e-07, -9.452924132347107e-07, -8.922070264816284e-07, -8.391216397285461e-07, -7.860362529754639e-07, -7.329508662223816e-07, -6.798654794692993e-07, -6.26780092716217e-07, -5.736947059631348e-07, -5.206093192100525e-07, -4.675239324569702e-07, -4.1443854570388794e-07, -3.6135315895080566e-07, -3.082677721977234e-07, -2.551823854446411e-07, -2.0209699869155884e-07, -1.4901161193847656e-07, -9.592622518539429e-08, -4.284083843231201e-08, 1.0244548320770264e-08, 6.332993507385254e-08, 1.1641532182693481e-07, 1.695007085800171e-07, 2.2258609533309937e-07, 2.7567148208618164e-07, 3.287568688392639e-07, 3.818422555923462e-07, 4.3492764234542847e-07, 4.880130290985107e-07, 5.41098415851593e-07, 5.941838026046753e-07, 6.472691893577576e-07, 7.003545761108398e-07, 7.534399628639221e-07, 8.065253496170044e-07, 8.596107363700867e-07, 9.126961231231689e-07, 9.657815098762512e-07, 1.0188668966293335e-06, 1.0719522833824158e-06, 1.125037670135498e-06, 1.1781230568885803e-06, 1.2312084436416626e-06, 1.2842938303947449e-06, 1.3373792171478271e-06, 1.3904646039009094e-06, 1.4435499906539917e-06, 1.496635377407074e-06, 1.5497207641601562e-06]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 10.0, 8.0, 14.0, 16.0, 29.0, 35.0, 40.0, 43.0, 42.0, 69.0, 98.0, 144.0, 172.0, 247.0, 302.0, 347.0, 474.0, 629.0, 889.0, 1274.0, 1626.0, 2285.0, 3464.0, 5070.0, 8060.0, 13315.0, 24947.0, 63680.0, 803549.0, 57118.0, 23326.0, 12705.0, 7675.0, 5089.0, 3167.0, 2325.0, 1591.0, 1140.0, 881.0, 628.0, 433.0, 350.0, 275.0, 304.0, 212.0, 116.0, 80.0, 55.0, 44.0, 45.0, 38.0, 20.0, 22.0, 6.0, 19.0, 5.0, 11.0, 10.0, 0.0, 2.0], "bins": [-0.00011903047561645508, -0.00011536292731761932, -0.00011169537901878357, -0.00010802783071994781, -0.00010436028242111206, -0.0001006927341222763, -9.702518582344055e-05, -9.33576375246048e-05, -8.969008922576904e-05, -8.602254092693329e-05, -8.235499262809753e-05, -7.868744432926178e-05, -7.501989603042603e-05, -7.135234773159027e-05, -6.768479943275452e-05, -6.401725113391876e-05, -6.034970283508301e-05, -5.6682154536247253e-05, -5.30146062374115e-05, -4.9347057938575745e-05, -4.567950963973999e-05, -4.2011961340904236e-05, -3.834441304206848e-05, -3.467686474323273e-05, -3.100931644439697e-05, -2.7341768145561218e-05, -2.3674219846725464e-05, -2.000667154788971e-05, -1.6339123249053955e-05, -1.26715749502182e-05, -9.004026651382446e-06, -5.336478352546692e-06, -1.6689300537109375e-06, 1.998618245124817e-06, 5.666166543960571e-06, 9.333714842796326e-06, 1.300126314163208e-05, 1.6668811440467834e-05, 2.033635973930359e-05, 2.4003908038139343e-05, 2.7671456336975098e-05, 3.133900463581085e-05, 3.5006552934646606e-05, 3.867410123348236e-05, 4.2341649532318115e-05, 4.600919783115387e-05, 4.9676746129989624e-05, 5.334429442882538e-05, 5.701184272766113e-05, 6.067939102649689e-05, 6.434693932533264e-05, 6.80144876241684e-05, 7.168203592300415e-05, 7.53495842218399e-05, 7.901713252067566e-05, 8.268468081951141e-05, 8.635222911834717e-05, 9.001977741718292e-05, 9.368732571601868e-05, 9.735487401485443e-05, 0.00010102242231369019, 0.00010468997061252594, 0.0001083575189113617, 0.00011202506721019745, 0.0001156926155090332]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 7.0, 12.0, 11.0, 6.0, 9.0, 18.0, 16.0, 26.0, 27.0, 89.0, 571.0, 63.0, 20.0, 17.0, 14.0, 15.0, 12.0, 3.0, 7.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4749507904052734e-05, -3.360491245985031e-05, -3.246031701564789e-05, -3.1315721571445465e-05, -3.0171126127243042e-05, -2.902653068304062e-05, -2.7881935238838196e-05, -2.6737339794635773e-05, -2.559274435043335e-05, -2.4448148906230927e-05, -2.3303553462028503e-05, -2.215895801782608e-05, -2.1014362573623657e-05, -1.9869767129421234e-05, -1.872517168521881e-05, -1.7580576241016388e-05, -1.6435980796813965e-05, -1.5291385352611542e-05, -1.4146789908409119e-05, -1.3002194464206696e-05, -1.1857599020004272e-05, -1.071300357580185e-05, -9.568408131599426e-06, -8.423812687397003e-06, -7.27921724319458e-06, -6.134621798992157e-06, -4.990026354789734e-06, -3.845430910587311e-06, -2.7008354663848877e-06, -1.5562400221824646e-06, -4.116445779800415e-07, 7.329508662223816e-07, 1.8775463104248047e-06, 3.0221417546272278e-06, 4.166737198829651e-06, 5.311332643032074e-06, 6.455928087234497e-06, 7.60052353143692e-06, 8.745118975639343e-06, 9.889714419841766e-06, 1.103430986404419e-05, 1.2178905308246613e-05, 1.3323500752449036e-05, 1.4468096196651459e-05, 1.5612691640853882e-05, 1.6757287085056305e-05, 1.7901882529258728e-05, 1.904647797346115e-05, 2.0191073417663574e-05, 2.1335668861865997e-05, 2.248026430606842e-05, 2.3624859750270844e-05, 2.4769455194473267e-05, 2.591405063867569e-05, 2.7058646082878113e-05, 2.8203241527080536e-05, 2.934783697128296e-05, 3.0492432415485382e-05, 3.1637027859687805e-05, 3.278162330389023e-05, 3.392621874809265e-05, 3.5070814192295074e-05, 3.62154096364975e-05, 3.736000508069992e-05, 3.8504600524902344e-05]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 7.0, 10.0, 10.0, 12.0, 11.0, 12.0, 21.0, 24.0, 38.0, 48.0, 66.0, 87.0, 100.0, 103.0, 78.0, 67.0, 71.0, 49.0, 38.0, 47.0, 26.0, 10.0, 6.0, 11.0, 7.0, 6.0, 8.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0003639767237473279, -0.00035393895814195275, -0.00034390122164040804, -0.00033386345603503287, -0.0003238256904296577, -0.0003137879248242825, -0.00030375015921890736, -0.00029371242271736264, -0.00028367465711198747, -0.0002736368915066123, -0.0002635991550050676, -0.0002535613893996924, -0.00024352362379431725, -0.00023348585818894207, -0.00022344810713548213, -0.0002134103560820222, -0.00020337259047664702, -0.00019333482487127185, -0.0001832970738178119, -0.00017325932276435196, -0.0001632215571589768, -0.00015318379155360162, -0.00014314604050014168, -0.00013310828944668174, -0.00012307052384130657, -0.00011303276551188901, -0.00010299500718247145, -9.29572488530539e-05, -8.291949052363634e-05, -7.288173219421878e-05, -6.284397386480123e-05, -5.280621553538367e-05, -4.276842810213566e-05, -3.27306697727181e-05, -2.2692911443300545e-05, -1.2655153113882989e-05, -2.617394784465432e-06, 7.420363544952124e-06, 1.745812187436968e-05, 2.7495880203787237e-05, 3.7533638533204794e-05, 4.757139686262235e-05, 5.760915519203991e-05, 6.764691352145746e-05, 7.768467185087502e-05, 8.772243018029258e-05, 9.776018850971013e-05, 0.00010779794683912769, 0.00011783570516854525, 0.00012787347077392042, 0.00013791122182738036, 0.0001479489728808403, 0.00015798673848621547, 0.00016802450409159064, 0.00017806225514505059, 0.00018810000619851053, 0.0001981377718038857, 0.00020817553740926087, 0.0002182132884627208, 0.00022825103951618075, 0.00023828880512155592, 0.0002483265707269311, 0.0002583643072284758, 0.000268402072833851, 0.00027843983843922615]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 1.0, 9.0, 7.0, 5.0, 7.0, 14.0, 11.0, 17.0, 26.0, 18.0, 19.0, 26.0, 35.0, 29.0, 29.0, 41.0, 29.0, 32.0, 33.0, 52.0, 42.0, 45.0, 44.0, 31.0, 39.0, 38.0, 32.0, 32.0, 34.0, 27.0, 30.0, 24.0, 28.0, 22.0, 17.0, 16.0, 10.0, 8.0, 12.0, 4.0, 7.0, 6.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00021589358220808208, -0.00020922219846397638, -0.0002025508147198707, -0.000195879430975765, -0.00018920806178357452, -0.00018253667803946882, -0.00017586529429536313, -0.00016919391055125743, -0.00016252254135906696, -0.00015585115761496127, -0.00014917977387085557, -0.00014250839012674987, -0.0001358370209345594, -0.0001291656371904537, -0.000122494253446348, -0.00011582286970224231, -0.00010915148595813662, -0.00010248010221403092, -9.580872574588284e-05, -8.913734200177714e-05, -8.246596553362906e-05, -7.579458178952336e-05, -6.912319804541767e-05, -6.245181430131197e-05, -5.578043783316389e-05, -4.9109057727037e-05, -4.243767762091011e-05, -3.576629387680441e-05, -2.9094913770677522e-05, -2.2423533664550632e-05, -1.5752149920444936e-05, -9.080769814318046e-06, -2.4093897081911564e-06, 4.261991307430435e-06, 1.0933372323052026e-05, 1.760475424816832e-05, 2.427613435429521e-05, 3.09475144604221e-05, 3.7618898204527795e-05, 4.4290278310654685e-05, 5.0961658416781574e-05, 5.7633038522908464e-05, 6.430441862903535e-05, 7.097580237314105e-05, 7.764718611724675e-05, 8.431856258539483e-05, 9.098994632950053e-05, 9.766132279764861e-05, 0.0001043327065417543, 0.00011100409028586, 0.00011767546675400808, 0.00012434684322215617, 0.00013101822696626186, 0.00013768961071036756, 0.00014436099445447326, 0.00015103237819857895, 0.00015770376194268465, 0.00016437514568679035, 0.00017104652943089604, 0.00017771791317500174, 0.0001843892823671922, 0.0001910606661112979, 0.0001977320498554036, 0.0002044034335995093, 0.00021107480279169977]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 5.0, 8.0, 11.0, 14.0, 25.0, 35.0, 55.0, 51.0, 110.0, 133.0, 192.0, 299.0, 423.0, 571.0, 833.0, 1212.0, 1691.0, 2499.0, 3671.0, 5356.0, 8032.0, 12088.0, 18259.0, 28315.0, 44858.0, 73105.0, 125162.0, 230084.0, 534736.0, 1285427.0, 990603.0, 375935.0, 179828.0, 101126.0, 60526.0, 37651.0, 24136.0, 15232.0, 10165.0, 6777.0, 4659.0, 3089.0, 2232.0, 1510.0, 1070.0, 746.0, 551.0, 362.0, 259.0, 167.0, 119.0, 110.0, 61.0, 38.0, 26.0, 27.0, 15.0, 7.0, 1.0, 3.0], "bins": [-0.00024008750915527344, -0.00023298710584640503, -0.00022588670253753662, -0.0002187862992286682, -0.0002116858959197998, -0.0002045854926109314, -0.000197485089302063, -0.00019038468599319458, -0.00018328428268432617, -0.00017618387937545776, -0.00016908347606658936, -0.00016198307275772095, -0.00015488266944885254, -0.00014778226613998413, -0.00014068186283111572, -0.00013358145952224731, -0.0001264810562133789, -0.0001193806529045105, -0.00011228024959564209, -0.00010517984628677368, -9.807944297790527e-05, -9.097903966903687e-05, -8.387863636016846e-05, -7.677823305130005e-05, -6.967782974243164e-05, -6.257742643356323e-05, -5.5477023124694824e-05, -4.8376619815826416e-05, -4.127621650695801e-05, -3.41758131980896e-05, -2.707540988922119e-05, -1.9975006580352783e-05, -1.2874603271484375e-05, -5.774199962615967e-06, 1.3262033462524414e-06, 8.42660665512085e-06, 1.5527009963989258e-05, 2.2627413272857666e-05, 2.9727816581726074e-05, 3.682821989059448e-05, 4.392862319946289e-05, 5.10290265083313e-05, 5.812942981719971e-05, 6.522983312606812e-05, 7.233023643493652e-05, 7.943063974380493e-05, 8.653104305267334e-05, 9.363144636154175e-05, 0.00010073184967041016, 0.00010783225297927856, 0.00011493265628814697, 0.00012203305959701538, 0.0001291334629058838, 0.0001362338662147522, 0.0001433342695236206, 0.00015043467283248901, 0.00015753507614135742, 0.00016463547945022583, 0.00017173588275909424, 0.00017883628606796265, 0.00018593668937683105, 0.00019303709268569946, 0.00020013749599456787, 0.00020723789930343628, 0.0002143383026123047]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 4.0, 12.0, 9.0, 11.0, 15.0, 10.0, 17.0, 18.0, 18.0, 22.0, 28.0, 31.0, 14.0, 38.0, 30.0, 33.0, 37.0, 40.0, 47.0, 47.0, 30.0, 33.0, 39.0, 41.0, 29.0, 41.0, 32.0, 28.0, 27.0, 32.0, 22.0, 20.0, 27.0, 19.0, 15.0, 16.0, 8.0, 8.0, 8.0, 11.0, 7.0, 4.0, 3.0, 3.0, 1.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00011134147644042969, -0.0001075640320777893, -0.00010378658771514893, -0.00010000914335250854, -9.623169898986816e-05, -9.245425462722778e-05, -8.86768102645874e-05, -8.489936590194702e-05, -8.112192153930664e-05, -7.734447717666626e-05, -7.356703281402588e-05, -6.97895884513855e-05, -6.601214408874512e-05, -6.223469972610474e-05, -5.8457255363464355e-05, -5.4679811000823975e-05, -5.0902366638183594e-05, -4.712492227554321e-05, -4.334747791290283e-05, -3.957003355026245e-05, -3.579258918762207e-05, -3.201514482498169e-05, -2.823770046234131e-05, -2.4460256099700928e-05, -2.0682811737060547e-05, -1.6905367374420166e-05, -1.3127923011779785e-05, -9.350478649139404e-06, -5.5730342864990234e-06, -1.7955899238586426e-06, 1.9818544387817383e-06, 5.759298801422119e-06, 9.5367431640625e-06, 1.3314187526702881e-05, 1.7091631889343262e-05, 2.0869076251983643e-05, 2.4646520614624023e-05, 2.8423964977264404e-05, 3.2201409339904785e-05, 3.5978853702545166e-05, 3.975629806518555e-05, 4.353374242782593e-05, 4.731118679046631e-05, 5.108863115310669e-05, 5.486607551574707e-05, 5.864351987838745e-05, 6.242096424102783e-05, 6.619840860366821e-05, 6.99758529663086e-05, 7.375329732894897e-05, 7.753074169158936e-05, 8.130818605422974e-05, 8.508563041687012e-05, 8.88630747795105e-05, 9.264051914215088e-05, 9.641796350479126e-05, 0.00010019540786743164, 0.00010397285223007202, 0.0001077502965927124, 0.00011152774095535278, 0.00011530518531799316, 0.00011908262968063354, 0.00012286007404327393, 0.0001266375184059143, 0.0001304149627685547]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 7.0, 10.0, 12.0, 15.0, 37.0, 60.0, 42.0, 86.0, 149.0, 188.0, 310.0, 486.0, 677.0, 1012.0, 1645.0, 2525.0, 3776.0, 6075.0, 9606.0, 15733.0, 25531.0, 42646.0, 71562.0, 127239.0, 237039.0, 502610.0, 1193080.0, 1026507.0, 434528.0, 212070.0, 112773.0, 65469.0, 38761.0, 22973.0, 14271.0, 9002.0, 5471.0, 3524.0, 2405.0, 1480.0, 943.0, 645.0, 413.0, 298.0, 194.0, 122.0, 86.0, 76.0, 40.0, 32.0, 12.0, 14.0, 6.0, 5.0, 6.0, 4.0, 2.0], "bins": [-0.0002256631851196289, -0.0002190079540014267, -0.0002123527228832245, -0.00020569749176502228, -0.00019904226064682007, -0.00019238702952861786, -0.00018573179841041565, -0.00017907656729221344, -0.00017242133617401123, -0.00016576610505580902, -0.0001591108739376068, -0.0001524556428194046, -0.0001458004117012024, -0.00013914518058300018, -0.00013248994946479797, -0.00012583471834659576, -0.00011917948722839355, -0.00011252425611019135, -0.00010586902499198914, -9.921379387378693e-05, -9.255856275558472e-05, -8.590333163738251e-05, -7.92481005191803e-05, -7.259286940097809e-05, -6.593763828277588e-05, -5.928240716457367e-05, -5.262717604637146e-05, -4.597194492816925e-05, -3.931671380996704e-05, -3.266148269176483e-05, -2.6006251573562622e-05, -1.9351020455360413e-05, -1.2695789337158203e-05, -6.040558218955994e-06, 6.146728992462158e-07, 7.269904017448425e-06, 1.3925135135650635e-05, 2.0580366253852844e-05, 2.7235597372055054e-05, 3.389082849025726e-05, 4.054605960845947e-05, 4.720129072666168e-05, 5.385652184486389e-05, 6.05117529630661e-05, 6.716698408126831e-05, 7.382221519947052e-05, 8.047744631767273e-05, 8.713267743587494e-05, 9.378790855407715e-05, 0.00010044313967227936, 0.00010709837079048157, 0.00011375360190868378, 0.00012040883302688599, 0.0001270640641450882, 0.0001337192952632904, 0.00014037452638149261, 0.00014702975749969482, 0.00015368498861789703, 0.00016034021973609924, 0.00016699545085430145, 0.00017365068197250366, 0.00018030591309070587, 0.00018696114420890808, 0.0001936163753271103, 0.0002002716064453125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 11.0, 14.0, 20.0, 20.0, 25.0, 33.0, 33.0, 66.0, 72.0, 79.0, 92.0, 100.0, 109.0, 138.0, 175.0, 203.0, 218.0, 225.0, 240.0, 252.0, 242.0, 248.0, 216.0, 205.0, 177.0, 135.0, 113.0, 96.0, 92.0, 79.0, 58.0, 52.0, 56.0, 45.0, 30.0, 26.0, 20.0, 11.0, 10.0, 6.0, 7.0, 3.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.216764450073242e-05, -6.006751209497452e-05, -5.7967379689216614e-05, -5.586724728345871e-05, -5.3767114877700806e-05, -5.16669824719429e-05, -4.9566850066185e-05, -4.7466717660427094e-05, -4.536658525466919e-05, -4.3266452848911285e-05, -4.116632044315338e-05, -3.906618803739548e-05, -3.696605563163757e-05, -3.486592322587967e-05, -3.2765790820121765e-05, -3.066565841436386e-05, -2.8565526008605957e-05, -2.6465393602848053e-05, -2.436526119709015e-05, -2.2265128791332245e-05, -2.016499638557434e-05, -1.8064863979816437e-05, -1.5964731574058533e-05, -1.3864599168300629e-05, -1.1764466762542725e-05, -9.66433435678482e-06, -7.5642019510269165e-06, -5.4640695452690125e-06, -3.3639371395111084e-06, -1.2638047337532043e-06, 8.363276720046997e-07, 2.9364600777626038e-06, 5.036592483520508e-06, 7.136724889278412e-06, 9.236857295036316e-06, 1.133698970079422e-05, 1.3437122106552124e-05, 1.5537254512310028e-05, 1.7637386918067932e-05, 1.9737519323825836e-05, 2.183765172958374e-05, 2.3937784135341644e-05, 2.603791654109955e-05, 2.8138048946857452e-05, 3.0238181352615356e-05, 3.233831375837326e-05, 3.4438446164131165e-05, 3.653857856988907e-05, 3.863871097564697e-05, 4.073884338140488e-05, 4.283897578716278e-05, 4.4939108192920685e-05, 4.703924059867859e-05, 4.913937300443649e-05, 5.12395054101944e-05, 5.33396378159523e-05, 5.5439770221710205e-05, 5.753990262746811e-05, 5.964003503322601e-05, 6.174016743898392e-05, 6.384029984474182e-05, 6.594043225049973e-05, 6.804056465625763e-05, 7.014069706201553e-05, 7.224082946777344e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 6.0, 5.0, 9.0, 5.0, 11.0, 12.0, 15.0, 24.0, 17.0, 33.0, 40.0, 43.0, 59.0, 62.0, 97.0, 92.0, 73.0, 66.0, 55.0, 55.0, 35.0, 33.0, 24.0, 27.0, 21.0, 9.0, 10.0, 15.0, 4.0, 6.0, 6.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.00020644454343710095, -0.00020093427156098187, -0.0001954239996848628, -0.00018991372780874372, -0.00018440347048453987, -0.0001788931986084208, -0.0001733829267323017, -0.00016787265485618263, -0.00016236238298006356, -0.00015685211110394448, -0.0001513418392278254, -0.00014583156735170633, -0.00014032129547558725, -0.0001348110381513834, -0.00012930076627526432, -0.00012379049439914525, -0.00011828022252302617, -0.00011276995064690709, -0.00010725967877078801, -0.00010174941417062655, -9.623914229450747e-05, -9.07288704183884e-05, -8.521860581822693e-05, -7.970833394210786e-05, -7.419806206598878e-05, -6.86877901898697e-05, -6.317751831375062e-05, -5.766725371358916e-05, -5.2156981837470084e-05, -4.664670996135101e-05, -4.113644172321074e-05, -3.562617348507047e-05, -3.011590160895139e-05, -2.4605631551821716e-05, -1.9095361494692042e-05, -1.3585091437562369e-05, -8.074821380432695e-06, -2.5645513233030215e-06, 2.945718733826652e-06, 8.455986971966922e-06, 1.3966258848086e-05, 1.9476528905215673e-05, 2.4986798962345347e-05, 3.049706901947502e-05, 3.6007339076604694e-05, 4.151761095272377e-05, 4.702787919086404e-05, 5.253814742900431e-05, 5.804841930512339e-05, 6.355869118124247e-05, 6.906896305736154e-05, 7.4579227657523e-05, 8.008949953364208e-05, 8.559977140976116e-05, 9.111003600992262e-05, 9.66203078860417e-05, 0.00010213057976216078, 0.00010764085163827986, 0.00011315112351439893, 0.0001186613881145604, 0.0001241716672666371, 0.00012968192459084094, 0.00013519219646696, 0.0001407024683430791, 0.00014621274021919817]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 3.0, 2.0, 1.0, 5.0, 13.0, 11.0, 15.0, 11.0, 27.0, 10.0, 21.0, 36.0, 21.0, 25.0, 25.0, 25.0, 43.0, 29.0, 42.0, 41.0, 36.0, 29.0, 32.0, 35.0, 37.0, 46.0, 37.0, 43.0, 39.0, 26.0, 23.0, 32.0, 22.0, 16.0, 26.0, 16.0, 13.0, 15.0, 11.0, 13.0, 11.0, 9.0, 9.0, 8.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00013573053001891822, -0.0001316455309279263, -0.00012756051728501916, -0.00012347551819402725, -0.00011939051910303533, -0.0001153055127360858, -0.00011122050636913627, -0.00010713550727814436, -0.00010305050091119483, -9.89654945442453e-05, -9.488049545325339e-05, -9.079548908630386e-05, -8.671048271935433e-05, -8.262548362836242e-05, -7.854047726141289e-05, -7.445547089446336e-05, -7.037047180347145e-05, -6.628546543652192e-05, -6.220046634553e-05, -5.8115459978580475e-05, -5.4030457249609753e-05, -4.994545452063903e-05, -4.5860448153689504e-05, -4.177544542471878e-05, -3.769044269574806e-05, -3.360543996677734e-05, -2.9520435418817215e-05, -2.543543087085709e-05, -2.135042814188637e-05, -1.7265425412915647e-05, -1.3180420864955522e-05, -9.095416316995397e-06, -5.010428139939904e-06, -9.254245014744811e-07, 3.159579136990942e-06, 7.244582775456365e-06, 1.1329586413921788e-05, 1.541458914289251e-05, 1.9499593690852635e-05, 2.358459823881276e-05, 2.766960096778348e-05, 3.17546036967542e-05, 3.5839606425724924e-05, 3.992461279267445e-05, 4.4009615521645173e-05, 4.8094618250615895e-05, 5.217962461756542e-05, 5.6264627346536145e-05, 6.0349630075506866e-05, 6.44346364424564e-05, 6.851963553344831e-05, 7.260464190039784e-05, 7.668964099138975e-05, 8.077464735833928e-05, 8.485965372528881e-05, 8.894465281628072e-05, 9.302965918323025e-05, 9.711466555017978e-05, 0.0001011996646411717, 0.00010528467100812122, 0.00010936967737507075, 0.00011345467646606266, 0.0001175396828330122, 0.00012162468919996172, 0.00012570968829095364]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 10.0, 11.0, 24.0, 26.0, 37.0, 63.0, 78.0, 109.0, 176.0, 232.0, 402.0, 507.0, 755.0, 1157.0, 1803.0, 2663.0, 4248.0, 6503.0, 10066.0, 16250.0, 25526.0, 41279.0, 66340.0, 106496.0, 168104.0, 199094.0, 147659.0, 93098.0, 58326.0, 35523.0, 21961.0, 14363.0, 9078.0, 5779.0, 3696.0, 2393.0, 1620.0, 1023.0, 688.0, 480.0, 254.0, 201.0, 151.0, 104.0, 70.0, 44.0, 30.0, 22.0, 15.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0], "bins": [-0.00021314620971679688, -0.00020675547420978546, -0.00020036473870277405, -0.00019397400319576263, -0.00018758326768875122, -0.0001811925321817398, -0.0001748017966747284, -0.00016841106116771698, -0.00016202032566070557, -0.00015562959015369415, -0.00014923885464668274, -0.00014284811913967133, -0.0001364573836326599, -0.0001300666481256485, -0.00012367591261863708, -0.00011728517711162567, -0.00011089444160461426, -0.00010450370609760284, -9.811297059059143e-05, -9.172223508358002e-05, -8.53314995765686e-05, -7.894076406955719e-05, -7.255002856254578e-05, -6.615929305553436e-05, -5.976855754852295e-05, -5.3377822041511536e-05, -4.698708653450012e-05, -4.059635102748871e-05, -3.4205615520477295e-05, -2.781488001346588e-05, -2.1424144506454468e-05, -1.5033408999443054e-05, -8.64267349243164e-06, -2.251937985420227e-06, 4.1387975215911865e-06, 1.05295330286026e-05, 1.6920268535614014e-05, 2.3311004042625427e-05, 2.970173954963684e-05, 3.6092475056648254e-05, 4.248321056365967e-05, 4.887394607067108e-05, 5.5264681577682495e-05, 6.165541708469391e-05, 6.804615259170532e-05, 7.443688809871674e-05, 8.082762360572815e-05, 8.721835911273956e-05, 9.360909461975098e-05, 9.999983012676239e-05, 0.0001063905656337738, 0.00011278130114078522, 0.00011917203664779663, 0.00012556277215480804, 0.00013195350766181946, 0.00013834424316883087, 0.00014473497867584229, 0.0001511257141828537, 0.0001575164496898651, 0.00016390718519687653, 0.00017029792070388794, 0.00017668865621089935, 0.00018307939171791077, 0.00018947012722492218, 0.0001958608627319336]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 5.0, 3.0, 5.0, 6.0, 11.0, 11.0, 20.0, 23.0, 20.0, 29.0, 21.0, 19.0, 27.0, 25.0, 37.0, 30.0, 28.0, 35.0, 30.0, 39.0, 37.0, 25.0, 29.0, 46.0, 46.0, 39.0, 43.0, 39.0, 38.0, 23.0, 24.0, 26.0, 26.0, 22.0, 22.0, 11.0, 13.0, 15.0, 6.0, 12.0, 13.0, 10.0, 1.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.00011938810348510742, -0.00011594314128160477, -0.00011249817907810211, -0.00010905321687459946, -0.0001056082546710968, -0.00010216329246759415, -9.871833026409149e-05, -9.527336806058884e-05, -9.182840585708618e-05, -8.838344365358353e-05, -8.493848145008087e-05, -8.149351924657822e-05, -7.804855704307556e-05, -7.46035948395729e-05, -7.115863263607025e-05, -6.77136704325676e-05, -6.426870822906494e-05, -6.0823746025562286e-05, -5.737878382205963e-05, -5.3933821618556976e-05, -5.048885941505432e-05, -4.7043897211551666e-05, -4.359893500804901e-05, -4.0153972804546356e-05, -3.67090106010437e-05, -3.3264048397541046e-05, -2.981908619403839e-05, -2.6374123990535736e-05, -2.292916178703308e-05, -1.9484199583530426e-05, -1.603923738002777e-05, -1.2594275176525116e-05, -9.149312973022461e-06, -5.704350769519806e-06, -2.259388566017151e-06, 1.1855736374855042e-06, 4.630535840988159e-06, 8.075498044490814e-06, 1.152046024799347e-05, 1.4965422451496124e-05, 1.841038465499878e-05, 2.1855346858501434e-05, 2.530030906200409e-05, 2.8745271265506744e-05, 3.21902334690094e-05, 3.5635195672512054e-05, 3.908015787601471e-05, 4.2525120079517365e-05, 4.597008228302002e-05, 4.9415044486522675e-05, 5.286000669002533e-05, 5.6304968893527985e-05, 5.974993109703064e-05, 6.31948933005333e-05, 6.663985550403595e-05, 7.00848177075386e-05, 7.352977991104126e-05, 7.697474211454391e-05, 8.041970431804657e-05, 8.386466652154922e-05, 8.730962872505188e-05, 9.075459092855453e-05, 9.419955313205719e-05, 9.764451533555984e-05, 0.0001010894775390625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 10.0, 7.0, 10.0, 26.0, 34.0, 56.0, 87.0, 146.0, 216.0, 323.0, 492.0, 845.0, 1381.0, 2404.0, 4314.0, 8626.0, 18867.0, 52660.0, 271766.0, 541612.0, 92389.0, 27401.0, 11524.0, 5808.0, 3082.0, 1779.0, 1005.0, 597.0, 378.0, 251.0, 160.0, 109.0, 61.0, 40.0, 17.0, 17.0, 8.0, 13.0, 10.0, 2.0, 9.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003447532653808594, -0.0003310739994049072, -0.0003173947334289551, -0.00030371546745300293, -0.0002900362014770508, -0.00027635693550109863, -0.0002626776695251465, -0.00024899840354919434, -0.0002353191375732422, -0.00022163987159729004, -0.0002079606056213379, -0.00019428133964538574, -0.0001806020736694336, -0.00016692280769348145, -0.0001532435417175293, -0.00013956427574157715, -0.000125885009765625, -0.00011220574378967285, -9.85264778137207e-05, -8.484721183776855e-05, -7.11679458618164e-05, -5.748867988586426e-05, -4.380941390991211e-05, -3.013014793395996e-05, -1.6450881958007812e-05, -2.771615982055664e-06, 1.0907649993896484e-05, 2.4586915969848633e-05, 3.826618194580078e-05, 5.194544792175293e-05, 6.562471389770508e-05, 7.930397987365723e-05, 9.298324584960938e-05, 0.00010666251182556152, 0.00012034177780151367, 0.00013402104377746582, 0.00014770030975341797, 0.00016137957572937012, 0.00017505884170532227, 0.00018873810768127441, 0.00020241737365722656, 0.0002160966396331787, 0.00022977590560913086, 0.000243455171585083, 0.00025713443756103516, 0.0002708137035369873, 0.00028449296951293945, 0.0002981722354888916, 0.00031185150146484375, 0.0003255307674407959, 0.00033921003341674805, 0.0003528892993927002, 0.00036656856536865234, 0.0003802478313446045, 0.00039392709732055664, 0.0004076063632965088, 0.00042128562927246094, 0.0004349648952484131, 0.00044864416122436523, 0.0004623234272003174, 0.00047600269317626953, 0.0004896819591522217, 0.0005033612251281738, 0.000517040491104126, 0.0005307197570800781]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 2.0, 4.0, 9.0, 6.0, 9.0, 10.0, 20.0, 11.0, 21.0, 24.0, 16.0, 24.0, 23.0, 29.0, 28.0, 30.0, 33.0, 41.0, 42.0, 48.0, 37.0, 41.0, 38.0, 52.0, 36.0, 45.0, 37.0, 23.0, 34.0, 25.0, 28.0, 22.0, 24.0, 27.0, 14.0, 14.0, 12.0, 16.0, 12.0, 5.0, 8.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.514787673950195e-05, -6.292946636676788e-05, -6.0711055994033813e-05, -5.8492645621299744e-05, -5.6274235248565674e-05, -5.4055824875831604e-05, -5.1837414503097534e-05, -4.9619004130363464e-05, -4.7400593757629395e-05, -4.5182183384895325e-05, -4.2963773012161255e-05, -4.0745362639427185e-05, -3.8526952266693115e-05, -3.6308541893959045e-05, -3.4090131521224976e-05, -3.1871721148490906e-05, -2.9653310775756836e-05, -2.7434900403022766e-05, -2.5216490030288696e-05, -2.2998079657554626e-05, -2.0779669284820557e-05, -1.8561258912086487e-05, -1.6342848539352417e-05, -1.4124438166618347e-05, -1.1906027793884277e-05, -9.687617421150208e-06, -7.469207048416138e-06, -5.250796675682068e-06, -3.032386302947998e-06, -8.139759302139282e-07, 1.4044344425201416e-06, 3.6228448152542114e-06, 5.841255187988281e-06, 8.059665560722351e-06, 1.0278075933456421e-05, 1.249648630619049e-05, 1.471489667892456e-05, 1.693330705165863e-05, 1.91517174243927e-05, 2.137012779712677e-05, 2.358853816986084e-05, 2.580694854259491e-05, 2.802535891532898e-05, 3.024376928806305e-05, 3.246217966079712e-05, 3.468059003353119e-05, 3.689900040626526e-05, 3.911741077899933e-05, 4.13358211517334e-05, 4.355423152446747e-05, 4.577264189720154e-05, 4.799105226993561e-05, 5.020946264266968e-05, 5.242787301540375e-05, 5.464628338813782e-05, 5.686469376087189e-05, 5.908310413360596e-05, 6.130151450634003e-05, 6.35199248790741e-05, 6.573833525180817e-05, 6.795674562454224e-05, 7.01751559972763e-05, 7.239356637001038e-05, 7.461197674274445e-05, 7.683038711547852e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 8.0, 5.0, 7.0, 22.0, 22.0, 34.0, 52.0, 77.0, 106.0, 175.0, 267.0, 412.0, 720.0, 1070.0, 2055.0, 3864.0, 8797.0, 26136.0, 154172.0, 744522.0, 74652.0, 17431.0, 6601.0, 3120.0, 1664.0, 937.0, 547.0, 369.0, 246.0, 144.0, 112.0, 66.0, 44.0, 33.0, 15.0, 12.0, 14.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.0001652240753173828, -0.00016079843044281006, -0.0001563727855682373, -0.00015194714069366455, -0.0001475214958190918, -0.00014309585094451904, -0.0001386702060699463, -0.00013424456119537354, -0.00012981891632080078, -0.00012539327144622803, -0.00012096762657165527, -0.00011654198169708252, -0.00011211633682250977, -0.00010769069194793701, -0.00010326504707336426, -9.88394021987915e-05, -9.441375732421875e-05, -8.9988112449646e-05, -8.556246757507324e-05, -8.113682270050049e-05, -7.671117782592773e-05, -7.228553295135498e-05, -6.785988807678223e-05, -6.343424320220947e-05, -5.900859832763672e-05, -5.4582953453063965e-05, -5.015730857849121e-05, -4.573166370391846e-05, -4.13060188293457e-05, -3.688037395477295e-05, -3.2454729080200195e-05, -2.802908420562744e-05, -2.3603439331054688e-05, -1.9177794456481934e-05, -1.475214958190918e-05, -1.0326504707336426e-05, -5.900859832763672e-06, -1.475214958190918e-06, 2.950429916381836e-06, 7.37607479095459e-06, 1.1801719665527344e-05, 1.6227364540100098e-05, 2.065300941467285e-05, 2.5078654289245605e-05, 2.950429916381836e-05, 3.392994403839111e-05, 3.835558891296387e-05, 4.278123378753662e-05, 4.7206878662109375e-05, 5.163252353668213e-05, 5.605816841125488e-05, 6.048381328582764e-05, 6.490945816040039e-05, 6.933510303497314e-05, 7.37607479095459e-05, 7.818639278411865e-05, 8.26120376586914e-05, 8.703768253326416e-05, 9.146332740783691e-05, 9.588897228240967e-05, 0.00010031461715698242, 0.00010474026203155518, 0.00010916590690612793, 0.00011359155178070068, 0.00011801719665527344]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 2.0, 2.0, 7.0, 5.0, 2.0, 10.0, 6.0, 11.0, 16.0, 13.0, 21.0, 16.0, 25.0, 39.0, 50.0, 57.0, 92.0, 98.0, 147.0, 95.0, 56.0, 31.0, 37.0, 36.0, 19.0, 17.0, 10.0, 11.0, 14.0, 9.0, 7.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.496906280517578e-06, -6.305985152721405e-06, -6.115064024925232e-06, -5.924142897129059e-06, -5.733221769332886e-06, -5.542300641536713e-06, -5.3513795137405396e-06, -5.1604583859443665e-06, -4.969537258148193e-06, -4.77861613035202e-06, -4.587695002555847e-06, -4.396773874759674e-06, -4.205852746963501e-06, -4.014931619167328e-06, -3.824010491371155e-06, -3.6330893635749817e-06, -3.4421682357788086e-06, -3.2512471079826355e-06, -3.0603259801864624e-06, -2.8694048523902893e-06, -2.678483724594116e-06, -2.487562596797943e-06, -2.29664146900177e-06, -2.105720341205597e-06, -1.914799213409424e-06, -1.7238780856132507e-06, -1.5329569578170776e-06, -1.3420358300209045e-06, -1.1511147022247314e-06, -9.601935744285583e-07, -7.692724466323853e-07, -5.783513188362122e-07, -3.8743019104003906e-07, -1.9650906324386597e-07, -5.587935447692871e-09, 1.8533319234848022e-07, 3.762543201446533e-07, 5.671754479408264e-07, 7.580965757369995e-07, 9.490177035331726e-07, 1.1399388313293457e-06, 1.3308599591255188e-06, 1.521781086921692e-06, 1.712702214717865e-06, 1.903623342514038e-06, 2.094544470310211e-06, 2.2854655981063843e-06, 2.4763867259025574e-06, 2.6673078536987305e-06, 2.8582289814949036e-06, 3.0491501092910767e-06, 3.2400712370872498e-06, 3.430992364883423e-06, 3.621913492679596e-06, 3.812834620475769e-06, 4.003755748271942e-06, 4.194676876068115e-06, 4.385598003864288e-06, 4.5765191316604614e-06, 4.7674402594566345e-06, 4.958361387252808e-06, 5.149282515048981e-06, 5.340203642845154e-06, 5.531124770641327e-06, 5.7220458984375e-06]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 9.0, 8.0, 25.0, 27.0, 33.0, 45.0, 72.0, 98.0, 144.0, 157.0, 306.0, 390.0, 614.0, 820.0, 1193.0, 1924.0, 2672.0, 4293.0, 7299.0, 12138.0, 22276.0, 44072.0, 107047.0, 307508.0, 321510.0, 112182.0, 45593.0, 22982.0, 12422.0, 7576.0, 4403.0, 2860.0, 1831.0, 1164.0, 826.0, 630.0, 425.0, 278.0, 204.0, 133.0, 108.0, 74.0, 51.0, 40.0, 31.0, 19.0, 12.0, 5.0, 9.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.0650367736816406e-05, -3.938097506761551e-05, -3.811158239841461e-05, -3.6842189729213715e-05, -3.557279706001282e-05, -3.430340439081192e-05, -3.303401172161102e-05, -3.1764619052410126e-05, -3.049522638320923e-05, -2.922583371400833e-05, -2.7956441044807434e-05, -2.6687048375606537e-05, -2.541765570640564e-05, -2.4148263037204742e-05, -2.2878870368003845e-05, -2.1609477698802948e-05, -2.034008502960205e-05, -1.9070692360401154e-05, -1.7801299691200256e-05, -1.653190702199936e-05, -1.5262514352798462e-05, -1.3993121683597565e-05, -1.2723729014396667e-05, -1.145433634519577e-05, -1.0184943675994873e-05, -8.915551006793976e-06, -7.646158337593079e-06, -6.376765668392181e-06, -5.107372999191284e-06, -3.837980329990387e-06, -2.5685876607894897e-06, -1.2991949915885925e-06, -2.9802322387695312e-08, 1.239590346813202e-06, 2.508983016014099e-06, 3.7783756852149963e-06, 5.0477683544158936e-06, 6.317161023616791e-06, 7.586553692817688e-06, 8.855946362018585e-06, 1.0125339031219482e-05, 1.139473170042038e-05, 1.2664124369621277e-05, 1.3933517038822174e-05, 1.5202909708023071e-05, 1.647230237722397e-05, 1.7741695046424866e-05, 1.9011087715625763e-05, 2.028048038482666e-05, 2.1549873054027557e-05, 2.2819265723228455e-05, 2.4088658392429352e-05, 2.535805106163025e-05, 2.6627443730831146e-05, 2.7896836400032043e-05, 2.916622906923294e-05, 3.0435621738433838e-05, 3.1705014407634735e-05, 3.297440707683563e-05, 3.424379974603653e-05, 3.551319241523743e-05, 3.6782585084438324e-05, 3.805197775363922e-05, 3.932137042284012e-05, 4.0590763092041016e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 10.0, 6.0, 4.0, 6.0, 9.0, 2.0, 12.0, 11.0, 19.0, 28.0, 27.0, 35.0, 26.0, 48.0, 54.0, 49.0, 64.0, 54.0, 68.0, 69.0, 50.0, 62.0, 48.0, 43.0, 36.0, 22.0, 28.0, 20.0, 18.0, 8.0, 11.0, 12.0, 7.0, 5.0, 5.0, 4.0, 7.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0192394256591797e-05, -9.858980774879456e-06, -9.525567293167114e-06, -9.192153811454773e-06, -8.858740329742432e-06, -8.52532684803009e-06, -8.191913366317749e-06, -7.858499884605408e-06, -7.525086402893066e-06, -7.191672921180725e-06, -6.858259439468384e-06, -6.5248459577560425e-06, -6.191432476043701e-06, -5.85801899433136e-06, -5.5246055126190186e-06, -5.191192030906677e-06, -4.857778549194336e-06, -4.524365067481995e-06, -4.190951585769653e-06, -3.857538104057312e-06, -3.5241246223449707e-06, -3.1907111406326294e-06, -2.857297658920288e-06, -2.5238841772079468e-06, -2.1904706954956055e-06, -1.8570572137832642e-06, -1.5236437320709229e-06, -1.1902302503585815e-06, -8.568167686462402e-07, -5.234032869338989e-07, -1.8998980522155762e-07, 1.434236764907837e-07, 4.76837158203125e-07, 8.102506399154663e-07, 1.1436641216278076e-06, 1.477077603340149e-06, 1.8104910850524902e-06, 2.1439045667648315e-06, 2.477318048477173e-06, 2.810731530189514e-06, 3.1441450119018555e-06, 3.4775584936141968e-06, 3.810971975326538e-06, 4.144385457038879e-06, 4.477798938751221e-06, 4.811212420463562e-06, 5.144625902175903e-06, 5.478039383888245e-06, 5.811452865600586e-06, 6.144866347312927e-06, 6.4782798290252686e-06, 6.81169331073761e-06, 7.145106792449951e-06, 7.4785202741622925e-06, 7.811933755874634e-06, 8.145347237586975e-06, 8.478760719299316e-06, 8.812174201011658e-06, 9.145587682723999e-06, 9.47900116443634e-06, 9.812414646148682e-06, 1.0145828127861023e-05, 1.0479241609573364e-05, 1.0812655091285706e-05, 1.1146068572998047e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 7.0, 11.0, 6.0, 22.0, 29.0, 24.0, 44.0, 38.0, 59.0, 65.0, 110.0, 97.0, 85.0, 77.0, 55.0, 57.0, 46.0, 25.0, 24.0, 18.0, 20.0, 11.0, 7.0, 9.0, 9.0, 4.0, 4.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018325835117138922, -0.00017826180555857718, -0.00017326525994576514, -0.00016826872888486832, -0.00016327218327205628, -0.00015827563765924424, -0.00015327910659834743, -0.00014828256098553538, -0.00014328601537272334, -0.0001382894697599113, -0.00013329292414709926, -0.00012829639308620244, -0.0001232998474733904, -0.00011830330186057836, -0.00011330676352372393, -0.0001083102251868695, -0.00010331367957405746, -9.831713396124542e-05, -9.332059562439099e-05, -8.832405728753656e-05, -8.332751167472452e-05, -7.833096606191248e-05, -7.333442772505805e-05, -6.833788938820362e-05, -6.334134377539158e-05, -5.8344801800558344e-05, -5.334825982572511e-05, -4.835171785089187e-05, -4.335517587605864e-05, -3.83586339012254e-05, -3.336209192639217e-05, -2.8365549951558933e-05, -2.336899342481047e-05, -1.8372451449977234e-05, -1.3375909475143999e-05, -8.379367500310764e-06, -3.3828255254775286e-06, 1.6137164493557066e-06, 6.610258424188942e-06, 1.1606800399022177e-05, 1.6603342373855412e-05, 2.1599884348688647e-05, 2.6596426323521882e-05, 3.159296829835512e-05, 3.658951027318835e-05, 4.158605224802159e-05, 4.658259422285482e-05, 5.157913619768806e-05, 5.657567817252129e-05, 6.157222378533334e-05, 6.656876212218776e-05, 7.156530045904219e-05, 7.656184607185423e-05, 8.155839168466628e-05, 8.65549300215207e-05, 9.155146835837513e-05, 9.654801397118717e-05, 0.00010154455958399922, 0.00010654109792085364, 0.00011153763625770807, 0.00011653418187052011, 0.00012153072748333216, 0.0001265272730961442, 0.000131523804157041, 0.00013652034976985306]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 4.0, 11.0, 13.0, 18.0, 16.0, 26.0, 18.0, 28.0, 23.0, 24.0, 25.0, 24.0, 44.0, 35.0, 36.0, 45.0, 39.0, 26.0, 28.0, 39.0, 41.0, 45.0, 39.0, 47.0, 39.0, 28.0, 29.0, 22.0, 28.0, 24.0, 14.0, 16.0, 22.0, 12.0, 10.0, 12.0, 14.0, 11.0, 7.0, 4.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001153466000687331, -0.0001119141816161573, -0.0001084817704395391, -0.0001050493519869633, -0.0001016169335343875, -9.818452235776931e-05, -9.475210390519351e-05, -9.13196854526177e-05, -8.78872670000419e-05, -8.44548485474661e-05, -8.102243737084791e-05, -7.759001891827211e-05, -7.41576004656963e-05, -7.072518928907812e-05, -6.729277083650231e-05, -6.386035238392651e-05, -6.0427937569329515e-05, -5.699552275473252e-05, -5.3563104302156717e-05, -5.013068948755972e-05, -4.669827103498392e-05, -4.326585622038692e-05, -3.983343776781112e-05, -3.6401022953214124e-05, -3.296860813861713e-05, -2.953619150503073e-05, -2.610377487144433e-05, -2.2671360056847334e-05, -1.923894160427153e-05, -1.5806526789674535e-05, -1.2374110156088136e-05, -8.941693522501737e-06, -5.509275069925934e-06, -2.0768586637132103e-06, 1.3555577424995136e-06, 4.787973921338562e-06, 8.220390554924961e-06, 1.1652806279016659e-05, 1.5085222912603058e-05, 1.8517639546189457e-05, 2.1950056179775856e-05, 2.5382472813362256e-05, 2.8814889446948655e-05, 3.2247306080535054e-05, 3.567972089513205e-05, 3.9112135709729046e-05, 4.254455416230485e-05, 4.597697261488065e-05, 4.940938742947765e-05, 5.284180224407464e-05, 5.6274220696650445e-05, 5.970663551124744e-05, 6.313905032584444e-05, 6.657146877842024e-05, 7.000388723099604e-05, 7.343629840761423e-05, 7.686871686019003e-05, 8.030113531276584e-05, 8.373354648938403e-05, 8.716596494195983e-05, 9.059838339453563e-05, 9.403079457115382e-05, 9.746321302372962e-05, 0.00010089563147630543, 0.00010432804992888123]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 9.0, 8.0, 9.0, 21.0, 28.0, 42.0, 56.0, 93.0, 106.0, 174.0, 240.0, 336.0, 461.0, 670.0, 913.0, 1231.0, 1754.0, 2547.0, 3458.0, 4993.0, 7266.0, 10607.0, 15761.0, 23774.0, 36322.0, 57349.0, 92725.0, 154794.0, 206365.0, 159073.0, 95782.0, 58381.0, 37398.0, 23964.0, 16346.0, 10776.0, 7453.0, 5029.0, 3547.0, 2494.0, 1776.0, 1287.0, 936.0, 641.0, 434.0, 344.0, 261.0, 157.0, 113.0, 86.0, 57.0, 36.0, 27.0, 27.0, 7.0, 11.0, 5.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.00017762184143066406, -0.00017198733985424042, -0.00016635283827781677, -0.00016071833670139313, -0.00015508383512496948, -0.00014944933354854584, -0.0001438148319721222, -0.00013818033039569855, -0.0001325458288192749, -0.00012691132724285126, -0.00012127682566642761, -0.00011564232409000397, -0.00011000782251358032, -0.00010437332093715668, -9.873881936073303e-05, -9.310431778430939e-05, -8.746981620788574e-05, -8.18353146314621e-05, -7.620081305503845e-05, -7.056631147861481e-05, -6.493180990219116e-05, -5.929730832576752e-05, -5.366280674934387e-05, -4.802830517292023e-05, -4.239380359649658e-05, -3.675930202007294e-05, -3.112480044364929e-05, -2.5490298867225647e-05, -1.9855797290802002e-05, -1.4221295714378357e-05, -8.586794137954712e-06, -2.952292561531067e-06, 2.682209014892578e-06, 8.316710591316223e-06, 1.3951212167739868e-05, 1.9585713744163513e-05, 2.5220215320587158e-05, 3.08547168970108e-05, 3.648921847343445e-05, 4.212372004985809e-05, 4.775822162628174e-05, 5.339272320270538e-05, 5.902722477912903e-05, 6.466172635555267e-05, 7.029622793197632e-05, 7.593072950839996e-05, 8.156523108482361e-05, 8.719973266124725e-05, 9.28342342376709e-05, 9.846873581409454e-05, 0.00010410323739051819, 0.00010973773896694183, 0.00011537224054336548, 0.00012100674211978912, 0.00012664124369621277, 0.00013227574527263641, 0.00013791024684906006, 0.0001435447484254837, 0.00014917925000190735, 0.000154813751578331, 0.00016044825315475464, 0.00016608275473117828, 0.00017171725630760193, 0.00017735175788402557, 0.00018298625946044922]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 5.0, 10.0, 19.0, 28.0, 13.0, 21.0, 22.0, 32.0, 24.0, 30.0, 29.0, 28.0, 37.0, 37.0, 38.0, 43.0, 31.0, 40.0, 37.0, 36.0, 38.0, 38.0, 43.0, 28.0, 42.0, 29.0, 14.0, 23.0, 30.0, 22.0, 22.0, 11.0, 12.0, 11.0, 13.0, 11.0, 5.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 5.0], "bins": [-0.00010061264038085938, -9.786803275346756e-05, -9.512342512607574e-05, -9.237881749868393e-05, -8.963420987129211e-05, -8.68896022439003e-05, -8.414499461650848e-05, -8.140038698911667e-05, -7.865577936172485e-05, -7.591117173433304e-05, -7.316656410694122e-05, -7.042195647954941e-05, -6.767734885215759e-05, -6.493274122476578e-05, -6.218813359737396e-05, -5.944352596998215e-05, -5.669891834259033e-05, -5.395431071519852e-05, -5.12097030878067e-05, -4.8465095460414886e-05, -4.572048783302307e-05, -4.2975880205631256e-05, -4.023127257823944e-05, -3.7486664950847626e-05, -3.474205732345581e-05, -3.1997449696063995e-05, -2.925284206867218e-05, -2.6508234441280365e-05, -2.376362681388855e-05, -2.1019019186496735e-05, -1.827441155910492e-05, -1.5529803931713104e-05, -1.2785196304321289e-05, -1.0040588676929474e-05, -7.295981049537659e-06, -4.5513734221458435e-06, -1.8067657947540283e-06, 9.378418326377869e-07, 3.682449460029602e-06, 6.427057087421417e-06, 9.171664714813232e-06, 1.1916272342205048e-05, 1.4660879969596863e-05, 1.7405487596988678e-05, 2.0150095224380493e-05, 2.289470285177231e-05, 2.5639310479164124e-05, 2.838391810655594e-05, 3.1128525733947754e-05, 3.387313336133957e-05, 3.6617740988731384e-05, 3.93623486161232e-05, 4.2106956243515015e-05, 4.485156387090683e-05, 4.7596171498298645e-05, 5.034077912569046e-05, 5.3085386753082275e-05, 5.582999438047409e-05, 5.8574602007865906e-05, 6.131920963525772e-05, 6.406381726264954e-05, 6.680842489004135e-05, 6.955303251743317e-05, 7.229764014482498e-05, 7.50422477722168e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 1.0, 13.0, 10.0, 15.0, 31.0, 39.0, 69.0, 85.0, 137.0, 178.0, 267.0, 422.0, 616.0, 850.0, 1254.0, 2016.0, 3010.0, 4503.0, 7285.0, 11207.0, 17937.0, 28947.0, 48321.0, 80771.0, 141551.0, 226418.0, 194051.0, 110301.0, 64490.0, 38978.0, 23500.0, 14703.0, 9288.0, 5966.0, 3779.0, 2465.0, 1626.0, 1087.0, 777.0, 482.0, 367.0, 237.0, 149.0, 116.0, 83.0, 57.0, 34.0, 14.0, 19.0, 8.0, 10.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.00018525123596191406, -0.0001794230192899704, -0.00017359480261802673, -0.00016776658594608307, -0.0001619383692741394, -0.00015611015260219574, -0.00015028193593025208, -0.0001444537192583084, -0.00013862550258636475, -0.00013279728591442108, -0.00012696906924247742, -0.00012114085257053375, -0.00011531263589859009, -0.00010948441922664642, -0.00010365620255470276, -9.78279858827591e-05, -9.199976921081543e-05, -8.617155253887177e-05, -8.03433358669281e-05, -7.451511919498444e-05, -6.868690252304077e-05, -6.285868585109711e-05, -5.703046917915344e-05, -5.120225250720978e-05, -4.537403583526611e-05, -3.954581916332245e-05, -3.3717602491378784e-05, -2.788938581943512e-05, -2.2061169147491455e-05, -1.623295247554779e-05, -1.0404735803604126e-05, -4.5765191316604614e-06, 1.2516975402832031e-06, 7.079914212226868e-06, 1.2908130884170532e-05, 1.8736347556114197e-05, 2.456456422805786e-05, 3.0392780900001526e-05, 3.622099757194519e-05, 4.2049214243888855e-05, 4.787743091583252e-05, 5.3705647587776184e-05, 5.953386425971985e-05, 6.536208093166351e-05, 7.119029760360718e-05, 7.701851427555084e-05, 8.284673094749451e-05, 8.867494761943817e-05, 9.450316429138184e-05, 0.0001003313809633255, 0.00010615959763526917, 0.00011198781430721283, 0.0001178160309791565, 0.00012364424765110016, 0.00012947246432304382, 0.0001353006809949875, 0.00014112889766693115, 0.00014695711433887482, 0.00015278533101081848, 0.00015861354768276215, 0.0001644417643547058, 0.00017026998102664948, 0.00017609819769859314, 0.0001819264143705368, 0.00018775463104248047]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 5.0, 6.0, 8.0, 6.0, 10.0, 12.0, 15.0, 17.0, 18.0, 25.0, 17.0, 26.0, 19.0, 37.0, 34.0, 27.0, 36.0, 37.0, 32.0, 35.0, 43.0, 44.0, 52.0, 38.0, 49.0, 39.0, 35.0, 31.0, 26.0, 27.0, 22.0, 16.0, 29.0, 15.0, 9.0, 13.0, 14.0, 14.0, 3.0, 11.0, 11.0, 2.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0], "bins": [-5.704164505004883e-05, -5.539972335100174e-05, -5.375780165195465e-05, -5.211587995290756e-05, -5.0473958253860474e-05, -4.8832036554813385e-05, -4.7190114855766296e-05, -4.554819315671921e-05, -4.390627145767212e-05, -4.226434975862503e-05, -4.062242805957794e-05, -3.898050636053085e-05, -3.7338584661483765e-05, -3.5696662962436676e-05, -3.405474126338959e-05, -3.24128195643425e-05, -3.077089786529541e-05, -2.912897616624832e-05, -2.7487054467201233e-05, -2.5845132768154144e-05, -2.4203211069107056e-05, -2.2561289370059967e-05, -2.091936767101288e-05, -1.927744597196579e-05, -1.76355242729187e-05, -1.5993602573871613e-05, -1.4351680874824524e-05, -1.2709759175777435e-05, -1.1067837476730347e-05, -9.425915777683258e-06, -7.78399407863617e-06, -6.142072379589081e-06, -4.500150680541992e-06, -2.8582289814949036e-06, -1.216307282447815e-06, 4.256144165992737e-07, 2.0675361156463623e-06, 3.709457814693451e-06, 5.3513795137405396e-06, 6.993301212787628e-06, 8.635222911834717e-06, 1.0277144610881805e-05, 1.1919066309928894e-05, 1.3560988008975983e-05, 1.5202909708023071e-05, 1.684483140707016e-05, 1.848675310611725e-05, 2.0128674805164337e-05, 2.1770596504211426e-05, 2.3412518203258514e-05, 2.5054439902305603e-05, 2.669636160135269e-05, 2.833828330039978e-05, 2.998020499944687e-05, 3.162212669849396e-05, 3.3264048397541046e-05, 3.4905970096588135e-05, 3.6547891795635223e-05, 3.818981349468231e-05, 3.98317351937294e-05, 4.147365689277649e-05, 4.311557859182358e-05, 4.4757500290870667e-05, 4.6399421989917755e-05, 4.8041343688964844e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 9.0, 7.0, 13.0, 22.0, 22.0, 22.0, 53.0, 56.0, 61.0, 101.0, 124.0, 161.0, 227.0, 322.0, 432.0, 623.0, 927.0, 1503.0, 2458.0, 4500.0, 11471.0, 70354.0, 919330.0, 20653.0, 6447.0, 3133.0, 1759.0, 1154.0, 707.0, 554.0, 364.0, 245.0, 181.0, 136.0, 102.0, 79.0, 58.0, 43.0, 29.0, 30.0, 24.0, 14.0, 9.0, 9.0, 13.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.412101745605469e-05, -5.2440911531448364e-05, -5.076080560684204e-05, -4.908069968223572e-05, -4.7400593757629395e-05, -4.572048783302307e-05, -4.404038190841675e-05, -4.2360275983810425e-05, -4.06801700592041e-05, -3.900006413459778e-05, -3.7319958209991455e-05, -3.563985228538513e-05, -3.395974636077881e-05, -3.2279640436172485e-05, -3.059953451156616e-05, -2.891942858695984e-05, -2.7239322662353516e-05, -2.5559216737747192e-05, -2.387911081314087e-05, -2.2199004888534546e-05, -2.0518898963928223e-05, -1.88387930393219e-05, -1.7158687114715576e-05, -1.5478581190109253e-05, -1.379847526550293e-05, -1.2118369340896606e-05, -1.0438263416290283e-05, -8.75815749168396e-06, -7.078051567077637e-06, -5.3979456424713135e-06, -3.7178397178649902e-06, -2.037733793258667e-06, -3.5762786865234375e-07, 1.3224780559539795e-06, 3.0025839805603027e-06, 4.682689905166626e-06, 6.362795829772949e-06, 8.042901754379272e-06, 9.723007678985596e-06, 1.1403113603591919e-05, 1.3083219528198242e-05, 1.4763325452804565e-05, 1.644343137741089e-05, 1.8123537302017212e-05, 1.9803643226623535e-05, 2.148374915122986e-05, 2.316385507583618e-05, 2.4843961000442505e-05, 2.6524066925048828e-05, 2.820417284965515e-05, 2.9884278774261475e-05, 3.15643846988678e-05, 3.324449062347412e-05, 3.4924596548080444e-05, 3.660470247268677e-05, 3.828480839729309e-05, 3.9964914321899414e-05, 4.164502024650574e-05, 4.332512617111206e-05, 4.5005232095718384e-05, 4.668533802032471e-05, 4.836544394493103e-05, 5.0045549869537354e-05, 5.172565579414368e-05, 5.340576171875e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 0.0, 34.0, 0.0, 0.0, 41.0, 0.0, 0.0, 79.0, 0.0, 0.0, 0.0, 178.0, 0.0, 0.0, 330.0, 0.0, 0.0, 166.0, 0.0, 0.0, 85.0, 0.0, 0.0, 42.0, 0.0, 0.0, 0.0, 33.0, 0.0, 0.0, 15.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.370246410369873e-07, -6.183981895446777e-07, -5.997717380523682e-07, -5.811452865600586e-07, -5.62518835067749e-07, -5.438923835754395e-07, -5.252659320831299e-07, -5.066394805908203e-07, -4.880130290985107e-07, -4.6938657760620117e-07, -4.507601261138916e-07, -4.3213367462158203e-07, -4.1350722312927246e-07, -3.948807716369629e-07, -3.762543201446533e-07, -3.5762786865234375e-07, -3.390014171600342e-07, -3.203749656677246e-07, -3.0174851417541504e-07, -2.8312206268310547e-07, -2.644956111907959e-07, -2.4586915969848633e-07, -2.2724270820617676e-07, -2.086162567138672e-07, -1.8998980522155762e-07, -1.7136335372924805e-07, -1.5273690223693848e-07, -1.341104507446289e-07, -1.1548399925231934e-07, -9.685754776000977e-08, -7.82310962677002e-08, -5.960464477539063e-08, -4.0978193283081055e-08, -2.2351741790771484e-08, -3.725290298461914e-09, 1.4901161193847656e-08, 3.3527612686157227e-08, 5.21540641784668e-08, 7.078051567077637e-08, 8.940696716308594e-08, 1.0803341865539551e-07, 1.2665987014770508e-07, 1.4528632164001465e-07, 1.6391277313232422e-07, 1.825392246246338e-07, 2.0116567611694336e-07, 2.1979212760925293e-07, 2.384185791015625e-07, 2.5704503059387207e-07, 2.7567148208618164e-07, 2.942979335784912e-07, 3.129243850708008e-07, 3.3155083656311035e-07, 3.501772880554199e-07, 3.688037395477295e-07, 3.8743019104003906e-07, 4.0605664253234863e-07, 4.246830940246582e-07, 4.4330954551696777e-07, 4.6193599700927734e-07, 4.805624485015869e-07, 4.991888999938965e-07, 5.178153514862061e-07, 5.364418029785156e-07]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 7.0, 5.0, 13.0, 19.0, 16.0, 18.0, 28.0, 40.0, 73.0, 80.0, 87.0, 132.0, 230.0, 282.0, 392.0, 548.0, 827.0, 1171.0, 1740.0, 2388.0, 3520.0, 6334.0, 26153.0, 958920.0, 27348.0, 6408.0, 3693.0, 2427.0, 1661.0, 1176.0, 791.0, 582.0, 392.0, 290.0, 212.0, 156.0, 115.0, 74.0, 55.0, 40.0, 32.0, 27.0, 20.0, 10.0, 4.0, 6.0, 3.0, 7.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.071826934814453e-05, -8.774455636739731e-05, -8.477084338665009e-05, -8.179713040590286e-05, -7.882341742515564e-05, -7.584970444440842e-05, -7.28759914636612e-05, -6.990227848291397e-05, -6.692856550216675e-05, -6.395485252141953e-05, -6.09811395406723e-05, -5.800742655992508e-05, -5.5033713579177856e-05, -5.2060000598430634e-05, -4.908628761768341e-05, -4.611257463693619e-05, -4.3138861656188965e-05, -4.016514867544174e-05, -3.719143569469452e-05, -3.4217722713947296e-05, -3.124400973320007e-05, -2.827029675245285e-05, -2.5296583771705627e-05, -2.2322870790958405e-05, -1.934915781021118e-05, -1.637544482946396e-05, -1.3401731848716736e-05, -1.0428018867969513e-05, -7.45430588722229e-06, -4.480592906475067e-06, -1.5068799257278442e-06, 1.4668330550193787e-06, 4.4405460357666016e-06, 7.4142590165138245e-06, 1.0387971997261047e-05, 1.336168497800827e-05, 1.6335397958755493e-05, 1.9309110939502716e-05, 2.228282392024994e-05, 2.5256536900997162e-05, 2.8230249881744385e-05, 3.120396286249161e-05, 3.417767584323883e-05, 3.7151388823986053e-05, 4.0125101804733276e-05, 4.30988147854805e-05, 4.607252776622772e-05, 4.9046240746974945e-05, 5.201995372772217e-05, 5.499366670846939e-05, 5.7967379689216614e-05, 6.094109266996384e-05, 6.391480565071106e-05, 6.688851863145828e-05, 6.98622316122055e-05, 7.283594459295273e-05, 7.580965757369995e-05, 7.878337055444717e-05, 8.17570835351944e-05, 8.473079651594162e-05, 8.770450949668884e-05, 9.067822247743607e-05, 9.365193545818329e-05, 9.662564843893051e-05, 9.959936141967773e-05]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 12.0, 23.0, 63.0, 777.0, 55.0, 20.0, 15.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.045797348022461e-05, -2.960115671157837e-05, -2.874433994293213e-05, -2.788752317428589e-05, -2.703070640563965e-05, -2.6173889636993408e-05, -2.5317072868347168e-05, -2.4460256099700928e-05, -2.3603439331054688e-05, -2.2746622562408447e-05, -2.1889805793762207e-05, -2.1032989025115967e-05, -2.0176172256469727e-05, -1.9319355487823486e-05, -1.8462538719177246e-05, -1.7605721950531006e-05, -1.6748905181884766e-05, -1.5892088413238525e-05, -1.5035271644592285e-05, -1.4178454875946045e-05, -1.3321638107299805e-05, -1.2464821338653564e-05, -1.1608004570007324e-05, -1.0751187801361084e-05, -9.894371032714844e-06, -9.037554264068604e-06, -8.180737495422363e-06, -7.323920726776123e-06, -6.467103958129883e-06, -5.610287189483643e-06, -4.753470420837402e-06, -3.896653652191162e-06, -3.039836883544922e-06, -2.1830201148986816e-06, -1.3262033462524414e-06, -4.6938657760620117e-07, 3.8743019104003906e-07, 1.2442469596862793e-06, 2.1010637283325195e-06, 2.9578804969787598e-06, 3.814697265625e-06, 4.67151403427124e-06, 5.5283308029174805e-06, 6.385147571563721e-06, 7.241964340209961e-06, 8.098781108856201e-06, 8.955597877502441e-06, 9.812414646148682e-06, 1.0669231414794922e-05, 1.1526048183441162e-05, 1.2382864952087402e-05, 1.3239681720733643e-05, 1.4096498489379883e-05, 1.4953315258026123e-05, 1.5810132026672363e-05, 1.6666948795318604e-05, 1.7523765563964844e-05, 1.8380582332611084e-05, 1.9237399101257324e-05, 2.0094215869903564e-05, 2.0951032638549805e-05, 2.1807849407196045e-05, 2.2664666175842285e-05, 2.3521482944488525e-05, 2.4378299713134766e-05]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 5.0, 6.0, 7.0, 12.0, 13.0, 20.0, 20.0, 22.0, 30.0, 34.0, 48.0, 55.0, 78.0, 80.0, 80.0, 79.0, 66.0, 45.0, 44.0, 37.0, 33.0, 34.0, 19.0, 16.0, 21.0, 15.0, 8.0, 6.0, 6.0, 7.0, 4.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012496898125391454, -0.0001214294316014275, -0.00011788987467298284, -0.00011435031774453819, -0.00011081076809205115, -0.00010727121843956411, -0.00010373166151111946, -0.0001001921045826748, -9.665255493018776e-05, -9.311300527770072e-05, -8.957344834925607e-05, -8.603389142081141e-05, -8.249434176832438e-05, -7.895479211583734e-05, -7.541523518739268e-05, -7.187567825894803e-05, -6.833612860646099e-05, -6.479657895397395e-05, -6.12570220255293e-05, -5.771746873506345e-05, -5.41779154445976e-05, -5.0638362154131755e-05, -4.709880886366591e-05, -4.355925557320006e-05, -4.0019702282734215e-05, -3.648014899226837e-05, -3.294059570180252e-05, -2.9401042411336675e-05, -2.586148912087083e-05, -2.2321935830404982e-05, -1.8782382539939135e-05, -1.5242829249473289e-05, -1.1703268683049828e-05, -8.163715392583981e-06, -4.6241621021181345e-06, -1.0846088116522878e-06, 2.454944478813559e-06, 5.9944977692794055e-06, 9.534051059745252e-06, 1.3073604350211099e-05, 1.6613157640676945e-05, 2.0152710931142792e-05, 2.369226422160864e-05, 2.7231817512074485e-05, 3.077137080254033e-05, 3.431092409300618e-05, 3.7850477383472025e-05, 4.139003067393787e-05, 4.492958396440372e-05, 4.8469137254869565e-05, 5.200869054533541e-05, 5.554824383580126e-05, 5.9087797126267105e-05, 6.262735405471176e-05, 6.61669037071988e-05, 6.970645335968584e-05, 7.324601028813049e-05, 7.678556721657515e-05, 8.032511686906219e-05, 8.386466652154922e-05, 8.740422344999388e-05, 9.094378037843853e-05, 9.448333003092557e-05, 9.802287968341261e-05, 0.00010156243661185727]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 8.0, 10.0, 14.0, 13.0, 12.0, 14.0, 17.0, 28.0, 21.0, 27.0, 33.0, 32.0, 31.0, 43.0, 39.0, 31.0, 32.0, 34.0, 37.0, 41.0, 45.0, 49.0, 46.0, 40.0, 42.0, 29.0, 35.0, 27.0, 22.0, 26.0, 11.0, 10.0, 17.0, 15.0, 14.0, 14.0, 4.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.777162631507963e-05, -9.47269654716365e-05, -9.168231190415099e-05, -8.863765106070787e-05, -8.559299021726474e-05, -8.254832937382162e-05, -7.95036758063361e-05, -7.645901496289298e-05, -7.341435411944985e-05, -7.036969327600673e-05, -6.732503970852122e-05, -6.428037886507809e-05, -6.123571802163497e-05, -5.819106081617065e-05, -5.514640361070633e-05, -5.2101742767263204e-05, -4.905708919977769e-05, -4.6012431994313374e-05, -4.296777115087025e-05, -3.992311394540593e-05, -3.6878453101962805e-05, -3.3833795896498486e-05, -3.078913869103417e-05, -2.7744479666580446e-05, -2.4699820642126724e-05, -2.1655161617673002e-05, -1.861050259321928e-05, -1.5565845387754962e-05, -1.252118636330124e-05, -9.476527338847518e-06, -6.4318701333831996e-06, -3.3872111089294776e-06, -3.425593604333699e-07, 2.702099209273001e-06, 5.746757778979372e-06, 8.791415893938392e-06, 1.1836074918392114e-05, 1.4880733942845836e-05, 1.7925391148310155e-05, 2.0970050172763877e-05, 2.40147091972176e-05, 2.705936822167132e-05, 3.0104027246125042e-05, 3.314868445158936e-05, 3.619334165705368e-05, 3.9238002500496805e-05, 4.228265970596112e-05, 4.532731691142544e-05, 4.837197775486857e-05, 5.1416634960332885e-05, 5.446129580377601e-05, 5.750595300924033e-05, 6.0550613852683455e-05, 6.359527469612658e-05, 6.663992826361209e-05, 6.968458910705522e-05, 7.272924995049834e-05, 7.577391079394147e-05, 7.881856436142698e-05, 8.18632252048701e-05, 8.490788604831323e-05, 8.795254689175636e-05, 9.099720045924187e-05, 9.404186130268499e-05, 9.70865148701705e-05]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 2.0, 6.0, 8.0, 22.0, 31.0, 46.0, 51.0, 101.0, 113.0, 185.0, 292.0, 527.0, 779.0, 1200.0, 2011.0, 3146.0, 5257.0, 8683.0, 14960.0, 25937.0, 47633.0, 93130.0, 201264.0, 562645.0, 1765120.0, 932110.0, 277785.0, 119536.0, 59012.0, 30790.0, 17244.0, 9708.0, 5663.0, 3407.0, 2153.0, 1295.0, 815.0, 504.0, 362.0, 215.0, 168.0, 107.0, 68.0, 56.0, 28.0, 28.0, 22.0, 17.0, 14.0, 7.0, 9.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.00012069940567016602, -0.0001161741092801094, -0.0001116488128900528, -0.00010712351649999619, -0.00010259822010993958, -9.807292371988297e-05, -9.354762732982635e-05, -8.902233093976974e-05, -8.449703454971313e-05, -7.997173815965652e-05, -7.544644176959991e-05, -7.09211453795433e-05, -6.63958489894867e-05, -6.187055259943008e-05, -5.7345256209373474e-05, -5.2819959819316864e-05, -4.8294663429260254e-05, -4.3769367039203644e-05, -3.9244070649147034e-05, -3.4718774259090424e-05, -3.0193477869033813e-05, -2.5668181478977203e-05, -2.1142885088920593e-05, -1.6617588698863983e-05, -1.2092292308807373e-05, -7.566995918750763e-06, -3.041699528694153e-06, 1.4835968613624573e-06, 6.008893251419067e-06, 1.0534189641475677e-05, 1.5059486031532288e-05, 1.9584782421588898e-05, 2.4110078811645508e-05, 2.8635375201702118e-05, 3.316067159175873e-05, 3.768596798181534e-05, 4.221126437187195e-05, 4.673656076192856e-05, 5.126185715198517e-05, 5.578715354204178e-05, 6.031244993209839e-05, 6.4837746322155e-05, 6.936304271221161e-05, 7.388833910226822e-05, 7.841363549232483e-05, 8.293893188238144e-05, 8.746422827243805e-05, 9.198952466249466e-05, 9.651482105255127e-05, 0.00010104011744260788, 0.00010556541383266449, 0.0001100907102227211, 0.00011461600661277771, 0.00011914130300283432, 0.00012366659939289093, 0.00012819189578294754, 0.00013271719217300415, 0.00013724248856306076, 0.00014176778495311737, 0.00014629308134317398, 0.0001508183777332306, 0.0001553436741232872, 0.0001598689705133438, 0.00016439426690340042, 0.00016891956329345703]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 5.0, 8.0, 8.0, 18.0, 8.0, 16.0, 10.0, 16.0, 30.0, 26.0, 25.0, 33.0, 37.0, 37.0, 45.0, 31.0, 45.0, 31.0, 35.0, 46.0, 52.0, 44.0, 38.0, 35.0, 46.0, 35.0, 42.0, 27.0, 31.0, 24.0, 17.0, 12.0, 21.0, 12.0, 11.0, 11.0, 6.0, 8.0, 9.0, 4.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.079673767089844e-05, -5.8867037296295166e-05, -5.6937336921691895e-05, -5.500763654708862e-05, -5.307793617248535e-05, -5.114823579788208e-05, -4.921853542327881e-05, -4.728883504867554e-05, -4.5359134674072266e-05, -4.3429434299468994e-05, -4.149973392486572e-05, -3.957003355026245e-05, -3.764033317565918e-05, -3.571063280105591e-05, -3.378093242645264e-05, -3.1851232051849365e-05, -2.9921531677246094e-05, -2.7991831302642822e-05, -2.606213092803955e-05, -2.413243055343628e-05, -2.2202730178833008e-05, -2.0273029804229736e-05, -1.8343329429626465e-05, -1.6413629055023193e-05, -1.4483928680419922e-05, -1.255422830581665e-05, -1.0624527931213379e-05, -8.694827556610107e-06, -6.765127182006836e-06, -4.8354268074035645e-06, -2.905726432800293e-06, -9.760260581970215e-07, 9.5367431640625e-07, 2.8833746910095215e-06, 4.813075065612793e-06, 6.7427754402160645e-06, 8.672475814819336e-06, 1.0602176189422607e-05, 1.2531876564025879e-05, 1.446157693862915e-05, 1.6391277313232422e-05, 1.8320977687835693e-05, 2.0250678062438965e-05, 2.2180378437042236e-05, 2.4110078811645508e-05, 2.603977918624878e-05, 2.796947956085205e-05, 2.9899179935455322e-05, 3.1828880310058594e-05, 3.3758580684661865e-05, 3.568828105926514e-05, 3.761798143386841e-05, 3.954768180847168e-05, 4.147738218307495e-05, 4.340708255767822e-05, 4.5336782932281494e-05, 4.7266483306884766e-05, 4.919618368148804e-05, 5.112588405609131e-05, 5.305558443069458e-05, 5.498528480529785e-05, 5.691498517990112e-05, 5.8844685554504395e-05, 6.0774385929107666e-05, 6.270408630371094e-05]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 12.0, 14.0, 26.0, 36.0, 39.0, 64.0, 92.0, 125.0, 211.0, 308.0, 432.0, 671.0, 941.0, 1561.0, 2246.0, 3301.0, 5314.0, 7887.0, 12489.0, 20105.0, 31472.0, 52158.0, 88877.0, 153873.0, 294876.0, 613988.0, 1289866.0, 807840.0, 353883.0, 187660.0, 104594.0, 59739.0, 36593.0, 22256.0, 14305.0, 9108.0, 5772.0, 3845.0, 2594.0, 1682.0, 1136.0, 758.0, 490.0, 333.0, 226.0, 160.0, 124.0, 74.0, 48.0, 25.0, 19.0, 16.0, 7.0, 8.0, 6.0, 3.0, 0.0, 4.0], "bins": [-9.655952453613281e-05, -9.360164403915405e-05, -9.064376354217529e-05, -8.768588304519653e-05, -8.472800254821777e-05, -8.177012205123901e-05, -7.881224155426025e-05, -7.58543610572815e-05, -7.289648056030273e-05, -6.993860006332397e-05, -6.698071956634521e-05, -6.402283906936646e-05, -6.10649585723877e-05, -5.8107078075408936e-05, -5.5149197578430176e-05, -5.2191317081451416e-05, -4.9233436584472656e-05, -4.6275556087493896e-05, -4.331767559051514e-05, -4.035979509353638e-05, -3.740191459655762e-05, -3.444403409957886e-05, -3.14861536026001e-05, -2.8528273105621338e-05, -2.5570392608642578e-05, -2.261251211166382e-05, -1.965463161468506e-05, -1.66967511177063e-05, -1.3738870620727539e-05, -1.078099012374878e-05, -7.82310962677002e-06, -4.86522912979126e-06, -1.9073486328125e-06, 1.0505318641662598e-06, 4.0084123611450195e-06, 6.966292858123779e-06, 9.924173355102539e-06, 1.2882053852081299e-05, 1.583993434906006e-05, 1.879781484603882e-05, 2.1755695343017578e-05, 2.4713575839996338e-05, 2.7671456336975098e-05, 3.062933683395386e-05, 3.358721733093262e-05, 3.654509782791138e-05, 3.950297832489014e-05, 4.2460858821868896e-05, 4.5418739318847656e-05, 4.8376619815826416e-05, 5.1334500312805176e-05, 5.4292380809783936e-05, 5.7250261306762695e-05, 6.0208141803741455e-05, 6.316602230072021e-05, 6.612390279769897e-05, 6.908178329467773e-05, 7.20396637916565e-05, 7.499754428863525e-05, 7.795542478561401e-05, 8.091330528259277e-05, 8.387118577957153e-05, 8.682906627655029e-05, 8.978694677352905e-05, 9.274482727050781e-05]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 6.0, 7.0, 7.0, 11.0, 14.0, 17.0, 17.0, 19.0, 20.0, 34.0, 36.0, 60.0, 50.0, 71.0, 64.0, 87.0, 104.0, 135.0, 179.0, 177.0, 203.0, 227.0, 250.0, 274.0, 218.0, 242.0, 206.0, 194.0, 168.0, 146.0, 146.0, 108.0, 79.0, 73.0, 77.0, 58.0, 54.0, 32.0, 45.0, 36.0, 23.0, 22.0, 13.0, 8.0, 10.0, 11.0, 6.0, 8.0, 8.0, 3.0, 1.0, 4.0, 2.0, 3.0], "bins": [-3.1113624572753906e-05, -3.019627183675766e-05, -2.9278919100761414e-05, -2.8361566364765167e-05, -2.744421362876892e-05, -2.6526860892772675e-05, -2.5609508156776428e-05, -2.4692155420780182e-05, -2.3774802684783936e-05, -2.285744994878769e-05, -2.1940097212791443e-05, -2.1022744476795197e-05, -2.010539174079895e-05, -1.9188039004802704e-05, -1.8270686268806458e-05, -1.735333353281021e-05, -1.6435980796813965e-05, -1.551862806081772e-05, -1.4601275324821472e-05, -1.3683922588825226e-05, -1.276656985282898e-05, -1.1849217116832733e-05, -1.0931864380836487e-05, -1.001451164484024e-05, -9.097158908843994e-06, -8.179806172847748e-06, -7.2624534368515015e-06, -6.345100700855255e-06, -5.427747964859009e-06, -4.5103952288627625e-06, -3.593042492866516e-06, -2.6756897568702698e-06, -1.7583370208740234e-06, -8.409842848777771e-07, 7.636845111846924e-08, 9.937211871147156e-07, 1.911073923110962e-06, 2.8284266591072083e-06, 3.7457793951034546e-06, 4.663132131099701e-06, 5.580484867095947e-06, 6.497837603092194e-06, 7.41519033908844e-06, 8.332543075084686e-06, 9.249895811080933e-06, 1.0167248547077179e-05, 1.1084601283073425e-05, 1.2001954019069672e-05, 1.2919306755065918e-05, 1.3836659491062164e-05, 1.475401222705841e-05, 1.5671364963054657e-05, 1.6588717699050903e-05, 1.750607043504715e-05, 1.8423423171043396e-05, 1.9340775907039642e-05, 2.025812864303589e-05, 2.1175481379032135e-05, 2.209283411502838e-05, 2.3010186851024628e-05, 2.3927539587020874e-05, 2.484489232301712e-05, 2.5762245059013367e-05, 2.6679597795009613e-05, 2.759695053100586e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 1.0, 5.0, 6.0, 6.0, 16.0, 14.0, 24.0, 19.0, 37.0, 36.0, 45.0, 61.0, 75.0, 84.0, 111.0, 91.0, 81.0, 66.0, 48.0, 26.0, 32.0, 21.0, 25.0, 16.0, 15.0, 8.0, 8.0, 4.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00011047763109672815, -0.00010744790779426694, -0.00010441818449180573, -0.00010138846118934453, -9.835873788688332e-05, -9.532901458442211e-05, -9.22992912819609e-05, -8.92695679794997e-05, -8.623984467703849e-05, -8.321012137457728e-05, -8.018039807211608e-05, -7.715067476965487e-05, -7.412095146719366e-05, -7.109122816473246e-05, -6.806150486227125e-05, -6.503178155981004e-05, -6.200205098139122e-05, -5.8972327678930014e-05, -5.594260437646881e-05, -5.29128810740076e-05, -4.9883157771546394e-05, -4.685343446908519e-05, -4.382370752864517e-05, -4.0793984226183966e-05, -3.776426092372276e-05, -3.473453762126155e-05, -3.1704814318800345e-05, -2.8675089197349735e-05, -2.5645365894888528e-05, -2.261564259242732e-05, -1.958591747097671e-05, -1.6556194168515503e-05, -1.3526463590096682e-05, -1.0496740287635475e-05, -7.467016075679567e-06, -4.437291863723658e-06, -1.4075685612624511e-06, 1.6221547411987558e-06, 4.651879862649366e-06, 7.681603165110573e-06, 1.071132646757178e-05, 1.3741049770032987e-05, 1.6770773072494194e-05, 1.9800498193944804e-05, 2.283022149640601e-05, 2.5859944798867218e-05, 2.888966992031783e-05, 3.1919393222779036e-05, 3.494911652524024e-05, 3.797883982770145e-05, 4.1008563130162656e-05, 4.403828643262386e-05, 4.706800973508507e-05, 5.009773303754628e-05, 5.312745997798629e-05, 5.61571832804475e-05, 5.9186906582908705e-05, 6.221663352334872e-05, 6.524635682580993e-05, 6.827608012827113e-05, 7.130580343073234e-05, 7.433552673319355e-05, 7.736525003565475e-05, 8.039497333811596e-05, 8.342469664057717e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 6.0, 10.0, 11.0, 15.0, 20.0, 20.0, 22.0, 21.0, 28.0, 43.0, 21.0, 38.0, 44.0, 34.0, 35.0, 29.0, 50.0, 50.0, 48.0, 40.0, 36.0, 41.0, 35.0, 36.0, 29.0, 24.0, 30.0, 25.0, 13.0, 22.0, 14.0, 18.0, 6.0, 15.0, 15.0, 6.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.92493049427867e-05, -6.719132943544537e-05, -6.513334665214643e-05, -6.30753711448051e-05, -6.1017388361506164e-05, -5.895941285416484e-05, -5.6901433708844706e-05, -5.4843454563524574e-05, -5.278547541820444e-05, -5.072749627288431e-05, -4.866951712756418e-05, -4.6611537982244045e-05, -4.455356247490272e-05, -4.249557969160378e-05, -4.0437604184262455e-05, -3.837962503894232e-05, -3.632164589362219e-05, -3.426366674830206e-05, -3.2205687602981925e-05, -3.0147710276651196e-05, -2.8089731131331064e-05, -2.603175198601093e-05, -2.3973774659680203e-05, -2.191579551436007e-05, -1.9857816369039938e-05, -1.7799837223719805e-05, -1.5741858078399673e-05, -1.3683880752068944e-05, -1.1625901606748812e-05, -9.56792246142868e-06, -7.509944225603249e-06, -5.451965989777818e-06, -3.3939795685000718e-06, -1.3360008779272903e-06, 7.219778126454912e-07, 2.7799565032182727e-06, 4.837935193791054e-06, 6.8959143391111866e-06, 8.953892574936617e-06, 1.1011870810762048e-05, 1.306984995608218e-05, 1.5127829101402313e-05, 1.7185808246722445e-05, 1.9243785573053174e-05, 2.1301764718373306e-05, 2.335974386369344e-05, 2.5417721190024167e-05, 2.74757003353443e-05, 2.9533679480664432e-05, 3.1591658625984564e-05, 3.36496377713047e-05, 3.570761691662483e-05, 3.776559606194496e-05, 3.982357156928629e-05, 4.188155071460642e-05, 4.393952985992655e-05, 4.5997509005246684e-05, 4.8055488150566816e-05, 5.011346729588695e-05, 5.217144644120708e-05, 5.4229421948548406e-05, 5.6287404731847346e-05, 5.834538023918867e-05, 6.0403359384508803e-05, 6.246133852982894e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 12.0, 7.0, 10.0, 22.0, 18.0, 38.0, 49.0, 67.0, 100.0, 150.0, 196.0, 288.0, 384.0, 663.0, 1028.0, 1466.0, 2282.0, 3462.0, 5240.0, 8235.0, 12836.0, 20758.0, 33668.0, 54085.0, 88517.0, 147074.0, 208749.0, 175194.0, 108210.0, 66443.0, 40435.0, 25015.0, 15311.0, 9984.0, 6478.0, 4082.0, 2626.0, 1783.0, 1178.0, 762.0, 515.0, 359.0, 220.0, 164.0, 124.0, 87.0, 56.0, 44.0, 28.0, 21.0, 11.0, 9.0, 5.0, 9.0, 2.0, 0.0, 2.0], "bins": [-0.00010395050048828125, -0.00010086596012115479, -9.778141975402832e-05, -9.469687938690186e-05, -9.161233901977539e-05, -8.852779865264893e-05, -8.544325828552246e-05, -8.2358717918396e-05, -7.927417755126953e-05, -7.618963718414307e-05, -7.31050968170166e-05, -7.002055644989014e-05, -6.693601608276367e-05, -6.385147571563721e-05, -6.076693534851074e-05, -5.768239498138428e-05, -5.459785461425781e-05, -5.151331424713135e-05, -4.842877388000488e-05, -4.534423351287842e-05, -4.225969314575195e-05, -3.917515277862549e-05, -3.6090612411499023e-05, -3.300607204437256e-05, -2.9921531677246094e-05, -2.683699131011963e-05, -2.3752450942993164e-05, -2.06679105758667e-05, -1.7583370208740234e-05, -1.449882984161377e-05, -1.1414289474487305e-05, -8.32974910736084e-06, -5.245208740234375e-06, -2.16066837310791e-06, 9.238719940185547e-07, 4.0084123611450195e-06, 7.092952728271484e-06, 1.017749309539795e-05, 1.3262033462524414e-05, 1.634657382965088e-05, 1.9431114196777344e-05, 2.251565456390381e-05, 2.5600194931030273e-05, 2.8684735298156738e-05, 3.17692756652832e-05, 3.485381603240967e-05, 3.793835639953613e-05, 4.10228967666626e-05, 4.410743713378906e-05, 4.719197750091553e-05, 5.027651786804199e-05, 5.336105823516846e-05, 5.644559860229492e-05, 5.953013896942139e-05, 6.261467933654785e-05, 6.569921970367432e-05, 6.878376007080078e-05, 7.186830043792725e-05, 7.495284080505371e-05, 7.803738117218018e-05, 8.112192153930664e-05, 8.42064619064331e-05, 8.729100227355957e-05, 9.037554264068604e-05, 9.34600830078125e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 9.0, 9.0, 14.0, 11.0, 11.0, 16.0, 15.0, 26.0, 18.0, 20.0, 15.0, 25.0, 35.0, 29.0, 26.0, 30.0, 41.0, 40.0, 34.0, 36.0, 39.0, 35.0, 33.0, 37.0, 56.0, 22.0, 28.0, 41.0, 21.0, 19.0, 23.0, 27.0, 15.0, 24.0, 17.0, 12.0, 9.0, 12.0, 10.0, 12.0, 9.0, 5.0, 7.0, 1.0, 3.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.364418029785156e-05, -5.2036717534065247e-05, -5.042925477027893e-05, -4.8821792006492615e-05, -4.72143292427063e-05, -4.560686647891998e-05, -4.399940371513367e-05, -4.239194095134735e-05, -4.0784478187561035e-05, -3.917701542377472e-05, -3.75695526599884e-05, -3.596208989620209e-05, -3.435462713241577e-05, -3.2747164368629456e-05, -3.113970160484314e-05, -2.9532238841056824e-05, -2.7924776077270508e-05, -2.6317313313484192e-05, -2.4709850549697876e-05, -2.310238778591156e-05, -2.1494925022125244e-05, -1.9887462258338928e-05, -1.8279999494552612e-05, -1.6672536730766296e-05, -1.506507396697998e-05, -1.3457611203193665e-05, -1.1850148439407349e-05, -1.0242685675621033e-05, -8.635222911834717e-06, -7.027760148048401e-06, -5.420297384262085e-06, -3.812834620475769e-06, -2.205371856689453e-06, -5.979090929031372e-07, 1.0095536708831787e-06, 2.6170164346694946e-06, 4.2244791984558105e-06, 5.8319419622421265e-06, 7.439404726028442e-06, 9.046867489814758e-06, 1.0654330253601074e-05, 1.226179301738739e-05, 1.3869255781173706e-05, 1.5476718544960022e-05, 1.7084181308746338e-05, 1.8691644072532654e-05, 2.029910683631897e-05, 2.1906569600105286e-05, 2.35140323638916e-05, 2.5121495127677917e-05, 2.6728957891464233e-05, 2.833642065525055e-05, 2.9943883419036865e-05, 3.155134618282318e-05, 3.31588089466095e-05, 3.476627171039581e-05, 3.637373447418213e-05, 3.7981197237968445e-05, 3.958866000175476e-05, 4.119612276554108e-05, 4.280358552932739e-05, 4.441104829311371e-05, 4.6018511056900024e-05, 4.762597382068634e-05, 4.9233436584472656e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 7.0, 3.0, 13.0, 11.0, 13.0, 32.0, 30.0, 51.0, 84.0, 155.0, 253.0, 391.0, 624.0, 1070.0, 1986.0, 3498.0, 6685.0, 13549.0, 33817.0, 133602.0, 638637.0, 148077.0, 35970.0, 14525.0, 6936.0, 3652.0, 1981.0, 1149.0, 710.0, 382.0, 237.0, 162.0, 84.0, 54.0, 38.0, 27.0, 22.0, 13.0, 10.0, 9.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019228458404541016, -0.00018577277660369873, -0.0001792609691619873, -0.00017274916172027588, -0.00016623735427856445, -0.00015972554683685303, -0.0001532137393951416, -0.00014670193195343018, -0.00014019012451171875, -0.00013367831707000732, -0.0001271665096282959, -0.00012065470218658447, -0.00011414289474487305, -0.00010763108730316162, -0.0001011192798614502, -9.460747241973877e-05, -8.809566497802734e-05, -8.158385753631592e-05, -7.507205009460449e-05, -6.856024265289307e-05, -6.204843521118164e-05, -5.5536627769470215e-05, -4.902482032775879e-05, -4.251301288604736e-05, -3.600120544433594e-05, -2.9489398002624512e-05, -2.2977590560913086e-05, -1.646578311920166e-05, -9.953975677490234e-06, -3.4421682357788086e-06, 3.069639205932617e-06, 9.581446647644043e-06, 1.609325408935547e-05, 2.2605061531066895e-05, 2.911686897277832e-05, 3.5628676414489746e-05, 4.214048385620117e-05, 4.86522912979126e-05, 5.5164098739624023e-05, 6.167590618133545e-05, 6.818771362304688e-05, 7.46995210647583e-05, 8.121132850646973e-05, 8.772313594818115e-05, 9.423494338989258e-05, 0.000100746750831604, 0.00010725855827331543, 0.00011377036571502686, 0.00012028217315673828, 0.0001267939805984497, 0.00013330578804016113, 0.00013981759548187256, 0.00014632940292358398, 0.0001528412103652954, 0.00015935301780700684, 0.00016586482524871826, 0.0001723766326904297, 0.0001788884401321411, 0.00018540024757385254, 0.00019191205501556396, 0.0001984238624572754, 0.00020493566989898682, 0.00021144747734069824, 0.00021795928478240967, 0.0002244710922241211]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 4.0, 10.0, 8.0, 11.0, 13.0, 13.0, 18.0, 22.0, 23.0, 19.0, 25.0, 40.0, 37.0, 41.0, 36.0, 35.0, 45.0, 40.0, 41.0, 59.0, 43.0, 46.0, 40.0, 32.0, 33.0, 41.0, 32.0, 24.0, 27.0, 18.0, 29.0, 11.0, 14.0, 18.0, 7.0, 8.0, 7.0, 3.0, 6.0, 7.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.987550735473633e-05, -3.8702040910720825e-05, -3.752857446670532e-05, -3.635510802268982e-05, -3.5181641578674316e-05, -3.4008175134658813e-05, -3.283470869064331e-05, -3.166124224662781e-05, -3.0487775802612305e-05, -2.9314309358596802e-05, -2.81408429145813e-05, -2.6967376470565796e-05, -2.5793910026550293e-05, -2.462044358253479e-05, -2.3446977138519287e-05, -2.2273510694503784e-05, -2.110004425048828e-05, -1.992657780647278e-05, -1.8753111362457275e-05, -1.7579644918441772e-05, -1.640617847442627e-05, -1.5232712030410767e-05, -1.4059245586395264e-05, -1.288577914237976e-05, -1.1712312698364258e-05, -1.0538846254348755e-05, -9.365379810333252e-06, -8.191913366317749e-06, -7.018446922302246e-06, -5.844980478286743e-06, -4.67151403427124e-06, -3.4980475902557373e-06, -2.3245811462402344e-06, -1.1511147022247314e-06, 2.2351741790771484e-08, 1.1958181858062744e-06, 2.3692846298217773e-06, 3.5427510738372803e-06, 4.716217517852783e-06, 5.889683961868286e-06, 7.063150405883789e-06, 8.236616849899292e-06, 9.410083293914795e-06, 1.0583549737930298e-05, 1.17570161819458e-05, 1.2930482625961304e-05, 1.4103949069976807e-05, 1.527741551399231e-05, 1.6450881958007812e-05, 1.7624348402023315e-05, 1.879781484603882e-05, 1.997128129005432e-05, 2.1144747734069824e-05, 2.2318214178085327e-05, 2.349168062210083e-05, 2.4665147066116333e-05, 2.5838613510131836e-05, 2.701207995414734e-05, 2.8185546398162842e-05, 2.9359012842178345e-05, 3.053247928619385e-05, 3.170594573020935e-05, 3.2879412174224854e-05, 3.4052878618240356e-05, 3.522634506225586e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 8.0, 4.0, 15.0, 21.0, 37.0, 51.0, 88.0, 121.0, 173.0, 271.0, 402.0, 599.0, 933.0, 1455.0, 2407.0, 4175.0, 7947.0, 17517.0, 48107.0, 244390.0, 594602.0, 77553.0, 24245.0, 10505.0, 5142.0, 2873.0, 1749.0, 1043.0, 715.0, 474.0, 298.0, 216.0, 139.0, 77.0, 53.0, 53.0, 21.0, 19.0, 22.0, 14.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8100948333740234e-05, -4.660617560148239e-05, -4.511140286922455e-05, -4.3616630136966705e-05, -4.212185740470886e-05, -4.062708467245102e-05, -3.9132311940193176e-05, -3.763753920793533e-05, -3.614276647567749e-05, -3.464799374341965e-05, -3.3153221011161804e-05, -3.165844827890396e-05, -3.0163675546646118e-05, -2.8668902814388275e-05, -2.7174130082130432e-05, -2.567935734987259e-05, -2.4184584617614746e-05, -2.2689811885356903e-05, -2.119503915309906e-05, -1.9700266420841217e-05, -1.8205493688583374e-05, -1.671072095632553e-05, -1.5215948224067688e-05, -1.3721175491809845e-05, -1.2226402759552002e-05, -1.0731630027294159e-05, -9.236857295036316e-06, -7.742084562778473e-06, -6.24731183052063e-06, -4.752539098262787e-06, -3.257766366004944e-06, -1.7629936337471008e-06, -2.682209014892578e-07, 1.2265518307685852e-06, 2.7213245630264282e-06, 4.216097295284271e-06, 5.710870027542114e-06, 7.205642759799957e-06, 8.7004154920578e-06, 1.0195188224315643e-05, 1.1689960956573486e-05, 1.318473368883133e-05, 1.4679506421089172e-05, 1.6174279153347015e-05, 1.766905188560486e-05, 1.91638246178627e-05, 2.0658597350120544e-05, 2.2153370082378387e-05, 2.364814281463623e-05, 2.5142915546894073e-05, 2.6637688279151917e-05, 2.813246101140976e-05, 2.9627233743667603e-05, 3.1122006475925446e-05, 3.261677920818329e-05, 3.411155194044113e-05, 3.5606324672698975e-05, 3.710109740495682e-05, 3.859587013721466e-05, 4.0090642869472504e-05, 4.158541560173035e-05, 4.308018833398819e-05, 4.457496106624603e-05, 4.6069733798503876e-05, 4.756450653076172e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 15.0, 8.0, 12.0, 8.0, 10.0, 18.0, 12.0, 25.0, 19.0, 23.0, 94.0, 50.0, 57.0, 60.0, 141.0, 89.0, 58.0, 46.0, 25.0, 48.0, 26.0, 14.0, 17.0, 30.0, 15.0, 9.0, 7.0, 10.0, 11.0, 5.0, 4.0, 0.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6226043701171875e-06, -2.54996120929718e-06, -2.477318048477173e-06, -2.4046748876571655e-06, -2.332031726837158e-06, -2.259388566017151e-06, -2.1867454051971436e-06, -2.1141022443771362e-06, -2.041459083557129e-06, -1.9688159227371216e-06, -1.8961727619171143e-06, -1.823529601097107e-06, -1.7508864402770996e-06, -1.6782432794570923e-06, -1.605600118637085e-06, -1.5329569578170776e-06, -1.4603137969970703e-06, -1.387670636177063e-06, -1.3150274753570557e-06, -1.2423843145370483e-06, -1.169741153717041e-06, -1.0970979928970337e-06, -1.0244548320770264e-06, -9.51811671257019e-07, -8.791685104370117e-07, -8.065253496170044e-07, -7.338821887969971e-07, -6.612390279769897e-07, -5.885958671569824e-07, -5.159527063369751e-07, -4.4330954551696777e-07, -3.7066638469696045e-07, -2.980232238769531e-07, -2.253800630569458e-07, -1.5273690223693848e-07, -8.009374141693115e-08, -7.450580596923828e-09, 6.51925802230835e-08, 1.3783574104309082e-07, 2.1047890186309814e-07, 2.8312206268310547e-07, 3.557652235031128e-07, 4.284083843231201e-07, 5.010515451431274e-07, 5.736947059631348e-07, 6.463378667831421e-07, 7.189810276031494e-07, 7.916241884231567e-07, 8.642673492431641e-07, 9.369105100631714e-07, 1.0095536708831787e-06, 1.082196831703186e-06, 1.1548399925231934e-06, 1.2274831533432007e-06, 1.300126314163208e-06, 1.3727694749832153e-06, 1.4454126358032227e-06, 1.51805579662323e-06, 1.5906989574432373e-06, 1.6633421182632446e-06, 1.735985279083252e-06, 1.8086284399032593e-06, 1.8812716007232666e-06, 1.953914761543274e-06, 2.0265579223632812e-06]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 7.0, 10.0, 20.0, 18.0, 26.0, 42.0, 49.0, 69.0, 121.0, 164.0, 270.0, 443.0, 767.0, 1328.0, 2468.0, 4667.0, 10858.0, 27850.0, 86573.0, 412678.0, 364394.0, 86615.0, 27684.0, 10988.0, 4864.0, 2368.0, 1205.0, 729.0, 459.0, 288.0, 184.0, 110.0, 70.0, 54.0, 34.0, 22.0, 20.0, 11.0, 8.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2067298889160156e-05, -3.1123869121074677e-05, -3.0180439352989197e-05, -2.9237009584903717e-05, -2.8293579816818237e-05, -2.7350150048732758e-05, -2.6406720280647278e-05, -2.5463290512561798e-05, -2.451986074447632e-05, -2.357643097639084e-05, -2.263300120830536e-05, -2.168957144021988e-05, -2.07461416721344e-05, -1.980271190404892e-05, -1.885928213596344e-05, -1.791585236787796e-05, -1.697242259979248e-05, -1.6028992831707e-05, -1.5085563063621521e-05, -1.4142133295536041e-05, -1.3198703527450562e-05, -1.2255273759365082e-05, -1.1311843991279602e-05, -1.0368414223194122e-05, -9.424984455108643e-06, -8.481554687023163e-06, -7.538124918937683e-06, -6.594695150852203e-06, -5.651265382766724e-06, -4.707835614681244e-06, -3.764405846595764e-06, -2.8209760785102844e-06, -1.8775463104248047e-06, -9.34116542339325e-07, 9.313225746154785e-09, 9.527429938316345e-07, 1.8961727619171143e-06, 2.839602530002594e-06, 3.7830322980880737e-06, 4.7264620661735535e-06, 5.669891834259033e-06, 6.613321602344513e-06, 7.556751370429993e-06, 8.500181138515472e-06, 9.443610906600952e-06, 1.0387040674686432e-05, 1.1330470442771912e-05, 1.2273900210857391e-05, 1.3217329978942871e-05, 1.416075974702835e-05, 1.510418951511383e-05, 1.604761928319931e-05, 1.699104905128479e-05, 1.793447881937027e-05, 1.887790858745575e-05, 1.982133835554123e-05, 2.076476812362671e-05, 2.170819789171219e-05, 2.265162765979767e-05, 2.3595057427883148e-05, 2.4538487195968628e-05, 2.5481916964054108e-05, 2.6425346732139587e-05, 2.7368776500225067e-05, 2.8312206268310547e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 4.0, 7.0, 4.0, 8.0, 8.0, 13.0, 7.0, 12.0, 29.0, 31.0, 47.0, 42.0, 56.0, 63.0, 69.0, 77.0, 65.0, 71.0, 73.0, 56.0, 59.0, 49.0, 22.0, 33.0, 21.0, 21.0, 12.0, 10.0, 8.0, 3.0, 2.0, 7.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.470348358154297e-06, -4.295259714126587e-06, -4.120171070098877e-06, -3.945082426071167e-06, -3.769993782043457e-06, -3.594905138015747e-06, -3.419816493988037e-06, -3.244727849960327e-06, -3.069639205932617e-06, -2.8945505619049072e-06, -2.7194619178771973e-06, -2.5443732738494873e-06, -2.3692846298217773e-06, -2.1941959857940674e-06, -2.0191073417663574e-06, -1.8440186977386475e-06, -1.6689300537109375e-06, -1.4938414096832275e-06, -1.3187527656555176e-06, -1.1436641216278076e-06, -9.685754776000977e-07, -7.934868335723877e-07, -6.183981895446777e-07, -4.4330954551696777e-07, -2.682209014892578e-07, -9.313225746154785e-08, 8.195638656616211e-08, 2.5704503059387207e-07, 4.3213367462158203e-07, 6.07222318649292e-07, 7.82310962677002e-07, 9.57399606704712e-07, 1.1324882507324219e-06, 1.3075768947601318e-06, 1.4826655387878418e-06, 1.6577541828155518e-06, 1.8328428268432617e-06, 2.0079314708709717e-06, 2.1830201148986816e-06, 2.3581087589263916e-06, 2.5331974029541016e-06, 2.7082860469818115e-06, 2.8833746910095215e-06, 3.0584633350372314e-06, 3.2335519790649414e-06, 3.4086406230926514e-06, 3.5837292671203613e-06, 3.7588179111480713e-06, 3.933906555175781e-06, 4.108995199203491e-06, 4.284083843231201e-06, 4.459172487258911e-06, 4.634261131286621e-06, 4.809349775314331e-06, 4.984438419342041e-06, 5.159527063369751e-06, 5.334615707397461e-06, 5.509704351425171e-06, 5.684792995452881e-06, 5.859881639480591e-06, 6.034970283508301e-06, 6.210058927536011e-06, 6.385147571563721e-06, 6.560236215591431e-06, 6.735324859619141e-06]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 4.0, 4.0, 8.0, 10.0, 25.0, 17.0, 15.0, 28.0, 29.0, 49.0, 55.0, 74.0, 92.0, 105.0, 84.0, 89.0, 53.0, 47.0, 42.0, 32.0, 28.0, 25.0, 11.0, 10.0, 18.0, 7.0, 6.0, 9.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-9.297375800088048e-05, -9.051169763552025e-05, -8.80496299942024e-05, -8.558756962884218e-05, -8.312550198752433e-05, -8.06634416221641e-05, -7.820138125680387e-05, -7.573931361548603e-05, -7.32772532501258e-05, -7.081519288476557e-05, -6.835312524344772e-05, -6.589106487808749e-05, -6.342900451272726e-05, -6.0966936871409416e-05, -5.8504876506049186e-05, -5.604281250271015e-05, -5.358074849937111e-05, -5.1118684496032074e-05, -4.865662049269304e-05, -4.6194560127332807e-05, -4.373249612399377e-05, -4.127043212065473e-05, -3.88083717552945e-05, -3.6346307751955464e-05, -3.388424374861643e-05, -3.142217974527739e-05, -2.8960117560927756e-05, -2.6498055376578122e-05, -2.4035991373239085e-05, -2.1573927369900048e-05, -1.9111865185550414e-05, -1.664980300120078e-05, -1.4187738997861743e-05, -1.1725675904017407e-05, -9.263612810173072e-06, -6.801549716328736e-06, -4.339486622484401e-06, -1.8774235286400653e-06, 5.846395652042702e-07, 3.046701749553904e-06, 5.508765752892941e-06, 7.970828846737277e-06, 1.0432891940581612e-05, 1.2894955034425948e-05, 1.5357018128270283e-05, 1.781908213160932e-05, 2.0281144315958954e-05, 2.2743206500308588e-05, 2.5205270503647625e-05, 2.7667334506986663e-05, 3.0129396691336296e-05, 3.259145887568593e-05, 3.505352287902497e-05, 3.7515586882364005e-05, 3.9977647247724235e-05, 4.243971125106327e-05, 4.490177525440231e-05, 4.736383925774135e-05, 4.9825903261080384e-05, 5.2287963626440614e-05, 5.475002762977965e-05, 5.721209163311869e-05, 5.967415199847892e-05, 6.213621236383915e-05, 6.4598280005157e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 0.0, 5.0, 9.0, 6.0, 5.0, 9.0, 12.0, 16.0, 14.0, 14.0, 20.0, 27.0, 17.0, 32.0, 32.0, 33.0, 31.0, 50.0, 29.0, 35.0, 39.0, 41.0, 58.0, 44.0, 33.0, 46.0, 36.0, 38.0, 30.0, 31.0, 28.0, 27.0, 21.0, 13.0, 23.0, 19.0, 16.0, 9.0, 12.0, 11.0, 8.0, 5.0, 9.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-5.965093441773206e-05, -5.791201692773029e-05, -5.6173099437728524e-05, -5.4434181947726756e-05, -5.269526081974618e-05, -5.0956343329744413e-05, -4.9217425839742646e-05, -4.747850834974088e-05, -4.573959085973911e-05, -4.400067336973734e-05, -4.2261755879735574e-05, -4.0522834751755e-05, -3.878391726175323e-05, -3.7044999771751463e-05, -3.5306082281749696e-05, -3.356716479174793e-05, -3.182824730174616e-05, -3.0089329811744392e-05, -2.835041050275322e-05, -2.6611493012751453e-05, -2.4872575522749685e-05, -2.3133656213758513e-05, -2.1394738723756745e-05, -1.9655821233754978e-05, -1.7916900105774403e-05, -1.6177982615772635e-05, -1.4439064216276165e-05, -1.2700145816779695e-05, -1.0961228326777928e-05, -9.222309927281458e-06, -7.483391527784988e-06, -5.74447403778322e-06, -4.0055565477814525e-06, -2.2666386030323338e-06, -5.277204309095396e-07, 1.2111977412132546e-06, 2.9501156859623734e-06, 4.689033630711492e-06, 6.427952030207962e-06, 8.16686952020973e-06, 9.9057879197062e-06, 1.1644706319202669e-05, 1.3383623809204437e-05, 1.5122542208700906e-05, 1.6861460608197376e-05, 1.8600378098199144e-05, 2.0339295588200912e-05, 2.207821307820268e-05, 2.381713238719385e-05, 2.555604987719562e-05, 2.729496918618679e-05, 2.903388667618856e-05, 3.0772804166190326e-05, 3.2511721656192094e-05, 3.425063914619386e-05, 3.598955663619563e-05, 3.7728477764176205e-05, 3.946739525417797e-05, 4.120631274417974e-05, 4.2945233872160316e-05, 4.468415136216208e-05, 4.642306885216385e-05, 4.816198634216562e-05, 4.990090383216739e-05, 5.1639821322169155e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 3.0, 9.0, 5.0, 14.0, 12.0, 21.0, 36.0, 54.0, 78.0, 127.0, 187.0, 274.0, 426.0, 722.0, 1115.0, 1792.0, 3041.0, 4988.0, 8322.0, 14610.0, 24507.0, 45748.0, 87927.0, 181081.0, 277023.0, 191041.0, 93442.0, 48833.0, 25953.0, 15047.0, 8711.0, 5179.0, 3110.0, 1914.0, 1169.0, 733.0, 433.0, 315.0, 176.0, 117.0, 85.0, 46.0, 43.0, 28.0, 20.0, 14.0, 13.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001099705696105957, -0.00010648369789123535, -0.000102996826171875, -9.950995445251465e-05, -9.60230827331543e-05, -9.253621101379395e-05, -8.90493392944336e-05, -8.556246757507324e-05, -8.207559585571289e-05, -7.858872413635254e-05, -7.510185241699219e-05, -7.161498069763184e-05, -6.812810897827148e-05, -6.464123725891113e-05, -6.115436553955078e-05, -5.766749382019043e-05, -5.418062210083008e-05, -5.0693750381469727e-05, -4.7206878662109375e-05, -4.3720006942749023e-05, -4.023313522338867e-05, -3.674626350402832e-05, -3.325939178466797e-05, -2.9772520065307617e-05, -2.6285648345947266e-05, -2.2798776626586914e-05, -1.9311904907226562e-05, -1.582503318786621e-05, -1.233816146850586e-05, -8.851289749145508e-06, -5.364418029785156e-06, -1.8775463104248047e-06, 1.6093254089355469e-06, 5.0961971282958984e-06, 8.58306884765625e-06, 1.2069940567016602e-05, 1.5556812286376953e-05, 1.9043684005737305e-05, 2.2530555725097656e-05, 2.6017427444458008e-05, 2.950429916381836e-05, 3.299117088317871e-05, 3.647804260253906e-05, 3.9964914321899414e-05, 4.3451786041259766e-05, 4.693865776062012e-05, 5.042552947998047e-05, 5.391240119934082e-05, 5.739927291870117e-05, 6.0886144638061523e-05, 6.437301635742188e-05, 6.785988807678223e-05, 7.134675979614258e-05, 7.483363151550293e-05, 7.832050323486328e-05, 8.180737495422363e-05, 8.529424667358398e-05, 8.878111839294434e-05, 9.226799011230469e-05, 9.575486183166504e-05, 9.924173355102539e-05, 0.00010272860527038574, 0.0001062154769897461, 0.00010970234870910645, 0.0001131892204284668]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 10.0, 3.0, 7.0, 8.0, 12.0, 14.0, 17.0, 15.0, 21.0, 22.0, 36.0, 34.0, 34.0, 45.0, 32.0, 33.0, 46.0, 44.0, 41.0, 51.0, 47.0, 37.0, 45.0, 35.0, 45.0, 39.0, 33.0, 31.0, 16.0, 20.0, 18.0, 25.0, 16.0, 14.0, 10.0, 8.0, 12.0, 9.0, 2.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.46574592590332e-05, -5.302019417285919e-05, -5.138292908668518e-05, -4.974566400051117e-05, -4.810839891433716e-05, -4.647113382816315e-05, -4.4833868741989136e-05, -4.3196603655815125e-05, -4.155933856964111e-05, -3.99220734834671e-05, -3.828480839729309e-05, -3.664754331111908e-05, -3.501027822494507e-05, -3.337301313877106e-05, -3.1735748052597046e-05, -3.0098482966423035e-05, -2.8461217880249023e-05, -2.6823952794075012e-05, -2.5186687707901e-05, -2.354942262172699e-05, -2.191215753555298e-05, -2.0274892449378967e-05, -1.8637627363204956e-05, -1.7000362277030945e-05, -1.5363097190856934e-05, -1.3725832104682922e-05, -1.2088567018508911e-05, -1.04513019323349e-05, -8.814036846160889e-06, -7.1767717599868774e-06, -5.539506673812866e-06, -3.902241587638855e-06, -2.2649765014648438e-06, -6.277114152908325e-07, 1.0095536708831787e-06, 2.64681875705719e-06, 4.284083843231201e-06, 5.921348929405212e-06, 7.558614015579224e-06, 9.195879101753235e-06, 1.0833144187927246e-05, 1.2470409274101257e-05, 1.4107674360275269e-05, 1.574493944644928e-05, 1.738220453262329e-05, 1.9019469618797302e-05, 2.0656734704971313e-05, 2.2293999791145325e-05, 2.3931264877319336e-05, 2.5568529963493347e-05, 2.720579504966736e-05, 2.884306013584137e-05, 3.048032522201538e-05, 3.211759030818939e-05, 3.37548553943634e-05, 3.5392120480537415e-05, 3.7029385566711426e-05, 3.866665065288544e-05, 4.030391573905945e-05, 4.194118082523346e-05, 4.357844591140747e-05, 4.521571099758148e-05, 4.685297608375549e-05, 4.8490241169929504e-05, 5.0127506256103516e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 4.0, 10.0, 9.0, 10.0, 15.0, 30.0, 43.0, 72.0, 102.0, 140.0, 237.0, 310.0, 541.0, 765.0, 1091.0, 1704.0, 2643.0, 3897.0, 6134.0, 9281.0, 14347.0, 22249.0, 37046.0, 59850.0, 106360.0, 182853.0, 235029.0, 149170.0, 82442.0, 49410.0, 29272.0, 18682.0, 11984.0, 7793.0, 5071.0, 3326.0, 2164.0, 1509.0, 1008.0, 700.0, 422.0, 271.0, 195.0, 142.0, 68.0, 59.0, 39.0, 20.0, 15.0, 15.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.863210678100586e-05, -8.579995483160019e-05, -8.296780288219452e-05, -8.013565093278885e-05, -7.730349898338318e-05, -7.447134703397751e-05, -7.163919508457184e-05, -6.880704313516617e-05, -6.59748911857605e-05, -6.314273923635483e-05, -6.031058728694916e-05, -5.747843533754349e-05, -5.464628338813782e-05, -5.181413143873215e-05, -4.898197948932648e-05, -4.614982753992081e-05, -4.331767559051514e-05, -4.0485523641109467e-05, -3.7653371691703796e-05, -3.4821219742298126e-05, -3.1989067792892456e-05, -2.9156915843486786e-05, -2.6324763894081116e-05, -2.3492611944675446e-05, -2.0660459995269775e-05, -1.7828308045864105e-05, -1.4996156096458435e-05, -1.2164004147052765e-05, -9.331852197647095e-06, -6.4997002482414246e-06, -3.6675482988357544e-06, -8.353963494300842e-07, 1.996755599975586e-06, 4.828907549381256e-06, 7.661059498786926e-06, 1.0493211448192596e-05, 1.3325363397598267e-05, 1.6157515347003937e-05, 1.8989667296409607e-05, 2.1821819245815277e-05, 2.4653971195220947e-05, 2.7486123144626617e-05, 3.0318275094032288e-05, 3.315042704343796e-05, 3.598257899284363e-05, 3.88147309422493e-05, 4.164688289165497e-05, 4.447903484106064e-05, 4.731118679046631e-05, 5.014333873987198e-05, 5.297549068927765e-05, 5.580764263868332e-05, 5.863979458808899e-05, 6.147194653749466e-05, 6.430409848690033e-05, 6.7136250436306e-05, 6.996840238571167e-05, 7.280055433511734e-05, 7.563270628452301e-05, 7.846485823392868e-05, 8.129701018333435e-05, 8.412916213274002e-05, 8.696131408214569e-05, 8.979346603155136e-05, 9.262561798095703e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 7.0, 3.0, 2.0, 6.0, 7.0, 4.0, 5.0, 12.0, 12.0, 12.0, 13.0, 18.0, 27.0, 32.0, 20.0, 19.0, 32.0, 43.0, 43.0, 30.0, 35.0, 39.0, 52.0, 40.0, 37.0, 32.0, 44.0, 40.0, 43.0, 33.0, 30.0, 33.0, 35.0, 25.0, 26.0, 11.0, 22.0, 22.0, 13.0, 16.0, 7.0, 5.0, 5.0, 6.0, 7.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.2842159271240234e-05, -3.184843808412552e-05, -3.08547168970108e-05, -2.9860995709896088e-05, -2.8867274522781372e-05, -2.7873553335666656e-05, -2.687983214855194e-05, -2.5886110961437225e-05, -2.489238977432251e-05, -2.3898668587207794e-05, -2.290494740009308e-05, -2.1911226212978363e-05, -2.0917505025863647e-05, -1.9923783838748932e-05, -1.8930062651634216e-05, -1.79363414645195e-05, -1.6942620277404785e-05, -1.594889909029007e-05, -1.4955177903175354e-05, -1.3961456716060638e-05, -1.2967735528945923e-05, -1.1974014341831207e-05, -1.0980293154716492e-05, -9.986571967601776e-06, -8.99285078048706e-06, -7.999129593372345e-06, -7.005408406257629e-06, -6.011687219142914e-06, -5.017966032028198e-06, -4.024244844913483e-06, -3.030523657798767e-06, -2.0368024706840515e-06, -1.043081283569336e-06, -4.936009645462036e-08, 9.443610906600952e-07, 1.938082277774811e-06, 2.9318034648895264e-06, 3.925524652004242e-06, 4.9192458391189575e-06, 5.912967026233673e-06, 6.906688213348389e-06, 7.900409400463104e-06, 8.89413058757782e-06, 9.887851774692535e-06, 1.0881572961807251e-05, 1.1875294148921967e-05, 1.2869015336036682e-05, 1.3862736523151398e-05, 1.4856457710266113e-05, 1.585017889738083e-05, 1.6843900084495544e-05, 1.783762127161026e-05, 1.8831342458724976e-05, 1.982506364583969e-05, 2.0818784832954407e-05, 2.1812506020069122e-05, 2.2806227207183838e-05, 2.3799948394298553e-05, 2.479366958141327e-05, 2.5787390768527985e-05, 2.67811119556427e-05, 2.7774833142757416e-05, 2.876855432987213e-05, 2.9762275516986847e-05, 3.075599670410156e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 13.0, 6.0, 32.0, 23.0, 38.0, 46.0, 70.0, 115.0, 156.0, 225.0, 354.0, 506.0, 852.0, 1288.0, 2085.0, 3055.0, 4721.0, 8105.0, 13746.0, 24863.0, 48599.0, 711188.0, 134144.0, 42081.0, 21303.0, 11486.0, 7130.0, 4346.0, 2857.0, 1774.0, 1117.0, 774.0, 472.0, 318.0, 192.0, 141.0, 99.0, 73.0, 49.0, 23.0, 31.0, 16.0, 15.0, 5.0, 10.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.464387893676758e-05, -4.328601062297821e-05, -4.192814230918884e-05, -4.0570273995399475e-05, -3.921240568161011e-05, -3.785453736782074e-05, -3.649666905403137e-05, -3.5138800740242004e-05, -3.378093242645264e-05, -3.242306411266327e-05, -3.10651957988739e-05, -2.9707327485084534e-05, -2.8349459171295166e-05, -2.69915908575058e-05, -2.563372254371643e-05, -2.4275854229927063e-05, -2.2917985916137695e-05, -2.1560117602348328e-05, -2.020224928855896e-05, -1.8844380974769592e-05, -1.7486512660980225e-05, -1.6128644347190857e-05, -1.477077603340149e-05, -1.3412907719612122e-05, -1.2055039405822754e-05, -1.0697171092033386e-05, -9.339302778244019e-06, -7.981434464454651e-06, -6.623566150665283e-06, -5.2656978368759155e-06, -3.907829523086548e-06, -2.54996120929718e-06, -1.1920928955078125e-06, 1.6577541828155518e-07, 1.5236437320709229e-06, 2.8815120458602905e-06, 4.239380359649658e-06, 5.597248673439026e-06, 6.9551169872283936e-06, 8.312985301017761e-06, 9.670853614807129e-06, 1.1028721928596497e-05, 1.2386590242385864e-05, 1.3744458556175232e-05, 1.51023268699646e-05, 1.6460195183753967e-05, 1.7818063497543335e-05, 1.9175931811332703e-05, 2.053380012512207e-05, 2.1891668438911438e-05, 2.3249536752700806e-05, 2.4607405066490173e-05, 2.596527338027954e-05, 2.732314169406891e-05, 2.8681010007858276e-05, 3.0038878321647644e-05, 3.139674663543701e-05, 3.275461494922638e-05, 3.411248326301575e-05, 3.5470351576805115e-05, 3.682821989059448e-05, 3.818608820438385e-05, 3.954395651817322e-05, 4.0901824831962585e-05, 4.225969314575195e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 0.0, 0.0, 9.0, 0.0, 7.0, 0.0, 0.0, 22.0, 0.0, 0.0, 25.0, 0.0, 23.0, 0.0, 0.0, 73.0, 0.0, 92.0, 0.0, 0.0, 485.0, 0.0, 101.0, 0.0, 0.0, 69.0, 0.0, 43.0, 0.0, 0.0, 31.0, 0.0, 0.0, 14.0, 0.0, 7.0, 0.0, 0.0, 6.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.748603820800781e-07, -7.515773177146912e-07, -7.282942533493042e-07, -7.050111889839172e-07, -6.817281246185303e-07, -6.584450602531433e-07, -6.351619958877563e-07, -6.118789315223694e-07, -5.885958671569824e-07, -5.653128027915955e-07, -5.420297384262085e-07, -5.187466740608215e-07, -4.954636096954346e-07, -4.721805453300476e-07, -4.4889748096466064e-07, -4.256144165992737e-07, -4.023313522338867e-07, -3.7904828786849976e-07, -3.557652235031128e-07, -3.3248215913772583e-07, -3.0919909477233887e-07, -2.859160304069519e-07, -2.6263296604156494e-07, -2.39349901676178e-07, -2.1606683731079102e-07, -1.9278377294540405e-07, -1.695007085800171e-07, -1.4621764421463013e-07, -1.2293457984924316e-07, -9.96515154838562e-08, -7.636845111846924e-08, -5.3085386753082275e-08, -2.9802322387695312e-08, -6.51925802230835e-09, 1.6763806343078613e-08, 4.0046870708465576e-08, 6.332993507385254e-08, 8.66129994392395e-08, 1.0989606380462646e-07, 1.3317912817001343e-07, 1.564621925354004e-07, 1.7974525690078735e-07, 2.0302832126617432e-07, 2.2631138563156128e-07, 2.4959444999694824e-07, 2.728775143623352e-07, 2.9616057872772217e-07, 3.1944364309310913e-07, 3.427267074584961e-07, 3.6600977182388306e-07, 3.8929283618927e-07, 4.12575900554657e-07, 4.3585896492004395e-07, 4.591420292854309e-07, 4.824250936508179e-07, 5.057081580162048e-07, 5.289912223815918e-07, 5.522742867469788e-07, 5.755573511123657e-07, 5.988404154777527e-07, 6.221234798431396e-07, 6.454065442085266e-07, 6.686896085739136e-07, 6.919726729393005e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 10.0, 8.0, 10.0, 18.0, 27.0, 42.0, 51.0, 63.0, 98.0, 135.0, 180.0, 320.0, 440.0, 650.0, 1000.0, 1440.0, 2268.0, 3511.0, 5626.0, 9367.0, 14119.0, 25005.0, 40645.0, 102077.0, 717289.0, 49802.0, 28595.0, 17105.0, 10552.0, 6228.0, 4089.0, 2712.0, 1698.0, 1083.0, 676.0, 507.0, 348.0, 223.0, 163.0, 109.0, 79.0, 45.0, 46.0, 33.0, 16.0, 15.0, 10.0, 8.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.060434341430664e-05, -4.903040826320648e-05, -4.745647311210632e-05, -4.5882537961006165e-05, -4.4308602809906006e-05, -4.273466765880585e-05, -4.116073250770569e-05, -3.958679735660553e-05, -3.801286220550537e-05, -3.643892705440521e-05, -3.4864991903305054e-05, -3.3291056752204895e-05, -3.1717121601104736e-05, -3.0143186450004578e-05, -2.856925129890442e-05, -2.699531614780426e-05, -2.54213809967041e-05, -2.3847445845603943e-05, -2.2273510694503784e-05, -2.0699575543403625e-05, -1.9125640392303467e-05, -1.7551705241203308e-05, -1.597777009010315e-05, -1.440383493900299e-05, -1.2829899787902832e-05, -1.1255964636802673e-05, -9.682029485702515e-06, -8.108094334602356e-06, -6.534159183502197e-06, -4.9602240324020386e-06, -3.38628888130188e-06, -1.8123537302017212e-06, -2.384185791015625e-07, 1.3355165719985962e-06, 2.909451723098755e-06, 4.4833868741989136e-06, 6.057322025299072e-06, 7.631257176399231e-06, 9.20519232749939e-06, 1.0779127478599548e-05, 1.2353062629699707e-05, 1.3926997780799866e-05, 1.5500932931900024e-05, 1.7074868083000183e-05, 1.8648803234100342e-05, 2.02227383852005e-05, 2.179667353630066e-05, 2.3370608687400818e-05, 2.4944543838500977e-05, 2.6518478989601135e-05, 2.8092414140701294e-05, 2.9666349291801453e-05, 3.124028444290161e-05, 3.281421959400177e-05, 3.438815474510193e-05, 3.596208989620209e-05, 3.7536025047302246e-05, 3.9109960198402405e-05, 4.0683895349502563e-05, 4.225783050060272e-05, 4.383176565170288e-05, 4.540570080280304e-05, 4.69796359539032e-05, 4.855357110500336e-05, 5.0127506256103516e-05]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 7.0, 5.0, 5.0, 7.0, 13.0, 12.0, 21.0, 14.0, 11.0, 11.0, 21.0, 17.0, 29.0, 501.0, 119.0, 20.0, 25.0, 15.0, 22.0, 20.0, 15.0, 11.0, 13.0, 13.0, 11.0, 7.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5914440155029297e-05, -1.54152512550354e-05, -1.4916062355041504e-05, -1.4416873455047607e-05, -1.3917684555053711e-05, -1.3418495655059814e-05, -1.2919306755065918e-05, -1.2420117855072021e-05, -1.1920928955078125e-05, -1.1421740055084229e-05, -1.0922551155090332e-05, -1.0423362255096436e-05, -9.924173355102539e-06, -9.424984455108643e-06, -8.925795555114746e-06, -8.42660665512085e-06, -7.927417755126953e-06, -7.428228855133057e-06, -6.92903995513916e-06, -6.429851055145264e-06, -5.930662155151367e-06, -5.431473255157471e-06, -4.932284355163574e-06, -4.433095455169678e-06, -3.933906555175781e-06, -3.4347176551818848e-06, -2.9355287551879883e-06, -2.436339855194092e-06, -1.9371509552001953e-06, -1.4379620552062988e-06, -9.387731552124023e-07, -4.3958425521850586e-07, 5.960464477539063e-08, 5.587935447692871e-07, 1.0579824447631836e-06, 1.55717134475708e-06, 2.0563602447509766e-06, 2.555549144744873e-06, 3.0547380447387695e-06, 3.553926944732666e-06, 4.0531158447265625e-06, 4.552304744720459e-06, 5.0514936447143555e-06, 5.550682544708252e-06, 6.0498714447021484e-06, 6.549060344696045e-06, 7.048249244689941e-06, 7.547438144683838e-06, 8.046627044677734e-06, 8.545815944671631e-06, 9.045004844665527e-06, 9.544193744659424e-06, 1.004338264465332e-05, 1.0542571544647217e-05, 1.1041760444641113e-05, 1.154094934463501e-05, 1.2040138244628906e-05, 1.2539327144622803e-05, 1.30385160446167e-05, 1.3537704944610596e-05, 1.4036893844604492e-05, 1.4536082744598389e-05, 1.5035271644592285e-05, 1.553446054458618e-05, 1.6033649444580078e-05]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 3.0, 8.0, 7.0, 9.0, 15.0, 10.0, 12.0, 34.0, 19.0, 45.0, 39.0, 51.0, 70.0, 93.0, 96.0, 103.0, 81.0, 62.0, 49.0, 34.0, 28.0, 24.0, 24.0, 11.0, 17.0, 8.0, 8.0, 3.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.371454557869583e-05, -7.13950939825736e-05, -6.907564238645136e-05, -6.675619079032913e-05, -6.44367391942069e-05, -6.211728032212704e-05, -5.979782872600481e-05, -5.7478377129882574e-05, -5.515892553376034e-05, -5.2839473937638104e-05, -5.052002234151587e-05, -4.820056710741483e-05, -4.588111551129259e-05, -4.356166391517036e-05, -4.1242208681069314e-05, -3.892275708494708e-05, -3.6603305488824844e-05, -3.428385389270261e-05, -3.1964402296580374e-05, -2.9644947062479332e-05, -2.7325495466357097e-05, -2.5006043870234862e-05, -2.2686590455123223e-05, -2.0367137040011585e-05, -1.804768544388935e-05, -1.5728233847767115e-05, -1.3408780432655476e-05, -1.108932792703854e-05, -8.769875421421602e-06, -6.4504229158046655e-06, -4.130970410187729e-06, -1.81151699507609e-06, 5.079418770037591e-07, 2.827394382620696e-06, 5.146846888237633e-06, 7.46629939385457e-06, 9.785751899471506e-06, 1.2105204405088443e-05, 1.442465691070538e-05, 1.674411032581702e-05, 1.9063561921939254e-05, 2.138301351806149e-05, 2.3702466933173127e-05, 2.6021920348284766e-05, 2.8341371944407e-05, 3.0660823540529236e-05, 3.298027877463028e-05, 3.5299730370752513e-05, 3.761918196687475e-05, 3.9938633562996984e-05, 4.225808515911922e-05, 4.457754039322026e-05, 4.6896991989342496e-05, 4.921644358546473e-05, 5.153589881956577e-05, 5.385535041568801e-05, 5.617480201181024e-05, 5.849425360793248e-05, 6.081370520405471e-05, 6.313315680017695e-05, 6.545260839629918e-05, 6.777206726837903e-05, 7.009151886450127e-05, 7.24109704606235e-05, 7.473042205674574e-05]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 6.0, 2.0, 7.0, 6.0, 11.0, 13.0, 23.0, 21.0, 19.0, 33.0, 35.0, 30.0, 36.0, 23.0, 38.0, 42.0, 50.0, 37.0, 43.0, 42.0, 39.0, 38.0, 36.0, 38.0, 43.0, 34.0, 42.0, 39.0, 29.0, 22.0, 18.0, 22.0, 14.0, 13.0, 12.0, 9.0, 6.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.786535646417178e-05, -4.6159148041624576e-05, -4.445293961907737e-05, -4.274673119653016e-05, -4.104052277398296e-05, -3.933431435143575e-05, -3.762810956686735e-05, -3.592189750634134e-05, -3.421569272177294e-05, -3.250948429922573e-05, -3.0803275876678526e-05, -2.909706745413132e-05, -2.7390859031584114e-05, -2.5684650609036908e-05, -2.3978444005479105e-05, -2.22722355829319e-05, -2.056602534139529e-05, -1.8859816918848082e-05, -1.7153608496300876e-05, -1.544740007375367e-05, -1.3741192560701165e-05, -1.2034984138153959e-05, -1.0328776625101455e-05, -8.622568202554248e-06, -6.916359780007042e-06, -5.210151357459836e-06, -3.5039433896599803e-06, -1.797735421860125e-06, -9.152699931291863e-08, 1.6146814232342876e-06, 3.320888936286792e-06, 5.0270973588339984e-06, 6.733302143402398e-06, 8.439510565949604e-06, 1.014571898849681e-05, 1.1851926501549315e-05, 1.3558134924096521e-05, 1.526434425613843e-05, 1.6970550859696232e-05, 1.8676759282243438e-05, 2.0382967704790644e-05, 2.208917612733785e-05, 2.3795384549885057e-05, 2.550159115344286e-05, 2.7207799575990066e-05, 2.8914007998537272e-05, 3.062021642108448e-05, 3.2326424843631685e-05, 3.403263326617889e-05, 3.57388416887261e-05, 3.7445050111273304e-05, 3.915125853382051e-05, 4.0857466956367716e-05, 4.256367537891492e-05, 4.426988016348332e-05, 4.5976092224009335e-05, 4.7682297008577734e-05, 4.938850543112494e-05, 5.109471385367215e-05, 5.280092227621935e-05, 5.450713069876656e-05, 5.6213339121313766e-05, 5.791954754386097e-05, 5.962575232842937e-05, 6.133196438895538e-05]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 9.0, 24.0, 18.0, 41.0, 51.0, 68.0, 81.0, 97.0, 158.0, 204.0, 261.0, 362.0, 529.0, 716.0, 922.0, 1235.0, 1695.0, 2557.0, 3385.0, 4839.0, 7377.0, 10520.0, 15529.0, 24669.0, 37985.0, 61462.0, 105845.0, 207905.0, 467538.0, 1224320.0, 1150603.0, 415739.0, 188022.0, 99411.0, 58874.0, 34422.0, 21937.0, 14667.0, 9325.0, 6327.0, 4373.0, 2979.0, 1992.0, 1501.0, 1051.0, 720.0, 580.0, 412.0, 250.0, 219.0, 165.0, 90.0, 82.0, 50.0, 42.0, 20.0, 14.0, 15.0, 3.0, 5.0, 2.0], "bins": [-5.751848220825195e-05, -5.577225238084793e-05, -5.402602255344391e-05, -5.2279792726039886e-05, -5.0533562898635864e-05, -4.878733307123184e-05, -4.704110324382782e-05, -4.52948734164238e-05, -4.3548643589019775e-05, -4.180241376161575e-05, -4.005618393421173e-05, -3.830995410680771e-05, -3.6563724279403687e-05, -3.4817494451999664e-05, -3.307126462459564e-05, -3.132503479719162e-05, -2.9578804969787598e-05, -2.7832575142383575e-05, -2.6086345314979553e-05, -2.434011548757553e-05, -2.259388566017151e-05, -2.0847655832767487e-05, -1.9101426005363464e-05, -1.7355196177959442e-05, -1.560896635055542e-05, -1.3862736523151398e-05, -1.2116506695747375e-05, -1.0370276868343353e-05, -8.624047040939331e-06, -6.877817213535309e-06, -5.131587386131287e-06, -3.3853575587272644e-06, -1.6391277313232422e-06, 1.0710209608078003e-07, 1.8533319234848022e-06, 3.5995617508888245e-06, 5.345791578292847e-06, 7.092021405696869e-06, 8.838251233100891e-06, 1.0584481060504913e-05, 1.2330710887908936e-05, 1.4076940715312958e-05, 1.582317054271698e-05, 1.7569400370121002e-05, 1.9315630197525024e-05, 2.1061860024929047e-05, 2.280808985233307e-05, 2.455431967973709e-05, 2.6300549507141113e-05, 2.8046779334545135e-05, 2.9793009161949158e-05, 3.153923898935318e-05, 3.32854688167572e-05, 3.5031698644161224e-05, 3.6777928471565247e-05, 3.852415829896927e-05, 4.027038812637329e-05, 4.201661795377731e-05, 4.3762847781181335e-05, 4.550907760858536e-05, 4.725530743598938e-05, 4.90015372633934e-05, 5.0747767090797424e-05, 5.2493996918201447e-05, 5.424022674560547e-05]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 8.0, 4.0, 3.0, 9.0, 7.0, 7.0, 13.0, 16.0, 14.0, 24.0, 28.0, 28.0, 26.0, 29.0, 29.0, 26.0, 38.0, 31.0, 45.0, 45.0, 22.0, 36.0, 38.0, 34.0, 41.0, 29.0, 35.0, 44.0, 30.0, 29.0, 30.0, 29.0, 21.0, 23.0, 20.0, 18.0, 9.0, 16.0, 12.0, 3.0, 10.0, 9.0, 9.0, 5.0, 0.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.8073787689208984e-05, -2.7192756533622742e-05, -2.63117253780365e-05, -2.5430694222450256e-05, -2.4549663066864014e-05, -2.366863191127777e-05, -2.278760075569153e-05, -2.1906569600105286e-05, -2.1025538444519043e-05, -2.01445072889328e-05, -1.9263476133346558e-05, -1.8382444977760315e-05, -1.7501413822174072e-05, -1.662038266658783e-05, -1.5739351511001587e-05, -1.4858320355415344e-05, -1.3977289199829102e-05, -1.3096258044242859e-05, -1.2215226888656616e-05, -1.1334195733070374e-05, -1.0453164577484131e-05, -9.572133421897888e-06, -8.691102266311646e-06, -7.810071110725403e-06, -6.92903995513916e-06, -6.0480087995529175e-06, -5.166977643966675e-06, -4.285946488380432e-06, -3.4049153327941895e-06, -2.5238841772079468e-06, -1.642853021621704e-06, -7.618218660354614e-07, 1.1920928955078125e-07, 1.000240445137024e-06, 1.8812716007232666e-06, 2.7623027563095093e-06, 3.643333911895752e-06, 4.524365067481995e-06, 5.405396223068237e-06, 6.28642737865448e-06, 7.167458534240723e-06, 8.048489689826965e-06, 8.929520845413208e-06, 9.81055200099945e-06, 1.0691583156585693e-05, 1.1572614312171936e-05, 1.2453645467758179e-05, 1.3334676623344421e-05, 1.4215707778930664e-05, 1.5096738934516907e-05, 1.597777009010315e-05, 1.6858801245689392e-05, 1.7739832401275635e-05, 1.8620863556861877e-05, 1.950189471244812e-05, 2.0382925868034363e-05, 2.1263957023620605e-05, 2.2144988179206848e-05, 2.302601933479309e-05, 2.3907050490379333e-05, 2.4788081645965576e-05, 2.566911280155182e-05, 2.655014395713806e-05, 2.7431175112724304e-05, 2.8312206268310547e-05]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 3.0, 11.0, 17.0, 21.0, 36.0, 50.0, 68.0, 108.0, 189.0, 275.0, 421.0, 730.0, 1099.0, 1604.0, 2620.0, 4056.0, 6557.0, 10616.0, 17910.0, 29770.0, 48684.0, 89235.0, 164465.0, 334428.0, 800351.0, 1402656.0, 657052.0, 279523.0, 147266.0, 80268.0, 45636.0, 26638.0, 15846.0, 9657.0, 5971.0, 3821.0, 2405.0, 1498.0, 958.0, 621.0, 394.0, 261.0, 178.0, 104.0, 66.0, 61.0, 31.0, 18.0, 11.0, 12.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.745887756347656e-05, -5.5738724768161774e-05, -5.4018571972846985e-05, -5.2298419177532196e-05, -5.057826638221741e-05, -4.885811358690262e-05, -4.713796079158783e-05, -4.541780799627304e-05, -4.369765520095825e-05, -4.197750240564346e-05, -4.0257349610328674e-05, -3.8537196815013885e-05, -3.68170440196991e-05, -3.509689122438431e-05, -3.337673842906952e-05, -3.165658563375473e-05, -2.993643283843994e-05, -2.8216280043125153e-05, -2.6496127247810364e-05, -2.4775974452495575e-05, -2.3055821657180786e-05, -2.1335668861865997e-05, -1.961551606655121e-05, -1.789536327123642e-05, -1.617521047592163e-05, -1.4455057680606842e-05, -1.2734904885292053e-05, -1.1014752089977264e-05, -9.294599294662476e-06, -7.574446499347687e-06, -5.854293704032898e-06, -4.134140908718109e-06, -2.4139881134033203e-06, -6.938353180885315e-07, 1.0263174772262573e-06, 2.746470272541046e-06, 4.466623067855835e-06, 6.186775863170624e-06, 7.906928658485413e-06, 9.627081453800201e-06, 1.134723424911499e-05, 1.3067387044429779e-05, 1.4787539839744568e-05, 1.6507692635059357e-05, 1.8227845430374146e-05, 1.9947998225688934e-05, 2.1668151021003723e-05, 2.3388303816318512e-05, 2.51084566116333e-05, 2.682860940694809e-05, 2.854876220226288e-05, 3.0268914997577667e-05, 3.1989067792892456e-05, 3.3709220588207245e-05, 3.5429373383522034e-05, 3.714952617883682e-05, 3.886967897415161e-05, 4.05898317694664e-05, 4.230998456478119e-05, 4.403013736009598e-05, 4.5750290155410767e-05, 4.7470442950725555e-05, 4.9190595746040344e-05, 5.091074854135513e-05, 5.263090133666992e-05]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 8.0, 10.0, 2.0, 17.0, 8.0, 7.0, 27.0, 30.0, 26.0, 39.0, 47.0, 55.0, 75.0, 115.0, 115.0, 128.0, 137.0, 201.0, 206.0, 235.0, 276.0, 268.0, 283.0, 238.0, 224.0, 213.0, 207.0, 157.0, 131.0, 112.0, 86.0, 69.0, 70.0, 47.0, 26.0, 43.0, 32.0, 23.0, 18.0, 17.0, 17.0, 10.0, 6.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.537799835205078e-05, -1.484900712966919e-05, -1.4320015907287598e-05, -1.3791024684906006e-05, -1.3262033462524414e-05, -1.2733042240142822e-05, -1.220405101776123e-05, -1.1675059795379639e-05, -1.1146068572998047e-05, -1.0617077350616455e-05, -1.0088086128234863e-05, -9.559094905853271e-06, -9.03010368347168e-06, -8.501112461090088e-06, -7.972121238708496e-06, -7.443130016326904e-06, -6.9141387939453125e-06, -6.385147571563721e-06, -5.856156349182129e-06, -5.327165126800537e-06, -4.798173904418945e-06, -4.2691826820373535e-06, -3.7401914596557617e-06, -3.21120023727417e-06, -2.682209014892578e-06, -2.1532177925109863e-06, -1.6242265701293945e-06, -1.0952353477478027e-06, -5.662441253662109e-07, -3.725290298461914e-08, 4.917383193969727e-07, 1.0207295417785645e-06, 1.5497207641601562e-06, 2.078711986541748e-06, 2.60770320892334e-06, 3.1366944313049316e-06, 3.6656856536865234e-06, 4.194676876068115e-06, 4.723668098449707e-06, 5.252659320831299e-06, 5.781650543212891e-06, 6.310641765594482e-06, 6.839632987976074e-06, 7.368624210357666e-06, 7.897615432739258e-06, 8.42660665512085e-06, 8.955597877502441e-06, 9.484589099884033e-06, 1.0013580322265625e-05, 1.0542571544647217e-05, 1.1071562767028809e-05, 1.16005539894104e-05, 1.2129545211791992e-05, 1.2658536434173584e-05, 1.3187527656555176e-05, 1.3716518878936768e-05, 1.424551010131836e-05, 1.4774501323699951e-05, 1.5303492546081543e-05, 1.5832483768463135e-05, 1.6361474990844727e-05, 1.689046621322632e-05, 1.741945743560791e-05, 1.7948448657989502e-05, 1.8477439880371094e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 7.0, 10.0, 9.0, 9.0, 21.0, 28.0, 24.0, 31.0, 38.0, 63.0, 73.0, 82.0, 115.0, 84.0, 83.0, 66.0, 55.0, 36.0, 36.0, 32.0, 16.0, 6.0, 10.0, 11.0, 6.0, 15.0, 7.0, 2.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.281666381051764e-05, -5.1207873184466735e-05, -4.959908619639464e-05, -4.799029557034373e-05, -4.638150494429283e-05, -4.4772714318241924e-05, -4.316392733016983e-05, -4.155513670411892e-05, -3.994634607806802e-05, -3.8337555452017114e-05, -3.6728768463945016e-05, -3.511997783789411e-05, -3.351118721184321e-05, -3.19023965857923e-05, -3.0293609597720206e-05, -2.86848189716693e-05, -2.70760301646078e-05, -2.54672413575463e-05, -2.3858450731495395e-05, -2.2249661924433894e-05, -2.064087129838299e-05, -1.903208249132149e-05, -1.7423291865270585e-05, -1.5814503058209084e-05, -1.4205713341652881e-05, -1.2596923625096679e-05, -1.0988133908540476e-05, -9.379344191984273e-06, -7.770555384922773e-06, -6.16176566836657e-06, -4.552975951810367e-06, -2.9441862352541648e-06, -1.3353965186979622e-06, 2.7339308417140273e-07, 1.8821826870407676e-06, 3.490972176223295e-06, 5.0997618927794974e-06, 6.708551154588349e-06, 8.317340871144552e-06, 9.926130587700754e-06, 1.1534920304256957e-05, 1.314371002081316e-05, 1.4752499737369362e-05, 1.6361289453925565e-05, 1.7970078260987066e-05, 1.9578867068048567e-05, 2.118765769409947e-05, 2.2796448320150375e-05, 2.4405237127211876e-05, 2.6014025934273377e-05, 2.762281656032428e-05, 2.9231605367385782e-05, 3.084039417444728e-05, 3.244918480049819e-05, 3.405797542654909e-05, 3.5666766052599996e-05, 3.7275553040672094e-05, 3.8884343666723e-05, 4.0493130654795095e-05, 4.2101921280846e-05, 4.3710711906896904e-05, 4.531950253294781e-05, 4.6928289521019906e-05, 4.853708014707081e-05, 5.0145870773121715e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 12.0, 11.0, 20.0, 14.0, 16.0, 22.0, 22.0, 31.0, 38.0, 30.0, 34.0, 39.0, 36.0, 44.0, 44.0, 54.0, 40.0, 41.0, 45.0, 46.0, 37.0, 41.0, 30.0, 34.0, 40.0, 32.0, 28.0, 18.0, 23.0, 15.0, 13.0, 11.0, 5.0, 8.0, 3.0, 9.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7627090932801366e-05, -3.642652518465184e-05, -3.52259557985235e-05, -3.402539005037397e-05, -3.2824820664245635e-05, -3.1624254916096106e-05, -3.0423689167946577e-05, -2.9223121600807644e-05, -2.8022554033668712e-05, -2.682198646652978e-05, -2.5621418899390846e-05, -2.4420853151241317e-05, -2.3220285584102385e-05, -2.2019718016963452e-05, -2.0819152268813923e-05, -1.961858470167499e-05, -1.8418017134536058e-05, -1.7217449567397125e-05, -1.6016882000258192e-05, -1.4816316252108663e-05, -1.361574868496973e-05, -1.2415181117830798e-05, -1.1214614460186567e-05, -1.0014047802542336e-05, -8.813480235403404e-06, -7.612913123011822e-06, -6.41234601062024e-06, -5.211778898228658e-06, -4.011211785837077e-06, -2.810644673445495e-06, -1.610077561053913e-06, -4.095109034096822e-07, 7.910603017080575e-07, 1.9916274140996393e-06, 3.192194526491221e-06, 4.392761638882803e-06, 5.5933287512743846e-06, 6.793895863665966e-06, 7.994462976057548e-06, 9.195029633701779e-06, 1.0395597200840712e-05, 1.1596164767979644e-05, 1.2796731425623875e-05, 1.3997298083268106e-05, 1.5197865650407039e-05, 1.639843321754597e-05, 1.75989989656955e-05, 1.8799566532834433e-05, 2.0000134099973366e-05, 2.12007016671123e-05, 2.240126923425123e-05, 2.360183498240076e-05, 2.4802402549539693e-05, 2.6002970116678625e-05, 2.7203535864828154e-05, 2.8404103431967087e-05, 2.960467099910602e-05, 3.080523674725555e-05, 3.2005806133383885e-05, 3.3206371881533414e-05, 3.440694126766175e-05, 3.560750701581128e-05, 3.680807276396081e-05, 3.8008642150089145e-05, 3.9209207898238674e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 12.0, 16.0, 20.0, 27.0, 43.0, 73.0, 121.0, 182.0, 270.0, 428.0, 590.0, 1006.0, 1523.0, 2489.0, 3773.0, 5954.0, 9899.0, 15412.0, 24616.0, 42086.0, 65961.0, 108068.0, 168712.0, 209830.0, 147233.0, 91476.0, 57446.0, 34031.0, 21123.0, 13127.0, 8579.0, 5238.0, 3263.0, 2133.0, 1360.0, 866.0, 589.0, 314.0, 239.0, 135.0, 83.0, 71.0, 38.0, 37.0, 13.0, 16.0, 10.0, 9.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.392862319946289e-05, -4.248041659593582e-05, -4.103220999240875e-05, -3.958400338888168e-05, -3.8135796785354614e-05, -3.6687590181827545e-05, -3.5239383578300476e-05, -3.379117697477341e-05, -3.234297037124634e-05, -3.089476376771927e-05, -2.94465571641922e-05, -2.799835056066513e-05, -2.655014395713806e-05, -2.5101937353610992e-05, -2.3653730750083923e-05, -2.2205524146556854e-05, -2.0757317543029785e-05, -1.9309110939502716e-05, -1.7860904335975647e-05, -1.6412697732448578e-05, -1.4964491128921509e-05, -1.351628452539444e-05, -1.206807792186737e-05, -1.0619871318340302e-05, -9.171664714813232e-06, -7.723458111286163e-06, -6.275251507759094e-06, -4.827044904232025e-06, -3.378838300704956e-06, -1.930631697177887e-06, -4.824250936508179e-07, 9.657815098762512e-07, 2.4139881134033203e-06, 3.862194716930389e-06, 5.3104013204574585e-06, 6.758607923984528e-06, 8.206814527511597e-06, 9.655021131038666e-06, 1.1103227734565735e-05, 1.2551434338092804e-05, 1.3999640941619873e-05, 1.5447847545146942e-05, 1.689605414867401e-05, 1.834426075220108e-05, 1.979246735572815e-05, 2.124067395925522e-05, 2.2688880562782288e-05, 2.4137087166309357e-05, 2.5585293769836426e-05, 2.7033500373363495e-05, 2.8481706976890564e-05, 2.9929913580417633e-05, 3.13781201839447e-05, 3.282632678747177e-05, 3.427453339099884e-05, 3.572273999452591e-05, 3.717094659805298e-05, 3.861915320158005e-05, 4.006735980510712e-05, 4.1515566408634186e-05, 4.2963773012161255e-05, 4.4411979615688324e-05, 4.586018621921539e-05, 4.730839282274246e-05, 4.875659942626953e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 8.0, 10.0, 12.0, 9.0, 18.0, 22.0, 7.0, 28.0, 31.0, 39.0, 33.0, 39.0, 35.0, 33.0, 45.0, 53.0, 46.0, 46.0, 41.0, 37.0, 49.0, 34.0, 45.0, 36.0, 34.0, 43.0, 31.0, 30.0, 20.0, 16.0, 15.0, 11.0, 16.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.272294998168945e-05, -3.168173134326935e-05, -3.064051270484924e-05, -2.9599294066429138e-05, -2.8558075428009033e-05, -2.7516856789588928e-05, -2.6475638151168823e-05, -2.5434419512748718e-05, -2.4393200874328613e-05, -2.3351982235908508e-05, -2.2310763597488403e-05, -2.12695449590683e-05, -2.0228326320648193e-05, -1.918710768222809e-05, -1.8145889043807983e-05, -1.710467040538788e-05, -1.6063451766967773e-05, -1.5022233128547668e-05, -1.3981014490127563e-05, -1.2939795851707458e-05, -1.1898577213287354e-05, -1.0857358574867249e-05, -9.816139936447144e-06, -8.774921298027039e-06, -7.733702659606934e-06, -6.692484021186829e-06, -5.651265382766724e-06, -4.610046744346619e-06, -3.5688281059265137e-06, -2.5276094675064087e-06, -1.4863908290863037e-06, -4.4517219066619873e-07, 5.960464477539062e-07, 1.6372650861740112e-06, 2.678483724594116e-06, 3.719702363014221e-06, 4.760921001434326e-06, 5.802139639854431e-06, 6.843358278274536e-06, 7.884576916694641e-06, 8.925795555114746e-06, 9.967014193534851e-06, 1.1008232831954956e-05, 1.2049451470375061e-05, 1.3090670108795166e-05, 1.4131888747215271e-05, 1.5173107385635376e-05, 1.621432602405548e-05, 1.7255544662475586e-05, 1.829676330089569e-05, 1.9337981939315796e-05, 2.03792005777359e-05, 2.1420419216156006e-05, 2.246163785457611e-05, 2.3502856492996216e-05, 2.454407513141632e-05, 2.5585293769836426e-05, 2.662651240825653e-05, 2.7667731046676636e-05, 2.870894968509674e-05, 2.9750168323516846e-05, 3.079138696193695e-05, 3.1832605600357056e-05, 3.287382423877716e-05, 3.3915042877197266e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 2.0, 7.0, 9.0, 8.0, 14.0, 29.0, 44.0, 62.0, 81.0, 147.0, 263.0, 397.0, 647.0, 946.0, 1464.0, 2497.0, 4007.0, 6966.0, 12780.0, 28314.0, 92998.0, 506871.0, 287918.0, 56366.0, 20995.0, 10301.0, 5530.0, 3342.0, 2023.0, 1292.0, 832.0, 514.0, 302.0, 210.0, 147.0, 89.0, 48.0, 35.0, 25.0, 7.0, 9.0, 6.0, 2.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.456541061401367e-05, -7.197819650173187e-05, -6.939098238945007e-05, -6.680376827716827e-05, -6.421655416488647e-05, -6.162934005260468e-05, -5.9042125940322876e-05, -5.645491182804108e-05, -5.386769771575928e-05, -5.128048360347748e-05, -4.869326949119568e-05, -4.610605537891388e-05, -4.351884126663208e-05, -4.093162715435028e-05, -3.834441304206848e-05, -3.575719892978668e-05, -3.316998481750488e-05, -3.0582770705223083e-05, -2.7995556592941284e-05, -2.5408342480659485e-05, -2.2821128368377686e-05, -2.0233914256095886e-05, -1.7646700143814087e-05, -1.5059486031532288e-05, -1.2472271919250488e-05, -9.885057806968689e-06, -7.29784369468689e-06, -4.71062958240509e-06, -2.123415470123291e-06, 4.637986421585083e-07, 3.0510127544403076e-06, 5.638226866722107e-06, 8.225440979003906e-06, 1.0812655091285706e-05, 1.3399869203567505e-05, 1.5987083315849304e-05, 1.8574297428131104e-05, 2.1161511540412903e-05, 2.3748725652694702e-05, 2.63359397649765e-05, 2.89231538772583e-05, 3.15103679895401e-05, 3.40975821018219e-05, 3.66847962141037e-05, 3.92720103263855e-05, 4.18592244386673e-05, 4.44464385509491e-05, 4.7033652663230896e-05, 4.9620866775512695e-05, 5.2208080887794495e-05, 5.4795295000076294e-05, 5.738250911235809e-05, 5.996972322463989e-05, 6.255693733692169e-05, 6.514415144920349e-05, 6.773136556148529e-05, 7.031857967376709e-05, 7.290579378604889e-05, 7.549300789833069e-05, 7.808022201061249e-05, 8.066743612289429e-05, 8.325465023517609e-05, 8.584186434745789e-05, 8.842907845973969e-05, 9.101629257202148e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 9.0, 4.0, 7.0, 7.0, 10.0, 6.0, 7.0, 7.0, 15.0, 18.0, 20.0, 19.0, 26.0, 29.0, 39.0, 50.0, 32.0, 40.0, 36.0, 45.0, 37.0, 48.0, 34.0, 54.0, 37.0, 32.0, 34.0, 37.0, 31.0, 26.0, 31.0, 17.0, 23.0, 20.0, 19.0, 17.0, 11.0, 6.0, 11.0, 6.0, 12.0, 6.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-1.6868114471435547e-05, -1.6351230442523956e-05, -1.5834346413612366e-05, -1.5317462384700775e-05, -1.4800578355789185e-05, -1.4283694326877594e-05, -1.3766810297966003e-05, -1.3249926269054413e-05, -1.2733042240142822e-05, -1.2216158211231232e-05, -1.1699274182319641e-05, -1.118239015340805e-05, -1.066550612449646e-05, -1.014862209558487e-05, -9.631738066673279e-06, -9.114854037761688e-06, -8.597970008850098e-06, -8.081085979938507e-06, -7.5642019510269165e-06, -7.047317922115326e-06, -6.530433893203735e-06, -6.013549864292145e-06, -5.496665835380554e-06, -4.979781806468964e-06, -4.462897777557373e-06, -3.9460137486457825e-06, -3.429129719734192e-06, -2.9122456908226013e-06, -2.3953616619110107e-06, -1.8784776329994202e-06, -1.3615936040878296e-06, -8.44709575176239e-07, -3.2782554626464844e-07, 1.8905848264694214e-07, 7.059425115585327e-07, 1.2228265404701233e-06, 1.7397105693817139e-06, 2.2565945982933044e-06, 2.773478627204895e-06, 3.2903626561164856e-06, 3.807246685028076e-06, 4.324130713939667e-06, 4.841014742851257e-06, 5.357898771762848e-06, 5.8747828006744385e-06, 6.391666829586029e-06, 6.90855085849762e-06, 7.42543488740921e-06, 7.9423189163208e-06, 8.459202945232391e-06, 8.976086974143982e-06, 9.492971003055573e-06, 1.0009855031967163e-05, 1.0526739060878754e-05, 1.1043623089790344e-05, 1.1560507118701935e-05, 1.2077391147613525e-05, 1.2594275176525116e-05, 1.3111159205436707e-05, 1.3628043234348297e-05, 1.4144927263259888e-05, 1.4661811292171478e-05, 1.5178695321083069e-05, 1.569557934999466e-05, 1.621246337890625e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 4.0, 3.0, 9.0, 14.0, 13.0, 31.0, 37.0, 52.0, 78.0, 82.0, 154.0, 200.0, 308.0, 536.0, 866.0, 1361.0, 2396.0, 4256.0, 10062.0, 26558.0, 148652.0, 728765.0, 85305.0, 21789.0, 7699.0, 3875.0, 2068.0, 1251.0, 733.0, 474.0, 282.0, 206.0, 121.0, 91.0, 70.0, 53.0, 48.0, 17.0, 8.0, 13.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.8967857360839844e-05, -2.8044916689395905e-05, -2.7121976017951965e-05, -2.6199035346508026e-05, -2.5276094675064087e-05, -2.4353154003620148e-05, -2.343021333217621e-05, -2.250727266073227e-05, -2.158433198928833e-05, -2.066139131784439e-05, -1.973845064640045e-05, -1.8815509974956512e-05, -1.7892569303512573e-05, -1.6969628632068634e-05, -1.6046687960624695e-05, -1.5123747289180756e-05, -1.4200806617736816e-05, -1.3277865946292877e-05, -1.2354925274848938e-05, -1.1431984603404999e-05, -1.050904393196106e-05, -9.58610326051712e-06, -8.663162589073181e-06, -7.740221917629242e-06, -6.817281246185303e-06, -5.8943405747413635e-06, -4.971399903297424e-06, -4.048459231853485e-06, -3.125518560409546e-06, -2.2025778889656067e-06, -1.2796372175216675e-06, -3.5669654607772827e-07, 5.662441253662109e-07, 1.4891847968101501e-06, 2.4121254682540894e-06, 3.3350661396980286e-06, 4.258006811141968e-06, 5.180947482585907e-06, 6.103888154029846e-06, 7.026828825473785e-06, 7.949769496917725e-06, 8.872710168361664e-06, 9.795650839805603e-06, 1.0718591511249542e-05, 1.1641532182693481e-05, 1.256447285413742e-05, 1.348741352558136e-05, 1.4410354197025299e-05, 1.5333294868469238e-05, 1.6256235539913177e-05, 1.7179176211357117e-05, 1.8102116882801056e-05, 1.9025057554244995e-05, 1.9947998225688934e-05, 2.0870938897132874e-05, 2.1793879568576813e-05, 2.2716820240020752e-05, 2.363976091146469e-05, 2.456270158290863e-05, 2.548564225435257e-05, 2.640858292579651e-05, 2.7331523597240448e-05, 2.8254464268684387e-05, 2.9177404940128326e-05, 3.0100345611572266e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 3.0, 2.0, 10.0, 3.0, 10.0, 10.0, 29.0, 17.0, 33.0, 19.0, 67.0, 29.0, 74.0, 72.0, 155.0, 73.0, 116.0, 38.0, 68.0, 30.0, 62.0, 17.0, 21.0, 21.0, 5.0, 7.0, 5.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.9206275939941406e-06, -2.8312206268310547e-06, -2.7418136596679688e-06, -2.652406692504883e-06, -2.562999725341797e-06, -2.473592758178711e-06, -2.384185791015625e-06, -2.294778823852539e-06, -2.205371856689453e-06, -2.115964889526367e-06, -2.0265579223632812e-06, -1.9371509552001953e-06, -1.8477439880371094e-06, -1.7583370208740234e-06, -1.6689300537109375e-06, -1.5795230865478516e-06, -1.4901161193847656e-06, -1.4007091522216797e-06, -1.3113021850585938e-06, -1.2218952178955078e-06, -1.1324882507324219e-06, -1.043081283569336e-06, -9.5367431640625e-07, -8.642673492431641e-07, -7.748603820800781e-07, -6.854534149169922e-07, -5.960464477539062e-07, -5.066394805908203e-07, -4.172325134277344e-07, -3.2782554626464844e-07, -2.384185791015625e-07, -1.4901161193847656e-07, -5.960464477539063e-08, 2.9802322387695312e-08, 1.1920928955078125e-07, 2.086162567138672e-07, 2.980232238769531e-07, 3.8743019104003906e-07, 4.76837158203125e-07, 5.662441253662109e-07, 6.556510925292969e-07, 7.450580596923828e-07, 8.344650268554688e-07, 9.238719940185547e-07, 1.0132789611816406e-06, 1.1026859283447266e-06, 1.1920928955078125e-06, 1.2814998626708984e-06, 1.3709068298339844e-06, 1.4603137969970703e-06, 1.5497207641601562e-06, 1.6391277313232422e-06, 1.7285346984863281e-06, 1.817941665649414e-06, 1.9073486328125e-06, 1.996755599975586e-06, 2.086162567138672e-06, 2.175569534301758e-06, 2.2649765014648438e-06, 2.3543834686279297e-06, 2.4437904357910156e-06, 2.5331974029541016e-06, 2.6226043701171875e-06, 2.7120113372802734e-06, 2.8014183044433594e-06]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 4.0, 7.0, 9.0, 10.0, 15.0, 22.0, 24.0, 39.0, 62.0, 87.0, 132.0, 247.0, 352.0, 605.0, 1076.0, 2051.0, 4169.0, 9269.0, 18968.0, 59388.0, 235265.0, 516556.0, 134443.0, 36034.0, 16070.0, 6664.0, 3072.0, 1574.0, 905.0, 474.0, 333.0, 227.0, 122.0, 92.0, 49.0, 22.0, 27.0, 24.0, 7.0, 9.0, 8.0, 2.0, 2.0, 6.0, 5.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.5079975128173828e-05, -1.4613382518291473e-05, -1.4146789908409119e-05, -1.3680197298526764e-05, -1.321360468864441e-05, -1.2747012078762054e-05, -1.22804194688797e-05, -1.1813826858997345e-05, -1.134723424911499e-05, -1.0880641639232635e-05, -1.041404902935028e-05, -9.947456419467926e-06, -9.480863809585571e-06, -9.014271199703217e-06, -8.547678589820862e-06, -8.081085979938507e-06, -7.614493370056152e-06, -7.147900760173798e-06, -6.681308150291443e-06, -6.214715540409088e-06, -5.748122930526733e-06, -5.281530320644379e-06, -4.814937710762024e-06, -4.348345100879669e-06, -3.8817524909973145e-06, -3.4151598811149597e-06, -2.948567271232605e-06, -2.4819746613502502e-06, -2.0153820514678955e-06, -1.5487894415855408e-06, -1.082196831703186e-06, -6.156042218208313e-07, -1.4901161193847656e-07, 3.175809979438782e-07, 7.841736078262329e-07, 1.2507662177085876e-06, 1.7173588275909424e-06, 2.183951437473297e-06, 2.650544047355652e-06, 3.1171366572380066e-06, 3.5837292671203613e-06, 4.050321877002716e-06, 4.516914486885071e-06, 4.9835070967674255e-06, 5.45009970664978e-06, 5.916692316532135e-06, 6.38328492641449e-06, 6.8498775362968445e-06, 7.316470146179199e-06, 7.783062756061554e-06, 8.249655365943909e-06, 8.716247975826263e-06, 9.182840585708618e-06, 9.649433195590973e-06, 1.0116025805473328e-05, 1.0582618415355682e-05, 1.1049211025238037e-05, 1.1515803635120392e-05, 1.1982396245002747e-05, 1.2448988854885101e-05, 1.2915581464767456e-05, 1.338217407464981e-05, 1.3848766684532166e-05, 1.431535929441452e-05, 1.4781951904296875e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 3.0, 6.0, 13.0, 8.0, 9.0, 18.0, 40.0, 53.0, 47.0, 72.0, 80.0, 94.0, 87.0, 130.0, 84.0, 71.0, 58.0, 32.0, 20.0, 20.0, 21.0, 6.0, 8.0, 5.0, 4.0, 7.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4570693969726562e-06, -3.3294782042503357e-06, -3.201887011528015e-06, -3.0742958188056946e-06, -2.946704626083374e-06, -2.8191134333610535e-06, -2.691522240638733e-06, -2.5639310479164124e-06, -2.436339855194092e-06, -2.3087486624717712e-06, -2.1811574697494507e-06, -2.05356627702713e-06, -1.9259750843048096e-06, -1.798383891582489e-06, -1.6707926988601685e-06, -1.543201506137848e-06, -1.4156103134155273e-06, -1.2880191206932068e-06, -1.1604279279708862e-06, -1.0328367352485657e-06, -9.052455425262451e-07, -7.776543498039246e-07, -6.50063157081604e-07, -5.224719643592834e-07, -3.948807716369629e-07, -2.6728957891464233e-07, -1.3969838619232178e-07, -1.210719347000122e-08, 1.1548399925231934e-07, 2.430751919746399e-07, 3.7066638469696045e-07, 4.98257577419281e-07, 6.258487701416016e-07, 7.534399628639221e-07, 8.810311555862427e-07, 1.0086223483085632e-06, 1.1362135410308838e-06, 1.2638047337532043e-06, 1.391395926475525e-06, 1.5189871191978455e-06, 1.646578311920166e-06, 1.7741695046424866e-06, 1.9017606973648071e-06, 2.0293518900871277e-06, 2.1569430828094482e-06, 2.284534275531769e-06, 2.4121254682540894e-06, 2.53971666097641e-06, 2.6673078536987305e-06, 2.794899046421051e-06, 2.9224902391433716e-06, 3.050081431865692e-06, 3.1776726245880127e-06, 3.3052638173103333e-06, 3.432855010032654e-06, 3.5604462027549744e-06, 3.688037395477295e-06, 3.8156285881996155e-06, 3.943219780921936e-06, 4.070810973644257e-06, 4.198402166366577e-06, 4.325993359088898e-06, 4.453584551811218e-06, 4.581175744533539e-06, 4.708766937255859e-06]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 15.0, 6.0, 9.0, 17.0, 21.0, 17.0, 38.0, 54.0, 55.0, 76.0, 106.0, 121.0, 110.0, 85.0, 58.0, 52.0, 28.0, 29.0, 31.0, 14.0, 6.0, 11.0, 5.0, 10.0, 6.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.824843199457973e-05, -4.671978240367025e-05, -4.519113281276077e-05, -4.366248322185129e-05, -4.213383363094181e-05, -4.060518404003233e-05, -3.9076534449122846e-05, -3.7547884858213365e-05, -3.6019235267303884e-05, -3.44905856763944e-05, -3.296193608548492e-05, -3.143328649457544e-05, -2.990463690366596e-05, -2.837598731275648e-05, -2.6847335902857594e-05, -2.5318686311948113e-05, -2.379003490204923e-05, -2.2261385311139748e-05, -2.0732735720230266e-05, -1.9204086129320785e-05, -1.7675436538411304e-05, -1.6146786947501823e-05, -1.4618135537602939e-05, -1.3089485946693458e-05, -1.1560836355783977e-05, -1.0032186764874496e-05, -8.503537173965015e-06, -6.974886673560832e-06, -5.446237082651351e-06, -3.91758749174187e-06, -2.3889369913376868e-06, -8.602874004282057e-07, 6.683621904812753e-07, 2.197012008764432e-06, 3.7256618270475883e-06, 5.25431187270442e-06, 6.782961463613901e-06, 8.311611054523382e-06, 9.840261554927565e-06, 1.1368911145837046e-05, 1.2897560736746527e-05, 1.4426210327656008e-05, 1.595485991856549e-05, 1.7483511328464374e-05, 1.9012160919373855e-05, 2.0540810510283336e-05, 2.2069460101192817e-05, 2.3598109692102298e-05, 2.512675928301178e-05, 2.665540887392126e-05, 2.818405846483074e-05, 2.9712708055740222e-05, 3.12413576466497e-05, 3.2770007237559184e-05, 3.429866046644747e-05, 3.5827310057356954e-05, 3.7355959648266435e-05, 3.8884609239175916e-05, 4.04132588300854e-05, 4.194190842099488e-05, 4.347055801190436e-05, 4.499920760281384e-05, 4.652785719372332e-05, 4.80565067846328e-05, 4.958515637554228e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 0.0, 5.0, 7.0, 6.0, 11.0, 15.0, 18.0, 17.0, 21.0, 19.0, 23.0, 32.0, 37.0, 37.0, 31.0, 36.0, 48.0, 37.0, 49.0, 50.0, 45.0, 43.0, 46.0, 35.0, 39.0, 34.0, 48.0, 30.0, 36.0, 30.0, 26.0, 19.0, 14.0, 16.0, 8.0, 10.0, 6.0, 9.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.128805474261753e-05, -3.0275081371655688e-05, -2.9262109819683246e-05, -2.82491364487214e-05, -2.723616489674896e-05, -2.6223191525787115e-05, -2.521021815482527e-05, -2.419724660285283e-05, -2.3184275050880387e-05, -2.2171301679918543e-05, -2.11583301279461e-05, -2.0145356756984256e-05, -1.9132385205011815e-05, -1.811941183404997e-05, -1.7106438463088125e-05, -1.6093466911115684e-05, -1.5080493540153839e-05, -1.4067521078686696e-05, -1.3054548617219552e-05, -1.2041575246257707e-05, -1.1028603694285266e-05, -1.0015630323323421e-05, -9.002657861856278e-06, -7.989685400389135e-06, -6.976712938921992e-06, -5.963740477454849e-06, -4.9507680159877054e-06, -3.937795099773211e-06, -2.9248226383060683e-06, -1.911850176838925e-06, -8.988772606244311e-07, 1.1409520084271207e-07, 1.1270676623098552e-06, 2.1400401237769984e-06, 3.153012812617817e-06, 4.1659855014586356e-06, 5.178957962925779e-06, 6.191930424392922e-06, 7.204903340607416e-06, 8.217875802074559e-06, 9.230848263541702e-06, 1.0243820725008845e-05, 1.1256793186475988e-05, 1.2269765647943132e-05, 1.3282739018904977e-05, 1.4295710570877418e-05, 1.5308683941839263e-05, 1.6321657312801108e-05, 1.733462886477355e-05, 1.8347602235735394e-05, 1.9360573787707835e-05, 2.037354715866968e-05, 2.1386518710642122e-05, 2.2399492081603967e-05, 2.3412463633576408e-05, 2.4425437004538253e-05, 2.5438410375500098e-05, 2.6451383746461943e-05, 2.7464355298434384e-05, 2.847732866939623e-05, 2.949030022136867e-05, 3.0503273592330515e-05, 3.151624696329236e-05, 3.2529220334254205e-05, 3.354219006723724e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 3.0, 9.0, 4.0, 6.0, 7.0, 21.0, 23.0, 36.0, 79.0, 106.0, 142.0, 239.0, 324.0, 499.0, 772.0, 1155.0, 1590.0, 2363.0, 3610.0, 5724.0, 8588.0, 14238.0, 23511.0, 38211.0, 69388.0, 124405.0, 234629.0, 223908.0, 127781.0, 67965.0, 37351.0, 23263.0, 13361.0, 8697.0, 5618.0, 3545.0, 2470.0, 1565.0, 1095.0, 723.0, 495.0, 342.0, 236.0, 153.0, 116.0, 70.0, 46.0, 30.0, 21.0, 13.0, 8.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9114227294921875e-05, -4.752911627292633e-05, -4.5944005250930786e-05, -4.435889422893524e-05, -4.27737832069397e-05, -4.118867218494415e-05, -3.960356116294861e-05, -3.8018450140953064e-05, -3.643333911895752e-05, -3.4848228096961975e-05, -3.326311707496643e-05, -3.1678006052970886e-05, -3.0092895030975342e-05, -2.8507784008979797e-05, -2.6922672986984253e-05, -2.533756196498871e-05, -2.3752450942993164e-05, -2.216733992099762e-05, -2.0582228899002075e-05, -1.899711787700653e-05, -1.7412006855010986e-05, -1.5826895833015442e-05, -1.4241784811019897e-05, -1.2656673789024353e-05, -1.1071562767028809e-05, -9.486451745033264e-06, -7.90134072303772e-06, -6.316229701042175e-06, -4.731118679046631e-06, -3.1460076570510864e-06, -1.560896635055542e-06, 2.421438694000244e-08, 1.6093254089355469e-06, 3.1944364309310913e-06, 4.779547452926636e-06, 6.36465847492218e-06, 7.949769496917725e-06, 9.534880518913269e-06, 1.1119991540908813e-05, 1.2705102562904358e-05, 1.4290213584899902e-05, 1.5875324606895447e-05, 1.746043562889099e-05, 1.9045546650886536e-05, 2.063065767288208e-05, 2.2215768694877625e-05, 2.380087971687317e-05, 2.5385990738868713e-05, 2.6971101760864258e-05, 2.8556212782859802e-05, 3.0141323804855347e-05, 3.172643482685089e-05, 3.3311545848846436e-05, 3.489665687084198e-05, 3.6481767892837524e-05, 3.806687891483307e-05, 3.965198993682861e-05, 4.123710095882416e-05, 4.28222119808197e-05, 4.4407323002815247e-05, 4.599243402481079e-05, 4.7577545046806335e-05, 4.916265606880188e-05, 5.0747767090797424e-05, 5.233287811279297e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 6.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 8.0, 9.0, 9.0, 10.0, 19.0, 14.0, 12.0, 27.0, 20.0, 30.0, 25.0, 31.0, 42.0, 42.0, 30.0, 33.0, 43.0, 43.0, 53.0, 40.0, 40.0, 46.0, 26.0, 50.0, 30.0, 30.0, 38.0, 25.0, 33.0, 25.0, 22.0, 15.0, 17.0, 8.0, 9.0, 10.0, 8.0, 6.0, 1.0, 8.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.187490463256836e-05, -2.105720341205597e-05, -2.023950219154358e-05, -1.942180097103119e-05, -1.86040997505188e-05, -1.778639853000641e-05, -1.696869730949402e-05, -1.615099608898163e-05, -1.5333294868469238e-05, -1.4515593647956848e-05, -1.3697892427444458e-05, -1.2880191206932068e-05, -1.2062489986419678e-05, -1.1244788765907288e-05, -1.0427087545394897e-05, -9.609386324882507e-06, -8.791685104370117e-06, -7.973983883857727e-06, -7.156282663345337e-06, -6.338581442832947e-06, -5.520880222320557e-06, -4.7031790018081665e-06, -3.885477781295776e-06, -3.0677765607833862e-06, -2.250075340270996e-06, -1.432374119758606e-06, -6.146728992462158e-07, 2.0302832126617432e-07, 1.0207295417785645e-06, 1.8384307622909546e-06, 2.6561319828033447e-06, 3.473833203315735e-06, 4.291534423828125e-06, 5.109235644340515e-06, 5.926936864852905e-06, 6.744638085365295e-06, 7.5623393058776855e-06, 8.380040526390076e-06, 9.197741746902466e-06, 1.0015442967414856e-05, 1.0833144187927246e-05, 1.1650845408439636e-05, 1.2468546628952026e-05, 1.3286247849464417e-05, 1.4103949069976807e-05, 1.4921650290489197e-05, 1.5739351511001587e-05, 1.6557052731513977e-05, 1.7374753952026367e-05, 1.8192455172538757e-05, 1.9010156393051147e-05, 1.9827857613563538e-05, 2.0645558834075928e-05, 2.1463260054588318e-05, 2.2280961275100708e-05, 2.3098662495613098e-05, 2.3916363716125488e-05, 2.473406493663788e-05, 2.555176615715027e-05, 2.636946737766266e-05, 2.718716859817505e-05, 2.800486981868744e-05, 2.882257103919983e-05, 2.964027225971222e-05, 3.045797348022461e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 9.0, 15.0, 21.0, 22.0, 42.0, 55.0, 88.0, 97.0, 122.0, 210.0, 320.0, 439.0, 630.0, 943.0, 1267.0, 1813.0, 2661.0, 3934.0, 5955.0, 8855.0, 13833.0, 21776.0, 35961.0, 60551.0, 105699.0, 184174.0, 214663.0, 154649.0, 90221.0, 52445.0, 31033.0, 19047.0, 12083.0, 7858.0, 5354.0, 3569.0, 2397.0, 1732.0, 1177.0, 870.0, 566.0, 440.0, 289.0, 195.0, 158.0, 91.0, 67.0, 45.0, 36.0, 23.0, 21.0, 10.0, 6.0, 5.0, 6.0, 7.0, 3.0], "bins": [-4.38690185546875e-05, -4.2553991079330444e-05, -4.123896360397339e-05, -3.992393612861633e-05, -3.860890865325928e-05, -3.729388117790222e-05, -3.5978853702545166e-05, -3.466382622718811e-05, -3.3348798751831055e-05, -3.2033771276474e-05, -3.071874380111694e-05, -2.9403716325759888e-05, -2.8088688850402832e-05, -2.6773661375045776e-05, -2.545863389968872e-05, -2.4143606424331665e-05, -2.282857894897461e-05, -2.1513551473617554e-05, -2.0198523998260498e-05, -1.8883496522903442e-05, -1.7568469047546387e-05, -1.625344157218933e-05, -1.4938414096832275e-05, -1.362338662147522e-05, -1.2308359146118164e-05, -1.0993331670761108e-05, -9.678304195404053e-06, -8.363276720046997e-06, -7.048249244689941e-06, -5.733221769332886e-06, -4.41819429397583e-06, -3.1031668186187744e-06, -1.7881393432617188e-06, -4.731118679046631e-07, 8.419156074523926e-07, 2.1569430828094482e-06, 3.471970558166504e-06, 4.7869980335235596e-06, 6.102025508880615e-06, 7.417052984237671e-06, 8.732080459594727e-06, 1.0047107934951782e-05, 1.1362135410308838e-05, 1.2677162885665894e-05, 1.399219036102295e-05, 1.5307217836380005e-05, 1.662224531173706e-05, 1.7937272787094116e-05, 1.9252300262451172e-05, 2.0567327737808228e-05, 2.1882355213165283e-05, 2.319738268852234e-05, 2.4512410163879395e-05, 2.582743763923645e-05, 2.7142465114593506e-05, 2.845749258995056e-05, 2.9772520065307617e-05, 3.108754754066467e-05, 3.240257501602173e-05, 3.3717602491378784e-05, 3.503262996673584e-05, 3.6347657442092896e-05, 3.766268491744995e-05, 3.897771239280701e-05, 4.029273986816406e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 7.0, 12.0, 9.0, 10.0, 9.0, 18.0, 14.0, 21.0, 32.0, 26.0, 40.0, 29.0, 45.0, 50.0, 42.0, 39.0, 38.0, 43.0, 51.0, 46.0, 43.0, 37.0, 33.0, 39.0, 35.0, 36.0, 26.0, 29.0, 23.0, 15.0, 15.0, 18.0, 11.0, 20.0, 10.0, 9.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8537044525146484e-05, -1.7977319657802582e-05, -1.741759479045868e-05, -1.6857869923114777e-05, -1.6298145055770874e-05, -1.573842018842697e-05, -1.5178695321083069e-05, -1.4618970453739166e-05, -1.4059245586395264e-05, -1.3499520719051361e-05, -1.2939795851707458e-05, -1.2380070984363556e-05, -1.1820346117019653e-05, -1.126062124967575e-05, -1.0700896382331848e-05, -1.0141171514987946e-05, -9.581446647644043e-06, -9.02172178030014e-06, -8.461996912956238e-06, -7.902272045612335e-06, -7.342547178268433e-06, -6.78282231092453e-06, -6.2230974435806274e-06, -5.663372576236725e-06, -5.103647708892822e-06, -4.54392284154892e-06, -3.984197974205017e-06, -3.4244731068611145e-06, -2.864748239517212e-06, -2.3050233721733093e-06, -1.7452985048294067e-06, -1.1855736374855042e-06, -6.258487701416016e-07, -6.612390279769897e-08, 4.936009645462036e-07, 1.0533258318901062e-06, 1.6130506992340088e-06, 2.1727755665779114e-06, 2.732500433921814e-06, 3.2922253012657166e-06, 3.851950168609619e-06, 4.411675035953522e-06, 4.971399903297424e-06, 5.531124770641327e-06, 6.0908496379852295e-06, 6.650574505329132e-06, 7.210299372673035e-06, 7.770024240016937e-06, 8.32974910736084e-06, 8.889473974704742e-06, 9.449198842048645e-06, 1.0008923709392548e-05, 1.056864857673645e-05, 1.1128373444080353e-05, 1.1688098311424255e-05, 1.2247823178768158e-05, 1.280754804611206e-05, 1.3367272913455963e-05, 1.3926997780799866e-05, 1.4486722648143768e-05, 1.5046447515487671e-05, 1.5606172382831573e-05, 1.6165897250175476e-05, 1.672562211751938e-05, 1.728534698486328e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 13.0, 16.0, 25.0, 32.0, 52.0, 72.0, 80.0, 101.0, 115.0, 212.0, 274.0, 362.0, 538.0, 641.0, 914.0, 1216.0, 1669.0, 2295.0, 3594.0, 4890.0, 7220.0, 11399.0, 21261.0, 38268.0, 92675.0, 658884.0, 101729.0, 42761.0, 20046.0, 11962.0, 7578.0, 5306.0, 3431.0, 2451.0, 1631.0, 1326.0, 944.0, 692.0, 477.0, 374.0, 256.0, 203.0, 152.0, 119.0, 94.0, 56.0, 38.0, 39.0, 22.0, 16.0, 12.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0], "bins": [-2.372264862060547e-05, -2.299342304468155e-05, -2.226419746875763e-05, -2.153497189283371e-05, -2.080574631690979e-05, -2.007652074098587e-05, -1.934729516506195e-05, -1.861806958913803e-05, -1.788884401321411e-05, -1.715961843729019e-05, -1.6430392861366272e-05, -1.5701167285442352e-05, -1.4971941709518433e-05, -1.4242716133594513e-05, -1.3513490557670593e-05, -1.2784264981746674e-05, -1.2055039405822754e-05, -1.1325813829898834e-05, -1.0596588253974915e-05, -9.867362678050995e-06, -9.138137102127075e-06, -8.408911526203156e-06, -7.679685950279236e-06, -6.950460374355316e-06, -6.2212347984313965e-06, -5.492009222507477e-06, -4.762783646583557e-06, -4.0335580706596375e-06, -3.3043324947357178e-06, -2.575106918811798e-06, -1.8458813428878784e-06, -1.1166557669639587e-06, -3.8743019104003906e-07, 3.417953848838806e-07, 1.0710209608078003e-06, 1.80024653673172e-06, 2.5294721126556396e-06, 3.2586976885795593e-06, 3.987923264503479e-06, 4.717148840427399e-06, 5.446374416351318e-06, 6.175599992275238e-06, 6.904825568199158e-06, 7.634051144123077e-06, 8.363276720046997e-06, 9.092502295970917e-06, 9.821727871894836e-06, 1.0550953447818756e-05, 1.1280179023742676e-05, 1.2009404599666595e-05, 1.2738630175590515e-05, 1.3467855751514435e-05, 1.4197081327438354e-05, 1.4926306903362274e-05, 1.5655532479286194e-05, 1.6384758055210114e-05, 1.7113983631134033e-05, 1.7843209207057953e-05, 1.8572434782981873e-05, 1.9301660358905792e-05, 2.0030885934829712e-05, 2.076011151075363e-05, 2.148933708667755e-05, 2.221856266260147e-05, 2.294778823852539e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 40.0, 0.0, 0.0, 0.0, 0.0, 153.0, 0.0, 0.0, 0.0, 0.0, 587.0, 0.0, 0.0, 0.0, 133.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 11.0, 8.0, 12.0, 19.0, 27.0, 43.0, 70.0, 73.0, 120.0, 195.0, 234.0, 375.0, 512.0, 852.0, 1187.0, 1710.0, 2654.0, 3837.0, 6119.0, 9748.0, 16397.0, 34439.0, 86535.0, 710536.0, 91765.0, 34554.0, 18125.0, 9774.0, 6419.0, 3938.0, 2795.0, 1749.0, 1152.0, 795.0, 557.0, 407.0, 240.0, 161.0, 144.0, 83.0, 45.0, 47.0, 34.0, 20.0, 9.0, 10.0, 11.0, 2.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7670135498046875e-05, -3.639422357082367e-05, -3.5118311643600464e-05, -3.384239971637726e-05, -3.256648778915405e-05, -3.129057586193085e-05, -3.001466393470764e-05, -2.8738752007484436e-05, -2.746284008026123e-05, -2.6186928153038025e-05, -2.491101622581482e-05, -2.3635104298591614e-05, -2.2359192371368408e-05, -2.1083280444145203e-05, -1.9807368516921997e-05, -1.853145658969879e-05, -1.7255544662475586e-05, -1.597963273525238e-05, -1.4703720808029175e-05, -1.342780888080597e-05, -1.2151896953582764e-05, -1.0875985026359558e-05, -9.600073099136353e-06, -8.324161171913147e-06, -7.048249244689941e-06, -5.772337317466736e-06, -4.49642539024353e-06, -3.2205134630203247e-06, -1.944601535797119e-06, -6.686896085739136e-07, 6.07222318649292e-07, 1.8831342458724976e-06, 3.159046173095703e-06, 4.434958100318909e-06, 5.710870027542114e-06, 6.98678195476532e-06, 8.262693881988525e-06, 9.538605809211731e-06, 1.0814517736434937e-05, 1.2090429663658142e-05, 1.3366341590881348e-05, 1.4642253518104553e-05, 1.591816544532776e-05, 1.7194077372550964e-05, 1.846998929977417e-05, 1.9745901226997375e-05, 2.102181315422058e-05, 2.2297725081443787e-05, 2.3573637008666992e-05, 2.4849548935890198e-05, 2.6125460863113403e-05, 2.740137279033661e-05, 2.8677284717559814e-05, 2.995319664478302e-05, 3.1229108572006226e-05, 3.250502049922943e-05, 3.378093242645264e-05, 3.505684435367584e-05, 3.633275628089905e-05, 3.7608668208122253e-05, 3.888458013534546e-05, 4.0160492062568665e-05, 4.143640398979187e-05, 4.2712315917015076e-05, 4.398822784423828e-05]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 2.0, 3.0, 3.0, 3.0, 6.0, 6.0, 3.0, 9.0, 8.0, 22.0, 9.0, 22.0, 34.0, 38.0, 54.0, 119.0, 388.0, 60.0, 45.0, 39.0, 23.0, 16.0, 16.0, 13.0, 9.0, 7.0, 6.0, 7.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3828277587890625e-05, -1.3423152267932892e-05, -1.3018026947975159e-05, -1.2612901628017426e-05, -1.2207776308059692e-05, -1.180265098810196e-05, -1.1397525668144226e-05, -1.0992400348186493e-05, -1.058727502822876e-05, -1.0182149708271027e-05, -9.777024388313293e-06, -9.37189906835556e-06, -8.966773748397827e-06, -8.561648428440094e-06, -8.15652310848236e-06, -7.751397788524628e-06, -7.3462724685668945e-06, -6.941147148609161e-06, -6.536021828651428e-06, -6.130896508693695e-06, -5.725771188735962e-06, -5.320645868778229e-06, -4.915520548820496e-06, -4.5103952288627625e-06, -4.105269908905029e-06, -3.700144588947296e-06, -3.295019268989563e-06, -2.88989394903183e-06, -2.4847686290740967e-06, -2.0796433091163635e-06, -1.6745179891586304e-06, -1.2693926692008972e-06, -8.642673492431641e-07, -4.591420292854309e-07, -5.4016709327697754e-08, 3.511086106300354e-07, 7.562339305877686e-07, 1.1613592505455017e-06, 1.5664845705032349e-06, 1.971609890460968e-06, 2.376735210418701e-06, 2.7818605303764343e-06, 3.1869858503341675e-06, 3.5921111702919006e-06, 3.997236490249634e-06, 4.402361810207367e-06, 4.8074871301651e-06, 5.212612450122833e-06, 5.617737770080566e-06, 6.0228630900382996e-06, 6.427988409996033e-06, 6.833113729953766e-06, 7.238239049911499e-06, 7.643364369869232e-06, 8.048489689826965e-06, 8.453615009784698e-06, 8.858740329742432e-06, 9.263865649700165e-06, 9.668990969657898e-06, 1.0074116289615631e-05, 1.0479241609573364e-05, 1.0884366929531097e-05, 1.128949224948883e-05, 1.1694617569446564e-05, 1.2099742889404297e-05]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 7.0, 4.0, 9.0, 8.0, 15.0, 22.0, 17.0, 22.0, 31.0, 46.0, 62.0, 80.0, 109.0, 104.0, 98.0, 85.0, 67.0, 41.0, 26.0, 27.0, 15.0, 26.0, 17.0, 12.0, 11.0, 8.0, 6.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.858188938465901e-05, -3.728336378117092e-05, -3.598483817768283e-05, -3.4686312574194744e-05, -3.3387786970706657e-05, -3.208926136721857e-05, -3.0790732125751674e-05, -2.949220834125299e-05, -2.8193682737764902e-05, -2.6895157134276815e-05, -2.5596631530788727e-05, -2.4298104108311236e-05, -2.2999578504823148e-05, -2.170105290133506e-05, -2.0402527297846973e-05, -1.9104001694358885e-05, -1.7805476090870798e-05, -1.650695048738271e-05, -1.5208424883894622e-05, -1.3909898370911833e-05, -1.2611372767423745e-05, -1.1312847163935658e-05, -1.0014320650952868e-05, -8.71579504746478e-06, -7.417269443976693e-06, -6.118743840488605e-06, -4.820217782253167e-06, -3.521691724017728e-06, -2.2231661205296405e-06, -9.246405170415528e-07, 3.738859959412366e-07, 1.6724115994293243e-06, 2.970940840896219e-06, 4.269466444384307e-06, 5.567992502619745e-06, 6.866518560855184e-06, 8.165044164343271e-06, 9.463569767831359e-06, 1.0762096280814148e-05, 1.2060621884302236e-05, 1.3359147487790324e-05, 1.4657673091278411e-05, 1.59561986947665e-05, 1.725472611724399e-05, 1.8553251720732078e-05, 1.9851777324220166e-05, 2.1150302927708253e-05, 2.244882853119634e-05, 2.374735413468443e-05, 2.5045879738172516e-05, 2.6344405341660604e-05, 2.764293094514869e-05, 2.894145654863678e-05, 3.0239982152124867e-05, 3.153851139359176e-05, 3.283703699707985e-05, 3.413556260056794e-05, 3.5434088204056025e-05, 3.673261380754411e-05, 3.80311394110322e-05, 3.932966501452029e-05, 4.0628190618008375e-05, 4.192671622149646e-05, 4.322524182498455e-05, 4.452376742847264e-05]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 14.0, 18.0, 16.0, 15.0, 11.0, 16.0, 18.0, 29.0, 27.0, 31.0, 38.0, 41.0, 38.0, 37.0, 37.0, 49.0, 36.0, 45.0, 54.0, 41.0, 38.0, 41.0, 43.0, 38.0, 31.0, 32.0, 34.0, 28.0, 21.0, 19.0, 8.0, 21.0, 4.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.628840047691483e-05, -2.534960185585078e-05, -2.4410803234786727e-05, -2.347200279473327e-05, -2.253320417366922e-05, -2.1594405552605167e-05, -2.0655606931541115e-05, -1.9716808310477063e-05, -1.877800968941301e-05, -1.783921106834896e-05, -1.6900412447284907e-05, -1.5961613826220855e-05, -1.50228133861674e-05, -1.4084014765103348e-05, -1.3145216144039296e-05, -1.2206417522975244e-05, -1.1267617082921788e-05, -1.0328818461857736e-05, -9.390018931298982e-06, -8.45122031023493e-06, -7.5124212344235275e-06, -6.573622158612125e-06, -5.634823537548073e-06, -4.69602446173667e-06, -3.757225385925267e-06, -2.818426310113864e-06, -1.8796274616761366e-06, -9.408286132384092e-07, -2.0295374270062894e-09, 9.367695383843966e-07, 1.8755681594484486e-06, 2.8143672352598514e-06, 3.7531644920818508e-06, 4.691963567893254e-06, 5.6307626437046565e-06, 6.5695612647687085e-06, 7.508360340580111e-06, 8.447159416391514e-06, 9.385958037455566e-06, 1.0324756658519618e-05, 1.1263556189078372e-05, 1.2202354810142424e-05, 1.3141154340701178e-05, 1.407995296176523e-05, 1.5018751582829282e-05, 1.5957550203893334e-05, 1.6896348824957386e-05, 1.783514926501084e-05, 1.8773947886074893e-05, 1.9712746507138945e-05, 2.0651545128202997e-05, 2.1590345568256453e-05, 2.2529144189320505e-05, 2.3467942810384557e-05, 2.440674143144861e-05, 2.534554005251266e-05, 2.6284338673576713e-05, 2.7223137294640765e-05, 2.8161935915704817e-05, 2.910073453676887e-05, 3.0039534976822324e-05, 3.097833541687578e-05, 3.1917130399961025e-05, 3.2855932659003884e-05, 3.3794731280067936e-05]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 14.0, 25.0, 31.0, 65.0, 121.0, 182.0, 232.0, 425.0, 629.0, 883.0, 1377.0, 2153.0, 3554.0, 5777.0, 9184.0, 15144.0, 26534.0, 44451.0, 88216.0, 191944.0, 535385.0, 1719538.0, 988165.0, 288242.0, 124036.0, 62714.0, 34412.0, 19101.0, 11844.0, 7478.0, 4439.0, 2913.0, 1855.0, 1045.0, 690.0, 453.0, 309.0, 223.0, 138.0, 104.0, 68.0, 46.0, 27.0, 23.0, 19.0, 20.0, 11.0, 15.0, 16.0, 7.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.0517578125e-05, -2.933107316493988e-05, -2.814456820487976e-05, -2.695806324481964e-05, -2.577155828475952e-05, -2.4585053324699402e-05, -2.3398548364639282e-05, -2.2212043404579163e-05, -2.1025538444519043e-05, -1.9839033484458923e-05, -1.8652528524398804e-05, -1.7466023564338684e-05, -1.6279518604278564e-05, -1.5093013644218445e-05, -1.3906508684158325e-05, -1.2720003724098206e-05, -1.1533498764038086e-05, -1.0346993803977966e-05, -9.160488843917847e-06, -7.973983883857727e-06, -6.787478923797607e-06, -5.600973963737488e-06, -4.414469003677368e-06, -3.2279640436172485e-06, -2.041459083557129e-06, -8.549541234970093e-07, 3.3155083656311035e-07, 1.51805579662323e-06, 2.7045607566833496e-06, 3.891065716743469e-06, 5.077570676803589e-06, 6.2640756368637085e-06, 7.450580596923828e-06, 8.637085556983948e-06, 9.823590517044067e-06, 1.1010095477104187e-05, 1.2196600437164307e-05, 1.3383105397224426e-05, 1.4569610357284546e-05, 1.5756115317344666e-05, 1.6942620277404785e-05, 1.8129125237464905e-05, 1.9315630197525024e-05, 2.0502135157585144e-05, 2.1688640117645264e-05, 2.2875145077705383e-05, 2.4061650037765503e-05, 2.5248154997825623e-05, 2.6434659957885742e-05, 2.7621164917945862e-05, 2.880766987800598e-05, 2.99941748380661e-05, 3.118067979812622e-05, 3.236718475818634e-05, 3.355368971824646e-05, 3.474019467830658e-05, 3.59266996383667e-05, 3.711320459842682e-05, 3.829970955848694e-05, 3.948621451854706e-05, 4.067271947860718e-05, 4.18592244386673e-05, 4.304572939872742e-05, 4.423223435878754e-05, 4.5418739318847656e-05]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 13.0, 16.0, 12.0, 14.0, 14.0, 18.0, 23.0, 21.0, 37.0, 41.0, 33.0, 52.0, 51.0, 49.0, 44.0, 44.0, 38.0, 53.0, 46.0, 39.0, 39.0, 51.0, 38.0, 38.0, 43.0, 23.0, 30.0, 21.0, 12.0, 14.0, 11.0, 7.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5854835510253906e-05, -1.5251338481903076e-05, -1.4647841453552246e-05, -1.4044344425201416e-05, -1.3440847396850586e-05, -1.2837350368499756e-05, -1.2233853340148926e-05, -1.1630356311798096e-05, -1.1026859283447266e-05, -1.0423362255096436e-05, -9.819865226745605e-06, -9.216368198394775e-06, -8.612871170043945e-06, -8.009374141693115e-06, -7.405877113342285e-06, -6.802380084991455e-06, -6.198883056640625e-06, -5.595386028289795e-06, -4.991888999938965e-06, -4.388391971588135e-06, -3.7848949432373047e-06, -3.1813979148864746e-06, -2.5779008865356445e-06, -1.9744038581848145e-06, -1.3709068298339844e-06, -7.674098014831543e-07, -1.6391277313232422e-07, 4.3958425521850586e-07, 1.043081283569336e-06, 1.646578311920166e-06, 2.250075340270996e-06, 2.853572368621826e-06, 3.4570693969726562e-06, 4.060566425323486e-06, 4.664063453674316e-06, 5.2675604820251465e-06, 5.8710575103759766e-06, 6.474554538726807e-06, 7.078051567077637e-06, 7.681548595428467e-06, 8.285045623779297e-06, 8.888542652130127e-06, 9.492039680480957e-06, 1.0095536708831787e-05, 1.0699033737182617e-05, 1.1302530765533447e-05, 1.1906027793884277e-05, 1.2509524822235107e-05, 1.3113021850585938e-05, 1.3716518878936768e-05, 1.4320015907287598e-05, 1.4923512935638428e-05, 1.5527009963989258e-05, 1.6130506992340088e-05, 1.6734004020690918e-05, 1.7337501049041748e-05, 1.7940998077392578e-05, 1.8544495105743408e-05, 1.9147992134094238e-05, 1.975148916244507e-05, 2.03549861907959e-05, 2.095848321914673e-05, 2.156198024749756e-05, 2.216547727584839e-05, 2.276897430419922e-05]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 1.0, 0.0, 4.0, 5.0, 6.0, 18.0, 23.0, 35.0, 52.0, 71.0, 113.0, 188.0, 251.0, 353.0, 492.0, 733.0, 1033.0, 1804.0, 2688.0, 4237.0, 7439.0, 11706.0, 19524.0, 35878.0, 61995.0, 117496.0, 247413.0, 683074.0, 1573772.0, 806578.0, 317840.0, 135674.0, 69329.0, 37657.0, 22581.0, 12629.0, 7637.0, 5002.0, 2988.0, 2068.0, 1403.0, 851.0, 545.0, 367.0, 247.0, 163.0, 96.0, 55.0, 54.0, 37.0, 24.0, 30.0, 18.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.069639205932617e-05, -2.9725022614002228e-05, -2.8753653168678284e-05, -2.778228372335434e-05, -2.6810914278030396e-05, -2.583954483270645e-05, -2.4868175387382507e-05, -2.3896805942058563e-05, -2.292543649673462e-05, -2.1954067051410675e-05, -2.098269760608673e-05, -2.0011328160762787e-05, -1.9039958715438843e-05, -1.80685892701149e-05, -1.7097219824790955e-05, -1.612585037946701e-05, -1.5154480934143066e-05, -1.4183111488819122e-05, -1.3211742043495178e-05, -1.2240372598171234e-05, -1.126900315284729e-05, -1.0297633707523346e-05, -9.326264262199402e-06, -8.354894816875458e-06, -7.383525371551514e-06, -6.41215592622757e-06, -5.4407864809036255e-06, -4.469417035579681e-06, -3.4980475902557373e-06, -2.5266781449317932e-06, -1.5553086996078491e-06, -5.83939254283905e-07, 3.8743019104003906e-07, 1.3587996363639832e-06, 2.3301690816879272e-06, 3.3015385270118713e-06, 4.2729079723358154e-06, 5.2442774176597595e-06, 6.215646862983704e-06, 7.187016308307648e-06, 8.158385753631592e-06, 9.129755198955536e-06, 1.010112464427948e-05, 1.1072494089603424e-05, 1.2043863534927368e-05, 1.3015232980251312e-05, 1.3986602425575256e-05, 1.49579718708992e-05, 1.5929341316223145e-05, 1.690071076154709e-05, 1.7872080206871033e-05, 1.8843449652194977e-05, 1.981481909751892e-05, 2.0786188542842865e-05, 2.175755798816681e-05, 2.2728927433490753e-05, 2.3700296878814697e-05, 2.467166632413864e-05, 2.5643035769462585e-05, 2.661440521478653e-05, 2.7585774660110474e-05, 2.8557144105434418e-05, 2.9528513550758362e-05, 3.0499882996082306e-05, 3.147125244140625e-05]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 12.0, 6.0, 13.0, 19.0, 18.0, 16.0, 44.0, 35.0, 35.0, 65.0, 67.0, 81.0, 117.0, 125.0, 156.0, 196.0, 211.0, 218.0, 319.0, 295.0, 263.0, 276.0, 285.0, 181.0, 209.0, 157.0, 120.0, 118.0, 96.0, 48.0, 58.0, 37.0, 18.0, 34.0, 29.0, 10.0, 13.0, 14.0, 8.0, 5.0, 12.0, 4.0, 8.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-9.179115295410156e-06, -8.900649845600128e-06, -8.6221843957901e-06, -8.343718945980072e-06, -8.065253496170044e-06, -7.786788046360016e-06, -7.508322596549988e-06, -7.22985714673996e-06, -6.951391696929932e-06, -6.6729262471199036e-06, -6.3944607973098755e-06, -6.115995347499847e-06, -5.837529897689819e-06, -5.559064447879791e-06, -5.280598998069763e-06, -5.002133548259735e-06, -4.723668098449707e-06, -4.445202648639679e-06, -4.166737198829651e-06, -3.888271749019623e-06, -3.6098062992095947e-06, -3.3313408493995667e-06, -3.0528753995895386e-06, -2.7744099497795105e-06, -2.4959444999694824e-06, -2.2174790501594543e-06, -1.9390136003494263e-06, -1.6605481505393982e-06, -1.3820827007293701e-06, -1.103617250919342e-06, -8.25151801109314e-07, -5.466863512992859e-07, -2.682209014892578e-07, 1.0244548320770264e-08, 2.8870999813079834e-07, 5.671754479408264e-07, 8.456408977508545e-07, 1.1241063475608826e-06, 1.4025717973709106e-06, 1.6810372471809387e-06, 1.959502696990967e-06, 2.237968146800995e-06, 2.516433596611023e-06, 2.794899046421051e-06, 3.073364496231079e-06, 3.351829946041107e-06, 3.6302953958511353e-06, 3.908760845661163e-06, 4.187226295471191e-06, 4.4656917452812195e-06, 4.7441571950912476e-06, 5.022622644901276e-06, 5.301088094711304e-06, 5.579553544521332e-06, 5.85801899433136e-06, 6.136484444141388e-06, 6.414949893951416e-06, 6.693415343761444e-06, 6.971880793571472e-06, 7.2503462433815e-06, 7.528811693191528e-06, 7.807277143001556e-06, 8.085742592811584e-06, 8.364208042621613e-06, 8.64267349243164e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 5.0, 10.0, 7.0, 13.0, 15.0, 16.0, 28.0, 27.0, 41.0, 61.0, 85.0, 78.0, 119.0, 93.0, 93.0, 64.0, 48.0, 43.0, 22.0, 32.0, 22.0, 19.0, 16.0, 13.0, 9.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4628623577882536e-05, -2.3752902052365243e-05, -2.2877178707858548e-05, -2.2001457182341255e-05, -2.1125735656823963e-05, -2.0250012312317267e-05, -1.9374290786799975e-05, -1.8498569261282682e-05, -1.7622845916775987e-05, -1.6747124391258694e-05, -1.5871401046752e-05, -1.4995679521234706e-05, -1.4119957995717414e-05, -1.324423556070542e-05, -1.2368513125693426e-05, -1.1492791600176133e-05, -1.0617070074658841e-05, -9.741347639646847e-06, -8.865626114129554e-06, -7.98990367911756e-06, -7.114181698852917e-06, -6.238459718588274e-06, -5.36273728357628e-06, -4.487015303311637e-06, -3.6112933230469935e-06, -2.7355713427823503e-06, -1.8598491351440316e-06, -9.84126927505713e-07, -1.0840494724106975e-07, 7.673170330235735e-07, 1.6430394680355676e-06, 2.5187614483002108e-06, 3.3944852475542575e-06, 4.270207227818901e-06, 5.145929208083544e-06, 6.021651643095538e-06, 6.897373623360181e-06, 7.773095603624824e-06, 8.648818038636819e-06, 9.524539564154111e-06, 1.0400261999166105e-05, 1.1275984434178099e-05, 1.2151705959695391e-05, 1.3027428394707385e-05, 1.390315082971938e-05, 1.4778872355236672e-05, 1.5654593880753964e-05, 1.653031722526066e-05, 1.7406038750777952e-05, 1.8281760276295245e-05, 1.915748362080194e-05, 2.0033205146319233e-05, 2.0908926671836525e-05, 2.178465001634322e-05, 2.2660371541860513e-05, 2.3536093067377806e-05, 2.44118164118845e-05, 2.5287537937401794e-05, 2.616326128190849e-05, 2.7038982807425782e-05, 2.7914704332943074e-05, 2.8790425858460367e-05, 2.9666149202967063e-05, 3.054187254747376e-05, 3.141759225400165e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 9.0, 4.0, 7.0, 4.0, 12.0, 16.0, 12.0, 15.0, 28.0, 11.0, 26.0, 21.0, 26.0, 34.0, 33.0, 34.0, 45.0, 27.0, 39.0, 40.0, 33.0, 43.0, 47.0, 36.0, 37.0, 35.0, 31.0, 34.0, 43.0, 32.0, 28.0, 27.0, 26.0, 21.0, 18.0, 17.0, 8.0, 8.0, 10.0, 6.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6537234841962345e-05, -1.5993147826520726e-05, -1.544906263006851e-05, -1.4904975614626892e-05, -1.4360889508679975e-05, -1.3816803402733058e-05, -1.3272716387291439e-05, -1.2728630281344522e-05, -1.2184544175397605e-05, -1.1640458069450688e-05, -1.109637196350377e-05, -1.0552284948062152e-05, -1.0008198842115235e-05, -9.464112736168317e-06, -8.920025720726699e-06, -8.375939614779782e-06, -7.831853508832864e-06, -7.287767402885947e-06, -6.743680842191679e-06, -6.1995942814974114e-06, -5.655508175550494e-06, -5.111422069603577e-06, -4.567335508909309e-06, -4.023248948215041e-06, -3.4791628422681242e-06, -2.9350765089475317e-06, -2.390990175626939e-06, -1.8469038423063466e-06, -1.302817508985754e-06, -7.587311756651616e-07, -2.1464484234456904e-07, 3.294414909760235e-07, 8.735296432860196e-07, 1.417615976606612e-06, 1.9617023099272046e-06, 2.505788643247797e-06, 3.0498749765683897e-06, 3.5939613098889822e-06, 4.138047643209575e-06, 4.682134203903843e-06, 5.22622030985076e-06, 5.770306415797677e-06, 6.314392976491945e-06, 6.858479537186213e-06, 7.40256564313313e-06, 7.946651749080047e-06, 8.490738764521666e-06, 9.034824870468583e-06, 9.5789109764155e-06, 1.0122997082362417e-05, 1.0667083188309334e-05, 1.1211170203750953e-05, 1.175525630969787e-05, 1.2299342415644787e-05, 1.2843429431086406e-05, 1.3387515537033323e-05, 1.393160164298024e-05, 1.4475687748927157e-05, 1.5019773854874074e-05, 1.5563860870315693e-05, 1.6107947885757312e-05, 1.6652033082209527e-05, 1.7196120097651146e-05, 1.774020529410336e-05, 1.828429230954498e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 19.0, 13.0, 38.0, 54.0, 86.0, 111.0, 180.0, 252.0, 428.0, 659.0, 875.0, 1649.0, 2378.0, 4022.0, 5888.0, 10667.0, 16235.0, 29081.0, 46631.0, 86411.0, 136760.0, 208006.0, 205043.0, 116602.0, 74123.0, 39673.0, 25075.0, 13906.0, 9138.0, 5211.0, 3456.0, 2007.0, 1362.0, 944.0, 507.0, 411.0, 234.0, 154.0, 93.0, 50.0, 42.0, 24.0, 16.0, 15.0, 9.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.6345252990722656e-05, -2.554338425397873e-05, -2.4741515517234802e-05, -2.3939646780490875e-05, -2.3137778043746948e-05, -2.233590930700302e-05, -2.1534040570259094e-05, -2.0732171833515167e-05, -1.993030309677124e-05, -1.9128434360027313e-05, -1.8326565623283386e-05, -1.752469688653946e-05, -1.6722828149795532e-05, -1.5920959413051605e-05, -1.5119090676307678e-05, -1.4317221939563751e-05, -1.3515353202819824e-05, -1.2713484466075897e-05, -1.191161572933197e-05, -1.1109746992588043e-05, -1.0307878255844116e-05, -9.50600951910019e-06, -8.704140782356262e-06, -7.902272045612335e-06, -7.100403308868408e-06, -6.298534572124481e-06, -5.496665835380554e-06, -4.694797098636627e-06, -3.8929283618927e-06, -3.091059625148773e-06, -2.289190888404846e-06, -1.4873221516609192e-06, -6.854534149169922e-07, 1.1641532182693481e-07, 9.182840585708618e-07, 1.7201527953147888e-06, 2.522021532058716e-06, 3.323890268802643e-06, 4.12575900554657e-06, 4.927627742290497e-06, 5.729496479034424e-06, 6.531365215778351e-06, 7.333233952522278e-06, 8.135102689266205e-06, 8.936971426010132e-06, 9.738840162754059e-06, 1.0540708899497986e-05, 1.1342577636241913e-05, 1.214444637298584e-05, 1.2946315109729767e-05, 1.3748183846473694e-05, 1.4550052583217621e-05, 1.5351921319961548e-05, 1.6153790056705475e-05, 1.6955658793449402e-05, 1.775752753019333e-05, 1.8559396266937256e-05, 1.9361265003681183e-05, 2.016313374042511e-05, 2.0965002477169037e-05, 2.1766871213912964e-05, 2.256873995065689e-05, 2.3370608687400818e-05, 2.4172477424144745e-05, 2.4974346160888672e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 8.0, 4.0, 4.0, 2.0, 5.0, 8.0, 9.0, 12.0, 19.0, 13.0, 18.0, 18.0, 22.0, 28.0, 32.0, 20.0, 29.0, 25.0, 35.0, 23.0, 40.0, 54.0, 42.0, 42.0, 45.0, 41.0, 31.0, 34.0, 40.0, 36.0, 24.0, 30.0, 25.0, 25.0, 28.0, 28.0, 24.0, 13.0, 7.0, 11.0, 8.0, 14.0, 8.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-1.5079975128173828e-05, -1.4619901776313782e-05, -1.4159828424453735e-05, -1.3699755072593689e-05, -1.3239681720733643e-05, -1.2779608368873596e-05, -1.231953501701355e-05, -1.1859461665153503e-05, -1.1399388313293457e-05, -1.093931496143341e-05, -1.0479241609573364e-05, -1.0019168257713318e-05, -9.559094905853271e-06, -9.099021553993225e-06, -8.638948202133179e-06, -8.178874850273132e-06, -7.718801498413086e-06, -7.2587281465530396e-06, -6.798654794692993e-06, -6.338581442832947e-06, -5.8785080909729e-06, -5.418434739112854e-06, -4.958361387252808e-06, -4.498288035392761e-06, -4.038214683532715e-06, -3.5781413316726685e-06, -3.118067979812622e-06, -2.6579946279525757e-06, -2.1979212760925293e-06, -1.737847924232483e-06, -1.2777745723724365e-06, -8.177012205123901e-07, -3.5762786865234375e-07, 1.0244548320770264e-07, 5.62518835067749e-07, 1.0225921869277954e-06, 1.4826655387878418e-06, 1.942738890647888e-06, 2.4028122425079346e-06, 2.862885594367981e-06, 3.3229589462280273e-06, 3.7830322980880737e-06, 4.24310564994812e-06, 4.7031790018081665e-06, 5.163252353668213e-06, 5.623325705528259e-06, 6.083399057388306e-06, 6.543472409248352e-06, 7.0035457611083984e-06, 7.463619112968445e-06, 7.923692464828491e-06, 8.383765816688538e-06, 8.843839168548584e-06, 9.30391252040863e-06, 9.763985872268677e-06, 1.0224059224128723e-05, 1.068413257598877e-05, 1.1144205927848816e-05, 1.1604279279708862e-05, 1.2064352631568909e-05, 1.2524425983428955e-05, 1.2984499335289001e-05, 1.3444572687149048e-05, 1.3904646039009094e-05, 1.436471939086914e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 7.0, 4.0, 7.0, 10.0, 15.0, 26.0, 34.0, 45.0, 69.0, 121.0, 144.0, 211.0, 390.0, 546.0, 876.0, 1385.0, 2306.0, 3601.0, 6266.0, 11513.0, 23713.0, 61198.0, 249049.0, 509453.0, 106345.0, 35271.0, 15658.0, 7814.0, 4710.0, 2874.0, 1744.0, 1117.0, 721.0, 449.0, 279.0, 175.0, 134.0, 94.0, 56.0, 39.0, 28.0, 22.0, 15.0, 5.0, 8.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.236532211303711e-05, -3.117695450782776e-05, -2.9988586902618408e-05, -2.8800219297409058e-05, -2.7611851692199707e-05, -2.6423484086990356e-05, -2.5235116481781006e-05, -2.4046748876571655e-05, -2.2858381271362305e-05, -2.1670013666152954e-05, -2.0481646060943604e-05, -1.9293278455734253e-05, -1.8104910850524902e-05, -1.6916543245315552e-05, -1.57281756401062e-05, -1.453980803489685e-05, -1.33514404296875e-05, -1.216307282447815e-05, -1.0974705219268799e-05, -9.786337614059448e-06, -8.597970008850098e-06, -7.409602403640747e-06, -6.2212347984313965e-06, -5.032867193222046e-06, -3.844499588012695e-06, -2.6561319828033447e-06, -1.4677643775939941e-06, -2.7939677238464355e-07, 9.08970832824707e-07, 2.0973384380340576e-06, 3.285706043243408e-06, 4.474073648452759e-06, 5.662441253662109e-06, 6.85080885887146e-06, 8.03917646408081e-06, 9.227544069290161e-06, 1.0415911674499512e-05, 1.1604279279708862e-05, 1.2792646884918213e-05, 1.3981014490127563e-05, 1.5169382095336914e-05, 1.6357749700546265e-05, 1.7546117305755615e-05, 1.8734484910964966e-05, 1.9922852516174316e-05, 2.1111220121383667e-05, 2.2299587726593018e-05, 2.3487955331802368e-05, 2.467632293701172e-05, 2.586469054222107e-05, 2.705305814743042e-05, 2.824142575263977e-05, 2.942979335784912e-05, 3.061816096305847e-05, 3.180652856826782e-05, 3.299489617347717e-05, 3.4183263778686523e-05, 3.5371631383895874e-05, 3.6559998989105225e-05, 3.7748366594314575e-05, 3.8936734199523926e-05, 4.0125101804733276e-05, 4.131346940994263e-05, 4.250183701515198e-05, 4.369020462036133e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 3.0, 2.0, 8.0, 4.0, 2.0, 12.0, 9.0, 10.0, 11.0, 11.0, 26.0, 17.0, 20.0, 22.0, 25.0, 26.0, 47.0, 36.0, 42.0, 43.0, 69.0, 53.0, 79.0, 41.0, 47.0, 34.0, 36.0, 36.0, 30.0, 27.0, 19.0, 19.0, 16.0, 20.0, 10.0, 23.0, 10.0, 14.0, 4.0, 10.0, 6.0, 2.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.046627044677734e-06, -7.776543498039246e-06, -7.506459951400757e-06, -7.236376404762268e-06, -6.966292858123779e-06, -6.6962093114852905e-06, -6.426125764846802e-06, -6.156042218208313e-06, -5.885958671569824e-06, -5.6158751249313354e-06, -5.345791578292847e-06, -5.075708031654358e-06, -4.805624485015869e-06, -4.53554093837738e-06, -4.265457391738892e-06, -3.995373845100403e-06, -3.725290298461914e-06, -3.4552067518234253e-06, -3.1851232051849365e-06, -2.9150396585464478e-06, -2.644956111907959e-06, -2.3748725652694702e-06, -2.1047890186309814e-06, -1.8347054719924927e-06, -1.564621925354004e-06, -1.2945383787155151e-06, -1.0244548320770264e-06, -7.543712854385376e-07, -4.842877388000488e-07, -2.1420419216156006e-07, 5.587935447692871e-08, 3.259629011154175e-07, 5.960464477539062e-07, 8.66129994392395e-07, 1.1362135410308838e-06, 1.4062970876693726e-06, 1.6763806343078613e-06, 1.94646418094635e-06, 2.216547727584839e-06, 2.4866312742233276e-06, 2.7567148208618164e-06, 3.026798367500305e-06, 3.296881914138794e-06, 3.5669654607772827e-06, 3.8370490074157715e-06, 4.10713255405426e-06, 4.377216100692749e-06, 4.647299647331238e-06, 4.9173831939697266e-06, 5.187466740608215e-06, 5.457550287246704e-06, 5.727633833885193e-06, 5.997717380523682e-06, 6.26780092716217e-06, 6.537884473800659e-06, 6.807968020439148e-06, 7.078051567077637e-06, 7.3481351137161255e-06, 7.618218660354614e-06, 7.888302206993103e-06, 8.158385753631592e-06, 8.42846930027008e-06, 8.69855284690857e-06, 8.968636393547058e-06, 9.238719940185547e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 6.0, 6.0, 7.0, 8.0, 9.0, 15.0, 20.0, 36.0, 38.0, 68.0, 56.0, 119.0, 139.0, 159.0, 290.0, 301.0, 480.0, 514.0, 989.0, 1202.0, 2366.0, 3141.0, 7388.0, 13032.0, 44013.0, 143998.0, 672857.0, 106734.0, 24437.0, 12489.0, 4639.0, 3196.0, 1586.0, 1323.0, 792.0, 580.0, 335.0, 353.0, 208.0, 187.0, 128.0, 99.0, 57.0, 43.0, 35.0, 23.0, 21.0, 17.0, 10.0, 6.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.344650268554688e-06, -8.07829201221466e-06, -7.811933755874634e-06, -7.545575499534607e-06, -7.27921724319458e-06, -7.012858986854553e-06, -6.746500730514526e-06, -6.4801424741744995e-06, -6.213784217834473e-06, -5.947425961494446e-06, -5.681067705154419e-06, -5.414709448814392e-06, -5.148351192474365e-06, -4.881992936134338e-06, -4.6156346797943115e-06, -4.349276423454285e-06, -4.082918167114258e-06, -3.816559910774231e-06, -3.550201654434204e-06, -3.2838433980941772e-06, -3.0174851417541504e-06, -2.7511268854141235e-06, -2.4847686290740967e-06, -2.21841037273407e-06, -1.952052116394043e-06, -1.6856938600540161e-06, -1.4193356037139893e-06, -1.1529773473739624e-06, -8.866190910339355e-07, -6.202608346939087e-07, -3.5390257835388184e-07, -8.754432201385498e-08, 1.7881393432617188e-07, 4.4517219066619873e-07, 7.115304470062256e-07, 9.778887033462524e-07, 1.2442469596862793e-06, 1.5106052160263062e-06, 1.776963472366333e-06, 2.04332172870636e-06, 2.3096799850463867e-06, 2.5760382413864136e-06, 2.8423964977264404e-06, 3.1087547540664673e-06, 3.375113010406494e-06, 3.641471266746521e-06, 3.907829523086548e-06, 4.174187779426575e-06, 4.4405460357666016e-06, 4.706904292106628e-06, 4.973262548446655e-06, 5.239620804786682e-06, 5.505979061126709e-06, 5.772337317466736e-06, 6.038695573806763e-06, 6.3050538301467896e-06, 6.571412086486816e-06, 6.837770342826843e-06, 7.10412859916687e-06, 7.370486855506897e-06, 7.636845111846924e-06, 7.90320336818695e-06, 8.169561624526978e-06, 8.435919880867004e-06, 8.702278137207031e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 4.0, 6.0, 0.0, 7.0, 0.0, 10.0, 0.0, 11.0, 0.0, 19.0, 0.0, 40.0, 58.0, 0.0, 92.0, 0.0, 109.0, 0.0, 264.0, 0.0, 128.0, 0.0, 96.0, 70.0, 0.0, 32.0, 0.0, 20.0, 0.0, 12.0, 0.0, 10.0, 0.0, 8.0, 8.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.2516975402832031e-06, -1.2191012501716614e-06, -1.1865049600601196e-06, -1.1539086699485779e-06, -1.1213123798370361e-06, -1.0887160897254944e-06, -1.0561197996139526e-06, -1.0235235095024109e-06, -9.909272193908691e-07, -9.583309292793274e-07, -9.257346391677856e-07, -8.931383490562439e-07, -8.605420589447021e-07, -8.279457688331604e-07, -7.953494787216187e-07, -7.627531886100769e-07, -7.301568984985352e-07, -6.975606083869934e-07, -6.649643182754517e-07, -6.323680281639099e-07, -5.997717380523682e-07, -5.671754479408264e-07, -5.345791578292847e-07, -5.019828677177429e-07, -4.6938657760620117e-07, -4.367902874946594e-07, -4.041939973831177e-07, -3.7159770727157593e-07, -3.390014171600342e-07, -3.0640512704849243e-07, -2.738088369369507e-07, -2.4121254682540894e-07, -2.086162567138672e-07, -1.7601996660232544e-07, -1.434236764907837e-07, -1.1082738637924194e-07, -7.82310962677002e-08, -4.563480615615845e-08, -1.30385160446167e-08, 1.955777406692505e-08, 5.21540641784668e-08, 8.475035429000854e-08, 1.1734664440155029e-07, 1.4994293451309204e-07, 1.825392246246338e-07, 2.1513551473617554e-07, 2.477318048477173e-07, 2.8032809495925903e-07, 3.129243850708008e-07, 3.4552067518234253e-07, 3.781169652938843e-07, 4.10713255405426e-07, 4.4330954551696777e-07, 4.759058356285095e-07, 5.085021257400513e-07, 5.41098415851593e-07, 5.736947059631348e-07, 6.062909960746765e-07, 6.388872861862183e-07, 6.7148357629776e-07, 7.040798664093018e-07, 7.366761565208435e-07, 7.692724466323853e-07, 8.01868736743927e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 9.0, 13.0, 23.0, 23.0, 37.0, 52.0, 63.0, 83.0, 117.0, 165.0, 204.0, 350.0, 536.0, 1365.0, 2131.0, 4000.0, 8129.0, 17927.0, 45624.0, 159385.0, 567741.0, 180381.0, 32851.0, 13616.0, 6306.0, 3191.0, 1650.0, 911.0, 543.0, 428.0, 181.0, 151.0, 90.0, 70.0, 50.0, 40.0, 34.0, 37.0, 14.0, 10.0, 12.0, 3.0, 1.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.841255187988281e-06, -5.6549906730651855e-06, -5.46872615814209e-06, -5.282461643218994e-06, -5.0961971282958984e-06, -4.909932613372803e-06, -4.723668098449707e-06, -4.537403583526611e-06, -4.351139068603516e-06, -4.16487455368042e-06, -3.978610038757324e-06, -3.7923455238342285e-06, -3.606081008911133e-06, -3.419816493988037e-06, -3.2335519790649414e-06, -3.0472874641418457e-06, -2.86102294921875e-06, -2.6747584342956543e-06, -2.4884939193725586e-06, -2.302229404449463e-06, -2.115964889526367e-06, -1.9297003746032715e-06, -1.7434358596801758e-06, -1.55717134475708e-06, -1.3709068298339844e-06, -1.1846423149108887e-06, -9.98377799987793e-07, -8.121132850646973e-07, -6.258487701416016e-07, -4.3958425521850586e-07, -2.5331974029541016e-07, -6.705522537231445e-08, 1.1920928955078125e-07, 3.0547380447387695e-07, 4.917383193969727e-07, 6.780028343200684e-07, 8.642673492431641e-07, 1.0505318641662598e-06, 1.2367963790893555e-06, 1.4230608940124512e-06, 1.6093254089355469e-06, 1.7955899238586426e-06, 1.9818544387817383e-06, 2.168118953704834e-06, 2.3543834686279297e-06, 2.5406479835510254e-06, 2.726912498474121e-06, 2.913177013397217e-06, 3.0994415283203125e-06, 3.285706043243408e-06, 3.471970558166504e-06, 3.6582350730895996e-06, 3.844499588012695e-06, 4.030764102935791e-06, 4.217028617858887e-06, 4.403293132781982e-06, 4.589557647705078e-06, 4.775822162628174e-06, 4.9620866775512695e-06, 5.148351192474365e-06, 5.334615707397461e-06, 5.520880222320557e-06, 5.707144737243652e-06, 5.893409252166748e-06, 6.079673767089844e-06]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 4.0, 16.0, 0.0, 20.0, 29.0, 51.0, 0.0, 62.0, 90.0, 138.0, 0.0, 163.0, 129.0, 0.0, 99.0, 69.0, 50.0, 0.0, 25.0, 26.0, 15.0, 0.0, 5.0, 3.0, 2.0, 0.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-06, -1.3271346688270569e-06, -1.2833625078201294e-06, -1.239590346813202e-06, -1.1958181858062744e-06, -1.152046024799347e-06, -1.1082738637924194e-06, -1.064501702785492e-06, -1.0207295417785645e-06, -9.76957380771637e-07, -9.331852197647095e-07, -8.89413058757782e-07, -8.456408977508545e-07, -8.01868736743927e-07, -7.580965757369995e-07, -7.14324414730072e-07, -6.705522537231445e-07, -6.26780092716217e-07, -5.830079317092896e-07, -5.392357707023621e-07, -4.954636096954346e-07, -4.516914486885071e-07, -4.079192876815796e-07, -3.641471266746521e-07, -3.203749656677246e-07, -2.766028046607971e-07, -2.3283064365386963e-07, -1.8905848264694214e-07, -1.4528632164001465e-07, -1.0151416063308716e-07, -5.774199962615967e-08, -1.3969838619232178e-08, 2.9802322387695312e-08, 7.35744833946228e-08, 1.1734664440155029e-07, 1.6111880540847778e-07, 2.0489096641540527e-07, 2.4866312742233276e-07, 2.9243528842926025e-07, 3.3620744943618774e-07, 3.7997961044311523e-07, 4.237517714500427e-07, 4.675239324569702e-07, 5.112960934638977e-07, 5.550682544708252e-07, 5.988404154777527e-07, 6.426125764846802e-07, 6.863847374916077e-07, 7.301568984985352e-07, 7.739290595054626e-07, 8.177012205123901e-07, 8.614733815193176e-07, 9.052455425262451e-07, 9.490177035331726e-07, 9.927898645401e-07, 1.0365620255470276e-06, 1.080334186553955e-06, 1.1241063475608826e-06, 1.16787850856781e-06, 1.2116506695747375e-06, 1.255422830581665e-06, 1.2991949915885925e-06, 1.34296715259552e-06, 1.3867393136024475e-06, 1.430511474609375e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 6.0, 5.0, 6.0, 8.0, 6.0, 17.0, 15.0, 19.0, 27.0, 31.0, 49.0, 59.0, 98.0, 117.0, 119.0, 103.0, 68.0, 57.0, 43.0, 40.0, 19.0, 21.0, 16.0, 13.0, 14.0, 12.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.040502477029804e-05, -1.960353802132886e-05, -1.8802051272359677e-05, -1.8000564523390494e-05, -1.7199079593410715e-05, -1.6397592844441533e-05, -1.559610609547235e-05, -1.4794619346503168e-05, -1.3993132597533986e-05, -1.3191645848564804e-05, -1.2390159099595621e-05, -1.158867326012114e-05, -1.0787186511151958e-05, -9.985699762182776e-06, -9.184213922708295e-06, -8.382727173739113e-06, -7.5812404247699305e-06, -6.779753675800748e-06, -5.978267381578917e-06, -5.176781087357085e-06, -4.375294338387903e-06, -3.5738075894187205e-06, -2.772321295196889e-06, -1.9708350009750575e-06, -1.1693482520058751e-06, -3.678617304103682e-07, 4.3362479118513875e-07, 1.2351113127806457e-06, 2.0365978343761526e-06, 2.838084583345335e-06, 3.6395708775671665e-06, 4.441057171788998e-06, 5.242542101768777e-06, 6.044028850737959e-06, 6.845515144959791e-06, 7.647001439181622e-06, 8.448488188150804e-06, 9.249974937119987e-06, 1.0051460776594467e-05, 1.085294752556365e-05, 1.1654434274532832e-05, 1.2455921023502015e-05, 1.3257407772471197e-05, 1.4058893611945678e-05, 1.486038036091486e-05, 1.566186620038934e-05, 1.6463352949358523e-05, 1.7264839698327705e-05, 1.8066326447296888e-05, 1.886781319626607e-05, 1.9669299945235252e-05, 2.0470786694204435e-05, 2.1272273443173617e-05, 2.20737601921428e-05, 2.287524512212258e-05, 2.367673187109176e-05, 2.4478218620060943e-05, 2.5279705369030125e-05, 2.6081192117999308e-05, 2.688267886696849e-05, 2.768416379694827e-05, 2.848565054591745e-05, 2.9287137294886634e-05, 3.0088624043855816e-05, 3.0890110792825e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 8.0, 4.0, 6.0, 8.0, 4.0, 9.0, 16.0, 10.0, 18.0, 17.0, 23.0, 19.0, 19.0, 25.0, 39.0, 31.0, 29.0, 38.0, 37.0, 29.0, 45.0, 41.0, 36.0, 42.0, 43.0, 36.0, 33.0, 29.0, 43.0, 27.0, 32.0, 31.0, 31.0, 22.0, 32.0, 14.0, 21.0, 12.0, 7.0, 7.0, 8.0, 10.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3696160749532282e-05, -1.3234711332188454e-05, -1.2773261914844625e-05, -1.2311812497500796e-05, -1.1850363080156967e-05, -1.1388913662813138e-05, -1.092746424546931e-05, -1.0466013918630779e-05, -1.0004565410781652e-05, -9.543115993437823e-06, -9.081666576093994e-06, -8.620217158750165e-06, -8.158767741406336e-06, -7.697318324062508e-06, -7.235868451971328e-06, -6.774419034627499e-06, -6.312969162536319e-06, -5.8515197451924905e-06, -5.390070327848662e-06, -4.928620910504833e-06, -4.467171493161004e-06, -4.005722075817175e-06, -3.5442722037259955e-06, -3.0828227863821667e-06, -2.621373369038338e-06, -2.159923951694509e-06, -1.6984744206638425e-06, -1.237024889633176e-06, -7.755754722893471e-07, -3.1412605494551826e-07, 1.47323589771986e-07, 6.087730071158148e-07, 1.0702224244596437e-06, 1.5316718418034725e-06, 1.9931212591473013e-06, 2.4545709038648056e-06, 2.9160203212086344e-06, 3.3774697385524632e-06, 3.8389193832699675e-06, 4.300368800613796e-06, 4.761818217957625e-06, 5.223267635301454e-06, 5.684717052645283e-06, 6.1461669247364625e-06, 6.607616342080291e-06, 7.06906575942412e-06, 7.530515176767949e-06, 7.991964594111778e-06, 8.453414011455607e-06, 8.914863428799435e-06, 9.376312846143264e-06, 9.837762263487093e-06, 1.0299211680830922e-05, 1.076066109817475e-05, 1.1222111425013281e-05, 1.1683559932862408e-05, 1.2145010259700939e-05, 1.2606459677044768e-05, 1.3067909094388597e-05, 1.3529358511732426e-05, 1.3990807929076254e-05, 1.4452257346420083e-05, 1.4913706763763912e-05, 1.5375157090602443e-05, 1.583660559845157e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 1.0, 6.0, 7.0, 10.0, 14.0, 16.0, 32.0, 45.0, 55.0, 88.0, 117.0, 157.0, 252.0, 373.0, 507.0, 784.0, 1073.0, 1700.0, 2671.0, 3771.0, 6207.0, 9388.0, 16496.0, 27792.0, 45380.0, 87877.0, 154773.0, 265550.0, 184334.0, 103954.0, 55780.0, 29562.0, 18770.0, 10635.0, 7261.0, 4507.0, 2726.0, 1977.0, 1187.0, 866.0, 595.0, 396.0, 275.0, 177.0, 149.0, 79.0, 63.0, 42.0, 25.0, 24.0, 10.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.664327621459961e-05, -2.5773420929908752e-05, -2.4903565645217896e-05, -2.403371036052704e-05, -2.316385507583618e-05, -2.2293999791145325e-05, -2.1424144506454468e-05, -2.055428922176361e-05, -1.9684433937072754e-05, -1.8814578652381897e-05, -1.794472336769104e-05, -1.7074868083000183e-05, -1.6205012798309326e-05, -1.533515751361847e-05, -1.4465302228927612e-05, -1.3595446944236755e-05, -1.2725591659545898e-05, -1.1855736374855042e-05, -1.0985881090164185e-05, -1.0116025805473328e-05, -9.24617052078247e-06, -8.376315236091614e-06, -7.506459951400757e-06, -6.6366046667099e-06, -5.766749382019043e-06, -4.896894097328186e-06, -4.027038812637329e-06, -3.157183527946472e-06, -2.2873282432556152e-06, -1.4174729585647583e-06, -5.476176738739014e-07, 3.2223761081695557e-07, 1.1920928955078125e-06, 2.0619481801986694e-06, 2.9318034648895264e-06, 3.8016587495803833e-06, 4.67151403427124e-06, 5.541369318962097e-06, 6.411224603652954e-06, 7.281079888343811e-06, 8.150935173034668e-06, 9.020790457725525e-06, 9.890645742416382e-06, 1.0760501027107239e-05, 1.1630356311798096e-05, 1.2500211596488953e-05, 1.337006688117981e-05, 1.4239922165870667e-05, 1.5109777450561523e-05, 1.597963273525238e-05, 1.6849488019943237e-05, 1.7719343304634094e-05, 1.858919858932495e-05, 1.9459053874015808e-05, 2.0328909158706665e-05, 2.1198764443397522e-05, 2.206861972808838e-05, 2.2938475012779236e-05, 2.3808330297470093e-05, 2.467818558216095e-05, 2.5548040866851807e-05, 2.6417896151542664e-05, 2.728775143623352e-05, 2.8157606720924377e-05, 2.9027462005615234e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 8.0, 5.0, 4.0, 7.0, 7.0, 8.0, 17.0, 21.0, 16.0, 19.0, 19.0, 19.0, 33.0, 32.0, 24.0, 39.0, 37.0, 37.0, 43.0, 36.0, 40.0, 45.0, 37.0, 33.0, 40.0, 43.0, 43.0, 28.0, 40.0, 29.0, 25.0, 24.0, 32.0, 17.0, 14.0, 16.0, 13.0, 9.0, 10.0, 10.0, 3.0, 7.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.233816146850586e-05, -1.192186027765274e-05, -1.1505559086799622e-05, -1.1089257895946503e-05, -1.0672956705093384e-05, -1.0256655514240265e-05, -9.840354323387146e-06, -9.424053132534027e-06, -9.007751941680908e-06, -8.59145075082779e-06, -8.17514955997467e-06, -7.758848369121552e-06, -7.342547178268433e-06, -6.926245987415314e-06, -6.509944796562195e-06, -6.093643605709076e-06, -5.677342414855957e-06, -5.261041224002838e-06, -4.844740033149719e-06, -4.4284388422966e-06, -4.0121376514434814e-06, -3.5958364605903625e-06, -3.1795352697372437e-06, -2.7632340788841248e-06, -2.346932888031006e-06, -1.930631697177887e-06, -1.514330506324768e-06, -1.0980293154716492e-06, -6.817281246185303e-07, -2.654269337654114e-07, 1.5087425708770752e-07, 5.671754479408264e-07, 9.834766387939453e-07, 1.3997778296470642e-06, 1.816079020500183e-06, 2.232380211353302e-06, 2.648681402206421e-06, 3.06498259305954e-06, 3.4812837839126587e-06, 3.897584974765778e-06, 4.3138861656188965e-06, 4.730187356472015e-06, 5.146488547325134e-06, 5.562789738178253e-06, 5.979090929031372e-06, 6.395392119884491e-06, 6.81169331073761e-06, 7.227994501590729e-06, 7.644295692443848e-06, 8.060596883296967e-06, 8.476898074150085e-06, 8.893199265003204e-06, 9.309500455856323e-06, 9.725801646709442e-06, 1.0142102837562561e-05, 1.055840402841568e-05, 1.0974705219268799e-05, 1.1391006410121918e-05, 1.1807307600975037e-05, 1.2223608791828156e-05, 1.2639909982681274e-05, 1.3056211173534393e-05, 1.3472512364387512e-05, 1.3888813555240631e-05, 1.430511474609375e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 4.0, 14.0, 28.0, 20.0, 29.0, 40.0, 85.0, 106.0, 163.0, 204.0, 298.0, 423.0, 675.0, 917.0, 1350.0, 2019.0, 2933.0, 4324.0, 6503.0, 10134.0, 15747.0, 24171.0, 38709.0, 64225.0, 97657.0, 183123.0, 230525.0, 144317.0, 83158.0, 49524.0, 30379.0, 19247.0, 12281.0, 8245.0, 5409.0, 3730.0, 2481.0, 1663.0, 1134.0, 817.0, 526.0, 391.0, 258.0, 195.0, 119.0, 82.0, 58.0, 43.0, 27.0, 16.0, 9.0, 2.0, 8.0, 6.0, 8.0, 2.0, 1.0], "bins": [-2.372264862060547e-05, -2.3009255528450012e-05, -2.2295862436294556e-05, -2.15824693441391e-05, -2.0869076251983643e-05, -2.0155683159828186e-05, -1.944229006767273e-05, -1.8728896975517273e-05, -1.8015503883361816e-05, -1.730211079120636e-05, -1.6588717699050903e-05, -1.5875324606895447e-05, -1.516193151473999e-05, -1.4448538422584534e-05, -1.3735145330429077e-05, -1.302175223827362e-05, -1.2308359146118164e-05, -1.1594966053962708e-05, -1.0881572961807251e-05, -1.0168179869651794e-05, -9.454786777496338e-06, -8.741393685340881e-06, -8.028000593185425e-06, -7.314607501029968e-06, -6.601214408874512e-06, -5.887821316719055e-06, -5.174428224563599e-06, -4.461035132408142e-06, -3.7476420402526855e-06, -3.034248948097229e-06, -2.3208558559417725e-06, -1.607462763786316e-06, -8.940696716308594e-07, -1.8067657947540283e-07, 5.327165126800537e-07, 1.2461096048355103e-06, 1.959502696990967e-06, 2.6728957891464233e-06, 3.38628888130188e-06, 4.0996819734573364e-06, 4.813075065612793e-06, 5.5264681577682495e-06, 6.239861249923706e-06, 6.953254342079163e-06, 7.666647434234619e-06, 8.380040526390076e-06, 9.093433618545532e-06, 9.806826710700989e-06, 1.0520219802856445e-05, 1.1233612895011902e-05, 1.1947005987167358e-05, 1.2660399079322815e-05, 1.3373792171478271e-05, 1.4087185263633728e-05, 1.4800578355789185e-05, 1.551397144794464e-05, 1.6227364540100098e-05, 1.6940757632255554e-05, 1.765415072441101e-05, 1.8367543816566467e-05, 1.9080936908721924e-05, 1.979433000087738e-05, 2.0507723093032837e-05, 2.1221116185188293e-05, 2.193450927734375e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 3.0, 3.0, 7.0, 5.0, 12.0, 19.0, 15.0, 23.0, 23.0, 19.0, 19.0, 35.0, 33.0, 33.0, 26.0, 32.0, 32.0, 33.0, 35.0, 55.0, 31.0, 35.0, 36.0, 58.0, 32.0, 38.0, 38.0, 46.0, 30.0, 26.0, 21.0, 22.0, 22.0, 16.0, 13.0, 19.0, 8.0, 11.0, 8.0, 9.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.179115295410156e-06, -8.910894393920898e-06, -8.64267349243164e-06, -8.374452590942383e-06, -8.106231689453125e-06, -7.838010787963867e-06, -7.569789886474609e-06, -7.3015689849853516e-06, -7.033348083496094e-06, -6.765127182006836e-06, -6.496906280517578e-06, -6.22868537902832e-06, -5.9604644775390625e-06, -5.692243576049805e-06, -5.424022674560547e-06, -5.155801773071289e-06, -4.887580871582031e-06, -4.6193599700927734e-06, -4.351139068603516e-06, -4.082918167114258e-06, -3.814697265625e-06, -3.546476364135742e-06, -3.2782554626464844e-06, -3.0100345611572266e-06, -2.7418136596679688e-06, -2.473592758178711e-06, -2.205371856689453e-06, -1.9371509552001953e-06, -1.6689300537109375e-06, -1.4007091522216797e-06, -1.1324882507324219e-06, -8.642673492431641e-07, -5.960464477539062e-07, -3.2782554626464844e-07, -5.960464477539063e-08, 2.086162567138672e-07, 4.76837158203125e-07, 7.450580596923828e-07, 1.0132789611816406e-06, 1.2814998626708984e-06, 1.5497207641601562e-06, 1.817941665649414e-06, 2.086162567138672e-06, 2.3543834686279297e-06, 2.6226043701171875e-06, 2.8908252716064453e-06, 3.159046173095703e-06, 3.427267074584961e-06, 3.6954879760742188e-06, 3.9637088775634766e-06, 4.231929779052734e-06, 4.500150680541992e-06, 4.76837158203125e-06, 5.036592483520508e-06, 5.304813385009766e-06, 5.5730342864990234e-06, 5.841255187988281e-06, 6.109476089477539e-06, 6.377696990966797e-06, 6.645917892456055e-06, 6.9141387939453125e-06, 7.18235969543457e-06, 7.450580596923828e-06, 7.718801498413086e-06, 7.987022399902344e-06]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 2.0, 11.0, 6.0, 8.0, 10.0, 25.0, 18.0, 43.0, 49.0, 77.0, 93.0, 124.0, 231.0, 254.0, 410.0, 582.0, 953.0, 1359.0, 2492.0, 3719.0, 6046.0, 13092.0, 23439.0, 66083.0, 653638.0, 182930.0, 45350.0, 20563.0, 11833.0, 5497.0, 3835.0, 1899.0, 1418.0, 734.0, 570.0, 304.0, 225.0, 175.0, 137.0, 79.0, 56.0, 61.0, 27.0, 29.0, 30.0, 17.0, 10.0, 3.0, 6.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1086463928222656e-05, -1.0702759027481079e-05, -1.0319054126739502e-05, -9.935349225997925e-06, -9.551644325256348e-06, -9.16793942451477e-06, -8.784234523773193e-06, -8.400529623031616e-06, -8.016824722290039e-06, -7.633119821548462e-06, -7.249414920806885e-06, -6.865710020065308e-06, -6.4820051193237305e-06, -6.098300218582153e-06, -5.714595317840576e-06, -5.330890417098999e-06, -4.947185516357422e-06, -4.563480615615845e-06, -4.179775714874268e-06, -3.7960708141326904e-06, -3.4123659133911133e-06, -3.028661012649536e-06, -2.644956111907959e-06, -2.261251211166382e-06, -1.8775463104248047e-06, -1.4938414096832275e-06, -1.1101365089416504e-06, -7.264316082000732e-07, -3.427267074584961e-07, 4.0978193283081055e-08, 4.246830940246582e-07, 8.083879947662354e-07, 1.1920928955078125e-06, 1.5757977962493896e-06, 1.959502696990967e-06, 2.343207597732544e-06, 2.726912498474121e-06, 3.1106173992156982e-06, 3.4943222999572754e-06, 3.8780272006988525e-06, 4.26173210144043e-06, 4.645437002182007e-06, 5.029141902923584e-06, 5.412846803665161e-06, 5.796551704406738e-06, 6.1802566051483154e-06, 6.563961505889893e-06, 6.94766640663147e-06, 7.331371307373047e-06, 7.715076208114624e-06, 8.098781108856201e-06, 8.482486009597778e-06, 8.866190910339355e-06, 9.249895811080933e-06, 9.63360071182251e-06, 1.0017305612564087e-05, 1.0401010513305664e-05, 1.0784715414047241e-05, 1.1168420314788818e-05, 1.1552125215530396e-05, 1.1935830116271973e-05, 1.231953501701355e-05, 1.2703239917755127e-05, 1.3086944818496704e-05, 1.3470649719238281e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 71.0, 0.0, 0.0, 0.0, 0.0, 796.0, 0.0, 0.0, 0.0, 0.0, 73.0, 0.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.172325134277344e-07, -4.0512531995773315e-07, -3.9301812648773193e-07, -3.809109330177307e-07, -3.688037395477295e-07, -3.5669654607772827e-07, -3.4458935260772705e-07, -3.3248215913772583e-07, -3.203749656677246e-07, -3.082677721977234e-07, -2.9616057872772217e-07, -2.8405338525772095e-07, -2.7194619178771973e-07, -2.598389983177185e-07, -2.477318048477173e-07, -2.3562461137771606e-07, -2.2351741790771484e-07, -2.1141022443771362e-07, -1.993030309677124e-07, -1.8719583749771118e-07, -1.7508864402770996e-07, -1.6298145055770874e-07, -1.5087425708770752e-07, -1.387670636177063e-07, -1.2665987014770508e-07, -1.1455267667770386e-07, -1.0244548320770264e-07, -9.033828973770142e-08, -7.82310962677002e-08, -6.612390279769897e-08, -5.4016709327697754e-08, -4.190951585769653e-08, -2.9802322387695312e-08, -1.7695128917694092e-08, -5.587935447692871e-09, 6.51925802230835e-09, 1.862645149230957e-08, 3.073364496231079e-08, 4.284083843231201e-08, 5.494803190231323e-08, 6.705522537231445e-08, 7.916241884231567e-08, 9.12696123123169e-08, 1.0337680578231812e-07, 1.1548399925231934e-07, 1.2759119272232056e-07, 1.3969838619232178e-07, 1.51805579662323e-07, 1.6391277313232422e-07, 1.7601996660232544e-07, 1.8812716007232666e-07, 2.0023435354232788e-07, 2.123415470123291e-07, 2.2444874048233032e-07, 2.3655593395233154e-07, 2.4866312742233276e-07, 2.60770320892334e-07, 2.728775143623352e-07, 2.849847078323364e-07, 2.9709190130233765e-07, 3.0919909477233887e-07, 3.213062882423401e-07, 3.334134817123413e-07, 3.4552067518234253e-07, 3.5762786865234375e-07]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 5.0, 15.0, 7.0, 12.0, 36.0, 24.0, 35.0, 60.0, 91.0, 121.0, 214.0, 260.0, 365.0, 599.0, 765.0, 1088.0, 1855.0, 2463.0, 4290.0, 5936.0, 9882.0, 19907.0, 38841.0, 121056.0, 720820.0, 58409.0, 24899.0, 14330.0, 7476.0, 5248.0, 2863.0, 2033.0, 1479.0, 943.0, 658.0, 468.0, 300.0, 209.0, 134.0, 102.0, 82.0, 59.0, 32.0, 44.0, 19.0, 6.0, 4.0, 4.0, 5.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.8537044525146484e-05, -1.7979182302951813e-05, -1.742132008075714e-05, -1.686345785856247e-05, -1.6305595636367798e-05, -1.5747733414173126e-05, -1.5189871191978455e-05, -1.4632008969783783e-05, -1.4074146747589111e-05, -1.351628452539444e-05, -1.2958422303199768e-05, -1.2400560081005096e-05, -1.1842697858810425e-05, -1.1284835636615753e-05, -1.0726973414421082e-05, -1.016911119222641e-05, -9.611248970031738e-06, -9.053386747837067e-06, -8.495524525642395e-06, -7.937662303447723e-06, -7.379800081253052e-06, -6.82193785905838e-06, -6.2640756368637085e-06, -5.706213414669037e-06, -5.148351192474365e-06, -4.590488970279694e-06, -4.032626748085022e-06, -3.4747645258903503e-06, -2.9169023036956787e-06, -2.359040081501007e-06, -1.8011778593063354e-06, -1.2433156371116638e-06, -6.854534149169922e-07, -1.2759119272232056e-07, 4.302710294723511e-07, 9.881332516670227e-07, 1.5459954738616943e-06, 2.103857696056366e-06, 2.6617199182510376e-06, 3.2195821404457092e-06, 3.777444362640381e-06, 4.3353065848350525e-06, 4.893168807029724e-06, 5.451031029224396e-06, 6.008893251419067e-06, 6.566755473613739e-06, 7.124617695808411e-06, 7.682479918003082e-06, 8.240342140197754e-06, 8.798204362392426e-06, 9.356066584587097e-06, 9.913928806781769e-06, 1.047179102897644e-05, 1.1029653251171112e-05, 1.1587515473365784e-05, 1.2145377695560455e-05, 1.2703239917755127e-05, 1.3261102139949799e-05, 1.381896436214447e-05, 1.4376826584339142e-05, 1.4934688806533813e-05, 1.5492551028728485e-05, 1.6050413250923157e-05, 1.660827547311783e-05, 1.71661376953125e-05]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 2.0, 4.0, 9.0, 5.0, 6.0, 6.0, 13.0, 8.0, 22.0, 37.0, 39.0, 56.0, 57.0, 444.0, 88.0, 40.0, 28.0, 18.0, 16.0, 20.0, 19.0, 11.0, 5.0, 5.0, 3.0, 3.0, 6.0, 8.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.9604644775390625e-06, -5.791895091533661e-06, -5.623325705528259e-06, -5.454756319522858e-06, -5.286186933517456e-06, -5.1176175475120544e-06, -4.949048161506653e-06, -4.780478775501251e-06, -4.61190938949585e-06, -4.443340003490448e-06, -4.274770617485046e-06, -4.106201231479645e-06, -3.937631845474243e-06, -3.7690624594688416e-06, -3.60049307346344e-06, -3.4319236874580383e-06, -3.2633543014526367e-06, -3.094784915447235e-06, -2.9262155294418335e-06, -2.757646143436432e-06, -2.5890767574310303e-06, -2.4205073714256287e-06, -2.251937985420227e-06, -2.0833685994148254e-06, -1.914799213409424e-06, -1.7462298274040222e-06, -1.5776604413986206e-06, -1.409091055393219e-06, -1.2405216693878174e-06, -1.0719522833824158e-06, -9.033828973770142e-07, -7.348135113716125e-07, -5.662441253662109e-07, -3.976747393608093e-07, -2.2910535335540771e-07, -6.05359673500061e-08, 1.0803341865539551e-07, 2.766028046607971e-07, 4.4517219066619873e-07, 6.137415766716003e-07, 7.82310962677002e-07, 9.508803486824036e-07, 1.1194497346878052e-06, 1.2880191206932068e-06, 1.4565885066986084e-06, 1.62515789270401e-06, 1.7937272787094116e-06, 1.9622966647148132e-06, 2.130866050720215e-06, 2.2994354367256165e-06, 2.468004822731018e-06, 2.6365742087364197e-06, 2.8051435947418213e-06, 2.973712980747223e-06, 3.1422823667526245e-06, 3.310851752758026e-06, 3.4794211387634277e-06, 3.6479905247688293e-06, 3.816559910774231e-06, 3.9851292967796326e-06, 4.153698682785034e-06, 4.322268068790436e-06, 4.490837454795837e-06, 4.659406840801239e-06, 4.827976226806641e-06]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 14.0, 14.0, 7.0, 18.0, 26.0, 37.0, 45.0, 60.0, 78.0, 132.0, 128.0, 107.0, 78.0, 50.0, 46.0, 32.0, 25.0, 22.0, 13.0, 12.0, 15.0, 5.0, 6.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1122672478668392e-05, -2.0349685655673966e-05, -1.957669883267954e-05, -1.8803712009685114e-05, -1.8030725186690688e-05, -1.7257738363696262e-05, -1.6484751540701836e-05, -1.571176471770741e-05, -1.4938776985218283e-05, -1.4165790162223857e-05, -1.3392803339229431e-05, -1.2619815606740303e-05, -1.1846828783745877e-05, -1.1073841960751452e-05, -1.0300855137757026e-05, -9.5278683147626e-06, -8.754881491768174e-06, -7.981894668773748e-06, -7.208907845779322e-06, -6.435920568037545e-06, -5.662933745043119e-06, -4.8899469220486935e-06, -4.116959644306917e-06, -3.343972821312491e-06, -2.570985998318065e-06, -1.7979990616368013e-06, -1.0250121249555377e-06, -2.520250745874364e-07, 5.209617484069895e-07, 1.2939485714014154e-06, 2.066935849143192e-06, 2.839922672137618e-06, 3.612909495132044e-06, 4.38589631812647e-06, 5.158883141120896e-06, 5.9318704188626725e-06, 6.704857241857098e-06, 7.477844064851524e-06, 8.250831342593301e-06, 9.023818165587727e-06, 9.796804988582153e-06, 1.0569791811576579e-05, 1.1342778634571005e-05, 1.2115766367060132e-05, 1.2888753190054558e-05, 1.3661740013048984e-05, 1.443472683604341e-05, 1.5207713659037836e-05, 1.5980700482032262e-05, 1.6753687305026688e-05, 1.7526674128021114e-05, 1.829966095101554e-05, 1.9072647774009965e-05, 1.984563459700439e-05, 2.061862323898822e-05, 2.1391610061982647e-05, 2.2164596884977072e-05, 2.29375837079715e-05, 2.3710570530965924e-05, 2.448355735396035e-05, 2.5256544176954776e-05, 2.6029530999949202e-05, 2.6802517822943628e-05, 2.7575504645938054e-05, 2.834849146893248e-05]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 3.0, 10.0, 7.0, 8.0, 9.0, 12.0, 12.0, 17.0, 16.0, 21.0, 26.0, 30.0, 28.0, 29.0, 39.0, 28.0, 25.0, 35.0, 38.0, 36.0, 33.0, 37.0, 37.0, 40.0, 45.0, 44.0, 35.0, 36.0, 29.0, 27.0, 20.0, 34.0, 18.0, 23.0, 22.0, 16.0, 17.0, 11.0, 8.0, 11.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1791449651354924e-05, -1.1374974747013766e-05, -1.0958499842672609e-05, -1.0542024938331451e-05, -1.0125550033990294e-05, -9.709076039143838e-06, -9.29260113480268e-06, -8.876126230461523e-06, -8.459651326120365e-06, -8.043176421779208e-06, -7.62670151743805e-06, -7.210227067844244e-06, -6.793752163503086e-06, -6.377277259161929e-06, -5.960802809568122e-06, -5.5443279052269645e-06, -5.127853000885807e-06, -4.7113780965446495e-06, -4.294903192203492e-06, -3.878428742609685e-06, -3.4619538382685278e-06, -3.0454789339273702e-06, -2.629004256959888e-06, -2.212529579992406e-06, -1.7960546756512485e-06, -1.3795798849969287e-06, -9.63105094342609e-07, -5.466303036882891e-07, -1.3015551303396933e-07, 2.863193913071882e-07, 7.027940682746703e-07, 1.1192687452421524e-06, 1.5357445590780117e-06, 1.952219463419169e-06, 2.3686941403866513e-06, 2.7851688173541334e-06, 3.201643721695291e-06, 3.6181186260364484e-06, 4.034593075630255e-06, 4.4510679799714126e-06, 4.86754288431257e-06, 5.284017788653728e-06, 5.700492692994885e-06, 6.116967142588692e-06, 6.533442046929849e-06, 6.949916951271007e-06, 7.3663914008648135e-06, 7.782866305205971e-06, 8.199341209547129e-06, 8.615816113888286e-06, 9.032291018229444e-06, 9.448765922570601e-06, 9.865239917417057e-06, 1.0281715731252916e-05, 1.0698189726099372e-05, 1.111466463044053e-05, 1.1531139534781687e-05, 1.1947614439122844e-05, 1.2364089343464002e-05, 1.278056424780516e-05, 1.3197039152146317e-05, 1.3613513146992773e-05, 1.402998805133393e-05, 1.4446462955675088e-05, 1.4862937860016245e-05]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 10.0, 11.0, 19.0, 32.0, 43.0, 85.0, 126.0, 222.0, 321.0, 418.0, 726.0, 1006.0, 1569.0, 2541.0, 3727.0, 6007.0, 9453.0, 15772.0, 26008.0, 45119.0, 93337.0, 175944.0, 453918.0, 1562150.0, 1147052.0, 334804.0, 143343.0, 72033.0, 38946.0, 22619.0, 13589.0, 8151.0, 5346.0, 3636.0, 2107.0, 1347.0, 878.0, 621.0, 382.0, 279.0, 188.0, 116.0, 91.0, 65.0, 33.0, 27.0, 25.0, 11.0, 9.0, 10.0, 6.0, 3.0, 8.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7344951629638672e-05, -1.6744248569011688e-05, -1.6143545508384705e-05, -1.554284244775772e-05, -1.4942139387130737e-05, -1.4341436326503754e-05, -1.374073326587677e-05, -1.3140030205249786e-05, -1.2539327144622803e-05, -1.1938624083995819e-05, -1.1337921023368835e-05, -1.0737217962741852e-05, -1.0136514902114868e-05, -9.535811841487885e-06, -8.935108780860901e-06, -8.334405720233917e-06, -7.733702659606934e-06, -7.13299959897995e-06, -6.532296538352966e-06, -5.931593477725983e-06, -5.330890417098999e-06, -4.730187356472015e-06, -4.129484295845032e-06, -3.528781235218048e-06, -2.9280781745910645e-06, -2.327375113964081e-06, -1.7266720533370972e-06, -1.1259689927101135e-06, -5.252659320831299e-07, 7.543712854385376e-08, 6.761401891708374e-07, 1.276843249797821e-06, 1.8775463104248047e-06, 2.4782493710517883e-06, 3.078952431678772e-06, 3.6796554923057556e-06, 4.280358552932739e-06, 4.881061613559723e-06, 5.4817646741867065e-06, 6.08246773481369e-06, 6.683170795440674e-06, 7.2838738560676575e-06, 7.884576916694641e-06, 8.485279977321625e-06, 9.085983037948608e-06, 9.686686098575592e-06, 1.0287389159202576e-05, 1.088809221982956e-05, 1.1488795280456543e-05, 1.2089498341083527e-05, 1.269020140171051e-05, 1.3290904462337494e-05, 1.3891607522964478e-05, 1.4492310583591461e-05, 1.5093013644218445e-05, 1.569371670484543e-05, 1.6294419765472412e-05, 1.6895122826099396e-05, 1.749582588672638e-05, 1.8096528947353363e-05, 1.8697232007980347e-05, 1.929793506860733e-05, 1.9898638129234314e-05, 2.0499341189861298e-05, 2.110004425048828e-05]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 6.0, 0.0, 6.0, 8.0, 15.0, 8.0, 20.0, 20.0, 25.0, 23.0, 21.0, 34.0, 30.0, 37.0, 14.0, 40.0, 45.0, 32.0, 38.0, 35.0, 43.0, 40.0, 48.0, 43.0, 37.0, 26.0, 27.0, 38.0, 38.0, 30.0, 28.0, 22.0, 25.0, 16.0, 16.0, 10.0, 9.0, 5.0, 14.0, 4.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.62939453125e-06, -7.379800081253052e-06, -7.1302056312561035e-06, -6.880611181259155e-06, -6.631016731262207e-06, -6.381422281265259e-06, -6.1318278312683105e-06, -5.882233381271362e-06, -5.632638931274414e-06, -5.383044481277466e-06, -5.133450031280518e-06, -4.883855581283569e-06, -4.634261131286621e-06, -4.384666681289673e-06, -4.135072231292725e-06, -3.885477781295776e-06, -3.635883331298828e-06, -3.38628888130188e-06, -3.1366944313049316e-06, -2.8870999813079834e-06, -2.637505531311035e-06, -2.387911081314087e-06, -2.1383166313171387e-06, -1.8887221813201904e-06, -1.6391277313232422e-06, -1.389533281326294e-06, -1.1399388313293457e-06, -8.903443813323975e-07, -6.407499313354492e-07, -3.91155481338501e-07, -1.4156103134155273e-07, 1.0803341865539551e-07, 3.5762786865234375e-07, 6.07222318649292e-07, 8.568167686462402e-07, 1.1064112186431885e-06, 1.3560056686401367e-06, 1.605600118637085e-06, 1.8551945686340332e-06, 2.1047890186309814e-06, 2.3543834686279297e-06, 2.603977918624878e-06, 2.853572368621826e-06, 3.1031668186187744e-06, 3.3527612686157227e-06, 3.602355718612671e-06, 3.851950168609619e-06, 4.101544618606567e-06, 4.351139068603516e-06, 4.600733518600464e-06, 4.850327968597412e-06, 5.09992241859436e-06, 5.349516868591309e-06, 5.599111318588257e-06, 5.848705768585205e-06, 6.098300218582153e-06, 6.3478946685791016e-06, 6.59748911857605e-06, 6.847083568572998e-06, 7.096678018569946e-06, 7.3462724685668945e-06, 7.595866918563843e-06, 7.845461368560791e-06, 8.09505581855774e-06, 8.344650268554688e-06]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 7.0, 12.0, 25.0, 26.0, 48.0, 73.0, 87.0, 151.0, 192.0, 254.0, 379.0, 634.0, 823.0, 1453.0, 1769.0, 3106.0, 4049.0, 7216.0, 9866.0, 17918.0, 25940.0, 49405.0, 75747.0, 161020.0, 283354.0, 629105.0, 1504193.0, 713200.0, 343076.0, 146892.0, 90347.0, 45061.0, 30699.0, 16317.0, 11582.0, 6486.0, 4829.0, 2728.0, 2031.0, 1232.0, 996.0, 577.0, 431.0, 310.0, 203.0, 156.0, 82.0, 74.0, 50.0, 20.0, 25.0, 15.0, 7.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.4483928680419922e-05, -1.4038756489753723e-05, -1.3593584299087524e-05, -1.3148412108421326e-05, -1.2703239917755127e-05, -1.2258067727088928e-05, -1.181289553642273e-05, -1.136772334575653e-05, -1.0922551155090332e-05, -1.0477378964424133e-05, -1.0032206773757935e-05, -9.587034583091736e-06, -9.141862392425537e-06, -8.696690201759338e-06, -8.25151801109314e-06, -7.806345820426941e-06, -7.361173629760742e-06, -6.9160014390945435e-06, -6.470829248428345e-06, -6.025657057762146e-06, -5.580484867095947e-06, -5.1353126764297485e-06, -4.69014048576355e-06, -4.244968295097351e-06, -3.7997961044311523e-06, -3.3546239137649536e-06, -2.909451723098755e-06, -2.464279532432556e-06, -2.0191073417663574e-06, -1.5739351511001587e-06, -1.12876296043396e-06, -6.835907697677612e-07, -2.384185791015625e-07, 2.0675361156463623e-07, 6.51925802230835e-07, 1.0970979928970337e-06, 1.5422701835632324e-06, 1.987442374229431e-06, 2.43261456489563e-06, 2.8777867555618286e-06, 3.3229589462280273e-06, 3.768131136894226e-06, 4.213303327560425e-06, 4.6584755182266235e-06, 5.103647708892822e-06, 5.548819899559021e-06, 5.99399209022522e-06, 6.4391642808914185e-06, 6.884336471557617e-06, 7.329508662223816e-06, 7.774680852890015e-06, 8.219853043556213e-06, 8.665025234222412e-06, 9.11019742488861e-06, 9.55536961555481e-06, 1.0000541806221008e-05, 1.0445713996887207e-05, 1.0890886187553406e-05, 1.1336058378219604e-05, 1.1781230568885803e-05, 1.2226402759552002e-05, 1.26715749502182e-05, 1.31167471408844e-05, 1.3561919331550598e-05, 1.4007091522216797e-05]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 2.0, 6.0, 3.0, 2.0, 10.0, 8.0, 10.0, 8.0, 17.0, 27.0, 23.0, 44.0, 68.0, 49.0, 75.0, 71.0, 132.0, 167.0, 139.0, 207.0, 165.0, 323.0, 233.0, 396.0, 339.0, 197.0, 259.0, 171.0, 220.0, 164.0, 92.0, 119.0, 55.0, 66.0, 46.0, 36.0, 32.0, 14.0, 24.0, 14.0, 7.0, 12.0, 8.0, 9.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.0067901611328125e-06, -4.852190613746643e-06, -4.697591066360474e-06, -4.542991518974304e-06, -4.388391971588135e-06, -4.233792424201965e-06, -4.079192876815796e-06, -3.9245933294296265e-06, -3.769993782043457e-06, -3.6153942346572876e-06, -3.460794687271118e-06, -3.3061951398849487e-06, -3.1515955924987793e-06, -2.99699604511261e-06, -2.8423964977264404e-06, -2.687796950340271e-06, -2.5331974029541016e-06, -2.378597855567932e-06, -2.2239983081817627e-06, -2.0693987607955933e-06, -1.914799213409424e-06, -1.7601996660232544e-06, -1.605600118637085e-06, -1.4510005712509155e-06, -1.296401023864746e-06, -1.1418014764785767e-06, -9.872019290924072e-07, -8.326023817062378e-07, -6.780028343200684e-07, -5.234032869338989e-07, -3.688037395477295e-07, -2.1420419216156006e-07, -5.960464477539063e-08, 9.499490261077881e-08, 2.4959444999694824e-07, 4.041939973831177e-07, 5.587935447692871e-07, 7.133930921554565e-07, 8.67992639541626e-07, 1.0225921869277954e-06, 1.1771917343139648e-06, 1.3317912817001343e-06, 1.4863908290863037e-06, 1.6409903764724731e-06, 1.7955899238586426e-06, 1.950189471244812e-06, 2.1047890186309814e-06, 2.259388566017151e-06, 2.4139881134033203e-06, 2.5685876607894897e-06, 2.723187208175659e-06, 2.8777867555618286e-06, 3.032386302947998e-06, 3.1869858503341675e-06, 3.341585397720337e-06, 3.4961849451065063e-06, 3.6507844924926758e-06, 3.8053840398788452e-06, 3.959983587265015e-06, 4.114583134651184e-06, 4.2691826820373535e-06, 4.423782229423523e-06, 4.578381776809692e-06, 4.732981324195862e-06, 4.887580871582031e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 4.0, 9.0, 17.0, 15.0, 22.0, 26.0, 31.0, 54.0, 64.0, 74.0, 87.0, 122.0, 103.0, 93.0, 73.0, 43.0, 34.0, 27.0, 29.0, 16.0, 8.0, 10.0, 8.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3004626453039236e-05, -1.2517227332864422e-05, -1.2029828212689608e-05, -1.1542430002009496e-05, -1.1055030881834682e-05, -1.0567631761659868e-05, -1.0080233550979756e-05, -9.592834430804942e-06, -9.105435310630128e-06, -8.618036190455314e-06, -8.1306370702805e-06, -7.643238859600388e-06, -7.1558397394255735e-06, -6.6684406192507595e-06, -6.181041953823296e-06, -5.693643288395833e-06, -5.206244168221019e-06, -4.718845048046205e-06, -4.231446382618742e-06, -3.7440474898176035e-06, -3.256648597016465e-06, -2.7692497042153263e-06, -2.2818508114141878e-06, -1.7944519186130492e-06, -1.3070530258119106e-06, -8.196541330107721e-07, -3.322552402096335e-07, 1.551436525915051e-07, 6.425425453926437e-07, 1.1299414381937822e-06, 1.6173403309949208e-06, 2.1047392237960594e-06, 2.5921362976077944e-06, 3.079535190408933e-06, 3.5669340832100715e-06, 4.054332748637535e-06, 4.541731868812349e-06, 5.029130988987163e-06, 5.516529654414626e-06, 6.003928319842089e-06, 6.491327440016903e-06, 6.978726560191717e-06, 7.46612522561918e-06, 7.953523891046643e-06, 8.440923011221457e-06, 8.928322131396271e-06, 9.415720342076384e-06, 9.903119462251198e-06, 1.0390518582426012e-05, 1.0877917702600826e-05, 1.136531682277564e-05, 1.1852715033455752e-05, 1.2340114153630566e-05, 1.282751327380538e-05, 1.3314911484485492e-05, 1.3802310604660306e-05, 1.428970972483512e-05, 1.4777108845009934e-05, 1.5264507965184748e-05, 1.575190617586486e-05, 1.6239304386544973e-05, 1.672670441621449e-05, 1.72141026268946e-05, 1.7701502656564116e-05, 1.818890086724423e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 7.0, 4.0, 3.0, 3.0, 6.0, 6.0, 3.0, 11.0, 8.0, 10.0, 15.0, 13.0, 12.0, 28.0, 24.0, 24.0, 27.0, 21.0, 26.0, 32.0, 36.0, 24.0, 35.0, 25.0, 28.0, 35.0, 40.0, 40.0, 36.0, 40.0, 40.0, 33.0, 26.0, 21.0, 30.0, 31.0, 20.0, 19.0, 25.0, 21.0, 19.0, 15.0, 14.0, 10.0, 13.0, 10.0, 8.0, 8.0, 9.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-7.083381660777377e-06, -6.84416545482236e-06, -6.604949248867342e-06, -6.365733042912325e-06, -6.1265168369573075e-06, -5.88730063100229e-06, -5.648083970299922e-06, -5.4088677643449046e-06, -5.169651558389887e-06, -4.93043535243487e-06, -4.6912191464798525e-06, -4.452002940524835e-06, -4.212786734569818e-06, -3.9735705286148e-06, -3.7343540952861076e-06, -3.4951378893310903e-06, -3.2559219107497483e-06, -3.016705704794731e-06, -2.7774894988397136e-06, -2.5382732928846963e-06, -2.299057086929679e-06, -2.0598408809746616e-06, -1.8206244476459688e-06, -1.5814082416909514e-06, -1.342192035735934e-06, -1.1029758297809167e-06, -8.637595669824805e-07, -6.245433041840442e-07, -3.853270982290269e-07, -1.4611089227400953e-07, 9.310542736784555e-08, 3.323216333228629e-07, 5.715382940252312e-07, 8.107544999802485e-07, 1.0499707059352659e-06, 1.289187025577121e-06, 1.5284032315321383e-06, 1.7676194374871557e-06, 2.0068357571290107e-06, 2.246051963084028e-06, 2.4852681690390455e-06, 2.724484374994063e-06, 2.96370058094908e-06, 3.202917014277773e-06, 3.4421332202327903e-06, 3.6813494261878077e-06, 3.920565632142825e-06, 4.159781838097842e-06, 4.39899804405286e-06, 4.638214250007877e-06, 4.8774304559628945e-06, 5.116646661917912e-06, 5.355862867872929e-06, 5.5950790738279466e-06, 5.834295734530315e-06, 6.073511940485332e-06, 6.3127281464403495e-06, 6.551944352395367e-06, 6.791160558350384e-06, 7.030376764305402e-06, 7.269592970260419e-06, 7.508809176215436e-06, 7.748025382170454e-06, 7.987241588125471e-06, 8.226457794080488e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 9.0, 14.0, 25.0, 41.0, 51.0, 89.0, 139.0, 142.0, 286.0, 434.0, 604.0, 1108.0, 1811.0, 2397.0, 4491.0, 7385.0, 10229.0, 19616.0, 27305.0, 54789.0, 98647.0, 145079.0, 235461.0, 188798.0, 96398.0, 64608.0, 36438.0, 18582.0, 13343.0, 6796.0, 5238.0, 3114.0, 1727.0, 1283.0, 757.0, 442.0, 307.0, 198.0, 106.0, 87.0, 56.0, 43.0, 23.0, 11.0, 16.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2516975402832031e-05, -1.2121163308620453e-05, -1.1725351214408875e-05, -1.1329539120197296e-05, -1.0933727025985718e-05, -1.053791493177414e-05, -1.0142102837562561e-05, -9.746290743350983e-06, -9.350478649139404e-06, -8.954666554927826e-06, -8.558854460716248e-06, -8.16304236650467e-06, -7.76723027229309e-06, -7.3714181780815125e-06, -6.975606083869934e-06, -6.579793989658356e-06, -6.183981895446777e-06, -5.788169801235199e-06, -5.392357707023621e-06, -4.996545612812042e-06, -4.600733518600464e-06, -4.2049214243888855e-06, -3.809109330177307e-06, -3.4132972359657288e-06, -3.0174851417541504e-06, -2.621673047542572e-06, -2.2258609533309937e-06, -1.8300488591194153e-06, -1.434236764907837e-06, -1.0384246706962585e-06, -6.426125764846802e-07, -2.468004822731018e-07, 1.4901161193847656e-07, 5.448237061500549e-07, 9.406358003616333e-07, 1.3364478945732117e-06, 1.73225998878479e-06, 2.1280720829963684e-06, 2.5238841772079468e-06, 2.919696271419525e-06, 3.3155083656311035e-06, 3.711320459842682e-06, 4.10713255405426e-06, 4.502944648265839e-06, 4.898756742477417e-06, 5.294568836688995e-06, 5.690380930900574e-06, 6.086193025112152e-06, 6.4820051193237305e-06, 6.877817213535309e-06, 7.273629307746887e-06, 7.669441401958466e-06, 8.065253496170044e-06, 8.461065590381622e-06, 8.8568776845932e-06, 9.252689778804779e-06, 9.648501873016357e-06, 1.0044313967227936e-05, 1.0440126061439514e-05, 1.0835938155651093e-05, 1.1231750249862671e-05, 1.162756234407425e-05, 1.2023374438285828e-05, 1.2419186532497406e-05, 1.2814998626708984e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 6.0, 7.0, 5.0, 8.0, 7.0, 9.0, 10.0, 9.0, 14.0, 23.0, 20.0, 36.0, 23.0, 17.0, 26.0, 27.0, 29.0, 22.0, 26.0, 43.0, 44.0, 31.0, 36.0, 33.0, 47.0, 47.0, 46.0, 31.0, 26.0, 35.0, 19.0, 33.0, 21.0, 24.0, 14.0, 19.0, 12.0, 16.0, 21.0, 5.0, 11.0, 9.0, 15.0, 9.0, 5.0, 7.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-7.331371307373047e-06, -7.095746695995331e-06, -6.860122084617615e-06, -6.624497473239899e-06, -6.388872861862183e-06, -6.1532482504844666e-06, -5.9176236391067505e-06, -5.6819990277290344e-06, -5.446374416351318e-06, -5.210749804973602e-06, -4.975125193595886e-06, -4.73950058221817e-06, -4.503875970840454e-06, -4.268251359462738e-06, -4.032626748085022e-06, -3.797002136707306e-06, -3.56137752532959e-06, -3.3257529139518738e-06, -3.0901283025741577e-06, -2.8545036911964417e-06, -2.6188790798187256e-06, -2.3832544684410095e-06, -2.1476298570632935e-06, -1.9120052456855774e-06, -1.6763806343078613e-06, -1.4407560229301453e-06, -1.2051314115524292e-06, -9.695068001747131e-07, -7.338821887969971e-07, -4.98257577419281e-07, -2.6263296604156494e-07, -2.7008354663848877e-08, 2.086162567138672e-07, 4.4424086809158325e-07, 6.798654794692993e-07, 9.154900908470154e-07, 1.1511147022247314e-06, 1.3867393136024475e-06, 1.6223639249801636e-06, 1.8579885363578796e-06, 2.0936131477355957e-06, 2.3292377591133118e-06, 2.564862370491028e-06, 2.800486981868744e-06, 3.03611159324646e-06, 3.271736204624176e-06, 3.507360816001892e-06, 3.742985427379608e-06, 3.978610038757324e-06, 4.21423465013504e-06, 4.449859261512756e-06, 4.685483872890472e-06, 4.9211084842681885e-06, 5.1567330956459045e-06, 5.392357707023621e-06, 5.627982318401337e-06, 5.863606929779053e-06, 6.099231541156769e-06, 6.334856152534485e-06, 6.570480763912201e-06, 6.806105375289917e-06, 7.041729986667633e-06, 7.277354598045349e-06, 7.512979209423065e-06, 7.748603820800781e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 12.0, 16.0, 6.0, 21.0, 27.0, 40.0, 66.0, 98.0, 165.0, 240.0, 425.0, 632.0, 1118.0, 1708.0, 3545.0, 7321.0, 17710.0, 51995.0, 206307.0, 627110.0, 84056.0, 25506.0, 9585.0, 4916.0, 2467.0, 1369.0, 763.0, 475.0, 294.0, 183.0, 113.0, 87.0, 55.0, 45.0, 22.0, 17.0, 9.0, 8.0, 6.0, 2.0, 6.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2590160369873047e-05, -2.1948479115962982e-05, -2.1306797862052917e-05, -2.0665116608142853e-05, -2.0023435354232788e-05, -1.9381754100322723e-05, -1.874007284641266e-05, -1.8098391592502594e-05, -1.745671033859253e-05, -1.6815029084682465e-05, -1.61733478307724e-05, -1.5531666576862335e-05, -1.488998532295227e-05, -1.4248304069042206e-05, -1.3606622815132141e-05, -1.2964941561222076e-05, -1.2323260307312012e-05, -1.1681579053401947e-05, -1.1039897799491882e-05, -1.0398216545581818e-05, -9.756535291671753e-06, -9.114854037761688e-06, -8.473172783851624e-06, -7.831491529941559e-06, -7.189810276031494e-06, -6.5481290221214294e-06, -5.906447768211365e-06, -5.2647665143013e-06, -4.623085260391235e-06, -3.981404006481171e-06, -3.339722752571106e-06, -2.6980414986610413e-06, -2.0563602447509766e-06, -1.4146789908409119e-06, -7.729977369308472e-07, -1.3131648302078247e-07, 5.103647708892822e-07, 1.152046024799347e-06, 1.7937272787094116e-06, 2.4354085326194763e-06, 3.077089786529541e-06, 3.7187710404396057e-06, 4.36045229434967e-06, 5.002133548259735e-06, 5.6438148021698e-06, 6.2854960560798645e-06, 6.927177309989929e-06, 7.568858563899994e-06, 8.210539817810059e-06, 8.852221071720123e-06, 9.493902325630188e-06, 1.0135583579540253e-05, 1.0777264833450317e-05, 1.1418946087360382e-05, 1.2060627341270447e-05, 1.2702308595180511e-05, 1.3343989849090576e-05, 1.3985671103000641e-05, 1.4627352356910706e-05, 1.526903361082077e-05, 1.5910714864730835e-05, 1.65523961186409e-05, 1.7194077372550964e-05, 1.783575862646103e-05, 1.8477439880371094e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 13.0, 11.0, 12.0, 16.0, 17.0, 20.0, 28.0, 28.0, 28.0, 54.0, 56.0, 46.0, 87.0, 132.0, 105.0, 52.0, 65.0, 42.0, 37.0, 33.0, 17.0, 28.0, 7.0, 13.0, 12.0, 2.0, 6.0, 2.0, 6.0, 7.0, 0.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.410743713378906e-06, -4.257075488567352e-06, -4.103407263755798e-06, -3.949739038944244e-06, -3.7960708141326904e-06, -3.6424025893211365e-06, -3.4887343645095825e-06, -3.3350661396980286e-06, -3.1813979148864746e-06, -3.0277296900749207e-06, -2.8740614652633667e-06, -2.7203932404518127e-06, -2.566725015640259e-06, -2.413056790828705e-06, -2.259388566017151e-06, -2.105720341205597e-06, -1.952052116394043e-06, -1.798383891582489e-06, -1.644715666770935e-06, -1.491047441959381e-06, -1.3373792171478271e-06, -1.1837109923362732e-06, -1.0300427675247192e-06, -8.763745427131653e-07, -7.227063179016113e-07, -5.690380930900574e-07, -4.153698682785034e-07, -2.6170164346694946e-07, -1.0803341865539551e-07, 4.563480615615845e-08, 1.993030309677124e-07, 3.5297125577926636e-07, 5.066394805908203e-07, 6.603077054023743e-07, 8.139759302139282e-07, 9.676441550254822e-07, 1.1213123798370361e-06, 1.27498060464859e-06, 1.428648829460144e-06, 1.582317054271698e-06, 1.735985279083252e-06, 1.889653503894806e-06, 2.04332172870636e-06, 2.196989953517914e-06, 2.3506581783294678e-06, 2.5043264031410217e-06, 2.6579946279525757e-06, 2.8116628527641296e-06, 2.9653310775756836e-06, 3.1189993023872375e-06, 3.2726675271987915e-06, 3.4263357520103455e-06, 3.5800039768218994e-06, 3.7336722016334534e-06, 3.887340426445007e-06, 4.041008651256561e-06, 4.194676876068115e-06, 4.348345100879669e-06, 4.502013325691223e-06, 4.655681550502777e-06, 4.809349775314331e-06, 4.963018000125885e-06, 5.116686224937439e-06, 5.270354449748993e-06, 5.424022674560547e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 12.0, 14.0, 20.0, 43.0, 36.0, 52.0, 84.0, 158.0, 185.0, 417.0, 814.0, 1668.0, 2781.0, 6509.0, 17051.0, 62251.0, 863782.0, 62807.0, 17087.0, 6345.0, 2917.0, 1722.0, 574.0, 513.0, 256.0, 162.0, 84.0, 73.0, 36.0, 43.0, 24.0, 6.0, 8.0, 9.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-06, -4.353001713752747e-06, -4.176050424575806e-06, -3.999099135398865e-06, -3.822147846221924e-06, -3.645196557044983e-06, -3.468245267868042e-06, -3.291293978691101e-06, -3.11434268951416e-06, -2.9373914003372192e-06, -2.7604401111602783e-06, -2.5834888219833374e-06, -2.4065375328063965e-06, -2.2295862436294556e-06, -2.0526349544525146e-06, -1.8756836652755737e-06, -1.6987323760986328e-06, -1.521781086921692e-06, -1.344829797744751e-06, -1.16787850856781e-06, -9.909272193908691e-07, -8.139759302139282e-07, -6.370246410369873e-07, -4.600733518600464e-07, -2.8312206268310547e-07, -1.0617077350616455e-07, 7.078051567077637e-08, 2.477318048477173e-07, 4.246830940246582e-07, 6.016343832015991e-07, 7.7858567237854e-07, 9.55536961555481e-07, 1.1324882507324219e-06, 1.3094395399093628e-06, 1.4863908290863037e-06, 1.6633421182632446e-06, 1.8402934074401855e-06, 2.0172446966171265e-06, 2.1941959857940674e-06, 2.3711472749710083e-06, 2.5480985641479492e-06, 2.72504985332489e-06, 2.902001142501831e-06, 3.078952431678772e-06, 3.255903720855713e-06, 3.432855010032654e-06, 3.6098062992095947e-06, 3.7867575883865356e-06, 3.9637088775634766e-06, 4.1406601667404175e-06, 4.317611455917358e-06, 4.494562745094299e-06, 4.67151403427124e-06, 4.848465323448181e-06, 5.025416612625122e-06, 5.202367901802063e-06, 5.379319190979004e-06, 5.556270480155945e-06, 5.733221769332886e-06, 5.910173058509827e-06, 6.087124347686768e-06, 6.2640756368637085e-06, 6.441026926040649e-06, 6.61797821521759e-06, 6.794929504394531e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 10.0, 0.0, 0.0, 10.0, 0.0, 0.0, 17.0, 0.0, 0.0, 24.0, 0.0, 0.0, 84.0, 0.0, 0.0, 116.0, 0.0, 506.0, 0.0, 0.0, 106.0, 0.0, 0.0, 76.0, 0.0, 0.0, 33.0, 0.0, 0.0, 13.0, 0.0, 0.0, 9.0, 0.0, 0.0, 10.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.94766640663147e-07, -6.742775440216064e-07, -6.537884473800659e-07, -6.332993507385254e-07, -6.128102540969849e-07, -5.923211574554443e-07, -5.718320608139038e-07, -5.513429641723633e-07, -5.308538675308228e-07, -5.103647708892822e-07, -4.898756742477417e-07, -4.6938657760620117e-07, -4.4889748096466064e-07, -4.284083843231201e-07, -4.079192876815796e-07, -3.8743019104003906e-07, -3.6694109439849854e-07, -3.46451997756958e-07, -3.259629011154175e-07, -3.0547380447387695e-07, -2.849847078323364e-07, -2.644956111907959e-07, -2.4400651454925537e-07, -2.2351741790771484e-07, -2.0302832126617432e-07, -1.825392246246338e-07, -1.6205012798309326e-07, -1.4156103134155273e-07, -1.210719347000122e-07, -1.0058283805847168e-07, -8.009374141693115e-08, -5.960464477539063e-08, -3.91155481338501e-08, -1.862645149230957e-08, 1.862645149230957e-09, 2.2351741790771484e-08, 4.284083843231201e-08, 6.332993507385254e-08, 8.381903171539307e-08, 1.043081283569336e-07, 1.2479722499847412e-07, 1.4528632164001465e-07, 1.6577541828155518e-07, 1.862645149230957e-07, 2.0675361156463623e-07, 2.2724270820617676e-07, 2.477318048477173e-07, 2.682209014892578e-07, 2.8870999813079834e-07, 3.0919909477233887e-07, 3.296881914138794e-07, 3.501772880554199e-07, 3.7066638469696045e-07, 3.91155481338501e-07, 4.116445779800415e-07, 4.3213367462158203e-07, 4.5262277126312256e-07, 4.731118679046631e-07, 4.936009645462036e-07, 5.140900611877441e-07, 5.345791578292847e-07, 5.550682544708252e-07, 5.755573511123657e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 10.0, 14.0, 17.0, 40.0, 26.0, 25.0, 62.0, 72.0, 78.0, 122.0, 353.0, 225.0, 360.0, 466.0, 627.0, 891.0, 3475.0, 3261.0, 5299.0, 8518.0, 14734.0, 25110.0, 51492.0, 710481.0, 107666.0, 51461.0, 25342.0, 14400.0, 8449.0, 8525.0, 1971.0, 1466.0, 957.0, 650.0, 492.0, 611.0, 198.0, 146.0, 113.0, 90.0, 59.0, 48.0, 57.0, 31.0, 18.0, 12.0, 8.0, 9.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-2.2649765014648438e-06, -2.1960586309432983e-06, -2.127140760421753e-06, -2.0582228899002075e-06, -1.989305019378662e-06, -1.9203871488571167e-06, -1.8514692783355713e-06, -1.7825514078140259e-06, -1.7136335372924805e-06, -1.644715666770935e-06, -1.5757977962493896e-06, -1.5068799257278442e-06, -1.4379620552062988e-06, -1.3690441846847534e-06, -1.300126314163208e-06, -1.2312084436416626e-06, -1.1622905731201172e-06, -1.0933727025985718e-06, -1.0244548320770264e-06, -9.55536961555481e-07, -8.866190910339355e-07, -8.177012205123901e-07, -7.487833499908447e-07, -6.798654794692993e-07, -6.109476089477539e-07, -5.420297384262085e-07, -4.731118679046631e-07, -4.041939973831177e-07, -3.3527612686157227e-07, -2.6635825634002686e-07, -1.9744038581848145e-07, -1.2852251529693604e-07, -5.960464477539063e-08, 9.313225746154785e-09, 7.82310962677002e-08, 1.471489667892456e-07, 2.1606683731079102e-07, 2.849847078323364e-07, 3.5390257835388184e-07, 4.2282044887542725e-07, 4.917383193969727e-07, 5.606561899185181e-07, 6.295740604400635e-07, 6.984919309616089e-07, 7.674098014831543e-07, 8.363276720046997e-07, 9.052455425262451e-07, 9.741634130477905e-07, 1.043081283569336e-06, 1.1119991540908813e-06, 1.1809170246124268e-06, 1.2498348951339722e-06, 1.3187527656555176e-06, 1.387670636177063e-06, 1.4565885066986084e-06, 1.5255063772201538e-06, 1.5944242477416992e-06, 1.6633421182632446e-06, 1.73225998878479e-06, 1.8011778593063354e-06, 1.8700957298278809e-06, 1.9390136003494263e-06, 2.0079314708709717e-06, 2.076849341392517e-06, 2.1457672119140625e-06]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 0.0, 11.0, 0.0, 0.0, 10.0, 0.0, 0.0, 18.0, 0.0, 0.0, 34.0, 0.0, 0.0, 77.0, 0.0, 118.0, 0.0, 0.0, 477.0, 0.0, 0.0, 118.0, 0.0, 0.0, 65.0, 0.0, 27.0, 0.0, 0.0, 24.0, 0.0, 0.0, 18.0, 0.0, 0.0, 8.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.342306733131409e-07, -6.128102540969849e-07, -5.913898348808289e-07, -5.699694156646729e-07, -5.485489964485168e-07, -5.271285772323608e-07, -5.057081580162048e-07, -4.842877388000488e-07, -4.628673195838928e-07, -4.414469003677368e-07, -4.200264811515808e-07, -3.986060619354248e-07, -3.771856427192688e-07, -3.557652235031128e-07, -3.343448042869568e-07, -3.129243850708008e-07, -2.915039658546448e-07, -2.7008354663848877e-07, -2.4866312742233276e-07, -2.2724270820617676e-07, -2.0582228899002075e-07, -1.8440186977386475e-07, -1.6298145055770874e-07, -1.4156103134155273e-07, -1.2014061212539673e-07, -9.872019290924072e-08, -7.729977369308472e-08, -5.587935447692871e-08, -3.4458935260772705e-08, -1.30385160446167e-08, 8.381903171539307e-09, 2.9802322387695312e-08, 5.122274160385132e-08, 7.264316082000732e-08, 9.406358003616333e-08, 1.1548399925231934e-07, 1.3690441846847534e-07, 1.5832483768463135e-07, 1.7974525690078735e-07, 2.0116567611694336e-07, 2.2258609533309937e-07, 2.4400651454925537e-07, 2.654269337654114e-07, 2.868473529815674e-07, 3.082677721977234e-07, 3.296881914138794e-07, 3.511086106300354e-07, 3.725290298461914e-07, 3.939494490623474e-07, 4.153698682785034e-07, 4.367902874946594e-07, 4.5821070671081543e-07, 4.796311259269714e-07, 5.010515451431274e-07, 5.224719643592834e-07, 5.438923835754395e-07, 5.653128027915955e-07, 5.867332220077515e-07, 6.081536412239075e-07, 6.295740604400635e-07, 6.509944796562195e-07, 6.724148988723755e-07, 6.938353180885315e-07, 7.152557373046875e-07]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 3.0, 8.0, 3.0, 9.0, 13.0, 15.0, 22.0, 31.0, 44.0, 40.0, 74.0, 96.0, 124.0, 128.0, 97.0, 77.0, 49.0, 45.0, 31.0, 20.0, 18.0, 8.0, 8.0, 11.0, 10.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2005237294943072e-05, -1.1527798051247373e-05, -1.1050358807551675e-05, -1.0572919563855976e-05, -1.0095480320160277e-05, -9.618041076464579e-06, -9.140602742263582e-06, -8.663163498567883e-06, -8.185724254872184e-06, -7.708285011176486e-06, -7.230845767480787e-06, -6.753406978532439e-06, -6.27596773483674e-06, -5.798528491141042e-06, -5.321089702192694e-06, -4.843650458496995e-06, -4.366211214801297e-06, -3.888771971105598e-06, -3.4113329547835747e-06, -2.9338939384615514e-06, -2.4564546947658528e-06, -1.979015451070154e-06, -1.5015764347481309e-06, -1.0241374184261076e-06, -5.466981747304089e-07, -6.925904472154798e-08, 4.08180085287313e-07, 8.856192152961739e-07, 1.3630583453050349e-06, 1.8404975890007336e-06, 2.317936605322757e-06, 2.79537562164478e-06, 3.2728166843298823e-06, 3.750255928025581e-06, 4.22769517172128e-06, 4.705133960669627e-06, 5.182573204365326e-06, 5.660012448061025e-06, 6.1374512370093726e-06, 6.614890480705071e-06, 7.09232972440077e-06, 7.569768968096469e-06, 8.047208211792167e-06, 8.524647455487866e-06, 9.002085789688863e-06, 9.479525033384562e-06, 9.95696427708026e-06, 1.0434403520775959e-05, 1.0911842764471658e-05, 1.1389282008167356e-05, 1.1866721251863055e-05, 1.2344160495558754e-05, 1.2821599739254452e-05, 1.3299038982950151e-05, 1.3776477317151148e-05, 1.4253916560846847e-05, 1.4731355804542545e-05, 1.5208795048238244e-05, 1.568623338243924e-05, 1.616367262613494e-05, 1.6641111869830638e-05, 1.7118551113526337e-05, 1.7595990357222036e-05, 1.8073429600917734e-05, 1.8550868844613433e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 4.0, 8.0, 6.0, 3.0, 5.0, 2.0, 4.0, 6.0, 5.0, 13.0, 8.0, 14.0, 11.0, 13.0, 14.0, 24.0, 26.0, 30.0, 19.0, 24.0, 26.0, 38.0, 25.0, 37.0, 29.0, 24.0, 27.0, 46.0, 30.0, 37.0, 48.0, 39.0, 33.0, 31.0, 28.0, 20.0, 32.0, 25.0, 28.0, 16.0, 22.0, 18.0, 20.0, 19.0, 7.0, 14.0, 12.0, 7.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-6.648672297160374e-06, -6.422322258003987e-06, -6.195972218847601e-06, -5.969622179691214e-06, -5.7432721405348275e-06, -5.516922101378441e-06, -5.290572062222054e-06, -5.064222023065668e-06, -4.837871983909281e-06, -4.611521944752894e-06, -4.385171905596508e-06, -4.158821866440121e-06, -3.9324718272837345e-06, -3.706121788127348e-06, -3.479771748970961e-06, -3.2534217098145746e-06, -3.027071670658188e-06, -2.8007216315018013e-06, -2.5743715923454147e-06, -2.348021553189028e-06, -2.1216715140326414e-06, -1.8953214748762548e-06, -1.6689714357198682e-06, -1.4426213965634815e-06, -1.216271357407095e-06, -9.899213182507083e-07, -7.635712790943217e-07, -5.37221239937935e-07, -3.108712007815484e-07, -8.452116162516177e-08, 1.4182887753122486e-07, 3.681789166876115e-07, 5.945285010966472e-07, 8.208785402530339e-07, 1.0472285794094205e-06, 1.2735786185658071e-06, 1.4999286577221937e-06, 1.7262786968785804e-06, 1.952628736034967e-06, 2.1789787751913536e-06, 2.4053288143477403e-06, 2.631678853504127e-06, 2.8580288926605135e-06, 3.0843789318169e-06, 3.3107289709732868e-06, 3.5370790101296734e-06, 3.76342904928606e-06, 3.989779088442447e-06, 4.216129127598833e-06, 4.44247916675522e-06, 4.6688292059116066e-06, 4.895179245067993e-06, 5.12152928422438e-06, 5.3478793233807664e-06, 5.574229362537153e-06, 5.80057940169354e-06, 6.026929440849926e-06, 6.253279480006313e-06, 6.4796295191627e-06, 6.705979558319086e-06, 6.932329597475473e-06, 7.1586796366318595e-06, 7.385029675788246e-06, 7.611379714944633e-06, 7.83772975410102e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 6.0, 4.0, 5.0, 7.0, 9.0, 12.0, 17.0, 23.0, 37.0, 59.0, 77.0, 115.0, 182.0, 222.0, 335.0, 362.0, 657.0, 745.0, 1284.0, 1813.0, 2259.0, 3799.0, 4707.0, 8047.0, 12480.0, 17087.0, 31894.0, 47359.0, 100602.0, 169043.0, 272479.0, 170874.0, 76940.0, 48606.0, 25040.0, 17871.0, 10981.0, 6589.0, 4938.0, 3090.0, 2358.0, 1743.0, 1031.0, 841.0, 523.0, 418.0, 292.0, 191.0, 153.0, 88.0, 81.0, 52.0, 40.0, 33.0, 21.0, 20.0, 11.0, 6.0, 5.0, 4.0, 1.0, 1.0], "bins": [-1.4662742614746094e-05, -1.4210119843482971e-05, -1.3757497072219849e-05, -1.3304874300956726e-05, -1.2852251529693604e-05, -1.2399628758430481e-05, -1.1947005987167358e-05, -1.1494383215904236e-05, -1.1041760444641113e-05, -1.058913767337799e-05, -1.0136514902114868e-05, -9.683892130851746e-06, -9.231269359588623e-06, -8.7786465883255e-06, -8.326023817062378e-06, -7.873401045799255e-06, -7.420778274536133e-06, -6.96815550327301e-06, -6.515532732009888e-06, -6.062909960746765e-06, -5.610287189483643e-06, -5.15766441822052e-06, -4.7050416469573975e-06, -4.252418875694275e-06, -3.7997961044311523e-06, -3.3471733331680298e-06, -2.8945505619049072e-06, -2.4419277906417847e-06, -1.989305019378662e-06, -1.5366822481155396e-06, -1.084059476852417e-06, -6.314367055892944e-07, -1.7881393432617188e-07, 2.738088369369507e-07, 7.264316082000732e-07, 1.1790543794631958e-06, 1.6316771507263184e-06, 2.084299921989441e-06, 2.5369226932525635e-06, 2.989545464515686e-06, 3.4421682357788086e-06, 3.894791007041931e-06, 4.347413778305054e-06, 4.800036549568176e-06, 5.252659320831299e-06, 5.705282092094421e-06, 6.157904863357544e-06, 6.6105276346206665e-06, 7.063150405883789e-06, 7.515773177146912e-06, 7.968395948410034e-06, 8.421018719673157e-06, 8.87364149093628e-06, 9.326264262199402e-06, 9.778887033462524e-06, 1.0231509804725647e-05, 1.068413257598877e-05, 1.1136755347251892e-05, 1.1589378118515015e-05, 1.2042000889778137e-05, 1.249462366104126e-05, 1.2947246432304382e-05, 1.3399869203567505e-05, 1.3852491974830627e-05, 1.430511474609375e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 3.0, 2.0, 7.0, 9.0, 3.0, 5.0, 12.0, 14.0, 13.0, 19.0, 29.0, 18.0, 36.0, 28.0, 34.0, 25.0, 32.0, 35.0, 38.0, 47.0, 39.0, 50.0, 43.0, 25.0, 49.0, 46.0, 37.0, 44.0, 34.0, 22.0, 26.0, 20.0, 24.0, 21.0, 19.0, 17.0, 11.0, 15.0, 14.0, 9.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.973743438720703e-06, -6.7427754402160645e-06, -6.511807441711426e-06, -6.280839443206787e-06, -6.0498714447021484e-06, -5.81890344619751e-06, -5.587935447692871e-06, -5.356967449188232e-06, -5.125999450683594e-06, -4.895031452178955e-06, -4.664063453674316e-06, -4.433095455169678e-06, -4.202127456665039e-06, -3.9711594581604e-06, -3.7401914596557617e-06, -3.509223461151123e-06, -3.2782554626464844e-06, -3.0472874641418457e-06, -2.816319465637207e-06, -2.5853514671325684e-06, -2.3543834686279297e-06, -2.123415470123291e-06, -1.8924474716186523e-06, -1.6614794731140137e-06, -1.430511474609375e-06, -1.1995434761047363e-06, -9.685754776000977e-07, -7.37607479095459e-07, -5.066394805908203e-07, -2.7567148208618164e-07, -4.470348358154297e-08, 1.862645149230957e-07, 4.172325134277344e-07, 6.48200511932373e-07, 8.791685104370117e-07, 1.1101365089416504e-06, 1.341104507446289e-06, 1.5720725059509277e-06, 1.8030405044555664e-06, 2.034008502960205e-06, 2.2649765014648438e-06, 2.4959444999694824e-06, 2.726912498474121e-06, 2.9578804969787598e-06, 3.1888484954833984e-06, 3.419816493988037e-06, 3.6507844924926758e-06, 3.8817524909973145e-06, 4.112720489501953e-06, 4.343688488006592e-06, 4.5746564865112305e-06, 4.805624485015869e-06, 5.036592483520508e-06, 5.2675604820251465e-06, 5.498528480529785e-06, 5.729496479034424e-06, 5.9604644775390625e-06, 6.191432476043701e-06, 6.42240047454834e-06, 6.6533684730529785e-06, 6.884336471557617e-06, 7.115304470062256e-06, 7.3462724685668945e-06, 7.577240467071533e-06, 7.808208465576172e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 10.0, 19.0, 23.0, 36.0, 46.0, 72.0, 136.0, 183.0, 272.0, 407.0, 572.0, 881.0, 1496.0, 1891.0, 3191.0, 5232.0, 6800.0, 12726.0, 21308.0, 31627.0, 65459.0, 131836.0, 221101.0, 259014.0, 132033.0, 59054.0, 37822.0, 21181.0, 11374.0, 8311.0, 5182.0, 2961.0, 2296.0, 1371.0, 784.0, 636.0, 403.0, 235.0, 194.0, 154.0, 77.0, 65.0, 33.0, 20.0, 14.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4185905456542969e-05, -1.3728626072406769e-05, -1.3271346688270569e-05, -1.2814067304134369e-05, -1.2356787919998169e-05, -1.1899508535861969e-05, -1.1442229151725769e-05, -1.0984949767589569e-05, -1.0527670383453369e-05, -1.007039099931717e-05, -9.61311161518097e-06, -9.15583223104477e-06, -8.69855284690857e-06, -8.24127346277237e-06, -7.78399407863617e-06, -7.3267146944999695e-06, -6.8694353103637695e-06, -6.41215592622757e-06, -5.95487654209137e-06, -5.49759715795517e-06, -5.04031777381897e-06, -4.58303838968277e-06, -4.12575900554657e-06, -3.66847962141037e-06, -3.21120023727417e-06, -2.75392085313797e-06, -2.29664146900177e-06, -1.83936208486557e-06, -1.3820827007293701e-06, -9.248033165931702e-07, -4.675239324569702e-07, -1.0244548320770264e-08, 4.470348358154297e-07, 9.043142199516296e-07, 1.3615936040878296e-06, 1.8188729882240295e-06, 2.2761523723602295e-06, 2.7334317564964294e-06, 3.1907111406326294e-06, 3.6479905247688293e-06, 4.105269908905029e-06, 4.562549293041229e-06, 5.019828677177429e-06, 5.477108061313629e-06, 5.934387445449829e-06, 6.391666829586029e-06, 6.848946213722229e-06, 7.306225597858429e-06, 7.763504981994629e-06, 8.220784366130829e-06, 8.678063750267029e-06, 9.135343134403229e-06, 9.592622518539429e-06, 1.0049901902675629e-05, 1.0507181286811829e-05, 1.0964460670948029e-05, 1.1421740055084229e-05, 1.1879019439220428e-05, 1.2336298823356628e-05, 1.2793578207492828e-05, 1.3250857591629028e-05, 1.3708136975765228e-05, 1.4165416359901428e-05, 1.4622695744037628e-05, 1.5079975128173828e-05]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 6.0, 6.0, 3.0, 2.0, 4.0, 5.0, 13.0, 15.0, 3.0, 17.0, 20.0, 21.0, 16.0, 32.0, 28.0, 39.0, 30.0, 50.0, 29.0, 45.0, 41.0, 42.0, 30.0, 34.0, 50.0, 28.0, 51.0, 30.0, 47.0, 22.0, 41.0, 22.0, 21.0, 28.0, 30.0, 13.0, 20.0, 10.0, 20.0, 13.0, 3.0, 8.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.5299530029296875e-06, -4.382804036140442e-06, -4.235655069351196e-06, -4.088506102561951e-06, -3.941357135772705e-06, -3.7942081689834595e-06, -3.647059202194214e-06, -3.4999102354049683e-06, -3.3527612686157227e-06, -3.205612301826477e-06, -3.0584633350372314e-06, -2.911314368247986e-06, -2.7641654014587402e-06, -2.6170164346694946e-06, -2.469867467880249e-06, -2.3227185010910034e-06, -2.175569534301758e-06, -2.028420567512512e-06, -1.8812716007232666e-06, -1.734122633934021e-06, -1.5869736671447754e-06, -1.4398247003555298e-06, -1.2926757335662842e-06, -1.1455267667770386e-06, -9.98377799987793e-07, -8.512288331985474e-07, -7.040798664093018e-07, -5.569308996200562e-07, -4.0978193283081055e-07, -2.6263296604156494e-07, -1.1548399925231934e-07, 3.166496753692627e-08, 1.7881393432617188e-07, 3.259629011154175e-07, 4.731118679046631e-07, 6.202608346939087e-07, 7.674098014831543e-07, 9.145587682723999e-07, 1.0617077350616455e-06, 1.2088567018508911e-06, 1.3560056686401367e-06, 1.5031546354293823e-06, 1.650303602218628e-06, 1.7974525690078735e-06, 1.944601535797119e-06, 2.0917505025863647e-06, 2.2388994693756104e-06, 2.386048436164856e-06, 2.5331974029541016e-06, 2.680346369743347e-06, 2.8274953365325928e-06, 2.9746443033218384e-06, 3.121793270111084e-06, 3.2689422369003296e-06, 3.416091203689575e-06, 3.563240170478821e-06, 3.7103891372680664e-06, 3.857538104057312e-06, 4.004687070846558e-06, 4.151836037635803e-06, 4.298985004425049e-06, 4.4461339712142944e-06, 4.59328293800354e-06, 4.740431904792786e-06, 4.887580871582031e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 10.0, 21.0, 33.0, 22.0, 41.0, 74.0, 89.0, 141.0, 187.0, 275.0, 412.0, 583.0, 846.0, 1242.0, 1699.0, 3446.0, 4039.0, 5995.0, 9383.0, 16970.0, 38302.0, 134167.0, 720431.0, 55934.0, 21151.0, 11324.0, 6944.0, 4380.0, 4069.0, 1923.0, 1333.0, 935.0, 686.0, 434.0, 336.0, 211.0, 144.0, 105.0, 78.0, 58.0, 26.0, 38.0, 21.0, 11.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-5.900859832763672e-06, -5.717389285564423e-06, -5.533918738365173e-06, -5.350448191165924e-06, -5.166977643966675e-06, -4.9835070967674255e-06, -4.800036549568176e-06, -4.616566002368927e-06, -4.433095455169678e-06, -4.2496249079704285e-06, -4.066154360771179e-06, -3.88268381357193e-06, -3.6992132663726807e-06, -3.5157427191734314e-06, -3.332272171974182e-06, -3.148801624774933e-06, -2.9653310775756836e-06, -2.7818605303764343e-06, -2.598389983177185e-06, -2.414919435977936e-06, -2.2314488887786865e-06, -2.0479783415794373e-06, -1.864507794380188e-06, -1.6810372471809387e-06, -1.4975666999816895e-06, -1.3140961527824402e-06, -1.130625605583191e-06, -9.471550583839417e-07, -7.636845111846924e-07, -5.802139639854431e-07, -3.9674341678619385e-07, -2.1327286958694458e-07, -2.9802322387695312e-08, 1.5366822481155396e-07, 3.371387720108032e-07, 5.206093192100525e-07, 7.040798664093018e-07, 8.87550413608551e-07, 1.0710209608078003e-06, 1.2544915080070496e-06, 1.4379620552062988e-06, 1.621432602405548e-06, 1.8049031496047974e-06, 1.9883736968040466e-06, 2.171844244003296e-06, 2.355314791202545e-06, 2.5387853384017944e-06, 2.7222558856010437e-06, 2.905726432800293e-06, 3.0891969799995422e-06, 3.2726675271987915e-06, 3.4561380743980408e-06, 3.63960862159729e-06, 3.823079168796539e-06, 4.0065497159957886e-06, 4.190020263195038e-06, 4.373490810394287e-06, 4.556961357593536e-06, 4.740431904792786e-06, 4.923902451992035e-06, 5.107372999191284e-06, 5.2908435463905334e-06, 5.474314093589783e-06, 5.657784640789032e-06, 5.841255187988281e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 845.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 59.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 12.0, 7.0, 15.0, 14.0, 29.0, 39.0, 35.0, 64.0, 66.0, 131.0, 141.0, 199.0, 276.0, 455.0, 529.0, 694.0, 1051.0, 1975.0, 2281.0, 3227.0, 4689.0, 9530.0, 13046.0, 23829.0, 60461.0, 764878.0, 98552.0, 23746.0, 13070.0, 8232.0, 6154.0, 3208.0, 2224.0, 1525.0, 1350.0, 770.0, 538.0, 412.0, 335.0, 185.0, 146.0, 97.0, 82.0, 77.0, 41.0, 43.0, 28.0, 14.0, 18.0, 11.0, 10.0, 6.0, 4.0, 2.0, 1.0, 5.0], "bins": [-8.463859558105469e-06, -8.211471140384674e-06, -7.95908272266388e-06, -7.706694304943085e-06, -7.45430588722229e-06, -7.201917469501495e-06, -6.949529051780701e-06, -6.697140634059906e-06, -6.444752216339111e-06, -6.192363798618317e-06, -5.939975380897522e-06, -5.687586963176727e-06, -5.435198545455933e-06, -5.182810127735138e-06, -4.930421710014343e-06, -4.678033292293549e-06, -4.425644874572754e-06, -4.173256456851959e-06, -3.9208680391311646e-06, -3.66847962141037e-06, -3.416091203689575e-06, -3.1637027859687805e-06, -2.911314368247986e-06, -2.658925950527191e-06, -2.4065375328063965e-06, -2.154149115085602e-06, -1.9017606973648071e-06, -1.6493722796440125e-06, -1.3969838619232178e-06, -1.144595444202423e-06, -8.922070264816284e-07, -6.398186087608337e-07, -3.8743019104003906e-07, -1.3504177331924438e-07, 1.1734664440155029e-07, 3.6973506212234497e-07, 6.221234798431396e-07, 8.745118975639343e-07, 1.126900315284729e-06, 1.3792887330055237e-06, 1.6316771507263184e-06, 1.884065568447113e-06, 2.1364539861679077e-06, 2.3888424038887024e-06, 2.641230821609497e-06, 2.8936192393302917e-06, 3.1460076570510864e-06, 3.398396074771881e-06, 3.6507844924926758e-06, 3.9031729102134705e-06, 4.155561327934265e-06, 4.40794974565506e-06, 4.6603381633758545e-06, 4.912726581096649e-06, 5.165114998817444e-06, 5.4175034165382385e-06, 5.669891834259033e-06, 5.922280251979828e-06, 6.1746686697006226e-06, 6.427057087421417e-06, 6.679445505142212e-06, 6.931833922863007e-06, 7.184222340583801e-06, 7.436610758304596e-06, 7.68899917602539e-06]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 7.0, 4.0, 4.0, 8.0, 7.0, 7.0, 16.0, 5.0, 11.0, 29.0, 19.0, 37.0, 574.0, 70.0, 43.0, 26.0, 32.0, 13.0, 7.0, 19.0, 7.0, 12.0, 7.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2649765014648438e-06, -2.1867454051971436e-06, -2.1085143089294434e-06, -2.030283212661743e-06, -1.952052116394043e-06, -1.8738210201263428e-06, -1.7955899238586426e-06, -1.7173588275909424e-06, -1.6391277313232422e-06, -1.560896635055542e-06, -1.4826655387878418e-06, -1.4044344425201416e-06, -1.3262033462524414e-06, -1.2479722499847412e-06, -1.169741153717041e-06, -1.0915100574493408e-06, -1.0132789611816406e-06, -9.350478649139404e-07, -8.568167686462402e-07, -7.7858567237854e-07, -7.003545761108398e-07, -6.221234798431396e-07, -5.438923835754395e-07, -4.6566128730773926e-07, -3.8743019104003906e-07, -3.0919909477233887e-07, -2.3096799850463867e-07, -1.5273690223693848e-07, -7.450580596923828e-08, 3.725290298461914e-09, 8.195638656616211e-08, 1.601874828338623e-07, 2.384185791015625e-07, 3.166496753692627e-07, 3.948807716369629e-07, 4.731118679046631e-07, 5.513429641723633e-07, 6.295740604400635e-07, 7.078051567077637e-07, 7.860362529754639e-07, 8.642673492431641e-07, 9.424984455108643e-07, 1.0207295417785645e-06, 1.0989606380462646e-06, 1.1771917343139648e-06, 1.255422830581665e-06, 1.3336539268493652e-06, 1.4118850231170654e-06, 1.4901161193847656e-06, 1.5683472156524658e-06, 1.646578311920166e-06, 1.7248094081878662e-06, 1.8030405044555664e-06, 1.8812716007232666e-06, 1.959502696990967e-06, 2.037733793258667e-06, 2.115964889526367e-06, 2.1941959857940674e-06, 2.2724270820617676e-06, 2.3506581783294678e-06, 2.428889274597168e-06, 2.507120370864868e-06, 2.5853514671325684e-06, 2.6635825634002686e-06, 2.7418136596679688e-06]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 7.0, 9.0, 14.0, 13.0, 26.0, 30.0, 40.0, 66.0, 79.0, 104.0, 124.0, 122.0, 91.0, 73.0, 47.0, 45.0, 28.0, 21.0, 12.0, 9.0, 5.0, 10.0, 6.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.109410459321225e-05, -1.0663046850822866e-05, -1.0231989108433481e-05, -9.800931366044097e-06, -9.369873623654712e-06, -8.938815881265327e-06, -8.507758138875943e-06, -8.076700396486558e-06, -7.645642654097173e-06, -7.214584911707789e-06, -6.783527169318404e-06, -6.352469426929019e-06, -5.921411684539635e-06, -5.49035394215025e-06, -5.059296199760865e-06, -4.628238457371481e-06, -4.197180714982096e-06, -3.7661229725927114e-06, -3.335065230203327e-06, -2.904007487813942e-06, -2.4729497454245575e-06, -2.041892003035173e-06, -1.6108342606457882e-06, -1.1797765182564035e-06, -7.487187758670188e-07, -3.176610334776342e-07, 1.1339670891175047e-07, 5.444544513011351e-07, 9.755121936905198e-07, 1.4065699360799044e-06, 1.837627678469289e-06, 2.2686854208586738e-06, 2.69974407274276e-06, 3.130801815132145e-06, 3.5618595575215295e-06, 3.992917299910914e-06, 4.423975042300299e-06, 4.8550327846896835e-06, 5.286090527079068e-06, 5.717148269468453e-06, 6.1482060118578374e-06, 6.579263754247222e-06, 7.010321496636607e-06, 7.441379239025991e-06, 7.872436981415376e-06, 8.30349472380476e-06, 8.734552466194145e-06, 9.16561020858353e-06, 9.596667950972915e-06, 1.00277256933623e-05, 1.0458783435751684e-05, 1.0889841178141069e-05, 1.1320898920530453e-05, 1.1751956662919838e-05, 1.2183014405309223e-05, 1.2614072147698607e-05, 1.3045129890087992e-05, 1.3476187632477377e-05, 1.3907245374866761e-05, 1.4338303117256146e-05, 1.476936085964553e-05, 1.5200418602034915e-05, 1.56314763444243e-05, 1.6062534996308386e-05, 1.649359182920307e-05]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 3.0, 7.0, 14.0, 6.0, 7.0, 11.0, 9.0, 16.0, 24.0, 26.0, 26.0, 37.0, 28.0, 26.0, 28.0, 43.0, 36.0, 35.0, 37.0, 35.0, 49.0, 38.0, 37.0, 34.0, 40.0, 45.0, 29.0, 29.0, 35.0, 23.0, 32.0, 25.0, 18.0, 21.0, 14.0, 11.0, 14.0, 14.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.045482107059797e-06, -6.80291623211815e-06, -6.560350357176503e-06, -6.317784936982207e-06, -6.07521906204056e-06, -5.832653187098913e-06, -5.590087312157266e-06, -5.347521437215619e-06, -5.104955562273972e-06, -4.862389687332325e-06, -4.619823812390678e-06, -4.377257937449031e-06, -4.134692517254734e-06, -3.892126642313087e-06, -3.6495607673714403e-06, -3.4069948924297933e-06, -3.164429472235497e-06, -2.92186359729385e-06, -2.6792979497258784e-06, -2.4367320747842314e-06, -2.1941664272162598e-06, -1.9516005522746127e-06, -1.7090346773329657e-06, -1.4664689160781563e-06, -1.223903154823347e-06, -9.813373935685377e-07, -7.387715754703095e-07, -4.962057573720813e-07, -2.5363999611727195e-07, -1.1074234862462617e-08, 2.3149164007918444e-07, 4.7405740133399377e-07, 7.166227078414522e-07, 9.591884690962615e-07, 1.2017542303510709e-06, 1.444320105292718e-06, 1.6868858665475273e-06, 1.9294516278023366e-06, 2.1720175027439836e-06, 2.4145833776856307e-06, 2.6571490252536023e-06, 2.8997149001952494e-06, 3.142280547763221e-06, 3.384846422704868e-06, 3.627412297646515e-06, 3.869978172588162e-06, 4.112544047529809e-06, 4.355109467724105e-06, 4.597675342665752e-06, 4.8402412176073994e-06, 5.0828070925490465e-06, 5.325372512743343e-06, 5.56793838768499e-06, 5.810504262626637e-06, 6.053070137568284e-06, 6.295636012509931e-06, 6.538201887451578e-06, 6.780767762393225e-06, 7.023333637334872e-06, 7.265899512276519e-06, 7.508464932470815e-06, 7.751030352665111e-06, 7.993596227606758e-06, 8.236162102548406e-06, 8.478727977490053e-06]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 6.0, 7.0, 9.0, 18.0, 28.0, 36.0, 67.0, 106.0, 136.0, 217.0, 315.0, 310.0, 556.0, 770.0, 1196.0, 1715.0, 2445.0, 3761.0, 5513.0, 8698.0, 13780.0, 22187.0, 37357.0, 66031.0, 124445.0, 261807.0, 721993.0, 1352812.0, 936899.0, 309103.0, 140609.0, 74275.0, 41325.0, 24167.0, 14940.0, 9126.0, 5912.0, 3884.0, 2522.0, 1647.0, 1157.0, 722.0, 548.0, 282.0, 277.0, 181.0, 132.0, 87.0, 66.0, 43.0, 21.0, 20.0, 20.0, 4.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0], "bins": [-9.298324584960938e-06, -9.004026651382446e-06, -8.709728717803955e-06, -8.415430784225464e-06, -8.121132850646973e-06, -7.826834917068481e-06, -7.53253698348999e-06, -7.238239049911499e-06, -6.943941116333008e-06, -6.649643182754517e-06, -6.355345249176025e-06, -6.061047315597534e-06, -5.766749382019043e-06, -5.472451448440552e-06, -5.1781535148620605e-06, -4.883855581283569e-06, -4.589557647705078e-06, -4.295259714126587e-06, -4.000961780548096e-06, -3.7066638469696045e-06, -3.4123659133911133e-06, -3.118067979812622e-06, -2.823770046234131e-06, -2.5294721126556396e-06, -2.2351741790771484e-06, -1.9408762454986572e-06, -1.646578311920166e-06, -1.3522803783416748e-06, -1.0579824447631836e-06, -7.636845111846924e-07, -4.6938657760620117e-07, -1.7508864402770996e-07, 1.1920928955078125e-07, 4.1350722312927246e-07, 7.078051567077637e-07, 1.0021030902862549e-06, 1.296401023864746e-06, 1.5906989574432373e-06, 1.8849968910217285e-06, 2.1792948246002197e-06, 2.473592758178711e-06, 2.767890691757202e-06, 3.0621886253356934e-06, 3.3564865589141846e-06, 3.6507844924926758e-06, 3.945082426071167e-06, 4.239380359649658e-06, 4.533678293228149e-06, 4.827976226806641e-06, 5.122274160385132e-06, 5.416572093963623e-06, 5.710870027542114e-06, 6.0051679611206055e-06, 6.299465894699097e-06, 6.593763828277588e-06, 6.888061761856079e-06, 7.18235969543457e-06, 7.4766576290130615e-06, 7.770955562591553e-06, 8.065253496170044e-06, 8.359551429748535e-06, 8.653849363327026e-06, 8.948147296905518e-06, 9.242445230484009e-06, 9.5367431640625e-06]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 3.0, 6.0, 10.0, 8.0, 6.0, 19.0, 15.0, 22.0, 26.0, 19.0, 22.0, 44.0, 25.0, 29.0, 38.0, 30.0, 37.0, 48.0, 31.0, 43.0, 58.0, 34.0, 38.0, 47.0, 22.0, 48.0, 25.0, 24.0, 49.0, 19.0, 23.0, 31.0, 10.0, 12.0, 12.0, 8.0, 7.0, 10.0, 9.0, 9.0, 10.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.0531158447265625e-06, -3.913417458534241e-06, -3.773719072341919e-06, -3.634020686149597e-06, -3.4943222999572754e-06, -3.3546239137649536e-06, -3.214925527572632e-06, -3.07522714138031e-06, -2.9355287551879883e-06, -2.7958303689956665e-06, -2.6561319828033447e-06, -2.516433596611023e-06, -2.376735210418701e-06, -2.2370368242263794e-06, -2.0973384380340576e-06, -1.957640051841736e-06, -1.817941665649414e-06, -1.6782432794570923e-06, -1.5385448932647705e-06, -1.3988465070724487e-06, -1.259148120880127e-06, -1.1194497346878052e-06, -9.797513484954834e-07, -8.400529623031616e-07, -7.003545761108398e-07, -5.606561899185181e-07, -4.209578037261963e-07, -2.812594175338745e-07, -1.4156103134155273e-07, -1.862645149230957e-09, 1.3783574104309082e-07, 2.775341272354126e-07, 4.172325134277344e-07, 5.569308996200562e-07, 6.966292858123779e-07, 8.363276720046997e-07, 9.760260581970215e-07, 1.1157244443893433e-06, 1.255422830581665e-06, 1.3951212167739868e-06, 1.5348196029663086e-06, 1.6745179891586304e-06, 1.8142163753509521e-06, 1.953914761543274e-06, 2.0936131477355957e-06, 2.2333115339279175e-06, 2.3730099201202393e-06, 2.512708306312561e-06, 2.652406692504883e-06, 2.7921050786972046e-06, 2.9318034648895264e-06, 3.071501851081848e-06, 3.21120023727417e-06, 3.3508986234664917e-06, 3.4905970096588135e-06, 3.6302953958511353e-06, 3.769993782043457e-06, 3.909692168235779e-06, 4.049390554428101e-06, 4.189088940620422e-06, 4.328787326812744e-06, 4.468485713005066e-06, 4.608184099197388e-06, 4.7478824853897095e-06, 4.887580871582031e-06]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 10.0, 12.0, 22.0, 34.0, 39.0, 67.0, 85.0, 120.0, 175.0, 267.0, 404.0, 584.0, 1142.0, 1448.0, 2096.0, 3203.0, 4943.0, 7716.0, 12055.0, 19257.0, 31278.0, 71029.0, 106472.0, 201963.0, 427783.0, 1016186.0, 1217737.0, 525674.0, 241479.0, 123750.0, 81002.0, 35723.0, 22126.0, 13878.0, 8524.0, 5422.0, 3520.0, 2345.0, 1538.0, 1173.0, 632.0, 414.0, 292.0, 214.0, 159.0, 92.0, 54.0, 52.0, 42.0, 14.0, 21.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-7.867813110351562e-06, -7.622875273227692e-06, -7.377937436103821e-06, -7.13299959897995e-06, -6.888061761856079e-06, -6.643123924732208e-06, -6.398186087608337e-06, -6.1532482504844666e-06, -5.908310413360596e-06, -5.663372576236725e-06, -5.418434739112854e-06, -5.173496901988983e-06, -4.928559064865112e-06, -4.6836212277412415e-06, -4.438683390617371e-06, -4.1937455534935e-06, -3.948807716369629e-06, -3.703869879245758e-06, -3.458932042121887e-06, -3.2139942049980164e-06, -2.9690563678741455e-06, -2.7241185307502747e-06, -2.479180693626404e-06, -2.234242856502533e-06, -1.989305019378662e-06, -1.7443671822547913e-06, -1.4994293451309204e-06, -1.2544915080070496e-06, -1.0095536708831787e-06, -7.646158337593079e-07, -5.19677996635437e-07, -2.7474015951156616e-07, -2.9802322387695312e-08, 2.1513551473617554e-07, 4.600733518600464e-07, 7.050111889839172e-07, 9.499490261077881e-07, 1.194886863231659e-06, 1.4398247003555298e-06, 1.6847625374794006e-06, 1.9297003746032715e-06, 2.1746382117271423e-06, 2.419576048851013e-06, 2.664513885974884e-06, 2.909451723098755e-06, 3.1543895602226257e-06, 3.3993273973464966e-06, 3.6442652344703674e-06, 3.889203071594238e-06, 4.134140908718109e-06, 4.37907874584198e-06, 4.624016582965851e-06, 4.868954420089722e-06, 5.1138922572135925e-06, 5.358830094337463e-06, 5.603767931461334e-06, 5.848705768585205e-06, 6.093643605709076e-06, 6.338581442832947e-06, 6.583519279956818e-06, 6.8284571170806885e-06, 7.073394954204559e-06, 7.31833279132843e-06, 7.563270628452301e-06, 7.808208465576172e-06]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 9.0, 4.0, 8.0, 17.0, 12.0, 8.0, 16.0, 38.0, 28.0, 26.0, 64.0, 39.0, 40.0, 49.0, 125.0, 81.0, 93.0, 116.0, 274.0, 155.0, 171.0, 178.0, 435.0, 211.0, 200.0, 360.0, 193.0, 138.0, 128.0, 231.0, 77.0, 73.0, 56.0, 122.0, 58.0, 50.0, 29.0, 64.0, 16.0, 16.0, 22.0, 9.0, 5.0, 5.0, 10.0, 6.0, 3.0, 2.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.384185791015625e-06, -2.3087486624717712e-06, -2.2333115339279175e-06, -2.1578744053840637e-06, -2.08243727684021e-06, -2.007000148296356e-06, -1.9315630197525024e-06, -1.8561258912086487e-06, -1.780688762664795e-06, -1.7052516341209412e-06, -1.6298145055770874e-06, -1.5543773770332336e-06, -1.4789402484893799e-06, -1.4035031199455261e-06, -1.3280659914016724e-06, -1.2526288628578186e-06, -1.1771917343139648e-06, -1.101754605770111e-06, -1.0263174772262573e-06, -9.508803486824036e-07, -8.754432201385498e-07, -8.00006091594696e-07, -7.245689630508423e-07, -6.491318345069885e-07, -5.736947059631348e-07, -4.98257577419281e-07, -4.2282044887542725e-07, -3.473833203315735e-07, -2.7194619178771973e-07, -1.9650906324386597e-07, -1.210719347000122e-07, -4.563480615615845e-08, 2.9802322387695312e-08, 1.0523945093154907e-07, 1.8067657947540283e-07, 2.561137080192566e-07, 3.3155083656311035e-07, 4.069879651069641e-07, 4.824250936508179e-07, 5.578622221946716e-07, 6.332993507385254e-07, 7.087364792823792e-07, 7.841736078262329e-07, 8.596107363700867e-07, 9.350478649139404e-07, 1.0104849934577942e-06, 1.085922122001648e-06, 1.1613592505455017e-06, 1.2367963790893555e-06, 1.3122335076332092e-06, 1.387670636177063e-06, 1.4631077647209167e-06, 1.5385448932647705e-06, 1.6139820218086243e-06, 1.689419150352478e-06, 1.7648562788963318e-06, 1.8402934074401855e-06, 1.9157305359840393e-06, 1.991167664527893e-06, 2.066604793071747e-06, 2.1420419216156006e-06, 2.2174790501594543e-06, 2.292916178703308e-06, 2.368353307247162e-06, 2.4437904357910156e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 8.0, 6.0, 4.0, 17.0, 14.0, 21.0, 28.0, 35.0, 55.0, 59.0, 78.0, 107.0, 120.0, 109.0, 68.0, 58.0, 43.0, 38.0, 21.0, 17.0, 13.0, 18.0, 14.0, 10.0, 8.0, 4.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.703766757709673e-06, -6.4593550632707775e-06, -6.214943368831882e-06, -5.970531674392987e-06, -5.726119525206741e-06, -5.481707830767846e-06, -5.2372961363289505e-06, -4.992884441890055e-06, -4.74847274745116e-06, -4.504061053012265e-06, -4.25964935857337e-06, -4.015237209387124e-06, -3.7708255149482284e-06, -3.526413820509333e-06, -3.282002126070438e-06, -3.0375904316315427e-06, -2.7931782824452966e-06, -2.5487665880064014e-06, -2.3043546661938308e-06, -2.0599429717549356e-06, -1.8155311636292026e-06, -1.5711193555034697e-06, -1.3267076610645745e-06, -1.0822958529388416e-06, -8.378840448131086e-07, -5.934722366873757e-07, -3.4906048540506163e-07, -1.0464873412274756e-07, 1.3976307400298538e-07, 3.841748821287183e-07, 6.285865765676135e-07, 8.729983846933465e-07, 1.1174097380717285e-06, 1.3618215461974614e-06, 1.6062333543231944e-06, 1.8506450487620896e-06, 2.0950569705746602e-06, 2.3394686650135554e-06, 2.5838803594524506e-06, 2.828292053891346e-06, 3.0727039757039165e-06, 3.3171156701428117e-06, 3.5615275919553824e-06, 3.8059392863942776e-06, 4.050350980833173e-06, 4.294763130019419e-06, 4.539174369710963e-06, 4.783586518897209e-06, 5.0279982133361045e-06, 5.272409907775e-06, 5.516821602213895e-06, 5.76123329665279e-06, 6.005645445839036e-06, 6.2500571402779315e-06, 6.494468834716827e-06, 6.738880529155722e-06, 6.983292223594617e-06, 7.227703918033512e-06, 7.4721156124724075e-06, 7.716527761658654e-06, 7.960939001350198e-06, 8.205351150536444e-06, 8.449762390227988e-06, 8.694174539414234e-06, 8.93858668860048e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 5.0, 9.0, 9.0, 15.0, 17.0, 18.0, 20.0, 21.0, 24.0, 33.0, 37.0, 36.0, 35.0, 35.0, 33.0, 43.0, 35.0, 43.0, 57.0, 48.0, 50.0, 40.0, 33.0, 29.0, 26.0, 31.0, 38.0, 30.0, 30.0, 17.0, 20.0, 11.0, 12.0, 12.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.673425337387016e-06, -4.511319275479764e-06, -4.3492132135725114e-06, -4.187107151665259e-06, -4.025001089758007e-06, -3.8628950278507546e-06, -3.7007889659435023e-06, -3.53868290403625e-06, -3.3765768421289977e-06, -3.2144707802217454e-06, -3.052364718314493e-06, -2.8902586564072408e-06, -2.7281525944999885e-06, -2.566046532592736e-06, -2.403940470685484e-06, -2.2418344087782316e-06, -2.0797283468709793e-06, -1.917622284963727e-06, -1.7555162230564747e-06, -1.5934101611492224e-06, -1.4313040992419701e-06, -1.2691980373347178e-06, -1.1070919754274655e-06, -9.449859135202132e-07, -7.828798516129609e-07, -6.207737897057086e-07, -4.586677277984563e-07, -2.9656166589120403e-07, -1.3445560398395173e-07, 2.7650457923300564e-08, 1.8975651983055286e-07, 3.5186258173780516e-07, 5.139686436450575e-07, 6.760747055523098e-07, 8.38180767459562e-07, 1.0002868293668143e-06, 1.1623928912740666e-06, 1.324498953181319e-06, 1.4866050150885712e-06, 1.6487110769958235e-06, 1.8108171389030758e-06, 1.972923200810328e-06, 2.1350292627175804e-06, 2.2971353246248327e-06, 2.459241386532085e-06, 2.6213474484393373e-06, 2.7834535103465896e-06, 2.945559572253842e-06, 3.107665634161094e-06, 3.2697716960683465e-06, 3.431877757975599e-06, 3.593983819882851e-06, 3.7560898817901034e-06, 3.918195943697356e-06, 4.080302005604608e-06, 4.24240806751186e-06, 4.404514129419113e-06, 4.566620191326365e-06, 4.728726253233617e-06, 4.8908323151408695e-06, 5.052938377048122e-06, 5.215044438955374e-06, 5.377150500862626e-06, 5.539256562769879e-06, 5.701362624677131e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 8.0, 7.0, 10.0, 30.0, 41.0, 59.0, 86.0, 109.0, 167.0, 239.0, 322.0, 467.0, 551.0, 1013.0, 1599.0, 2549.0, 4093.0, 6812.0, 11040.0, 18711.0, 22443.0, 49633.0, 89031.0, 161962.0, 250324.0, 187067.0, 103151.0, 56663.0, 25828.0, 21284.0, 12601.0, 7457.0, 4704.0, 2965.0, 1887.0, 1217.0, 626.0, 622.0, 376.0, 249.0, 178.0, 117.0, 88.0, 41.0, 33.0, 25.0, 17.0, 16.0, 14.0, 6.0, 7.0, 2.0, 2.0], "bins": [-8.225440979003906e-06, -7.994472980499268e-06, -7.763504981994629e-06, -7.53253698348999e-06, -7.3015689849853516e-06, -7.070600986480713e-06, -6.839632987976074e-06, -6.6086649894714355e-06, -6.377696990966797e-06, -6.146728992462158e-06, -5.9157609939575195e-06, -5.684792995452881e-06, -5.453824996948242e-06, -5.2228569984436035e-06, -4.991888999938965e-06, -4.760921001434326e-06, -4.5299530029296875e-06, -4.298985004425049e-06, -4.06801700592041e-06, -3.8370490074157715e-06, -3.606081008911133e-06, -3.375113010406494e-06, -3.1441450119018555e-06, -2.913177013397217e-06, -2.682209014892578e-06, -2.4512410163879395e-06, -2.2202730178833008e-06, -1.989305019378662e-06, -1.7583370208740234e-06, -1.5273690223693848e-06, -1.296401023864746e-06, -1.0654330253601074e-06, -8.344650268554688e-07, -6.034970283508301e-07, -3.725290298461914e-07, -1.4156103134155273e-07, 8.940696716308594e-08, 3.203749656677246e-07, 5.513429641723633e-07, 7.82310962677002e-07, 1.0132789611816406e-06, 1.2442469596862793e-06, 1.475214958190918e-06, 1.7061829566955566e-06, 1.9371509552001953e-06, 2.168118953704834e-06, 2.3990869522094727e-06, 2.6300549507141113e-06, 2.86102294921875e-06, 3.0919909477233887e-06, 3.3229589462280273e-06, 3.553926944732666e-06, 3.7848949432373047e-06, 4.015862941741943e-06, 4.246830940246582e-06, 4.477798938751221e-06, 4.708766937255859e-06, 4.939734935760498e-06, 5.170702934265137e-06, 5.401670932769775e-06, 5.632638931274414e-06, 5.863606929779053e-06, 6.094574928283691e-06, 6.32554292678833e-06, 6.556510925292969e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 6.0, 11.0, 5.0, 8.0, 11.0, 13.0, 19.0, 12.0, 24.0, 12.0, 27.0, 25.0, 42.0, 26.0, 28.0, 46.0, 27.0, 38.0, 42.0, 44.0, 46.0, 33.0, 48.0, 48.0, 58.0, 42.0, 20.0, 35.0, 32.0, 26.0, 15.0, 22.0, 26.0, 14.0, 16.0, 7.0, 14.0, 8.0, 5.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-4.231929779052734e-06, -4.07826155424118e-06, -3.9245933294296265e-06, -3.7709251046180725e-06, -3.6172568798065186e-06, -3.4635886549949646e-06, -3.3099204301834106e-06, -3.1562522053718567e-06, -3.0025839805603027e-06, -2.8489157557487488e-06, -2.695247530937195e-06, -2.541579306125641e-06, -2.387911081314087e-06, -2.234242856502533e-06, -2.080574631690979e-06, -1.926906406879425e-06, -1.773238182067871e-06, -1.6195699572563171e-06, -1.4659017324447632e-06, -1.3122335076332092e-06, -1.1585652828216553e-06, -1.0048970580101013e-06, -8.512288331985474e-07, -6.975606083869934e-07, -5.438923835754395e-07, -3.902241587638855e-07, -2.3655593395233154e-07, -8.288770914077759e-08, 7.078051567077637e-08, 2.2444874048233032e-07, 3.781169652938843e-07, 5.317851901054382e-07, 6.854534149169922e-07, 8.391216397285461e-07, 9.927898645401e-07, 1.146458089351654e-06, 1.300126314163208e-06, 1.453794538974762e-06, 1.607462763786316e-06, 1.7611309885978699e-06, 1.914799213409424e-06, 2.0684674382209778e-06, 2.2221356630325317e-06, 2.3758038878440857e-06, 2.5294721126556396e-06, 2.6831403374671936e-06, 2.8368085622787476e-06, 2.9904767870903015e-06, 3.1441450119018555e-06, 3.2978132367134094e-06, 3.4514814615249634e-06, 3.6051496863365173e-06, 3.7588179111480713e-06, 3.912486135959625e-06, 4.066154360771179e-06, 4.219822585582733e-06, 4.373490810394287e-06, 4.527159035205841e-06, 4.680827260017395e-06, 4.834495484828949e-06, 4.988163709640503e-06, 5.141831934452057e-06, 5.295500159263611e-06, 5.449168384075165e-06, 5.602836608886719e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 16.0, 25.0, 40.0, 43.0, 71.0, 106.0, 148.0, 259.0, 417.0, 751.0, 1213.0, 2696.0, 6386.0, 16099.0, 134737.0, 835608.0, 33557.0, 8373.0, 3922.0, 1811.0, 854.0, 557.0, 268.0, 196.0, 139.0, 69.0, 60.0, 33.0, 24.0, 17.0, 14.0, 10.0, 8.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.800060272216797e-05, -1.748930662870407e-05, -1.6978010535240173e-05, -1.6466714441776276e-05, -1.5955418348312378e-05, -1.544412225484848e-05, -1.4932826161384583e-05, -1.4421530067920685e-05, -1.3910233974456787e-05, -1.339893788099289e-05, -1.2887641787528992e-05, -1.2376345694065094e-05, -1.1865049600601196e-05, -1.1353753507137299e-05, -1.0842457413673401e-05, -1.0331161320209503e-05, -9.819865226745605e-06, -9.308569133281708e-06, -8.79727303981781e-06, -8.285976946353912e-06, -7.774680852890015e-06, -7.263384759426117e-06, -6.752088665962219e-06, -6.2407925724983215e-06, -5.729496479034424e-06, -5.218200385570526e-06, -4.706904292106628e-06, -4.195608198642731e-06, -3.684312105178833e-06, -3.1730160117149353e-06, -2.6617199182510376e-06, -2.15042382478714e-06, -1.6391277313232422e-06, -1.1278316378593445e-06, -6.165355443954468e-07, -1.0523945093154907e-07, 4.0605664253234863e-07, 9.173527359962463e-07, 1.428648829460144e-06, 1.9399449229240417e-06, 2.4512410163879395e-06, 2.962537109851837e-06, 3.473833203315735e-06, 3.9851292967796326e-06, 4.49642539024353e-06, 5.007721483707428e-06, 5.519017577171326e-06, 6.030313670635223e-06, 6.541609764099121e-06, 7.052905857563019e-06, 7.5642019510269165e-06, 8.075498044490814e-06, 8.586794137954712e-06, 9.09809023141861e-06, 9.609386324882507e-06, 1.0120682418346405e-05, 1.0631978511810303e-05, 1.11432746052742e-05, 1.1654570698738098e-05, 1.2165866792201996e-05, 1.2677162885665894e-05, 1.3188458979129791e-05, 1.3699755072593689e-05, 1.4211051166057587e-05, 1.4722347259521484e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 6.0, 4.0, 0.0, 7.0, 11.0, 18.0, 15.0, 18.0, 16.0, 24.0, 31.0, 56.0, 77.0, 370.0, 66.0, 55.0, 51.0, 38.0, 24.0, 21.0, 14.0, 18.0, 12.0, 0.0, 8.0, 5.0, 9.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8477439880371094e-06, -1.7909333109855652e-06, -1.734122633934021e-06, -1.6773119568824768e-06, -1.6205012798309326e-06, -1.5636906027793884e-06, -1.5068799257278442e-06, -1.4500692486763e-06, -1.3932585716247559e-06, -1.3364478945732117e-06, -1.2796372175216675e-06, -1.2228265404701233e-06, -1.166015863418579e-06, -1.109205186367035e-06, -1.0523945093154907e-06, -9.955838322639465e-07, -9.387731552124023e-07, -8.819624781608582e-07, -8.25151801109314e-07, -7.683411240577698e-07, -7.115304470062256e-07, -6.547197699546814e-07, -5.979090929031372e-07, -5.41098415851593e-07, -4.842877388000488e-07, -4.2747706174850464e-07, -3.7066638469696045e-07, -3.1385570764541626e-07, -2.5704503059387207e-07, -2.0023435354232788e-07, -1.434236764907837e-07, -8.66129994392395e-08, -2.9802322387695312e-08, 2.7008354663848877e-08, 8.381903171539307e-08, 1.4062970876693726e-07, 1.9744038581848145e-07, 2.5425106287002563e-07, 3.110617399215698e-07, 3.67872416973114e-07, 4.246830940246582e-07, 4.814937710762024e-07, 5.383044481277466e-07, 5.951151251792908e-07, 6.51925802230835e-07, 7.087364792823792e-07, 7.655471563339233e-07, 8.223578333854675e-07, 8.791685104370117e-07, 9.359791874885559e-07, 9.927898645401e-07, 1.0496005415916443e-06, 1.1064112186431885e-06, 1.1632218956947327e-06, 1.2200325727462769e-06, 1.276843249797821e-06, 1.3336539268493652e-06, 1.3904646039009094e-06, 1.4472752809524536e-06, 1.5040859580039978e-06, 1.560896635055542e-06, 1.6177073121070862e-06, 1.6745179891586304e-06, 1.7313286662101746e-06, 1.7881393432617188e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 2.0, 6.0, 5.0, 10.0, 13.0, 20.0, 16.0, 35.0, 57.0, 102.0, 88.0, 225.0, 295.0, 733.0, 721.0, 1817.0, 4585.0, 13609.0, 72576.0, 902274.0, 35388.0, 9342.0, 3231.0, 1043.0, 1047.0, 526.0, 267.0, 148.0, 137.0, 80.0, 72.0, 15.0, 23.0, 18.0, 12.0, 6.0, 4.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.662441253662109e-06, -5.49759715795517e-06, -5.33275306224823e-06, -5.16790896654129e-06, -5.003064870834351e-06, -4.838220775127411e-06, -4.673376679420471e-06, -4.5085325837135315e-06, -4.343688488006592e-06, -4.178844392299652e-06, -4.014000296592712e-06, -3.849156200885773e-06, -3.684312105178833e-06, -3.5194680094718933e-06, -3.3546239137649536e-06, -3.189779818058014e-06, -3.0249357223510742e-06, -2.8600916266441345e-06, -2.695247530937195e-06, -2.530403435230255e-06, -2.3655593395233154e-06, -2.2007152438163757e-06, -2.035871148109436e-06, -1.8710270524024963e-06, -1.7061829566955566e-06, -1.541338860988617e-06, -1.3764947652816772e-06, -1.2116506695747375e-06, -1.0468065738677979e-06, -8.819624781608582e-07, -7.171183824539185e-07, -5.522742867469788e-07, -3.8743019104003906e-07, -2.2258609533309937e-07, -5.774199962615967e-08, 1.0710209608078003e-07, 2.7194619178771973e-07, 4.367902874946594e-07, 6.016343832015991e-07, 7.664784789085388e-07, 9.313225746154785e-07, 1.0961666703224182e-06, 1.261010766029358e-06, 1.4258548617362976e-06, 1.5906989574432373e-06, 1.755543053150177e-06, 1.9203871488571167e-06, 2.0852312445640564e-06, 2.250075340270996e-06, 2.414919435977936e-06, 2.5797635316848755e-06, 2.744607627391815e-06, 2.909451723098755e-06, 3.0742958188056946e-06, 3.2391399145126343e-06, 3.403984010219574e-06, 3.5688281059265137e-06, 3.7336722016334534e-06, 3.898516297340393e-06, 4.063360393047333e-06, 4.2282044887542725e-06, 4.393048584461212e-06, 4.557892680168152e-06, 4.7227367758750916e-06, 4.887580871582031e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 53.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 112.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 683.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 117.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-2.384185791015625e-07, -2.3096799850463867e-07, -2.2351741790771484e-07, -2.1606683731079102e-07, -2.086162567138672e-07, -2.0116567611694336e-07, -1.9371509552001953e-07, -1.862645149230957e-07, -1.7881393432617188e-07, -1.7136335372924805e-07, -1.6391277313232422e-07, -1.564621925354004e-07, -1.4901161193847656e-07, -1.4156103134155273e-07, -1.341104507446289e-07, -1.2665987014770508e-07, -1.1920928955078125e-07, -1.1175870895385742e-07, -1.043081283569336e-07, -9.685754776000977e-08, -8.940696716308594e-08, -8.195638656616211e-08, -7.450580596923828e-08, -6.705522537231445e-08, -5.960464477539063e-08, -5.21540641784668e-08, -4.470348358154297e-08, -3.725290298461914e-08, -2.9802322387695312e-08, -2.2351741790771484e-08, -1.4901161193847656e-08, -7.450580596923828e-09, 0.0, 7.450580596923828e-09, 1.4901161193847656e-08, 2.2351741790771484e-08, 2.9802322387695312e-08, 3.725290298461914e-08, 4.470348358154297e-08, 5.21540641784668e-08, 5.960464477539063e-08, 6.705522537231445e-08, 7.450580596923828e-08, 8.195638656616211e-08, 8.940696716308594e-08, 9.685754776000977e-08, 1.043081283569336e-07, 1.1175870895385742e-07, 1.1920928955078125e-07, 1.2665987014770508e-07, 1.341104507446289e-07, 1.4156103134155273e-07, 1.4901161193847656e-07, 1.564621925354004e-07, 1.6391277313232422e-07, 1.7136335372924805e-07, 1.7881393432617188e-07, 1.862645149230957e-07, 1.9371509552001953e-07, 2.0116567611694336e-07, 2.086162567138672e-07, 2.1606683731079102e-07, 2.2351741790771484e-07, 2.3096799850463867e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 8.0, 13.0, 23.0, 26.0, 44.0, 49.0, 88.0, 147.0, 176.0, 266.0, 416.0, 646.0, 0.0, 969.0, 1516.0, 2491.0, 4019.0, 7710.0, 13505.0, 30953.0, 79026.0, 764324.0, 78851.0, 31269.0, 13346.0, 0.0, 7794.0, 4058.0, 2463.0, 1492.0, 962.0, 629.0, 428.0, 278.0, 170.0, 136.0, 91.0, 57.0, 0.0, 44.0, 27.0, 20.0, 9.0, 9.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.9073486328125e-06, -1.8524006009101868e-06, -1.7974525690078735e-06, -1.7425045371055603e-06, -1.687556505203247e-06, -1.6326084733009338e-06, -1.5776604413986206e-06, -1.5227124094963074e-06, -1.4677643775939941e-06, -1.412816345691681e-06, -1.3578683137893677e-06, -1.3029202818870544e-06, -1.2479722499847412e-06, -1.193024218082428e-06, -1.1380761861801147e-06, -1.0831281542778015e-06, -1.0281801223754883e-06, -9.73232090473175e-07, -9.182840585708618e-07, -8.633360266685486e-07, -8.083879947662354e-07, -7.534399628639221e-07, -6.984919309616089e-07, -6.435438990592957e-07, -5.885958671569824e-07, -5.336478352546692e-07, -4.78699803352356e-07, -4.237517714500427e-07, -3.688037395477295e-07, -3.1385570764541626e-07, -2.5890767574310303e-07, -2.039596438407898e-07, -1.4901161193847656e-07, -9.406358003616333e-08, -3.91155481338501e-08, 1.5832483768463135e-08, 7.078051567077637e-08, 1.257285475730896e-07, 1.8067657947540283e-07, 2.3562461137771606e-07, 2.905726432800293e-07, 3.4552067518234253e-07, 4.0046870708465576e-07, 4.55416738986969e-07, 5.103647708892822e-07, 5.653128027915955e-07, 6.202608346939087e-07, 6.752088665962219e-07, 7.301568984985352e-07, 7.851049304008484e-07, 8.400529623031616e-07, 8.950009942054749e-07, 9.499490261077881e-07, 1.0048970580101013e-06, 1.0598450899124146e-06, 1.1147931218147278e-06, 1.169741153717041e-06, 1.2246891856193542e-06, 1.2796372175216675e-06, 1.3345852494239807e-06, 1.389533281326294e-06, 1.4444813132286072e-06, 1.4994293451309204e-06, 1.5543773770332336e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 0.0, 104.0, 0.0, 0.0, 0.0, 0.0, 643.0, 0.0, 0.0, 0.0, 113.0, 0.0, 0.0, 0.0, 0.0, 48.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 9.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.172325134277344e-07, -4.041939973831177e-07, -3.91155481338501e-07, -3.781169652938843e-07, -3.650784492492676e-07, -3.520399332046509e-07, -3.390014171600342e-07, -3.259629011154175e-07, -3.129243850708008e-07, -2.998858690261841e-07, -2.868473529815674e-07, -2.738088369369507e-07, -2.60770320892334e-07, -2.477318048477173e-07, -2.3469328880310059e-07, -2.2165477275848389e-07, -2.086162567138672e-07, -1.955777406692505e-07, -1.825392246246338e-07, -1.695007085800171e-07, -1.564621925354004e-07, -1.434236764907837e-07, -1.30385160446167e-07, -1.1734664440155029e-07, -1.043081283569336e-07, -9.12696123123169e-08, -7.82310962677002e-08, -6.51925802230835e-08, -5.21540641784668e-08, -3.91155481338501e-08, -2.60770320892334e-08, -1.30385160446167e-08, 0.0, 1.30385160446167e-08, 2.60770320892334e-08, 3.91155481338501e-08, 5.21540641784668e-08, 6.51925802230835e-08, 7.82310962677002e-08, 9.12696123123169e-08, 1.043081283569336e-07, 1.1734664440155029e-07, 1.30385160446167e-07, 1.434236764907837e-07, 1.564621925354004e-07, 1.695007085800171e-07, 1.825392246246338e-07, 1.955777406692505e-07, 2.086162567138672e-07, 2.2165477275848389e-07, 2.3469328880310059e-07, 2.477318048477173e-07, 2.60770320892334e-07, 2.738088369369507e-07, 2.868473529815674e-07, 2.998858690261841e-07, 3.129243850708008e-07, 3.259629011154175e-07, 3.390014171600342e-07, 3.520399332046509e-07, 3.650784492492676e-07, 3.781169652938843e-07, 3.91155481338501e-07, 4.041939973831177e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 2.0, 11.0, 2.0, 11.0, 14.0, 16.0, 18.0, 34.0, 39.0, 54.0, 56.0, 92.0, 123.0, 112.0, 89.0, 82.0, 57.0, 31.0, 34.0, 23.0, 18.0, 18.0, 9.0, 11.0, 14.0, 5.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6234288169653155e-06, -6.388960173353553e-06, -6.15449152974179e-06, -5.9200228861300275e-06, -5.685554697265616e-06, -5.451086053653853e-06, -5.21661741004209e-06, -4.982148766430328e-06, -4.747680577565916e-06, -4.513211933954153e-06, -4.2787432903423905e-06, -4.044274646730628e-06, -3.809806457866216e-06, -3.5753378142544534e-06, -3.3408691706426907e-06, -3.106400527030928e-06, -2.8719318834191654e-06, -2.6374632398074027e-06, -2.4029948235693155e-06, -2.168526179957553e-06, -1.9340577637194656e-06, -1.699589120107703e-06, -1.4651204764959402e-06, -1.2306519465710153e-06, -9.961834166460903e-07, -7.617148867211654e-07, -5.272462999528216e-07, -2.9277771318447776e-07, -5.830918325955281e-08, 1.7615934666537214e-07, 4.106279902771348e-07, 6.450965202020598e-07, 8.795650501269847e-07, 1.1140335800519097e-06, 1.3485021099768346e-06, 1.5829707535885973e-06, 1.8174392835135222e-06, 2.051907813438447e-06, 2.28637645705021e-06, 2.5208451006619725e-06, 2.7553135169000598e-06, 2.9897821605118224e-06, 3.2242505767499097e-06, 3.4587192203616723e-06, 3.693187863973435e-06, 3.927656507585198e-06, 4.16212515119696e-06, 4.396593340061372e-06, 4.631061983673135e-06, 4.8655306272848975e-06, 5.09999927089666e-06, 5.334467459761072e-06, 5.568936103372835e-06, 5.803404746984597e-06, 6.03787339059636e-06, 6.272342034208123e-06, 6.506810677819885e-06, 6.741279321431648e-06, 6.975747965043411e-06, 7.210216608655173e-06, 7.444684797519585e-06, 7.679152986383997e-06, 7.913622539490461e-06, 8.148090273607522e-06, 8.382558917219285e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 6.0, 11.0, 8.0, 16.0, 19.0, 22.0, 23.0, 21.0, 31.0, 35.0, 39.0, 29.0, 42.0, 40.0, 31.0, 34.0, 44.0, 56.0, 51.0, 55.0, 37.0, 37.0, 26.0, 28.0, 38.0, 32.0, 31.0, 31.0, 18.0, 19.0, 14.0, 9.0, 14.0, 9.0, 7.0, 4.0, 6.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.610154519468779e-06, -4.4534726839629e-06, -4.296790848457022e-06, -4.140109012951143e-06, -3.9834271774452645e-06, -3.826745341939386e-06, -3.670063733807183e-06, -3.5133818983013043e-06, -3.3567000627954258e-06, -3.2000182272895472e-06, -3.0433363917836687e-06, -2.88665455627779e-06, -2.729972948145587e-06, -2.5732911126397084e-06, -2.41660927713383e-06, -2.2599274416279513e-06, -2.1032456061220728e-06, -1.9465637706161942e-06, -1.7898819351103157e-06, -1.6332002132912748e-06, -1.4765183777853963e-06, -1.3198365422795177e-06, -1.163154820460477e-06, -1.0064729849545984e-06, -8.497911494487198e-07, -6.931093139428413e-07, -5.364275352803816e-07, -3.7974572819621244e-07, -2.2306392111204332e-07, -6.638208560616476e-08, 9.029969305629493e-08, 2.469814717187546e-07, 4.036628524772823e-07, 5.603446879831608e-07, 7.170264666456205e-07, 8.737082453080802e-07, 1.0303900808139588e-06, 1.1870719163198373e-06, 1.3437536381388782e-06, 1.5004354736447567e-06, 1.6571173091506353e-06, 1.8137991446565138e-06, 1.9704809801623924e-06, 2.127162815668271e-06, 2.283844423800474e-06, 2.4405262593063526e-06, 2.597208094812231e-06, 2.7538899303181097e-06, 2.9105717658239882e-06, 3.067253601329867e-06, 3.2239354368357453e-06, 3.380617272341624e-06, 3.5372991078475025e-06, 3.693980943353381e-06, 3.8506627788592596e-06, 4.007344614365138e-06, 4.164025995123666e-06, 4.320707830629544e-06, 4.477389666135423e-06, 4.6340715016413014e-06, 4.79075333714718e-06, 4.9474351726530585e-06, 5.104117008158937e-06, 5.260798388917465e-06, 5.417480679170694e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 6.0, 18.0, 22.0, 24.0, 49.0, 63.0, 132.0, 137.0, 321.0, 510.0, 643.0, 1366.0, 2099.0, 3417.0, 4251.0, 8211.0, 14053.0, 23608.0, 31679.0, 69043.0, 138340.0, 255752.0, 197650.0, 137869.0, 68849.0, 31356.0, 23851.0, 13771.0, 8567.0, 4205.0, 3413.0, 2114.0, 1297.0, 602.0, 499.0, 310.0, 150.0, 90.0, 81.0, 59.0, 27.0, 19.0, 11.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.463859558105469e-06, -8.181668817996979e-06, -7.899478077888489e-06, -7.617287337779999e-06, -7.335096597671509e-06, -7.052905857563019e-06, -6.770715117454529e-06, -6.488524377346039e-06, -6.206333637237549e-06, -5.924142897129059e-06, -5.641952157020569e-06, -5.359761416912079e-06, -5.077570676803589e-06, -4.795379936695099e-06, -4.513189196586609e-06, -4.230998456478119e-06, -3.948807716369629e-06, -3.666616976261139e-06, -3.384426236152649e-06, -3.102235496044159e-06, -2.820044755935669e-06, -2.537854015827179e-06, -2.255663275718689e-06, -1.973472535610199e-06, -1.691281795501709e-06, -1.409091055393219e-06, -1.126900315284729e-06, -8.44709575176239e-07, -5.62518835067749e-07, -2.8032809495925903e-07, 1.862645149230957e-09, 2.8405338525772095e-07, 5.662441253662109e-07, 8.484348654747009e-07, 1.130625605583191e-06, 1.412816345691681e-06, 1.695007085800171e-06, 1.977197825908661e-06, 2.259388566017151e-06, 2.541579306125641e-06, 2.823770046234131e-06, 3.105960786342621e-06, 3.388151526451111e-06, 3.670342266559601e-06, 3.952533006668091e-06, 4.234723746776581e-06, 4.516914486885071e-06, 4.799105226993561e-06, 5.081295967102051e-06, 5.363486707210541e-06, 5.645677447319031e-06, 5.927868187427521e-06, 6.210058927536011e-06, 6.492249667644501e-06, 6.774440407752991e-06, 7.056631147861481e-06, 7.338821887969971e-06, 7.621012628078461e-06, 7.90320336818695e-06, 8.18539410829544e-06, 8.46758484840393e-06, 8.74977558851242e-06, 9.03196632862091e-06, 9.3141570687294e-06, 9.59634780883789e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 5.0, 16.0, 15.0, 17.0, 17.0, 14.0, 19.0, 22.0, 26.0, 33.0, 38.0, 58.0, 32.0, 43.0, 48.0, 32.0, 63.0, 40.0, 47.0, 45.0, 35.0, 55.0, 38.0, 24.0, 26.0, 30.0, 30.0, 18.0, 19.0, 18.0, 6.0, 19.0, 7.0, 3.0, 11.0, 6.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.933906555175781e-06, -3.8025900721549988e-06, -3.6712735891342163e-06, -3.539957106113434e-06, -3.4086406230926514e-06, -3.277324140071869e-06, -3.1460076570510864e-06, -3.014691174030304e-06, -2.8833746910095215e-06, -2.752058207988739e-06, -2.6207417249679565e-06, -2.489425241947174e-06, -2.3581087589263916e-06, -2.226792275905609e-06, -2.0954757928848267e-06, -1.964159309864044e-06, -1.8328428268432617e-06, -1.7015263438224792e-06, -1.5702098608016968e-06, -1.4388933777809143e-06, -1.3075768947601318e-06, -1.1762604117393494e-06, -1.044943928718567e-06, -9.136274456977844e-07, -7.82310962677002e-07, -6.509944796562195e-07, -5.19677996635437e-07, -3.8836151361465454e-07, -2.5704503059387207e-07, -1.257285475730896e-07, 5.587935447692871e-09, 1.3690441846847534e-07, 2.682209014892578e-07, 3.995373845100403e-07, 5.308538675308228e-07, 6.621703505516052e-07, 7.934868335723877e-07, 9.248033165931702e-07, 1.0561197996139526e-06, 1.1874362826347351e-06, 1.3187527656555176e-06, 1.4500692486763e-06, 1.5813857316970825e-06, 1.712702214717865e-06, 1.8440186977386475e-06, 1.97533518075943e-06, 2.1066516637802124e-06, 2.237968146800995e-06, 2.3692846298217773e-06, 2.50060111284256e-06, 2.6319175958633423e-06, 2.7632340788841248e-06, 2.8945505619049072e-06, 3.0258670449256897e-06, 3.157183527946472e-06, 3.2885000109672546e-06, 3.419816493988037e-06, 3.5511329770088196e-06, 3.682449460029602e-06, 3.8137659430503845e-06, 3.945082426071167e-06, 4.0763989090919495e-06, 4.207715392112732e-06, 4.339031875133514e-06, 4.470348358154297e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 5.0, 9.0, 3.0, 27.0, 23.0, 36.0, 37.0, 91.0, 110.0, 135.0, 246.0, 267.0, 539.0, 546.0, 1176.0, 1731.0, 1969.0, 3966.0, 4471.0, 8888.0, 14562.0, 17473.0, 37615.0, 46217.0, 104669.0, 129997.0, 242306.0, 187208.0, 83463.0, 66765.0, 30176.0, 24778.0, 11779.0, 10163.0, 6201.0, 3102.0, 2773.0, 1377.0, 1280.0, 867.0, 397.0, 396.0, 199.0, 171.0, 80.0, 100.0, 67.0, 39.0, 35.0, 12.0, 6.0, 9.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-6.735324859619141e-06, -6.522051990032196e-06, -6.3087791204452515e-06, -6.095506250858307e-06, -5.882233381271362e-06, -5.668960511684418e-06, -5.455687642097473e-06, -5.2424147725105286e-06, -5.029141902923584e-06, -4.815869033336639e-06, -4.602596163749695e-06, -4.38932329416275e-06, -4.176050424575806e-06, -3.962777554988861e-06, -3.7495046854019165e-06, -3.536231815814972e-06, -3.3229589462280273e-06, -3.1096860766410828e-06, -2.896413207054138e-06, -2.6831403374671936e-06, -2.469867467880249e-06, -2.2565945982933044e-06, -2.04332172870636e-06, -1.8300488591194153e-06, -1.6167759895324707e-06, -1.4035031199455261e-06, -1.1902302503585815e-06, -9.76957380771637e-07, -7.636845111846924e-07, -5.504116415977478e-07, -3.371387720108032e-07, -1.2386590242385864e-07, 8.940696716308594e-08, 3.026798367500305e-07, 5.159527063369751e-07, 7.292255759239197e-07, 9.424984455108643e-07, 1.1557713150978088e-06, 1.3690441846847534e-06, 1.582317054271698e-06, 1.7955899238586426e-06, 2.008862793445587e-06, 2.2221356630325317e-06, 2.4354085326194763e-06, 2.648681402206421e-06, 2.8619542717933655e-06, 3.07522714138031e-06, 3.2885000109672546e-06, 3.5017728805541992e-06, 3.715045750141144e-06, 3.928318619728088e-06, 4.141591489315033e-06, 4.3548643589019775e-06, 4.568137228488922e-06, 4.781410098075867e-06, 4.994682967662811e-06, 5.207955837249756e-06, 5.4212287068367004e-06, 5.634501576423645e-06, 5.84777444601059e-06, 6.061047315597534e-06, 6.274320185184479e-06, 6.487593054771423e-06, 6.700865924358368e-06, 6.9141387939453125e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 4.0, 15.0, 7.0, 10.0, 26.0, 11.0, 44.0, 14.0, 42.0, 28.0, 46.0, 26.0, 57.0, 32.0, 59.0, 42.0, 57.0, 34.0, 42.0, 61.0, 38.0, 61.0, 18.0, 52.0, 19.0, 41.0, 13.0, 31.0, 9.0, 13.0, 4.0, 8.0, 2.0, 7.0, 2.0, 3.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5033950805664062e-06, -2.4158507585525513e-06, -2.3283064365386963e-06, -2.2407621145248413e-06, -2.1532177925109863e-06, -2.0656734704971313e-06, -1.9781291484832764e-06, -1.8905848264694214e-06, -1.8030405044555664e-06, -1.7154961824417114e-06, -1.6279518604278564e-06, -1.5404075384140015e-06, -1.4528632164001465e-06, -1.3653188943862915e-06, -1.2777745723724365e-06, -1.1902302503585815e-06, -1.1026859283447266e-06, -1.0151416063308716e-06, -9.275972843170166e-07, -8.400529623031616e-07, -7.525086402893066e-07, -6.649643182754517e-07, -5.774199962615967e-07, -4.898756742477417e-07, -4.023313522338867e-07, -3.1478703022003174e-07, -2.2724270820617676e-07, -1.3969838619232178e-07, -5.21540641784668e-08, 3.5390257835388184e-08, 1.2293457984924316e-07, 2.1047890186309814e-07, 2.980232238769531e-07, 3.855675458908081e-07, 4.731118679046631e-07, 5.606561899185181e-07, 6.48200511932373e-07, 7.35744833946228e-07, 8.23289155960083e-07, 9.10833477973938e-07, 9.98377799987793e-07, 1.085922122001648e-06, 1.173466444015503e-06, 1.261010766029358e-06, 1.3485550880432129e-06, 1.4360994100570679e-06, 1.5236437320709229e-06, 1.6111880540847778e-06, 1.6987323760986328e-06, 1.7862766981124878e-06, 1.8738210201263428e-06, 1.9613653421401978e-06, 2.0489096641540527e-06, 2.1364539861679077e-06, 2.2239983081817627e-06, 2.3115426301956177e-06, 2.3990869522094727e-06, 2.4866312742233276e-06, 2.5741755962371826e-06, 2.6617199182510376e-06, 2.7492642402648926e-06, 2.8368085622787476e-06, 2.9243528842926025e-06, 3.0118972063064575e-06, 3.0994415283203125e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 9.0, 0.0, 6.0, 18.0, 15.0, 0.0, 35.0, 43.0, 104.0, 140.0, 0.0, 270.0, 336.0, 652.0, 0.0, 1178.0, 1978.0, 3349.0, 0.0, 6717.0, 12400.0, 23181.0, 0.0, 38087.0, 871681.0, 38028.0, 23084.0, 0.0, 12404.0, 6695.0, 3295.0, 0.0, 1980.0, 1194.0, 709.0, 0.0, 349.0, 263.0, 148.0, 0.0, 85.0, 36.0, 31.0, 26.0, 0.0, 9.0, 12.0, 6.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.430511474609375e-06, -1.3848766684532166e-06, -1.339241862297058e-06, -1.2936070561408997e-06, -1.2479722499847412e-06, -1.2023374438285828e-06, -1.1567026376724243e-06, -1.1110678315162659e-06, -1.0654330253601074e-06, -1.019798219203949e-06, -9.741634130477905e-07, -9.285286068916321e-07, -8.828938007354736e-07, -8.372589945793152e-07, -7.916241884231567e-07, -7.459893822669983e-07, -7.003545761108398e-07, -6.547197699546814e-07, -6.09084963798523e-07, -5.634501576423645e-07, -5.178153514862061e-07, -4.721805453300476e-07, -4.2654573917388916e-07, -3.809109330177307e-07, -3.3527612686157227e-07, -2.896413207054138e-07, -2.4400651454925537e-07, -1.9837170839309692e-07, -1.5273690223693848e-07, -1.0710209608078003e-07, -6.146728992462158e-08, -1.5832483768463135e-08, 2.9802322387695312e-08, 7.543712854385376e-08, 1.210719347000122e-07, 1.6670674085617065e-07, 2.123415470123291e-07, 2.5797635316848755e-07, 3.03611159324646e-07, 3.4924596548080444e-07, 3.948807716369629e-07, 4.4051557779312134e-07, 4.861503839492798e-07, 5.317851901054382e-07, 5.774199962615967e-07, 6.230548024177551e-07, 6.686896085739136e-07, 7.14324414730072e-07, 7.599592208862305e-07, 8.055940270423889e-07, 8.512288331985474e-07, 8.968636393547058e-07, 9.424984455108643e-07, 9.881332516670227e-07, 1.0337680578231812e-06, 1.0794028639793396e-06, 1.125037670135498e-06, 1.1706724762916565e-06, 1.216307282447815e-06, 1.2619420886039734e-06, 1.3075768947601318e-06, 1.3532117009162903e-06, 1.3988465070724487e-06, 1.4444813132286072e-06, 1.4901161193847656e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 7.0, 2.0, 0.0, 0.0, 2.0, 8.0, 17.0, 0.0, 35.0, 44.0, 79.0, 0.0, 113.0, 180.0, 301.0, 0.0, 446.0, 793.0, 1240.0, 0.0, 1956.0, 3634.0, 6301.0, 0.0, 11484.0, 26430.0, 63141.0, 0.0, 816274.0, 62872.0, 26747.0, 0.0, 11317.0, 6189.0, 3669.0, 0.0, 2046.0, 1247.0, 773.0, 0.0, 423.0, 303.0, 179.0, 0.0, 130.0, 81.0, 31.0, 0.0, 30.0, 21.0, 11.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 0.0, 2.0, 2.0], "bins": [-1.430511474609375e-06, -1.385807991027832e-06, -1.341104507446289e-06, -1.296401023864746e-06, -1.2516975402832031e-06, -1.2069940567016602e-06, -1.1622905731201172e-06, -1.1175870895385742e-06, -1.0728836059570312e-06, -1.0281801223754883e-06, -9.834766387939453e-07, -9.387731552124023e-07, -8.940696716308594e-07, -8.493661880493164e-07, -8.046627044677734e-07, -7.599592208862305e-07, -7.152557373046875e-07, -6.705522537231445e-07, -6.258487701416016e-07, -5.811452865600586e-07, -5.364418029785156e-07, -4.917383193969727e-07, -4.470348358154297e-07, -4.023313522338867e-07, -3.5762786865234375e-07, -3.129243850708008e-07, -2.682209014892578e-07, -2.2351741790771484e-07, -1.7881393432617188e-07, -1.341104507446289e-07, -8.940696716308594e-08, -4.470348358154297e-08, 0.0, 4.470348358154297e-08, 8.940696716308594e-08, 1.341104507446289e-07, 1.7881393432617188e-07, 2.2351741790771484e-07, 2.682209014892578e-07, 3.129243850708008e-07, 3.5762786865234375e-07, 4.023313522338867e-07, 4.470348358154297e-07, 4.917383193969727e-07, 5.364418029785156e-07, 5.811452865600586e-07, 6.258487701416016e-07, 6.705522537231445e-07, 7.152557373046875e-07, 7.599592208862305e-07, 8.046627044677734e-07, 8.493661880493164e-07, 8.940696716308594e-07, 9.387731552124023e-07, 9.834766387939453e-07, 1.0281801223754883e-06, 1.0728836059570312e-06, 1.1175870895385742e-06, 1.1622905731201172e-06, 1.2069940567016602e-06, 1.2516975402832031e-06, 1.296401023864746e-06, 1.341104507446289e-06, 1.385807991027832e-06, 1.430511474609375e-06]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 0.0, 0.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 0.0, 85.0, 0.0, 0.0, 0.0, 0.0, 0.0, 723.0, 0.0, 0.0, 0.0, 0.0, 72.0, 0.0, 0.0, 0.0, 0.0, 47.0, 0.0, 0.0, 0.0, 0.0, 0.0, 17.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.5762786865234375e-07, -3.46451997756958e-07, -3.3527612686157227e-07, -3.241002559661865e-07, -3.129243850708008e-07, -3.0174851417541504e-07, -2.905726432800293e-07, -2.7939677238464355e-07, -2.682209014892578e-07, -2.5704503059387207e-07, -2.4586915969848633e-07, -2.3469328880310059e-07, -2.2351741790771484e-07, -2.123415470123291e-07, -2.0116567611694336e-07, -1.8998980522155762e-07, -1.7881393432617188e-07, -1.6763806343078613e-07, -1.564621925354004e-07, -1.4528632164001465e-07, -1.341104507446289e-07, -1.2293457984924316e-07, -1.1175870895385742e-07, -1.0058283805847168e-07, -8.940696716308594e-08, -7.82310962677002e-08, -6.705522537231445e-08, -5.587935447692871e-08, -4.470348358154297e-08, -3.3527612686157227e-08, -2.2351741790771484e-08, -1.1175870895385742e-08, 0.0, 1.1175870895385742e-08, 2.2351741790771484e-08, 3.3527612686157227e-08, 4.470348358154297e-08, 5.587935447692871e-08, 6.705522537231445e-08, 7.82310962677002e-08, 8.940696716308594e-08, 1.0058283805847168e-07, 1.1175870895385742e-07, 1.2293457984924316e-07, 1.341104507446289e-07, 1.4528632164001465e-07, 1.564621925354004e-07, 1.6763806343078613e-07, 1.7881393432617188e-07, 1.8998980522155762e-07, 2.0116567611694336e-07, 2.123415470123291e-07, 2.2351741790771484e-07, 2.3469328880310059e-07, 2.4586915969848633e-07, 2.5704503059387207e-07, 2.682209014892578e-07, 2.7939677238464355e-07, 2.905726432800293e-07, 3.0174851417541504e-07, 3.129243850708008e-07, 3.241002559661865e-07, 3.3527612686157227e-07, 3.46451997756958e-07, 3.5762786865234375e-07]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 8.0, 3.0, 5.0, 8.0, 5.0, 16.0, 14.0, 33.0, 29.0, 51.0, 74.0, 86.0, 107.0, 157.0, 110.0, 85.0, 60.0, 25.0, 32.0, 27.0, 21.0, 11.0, 9.0, 7.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.029113021417288e-06, -6.789800409023883e-06, -6.550488251377828e-06, -6.311175638984423e-06, -6.071863026591018e-06, -5.8325504141976126e-06, -5.593238256551558e-06, -5.353925644158153e-06, -5.1146134865120985e-06, -4.875300874118693e-06, -4.635988716472639e-06, -4.3966761040792335e-06, -4.157363491685828e-06, -3.918051334039774e-06, -3.6787387216463685e-06, -3.4394261092529632e-06, -3.200113496859558e-06, -2.960801111839828e-06, -2.721488499446423e-06, -2.482176114426693e-06, -2.2428635020332877e-06, -2.003551117013558e-06, -1.764238731993828e-06, -1.5249262332872604e-06, -1.2856137345806928e-06, -1.0463012358741253e-06, -8.069887940109766e-07, -5.676763521478279e-07, -3.283638534412603e-07, -8.905135473469272e-08, 1.5026103028503712e-07, 3.895735289916047e-07, 6.288855729508214e-07, 8.681980716573889e-07, 1.1075105703639565e-06, 1.3468229553836863e-06, 1.586135454090254e-06, 1.8254479527968215e-06, 2.0647603378165513e-06, 2.3040729502099566e-06, 2.5433853352296865e-06, 2.7826977202494163e-06, 3.0220103326428216e-06, 3.2613227176625514e-06, 3.5006351026822813e-06, 3.7399477150756866e-06, 3.979260327469092e-06, 4.218572485115146e-06, 4.4578850975085516e-06, 4.697197709901957e-06, 4.936509867548011e-06, 5.1758224799414165e-06, 5.415135092334822e-06, 5.654447704728227e-06, 5.8937598623742815e-06, 6.133072474767687e-06, 6.372384632413741e-06, 6.6116972448071465e-06, 6.851009402453201e-06, 7.090322014846606e-06, 7.3296346272400115e-06, 7.568946784886066e-06, 7.808259397279471e-06, 8.047572009672876e-06, 8.286884622066282e-06]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 9.0, 6.0, 6.0, 6.0, 11.0, 9.0, 8.0, 9.0, 20.0, 17.0, 22.0, 22.0, 19.0, 27.0, 22.0, 32.0, 37.0, 32.0, 39.0, 34.0, 35.0, 46.0, 48.0, 40.0, 30.0, 29.0, 37.0, 31.0, 34.0, 39.0, 29.0, 29.0, 29.0, 27.0, 13.0, 22.0, 18.0, 14.0, 15.0, 10.0, 9.0, 6.0, 6.0, 5.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.230051561331493e-06, -3.110239731540787e-06, -2.9904281291237567e-06, -2.870616299333051e-06, -2.750804469542345e-06, -2.6309926397516392e-06, -2.5111808099609334e-06, -2.391369207543903e-06, -2.2715573777531972e-06, -2.1517455479624914e-06, -2.031933945545461e-06, -1.9121221157547552e-06, -1.7923102859640494e-06, -1.6724984561733436e-06, -1.5526867400694755e-06, -1.4328750239656074e-06, -1.3130631941749016e-06, -1.1932513643841958e-06, -1.0734396482803277e-06, -9.536278753330407e-07, -8.338161023857538e-07, -7.140043294384668e-07, -5.941925564911799e-07, -4.743807835438929e-07, -3.5456901059660595e-07, -2.34757237649319e-07, -1.1494546470203204e-07, 4.866308245254913e-09, 1.2467808119254187e-07, 2.444898541398288e-07, 3.643016270871158e-07, 4.841134000344027e-07, 6.039249456080142e-07, 7.237367185553012e-07, 8.435484915025881e-07, 9.633602076064562e-07, 1.083172037397162e-06, 1.2029838671878679e-06, 1.322795583291736e-06, 1.442607299395604e-06, 1.5624191291863099e-06, 1.6822309589770157e-06, 1.8020426750808838e-06, 1.921854391184752e-06, 2.0416662209754577e-06, 2.1614780507661635e-06, 2.281289653183194e-06, 2.4011014829738997e-06, 2.5209133127646055e-06, 2.6407251425553113e-06, 2.760536972346017e-06, 2.8803485747630475e-06, 3.0001604045537533e-06, 3.119972234344459e-06, 3.2397838367614895e-06, 3.3595956665521953e-06, 3.479407496342901e-06, 3.599219326133607e-06, 3.7190311559243128e-06, 3.838842985715019e-06, 3.958654815505724e-06, 4.078466190549079e-06, 4.198278020339785e-06, 4.318089850130491e-06, 4.437901679921197e-06]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 11.0, 24.0, 16.0, 25.0, 48.0, 76.0, 166.0, 205.0, 315.0, 484.0, 1162.0, 1532.0, 2423.0, 3830.0, 5978.0, 14163.0, 19227.0, 34168.0, 64423.0, 134483.0, 555725.0, 1616359.0, 1124084.0, 324154.0, 164720.0, 54082.0, 29507.0, 16855.0, 10008.0, 7289.0, 3226.0, 1923.0, 1262.0, 994.0, 452.0, 328.0, 187.0, 109.0, 120.0, 46.0, 31.0, 24.0, 16.0, 9.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.496906280517578e-06, -6.3050538301467896e-06, -6.113201379776001e-06, -5.921348929405212e-06, -5.729496479034424e-06, -5.537644028663635e-06, -5.345791578292847e-06, -5.153939127922058e-06, -4.9620866775512695e-06, -4.770234227180481e-06, -4.578381776809692e-06, -4.386529326438904e-06, -4.194676876068115e-06, -4.002824425697327e-06, -3.810971975326538e-06, -3.6191195249557495e-06, -3.427267074584961e-06, -3.2354146242141724e-06, -3.043562173843384e-06, -2.8517097234725952e-06, -2.6598572731018066e-06, -2.468004822731018e-06, -2.2761523723602295e-06, -2.084299921989441e-06, -1.8924474716186523e-06, -1.7005950212478638e-06, -1.5087425708770752e-06, -1.3168901205062866e-06, -1.125037670135498e-06, -9.331852197647095e-07, -7.413327693939209e-07, -5.494803190231323e-07, -3.5762786865234375e-07, -1.6577541828155518e-07, 2.60770320892334e-08, 2.1792948246002197e-07, 4.0978193283081055e-07, 6.016343832015991e-07, 7.934868335723877e-07, 9.853392839431763e-07, 1.1771917343139648e-06, 1.3690441846847534e-06, 1.560896635055542e-06, 1.7527490854263306e-06, 1.944601535797119e-06, 2.1364539861679077e-06, 2.3283064365386963e-06, 2.520158886909485e-06, 2.7120113372802734e-06, 2.903863787651062e-06, 3.0957162380218506e-06, 3.287568688392639e-06, 3.4794211387634277e-06, 3.6712735891342163e-06, 3.863126039505005e-06, 4.0549784898757935e-06, 4.246830940246582e-06, 4.438683390617371e-06, 4.630535840988159e-06, 4.822388291358948e-06, 5.014240741729736e-06, 5.206093192100525e-06, 5.3979456424713135e-06, 5.589798092842102e-06, 5.781650543212891e-06]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 1.0, 6.0, 10.0, 4.0, 11.0, 4.0, 10.0, 22.0, 12.0, 14.0, 18.0, 16.0, 16.0, 38.0, 30.0, 22.0, 28.0, 21.0, 71.0, 32.0, 30.0, 44.0, 35.0, 58.0, 28.0, 42.0, 35.0, 33.0, 30.0, 50.0, 27.0, 22.0, 15.0, 8.0, 41.0, 21.0, 16.0, 10.0, 14.0, 21.0, 4.0, 8.0, 2.0, 3.0, 4.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.8477439880371094e-06, -1.776963472366333e-06, -1.7061829566955566e-06, -1.6354024410247803e-06, -1.564621925354004e-06, -1.4938414096832275e-06, -1.4230608940124512e-06, -1.3522803783416748e-06, -1.2814998626708984e-06, -1.210719347000122e-06, -1.1399388313293457e-06, -1.0691583156585693e-06, -9.98377799987793e-07, -9.275972843170166e-07, -8.568167686462402e-07, -7.860362529754639e-07, -7.152557373046875e-07, -6.444752216339111e-07, -5.736947059631348e-07, -5.029141902923584e-07, -4.3213367462158203e-07, -3.6135315895080566e-07, -2.905726432800293e-07, -2.1979212760925293e-07, -1.4901161193847656e-07, -7.82310962677002e-08, -7.450580596923828e-09, 6.332993507385254e-08, 1.341104507446289e-07, 2.0489096641540527e-07, 2.7567148208618164e-07, 3.46451997756958e-07, 4.172325134277344e-07, 4.880130290985107e-07, 5.587935447692871e-07, 6.295740604400635e-07, 7.003545761108398e-07, 7.711350917816162e-07, 8.419156074523926e-07, 9.126961231231689e-07, 9.834766387939453e-07, 1.0542571544647217e-06, 1.125037670135498e-06, 1.1958181858062744e-06, 1.2665987014770508e-06, 1.3373792171478271e-06, 1.4081597328186035e-06, 1.4789402484893799e-06, 1.5497207641601562e-06, 1.6205012798309326e-06, 1.691281795501709e-06, 1.7620623111724854e-06, 1.8328428268432617e-06, 1.903623342514038e-06, 1.9744038581848145e-06, 2.045184373855591e-06, 2.115964889526367e-06, 2.1867454051971436e-06, 2.25752592086792e-06, 2.3283064365386963e-06, 2.3990869522094727e-06, 2.469867467880249e-06, 2.5406479835510254e-06, 2.6114284992218018e-06, 2.682209014892578e-06]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 2.0, 21.0, 19.0, 38.0, 47.0, 48.0, 126.0, 157.0, 202.0, 477.0, 548.0, 1293.0, 1458.0, 2145.0, 5352.0, 5999.0, 9240.0, 24786.0, 29166.0, 83643.0, 109289.0, 200380.0, 745625.0, 1233239.0, 869551.0, 513302.0, 146653.0, 108985.0, 37645.0, 23130.0, 19746.0, 7431.0, 4876.0, 4461.0, 1571.0, 1596.0, 652.0, 432.0, 419.0, 169.0, 112.0, 98.0, 48.0, 48.0, 18.0, 11.0, 17.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.351139068603516e-06, -4.209578037261963e-06, -4.06801700592041e-06, -3.926455974578857e-06, -3.7848949432373047e-06, -3.643333911895752e-06, -3.5017728805541992e-06, -3.3602118492126465e-06, -3.2186508178710938e-06, -3.077089786529541e-06, -2.9355287551879883e-06, -2.7939677238464355e-06, -2.652406692504883e-06, -2.51084566116333e-06, -2.3692846298217773e-06, -2.2277235984802246e-06, -2.086162567138672e-06, -1.944601535797119e-06, -1.8030405044555664e-06, -1.6614794731140137e-06, -1.519918441772461e-06, -1.3783574104309082e-06, -1.2367963790893555e-06, -1.0952353477478027e-06, -9.5367431640625e-07, -8.121132850646973e-07, -6.705522537231445e-07, -5.289912223815918e-07, -3.8743019104003906e-07, -2.4586915969848633e-07, -1.043081283569336e-07, 3.725290298461914e-08, 1.7881393432617188e-07, 3.203749656677246e-07, 4.6193599700927734e-07, 6.034970283508301e-07, 7.450580596923828e-07, 8.866190910339355e-07, 1.0281801223754883e-06, 1.169741153717041e-06, 1.3113021850585938e-06, 1.4528632164001465e-06, 1.5944242477416992e-06, 1.735985279083252e-06, 1.8775463104248047e-06, 2.0191073417663574e-06, 2.16066837310791e-06, 2.302229404449463e-06, 2.4437904357910156e-06, 2.5853514671325684e-06, 2.726912498474121e-06, 2.868473529815674e-06, 3.0100345611572266e-06, 3.1515955924987793e-06, 3.293156623840332e-06, 3.4347176551818848e-06, 3.5762786865234375e-06, 3.7178397178649902e-06, 3.859400749206543e-06, 4.000961780548096e-06, 4.1425228118896484e-06, 4.284083843231201e-06, 4.425644874572754e-06, 4.567205905914307e-06, 4.708766937255859e-06]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 4.0, 8.0, 0.0, 16.0, 13.0, 0.0, 22.0, 0.0, 36.0, 30.0, 0.0, 37.0, 75.0, 0.0, 91.0, 158.0, 0.0, 160.0, 217.0, 0.0, 271.0, 0.0, 308.0, 364.0, 0.0, 432.0, 395.0, 0.0, 329.0, 282.0, 0.0, 203.0, 0.0, 155.0, 129.0, 0.0, 99.0, 63.0, 0.0, 63.0, 32.0, 0.0, 24.0, 23.0, 0.0, 12.0, 0.0, 16.0, 4.0, 0.0, 7.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.1920928955078125e-06, -1.1539086699485779e-06, -1.1157244443893433e-06, -1.0775402188301086e-06, -1.039355993270874e-06, -1.0011717677116394e-06, -9.629875421524048e-07, -9.248033165931702e-07, -8.866190910339355e-07, -8.484348654747009e-07, -8.102506399154663e-07, -7.720664143562317e-07, -7.338821887969971e-07, -6.956979632377625e-07, -6.575137376785278e-07, -6.193295121192932e-07, -5.811452865600586e-07, -5.42961061000824e-07, -5.047768354415894e-07, -4.6659260988235474e-07, -4.284083843231201e-07, -3.902241587638855e-07, -3.520399332046509e-07, -3.1385570764541626e-07, -2.7567148208618164e-07, -2.3748725652694702e-07, -1.993030309677124e-07, -1.6111880540847778e-07, -1.2293457984924316e-07, -8.475035429000854e-08, -4.6566128730773926e-08, -8.381903171539307e-09, 2.9802322387695312e-08, 6.798654794692993e-08, 1.0617077350616455e-07, 1.4435499906539917e-07, 1.825392246246338e-07, 2.207234501838684e-07, 2.5890767574310303e-07, 2.9709190130233765e-07, 3.3527612686157227e-07, 3.734603524208069e-07, 4.116445779800415e-07, 4.498288035392761e-07, 4.880130290985107e-07, 5.261972546577454e-07, 5.6438148021698e-07, 6.025657057762146e-07, 6.407499313354492e-07, 6.789341568946838e-07, 7.171183824539185e-07, 7.553026080131531e-07, 7.934868335723877e-07, 8.316710591316223e-07, 8.698552846908569e-07, 9.080395102500916e-07, 9.462237358093262e-07, 9.844079613685608e-07, 1.0225921869277954e-06, 1.06077641248703e-06, 1.0989606380462646e-06, 1.1371448636054993e-06, 1.1753290891647339e-06, 1.2135133147239685e-06, 1.2516975402832031e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 12.0, 7.0, 10.0, 16.0, 23.0, 24.0, 32.0, 54.0, 50.0, 68.0, 108.0, 118.0, 96.0, 83.0, 61.0, 53.0, 37.0, 29.0, 26.0, 23.0, 13.0, 8.0, 4.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1600937947805505e-06, -4.0243216972157825e-06, -3.888550054398365e-06, -3.7527779568335973e-06, -3.6170060866425047e-06, -3.481234216451412e-06, -3.345462118886644e-06, -3.2096902486955514e-06, -3.073918378504459e-06, -2.9381465083133662e-06, -2.8023746381222736e-06, -2.6666025405575056e-06, -2.530830670366413e-06, -2.3950588001753204e-06, -2.2592867026105523e-06, -2.1235148324194597e-06, -1.987742962228367e-06, -1.8519710920372745e-06, -1.7161991081593442e-06, -1.5804271242814139e-06, -1.4446552540903213e-06, -1.3088833838992286e-06, -1.1731114000212983e-06, -1.037339416143368e-06, -9.015675459522754e-07, -7.657956189177639e-07, -6.300236918832525e-07, -4.94251764848741e-07, -3.5847983781422954e-07, -2.2270791077971808e-07, -8.693598374520661e-08, 4.883594328930485e-08, 1.8460787032381631e-07, 3.203797973583278e-07, 4.5615172439283924e-07, 5.919236514273507e-07, 7.276955784618622e-07, 8.634675054963736e-07, 9.99239432530885e-07, 1.1350114164088154e-06, 1.270783286599908e-06, 1.4065551567910006e-06, 1.542327140668931e-06, 1.6780991245468613e-06, 1.8138709947379539e-06, 1.9496428649290465e-06, 2.0854149624938145e-06, 2.221186832684907e-06, 2.3569587028759997e-06, 2.4927305730670923e-06, 2.628502443258185e-06, 2.764274540822953e-06, 2.9000464110140456e-06, 3.035818281205138e-06, 3.1715903787699062e-06, 3.307362248960999e-06, 3.4431341191520914e-06, 3.578905989343184e-06, 3.7146778595342766e-06, 3.850449957099045e-06, 3.986221599916462e-06, 4.12199369748123e-06, 4.257765795045998e-06, 4.393537437863415e-06, 4.529309535428183e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 8.0, 3.0, 7.0, 4.0, 7.0, 18.0, 20.0, 22.0, 25.0, 19.0, 23.0, 33.0, 31.0, 29.0, 42.0, 34.0, 47.0, 48.0, 38.0, 46.0, 39.0, 47.0, 38.0, 43.0, 35.0, 34.0, 28.0, 17.0, 23.0, 25.0, 27.0, 23.0, 21.0, 14.0, 15.0, 12.0, 12.0, 10.0, 9.0, 4.0, 1.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.5216900212399196e-06, -2.4381249659199966e-06, -2.354560137973749e-06, -2.270995082653826e-06, -2.1874302547075786e-06, -2.1038651993876556e-06, -2.0203001440677326e-06, -1.936735316121485e-06, -1.8531703744883998e-06, -1.7696054328553146e-06, -1.6860404912222293e-06, -1.602475549589144e-06, -1.518910494269221e-06, -1.4353456663229736e-06, -1.3517806110030506e-06, -1.2682156693699653e-06, -1.18465072773688e-06, -1.1010857861037948e-06, -1.0175208444707096e-06, -9.339558459942054e-07, -8.503909043611202e-07, -7.668259627280349e-07, -6.832609642515308e-07, -5.996960226184456e-07, -5.161310809853603e-07, -4.3256613935227506e-07, -3.490011692974804e-07, -2.654361992426857e-07, -1.8187125760960043e-07, -9.830631597651518e-08, -1.4741317500011064e-08, 6.882362413307419e-08, 1.523887931398349e-07, 2.3595374898377486e-07, 3.1951870482771483e-07, 4.030836748825095e-07, 4.866486165155948e-07, 5.7021355814868e-07, 6.537785566251841e-07, 7.373434982582694e-07, 8.209084398913546e-07, 9.044733815244399e-07, 9.880383231575252e-07, 1.0716032647906104e-06, 1.1551683201105334e-06, 1.238733148056781e-06, 1.322298203376704e-06, 1.4058631450097892e-06, 1.4894280866428744e-06, 1.5729930282759597e-06, 1.656557969909045e-06, 1.7401230252289679e-06, 1.8236878531752154e-06, 1.9072529084951384e-06, 1.9908179638150614e-06, 2.074382791761309e-06, 2.1579476197075564e-06, 2.2415126750274794e-06, 2.325077502973727e-06, 2.40864255829365e-06, 2.4922073862398975e-06, 2.5757724415598204e-06, 2.6593374968797434e-06, 2.742902324825991e-06, 2.826467380145914e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 13.0, 12.0, 11.0, 47.0, 50.0, 42.0, 124.0, 133.0, 133.0, 364.0, 385.0, 590.0, 1349.0, 1462.0, 2114.0, 5178.0, 5753.0, 8995.0, 24371.0, 29510.0, 49133.0, 146766.0, 187487.0, 224959.0, 193772.0, 63780.0, 38341.0, 31081.0, 11336.0, 7040.0, 6151.0, 2442.0, 1679.0, 1669.0, 653.0, 453.0, 471.0, 189.0, 144.0, 157.0, 68.0, 41.0, 41.0, 15.0, 17.0, 15.0, 14.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.0531158447265625e-06, -3.914348781108856e-06, -3.77558171749115e-06, -3.6368146538734436e-06, -3.4980475902557373e-06, -3.359280526638031e-06, -3.2205134630203247e-06, -3.0817463994026184e-06, -2.942979335784912e-06, -2.804212272167206e-06, -2.6654452085494995e-06, -2.5266781449317932e-06, -2.387911081314087e-06, -2.2491440176963806e-06, -2.1103769540786743e-06, -1.971609890460968e-06, -1.8328428268432617e-06, -1.6940757632255554e-06, -1.5553086996078491e-06, -1.4165416359901428e-06, -1.2777745723724365e-06, -1.1390075087547302e-06, -1.000240445137024e-06, -8.614733815193176e-07, -7.227063179016113e-07, -5.83939254283905e-07, -4.4517219066619873e-07, -3.0640512704849243e-07, -1.6763806343078613e-07, -2.8870999813079834e-08, 1.0989606380462646e-07, 2.4866312742233276e-07, 3.8743019104003906e-07, 5.261972546577454e-07, 6.649643182754517e-07, 8.03731381893158e-07, 9.424984455108643e-07, 1.0812655091285706e-06, 1.2200325727462769e-06, 1.3587996363639832e-06, 1.4975666999816895e-06, 1.6363337635993958e-06, 1.775100827217102e-06, 1.9138678908348083e-06, 2.0526349544525146e-06, 2.191402018070221e-06, 2.3301690816879272e-06, 2.4689361453056335e-06, 2.60770320892334e-06, 2.746470272541046e-06, 2.8852373361587524e-06, 3.0240043997764587e-06, 3.162771463394165e-06, 3.3015385270118713e-06, 3.4403055906295776e-06, 3.579072654247284e-06, 3.7178397178649902e-06, 3.8566067814826965e-06, 3.995373845100403e-06, 4.134140908718109e-06, 4.2729079723358154e-06, 4.411675035953522e-06, 4.550442099571228e-06, 4.689209163188934e-06, 4.827976226806641e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 8.0, 10.0, 8.0, 6.0, 16.0, 16.0, 13.0, 43.0, 20.0, 17.0, 32.0, 32.0, 21.0, 51.0, 29.0, 41.0, 72.0, 34.0, 35.0, 62.0, 29.0, 30.0, 53.0, 32.0, 37.0, 17.0, 21.0, 47.0, 15.0, 17.0, 30.0, 9.0, 10.0, 25.0, 13.0, 8.0, 12.0, 3.0, 1.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.3245811462402344e-06, -2.2444874048233032e-06, -2.164393663406372e-06, -2.084299921989441e-06, -2.0042061805725098e-06, -1.9241124391555786e-06, -1.8440186977386475e-06, -1.7639249563217163e-06, -1.6838312149047852e-06, -1.603737473487854e-06, -1.5236437320709229e-06, -1.4435499906539917e-06, -1.3634562492370605e-06, -1.2833625078201294e-06, -1.2032687664031982e-06, -1.123175024986267e-06, -1.043081283569336e-06, -9.629875421524048e-07, -8.828938007354736e-07, -8.028000593185425e-07, -7.227063179016113e-07, -6.426125764846802e-07, -5.62518835067749e-07, -4.824250936508179e-07, -4.023313522338867e-07, -3.2223761081695557e-07, -2.421438694000244e-07, -1.6205012798309326e-07, -8.195638656616211e-08, -1.862645149230957e-09, 7.82310962677002e-08, 1.5832483768463135e-07, 2.384185791015625e-07, 3.1851232051849365e-07, 3.986060619354248e-07, 4.78699803352356e-07, 5.587935447692871e-07, 6.388872861862183e-07, 7.189810276031494e-07, 7.990747690200806e-07, 8.791685104370117e-07, 9.592622518539429e-07, 1.039355993270874e-06, 1.1194497346878052e-06, 1.1995434761047363e-06, 1.2796372175216675e-06, 1.3597309589385986e-06, 1.4398247003555298e-06, 1.519918441772461e-06, 1.600012183189392e-06, 1.6801059246063232e-06, 1.7601996660232544e-06, 1.8402934074401855e-06, 1.9203871488571167e-06, 2.000480890274048e-06, 2.080574631690979e-06, 2.16066837310791e-06, 2.2407621145248413e-06, 2.3208558559417725e-06, 2.4009495973587036e-06, 2.4810433387756348e-06, 2.561137080192566e-06, 2.641230821609497e-06, 2.7213245630264282e-06, 2.8014183044433594e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 6.0, 14.0, 17.0, 26.0, 33.0, 56.0, 76.0, 96.0, 174.0, 325.0, 476.0, 981.0, 2122.0, 4811.0, 16449.0, 127898.0, 859147.0, 24149.0, 6382.0, 2552.0, 1206.0, 628.0, 341.0, 207.0, 111.0, 94.0, 46.0, 38.0, 25.0, 23.0, 13.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3909759521484375e-06, -7.152557373046875e-06, -6.9141387939453125e-06, -6.67572021484375e-06, -6.4373016357421875e-06, -6.198883056640625e-06, -5.9604644775390625e-06, -5.7220458984375e-06, -5.4836273193359375e-06, -5.245208740234375e-06, -5.0067901611328125e-06, -4.76837158203125e-06, -4.5299530029296875e-06, -4.291534423828125e-06, -4.0531158447265625e-06, -3.814697265625e-06, -3.5762786865234375e-06, -3.337860107421875e-06, -3.0994415283203125e-06, -2.86102294921875e-06, -2.6226043701171875e-06, -2.384185791015625e-06, -2.1457672119140625e-06, -1.9073486328125e-06, -1.6689300537109375e-06, -1.430511474609375e-06, -1.1920928955078125e-06, -9.5367431640625e-07, -7.152557373046875e-07, -4.76837158203125e-07, -2.384185791015625e-07, 0.0, 2.384185791015625e-07, 4.76837158203125e-07, 7.152557373046875e-07, 9.5367431640625e-07, 1.1920928955078125e-06, 1.430511474609375e-06, 1.6689300537109375e-06, 1.9073486328125e-06, 2.1457672119140625e-06, 2.384185791015625e-06, 2.6226043701171875e-06, 2.86102294921875e-06, 3.0994415283203125e-06, 3.337860107421875e-06, 3.5762786865234375e-06, 3.814697265625e-06, 4.0531158447265625e-06, 4.291534423828125e-06, 4.5299530029296875e-06, 4.76837158203125e-06, 5.0067901611328125e-06, 5.245208740234375e-06, 5.4836273193359375e-06, 5.7220458984375e-06, 5.9604644775390625e-06, 6.198883056640625e-06, 6.4373016357421875e-06, 6.67572021484375e-06, 6.9141387939453125e-06, 7.152557373046875e-06, 7.3909759521484375e-06, 7.62939453125e-06, 7.867813110351562e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 0.0, 5.0, 0.0, 13.0, 0.0, 17.0, 0.0, 29.0, 49.0, 0.0, 130.0, 0.0, 534.0, 0.0, 109.0, 0.0, 47.0, 0.0, 29.0, 0.0, 16.0, 0.0, 7.0, 0.0, 5.0, 0.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1324882507324219e-06, -1.101754605770111e-06, -1.0710209608078003e-06, -1.0402873158454895e-06, -1.0095536708831787e-06, -9.78820025920868e-07, -9.480863809585571e-07, -9.173527359962463e-07, -8.866190910339355e-07, -8.558854460716248e-07, -8.25151801109314e-07, -7.944181561470032e-07, -7.636845111846924e-07, -7.329508662223816e-07, -7.022172212600708e-07, -6.7148357629776e-07, -6.407499313354492e-07, -6.100162863731384e-07, -5.792826414108276e-07, -5.485489964485168e-07, -5.178153514862061e-07, -4.870817065238953e-07, -4.5634806156158447e-07, -4.256144165992737e-07, -3.948807716369629e-07, -3.641471266746521e-07, -3.334134817123413e-07, -3.026798367500305e-07, -2.7194619178771973e-07, -2.4121254682540894e-07, -2.1047890186309814e-07, -1.7974525690078735e-07, -1.4901161193847656e-07, -1.1827796697616577e-07, -8.754432201385498e-08, -5.681067705154419e-08, -2.60770320892334e-08, 4.6566128730773926e-09, 3.5390257835388184e-08, 6.612390279769897e-08, 9.685754776000977e-08, 1.2759119272232056e-07, 1.5832483768463135e-07, 1.8905848264694214e-07, 2.1979212760925293e-07, 2.505257725715637e-07, 2.812594175338745e-07, 3.119930624961853e-07, 3.427267074584961e-07, 3.734603524208069e-07, 4.041939973831177e-07, 4.3492764234542847e-07, 4.6566128730773926e-07, 4.9639493227005e-07, 5.271285772323608e-07, 5.578622221946716e-07, 5.885958671569824e-07, 6.193295121192932e-07, 6.50063157081604e-07, 6.807968020439148e-07, 7.115304470062256e-07, 7.422640919685364e-07, 7.729977369308472e-07, 8.03731381893158e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 2.0, 5.0, 7.0, 4.0, 34.0, 6.0, 23.0, 43.0, 175.0, 66.0, 103.0, 375.0, 261.0, 496.0, 641.0, 2526.0, 2538.0, 4524.0, 12931.0, 1011845.0, 4618.0, 2562.0, 2475.0, 667.0, 511.0, 271.0, 359.0, 114.0, 61.0, 180.0, 46.0, 18.0, 4.0, 37.0, 4.0, 7.0, 5.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4437904357910156e-06, -2.3674219846725464e-06, -2.291053533554077e-06, -2.214685082435608e-06, -2.1383166313171387e-06, -2.0619481801986694e-06, -1.9855797290802e-06, -1.909211277961731e-06, -1.8328428268432617e-06, -1.7564743757247925e-06, -1.6801059246063232e-06, -1.603737473487854e-06, -1.5273690223693848e-06, -1.4510005712509155e-06, -1.3746321201324463e-06, -1.298263669013977e-06, -1.2218952178955078e-06, -1.1455267667770386e-06, -1.0691583156585693e-06, -9.927898645401e-07, -9.164214134216309e-07, -8.400529623031616e-07, -7.636845111846924e-07, -6.873160600662231e-07, -6.109476089477539e-07, -5.345791578292847e-07, -4.5821070671081543e-07, -3.818422555923462e-07, -3.0547380447387695e-07, -2.2910535335540771e-07, -1.5273690223693848e-07, -7.636845111846924e-08, 0.0, 7.636845111846924e-08, 1.5273690223693848e-07, 2.2910535335540771e-07, 3.0547380447387695e-07, 3.818422555923462e-07, 4.5821070671081543e-07, 5.345791578292847e-07, 6.109476089477539e-07, 6.873160600662231e-07, 7.636845111846924e-07, 8.400529623031616e-07, 9.164214134216309e-07, 9.927898645401e-07, 1.0691583156585693e-06, 1.1455267667770386e-06, 1.2218952178955078e-06, 1.298263669013977e-06, 1.3746321201324463e-06, 1.4510005712509155e-06, 1.5273690223693848e-06, 1.603737473487854e-06, 1.6801059246063232e-06, 1.7564743757247925e-06, 1.8328428268432617e-06, 1.909211277961731e-06, 1.9855797290802e-06, 2.0619481801986694e-06, 2.1383166313171387e-06, 2.214685082435608e-06, 2.291053533554077e-06, 2.3674219846725464e-06, 2.4437904357910156e-06]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 34.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 946.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-1.7881393432617188e-07, -1.7415732145309448e-07, -1.695007085800171e-07, -1.648440957069397e-07, -1.601874828338623e-07, -1.555308699607849e-07, -1.5087425708770752e-07, -1.4621764421463013e-07, -1.4156103134155273e-07, -1.3690441846847534e-07, -1.3224780559539795e-07, -1.2759119272232056e-07, -1.2293457984924316e-07, -1.1827796697616577e-07, -1.1362135410308838e-07, -1.0896474123001099e-07, -1.043081283569336e-07, -9.96515154838562e-08, -9.499490261077881e-08, -9.033828973770142e-08, -8.568167686462402e-08, -8.102506399154663e-08, -7.636845111846924e-08, -7.171183824539185e-08, -6.705522537231445e-08, -6.239861249923706e-08, -5.774199962615967e-08, -5.3085386753082275e-08, -4.842877388000488e-08, -4.377216100692749e-08, -3.91155481338501e-08, -3.4458935260772705e-08, -2.9802322387695312e-08, -2.514570951461792e-08, -2.0489096641540527e-08, -1.5832483768463135e-08, -1.1175870895385742e-08, -6.51925802230835e-09, -1.862645149230957e-09, 2.7939677238464355e-09, 7.450580596923828e-09, 1.210719347000122e-08, 1.6763806343078613e-08, 2.1420419216156006e-08, 2.60770320892334e-08, 3.073364496231079e-08, 3.5390257835388184e-08, 4.0046870708465576e-08, 4.470348358154297e-08, 4.936009645462036e-08, 5.4016709327697754e-08, 5.8673322200775146e-08, 6.332993507385254e-08, 6.798654794692993e-08, 7.264316082000732e-08, 7.729977369308472e-08, 8.195638656616211e-08, 8.66129994392395e-08, 9.12696123123169e-08, 9.592622518539429e-08, 1.0058283805847168e-07, 1.0523945093154907e-07, 1.0989606380462646e-07, 1.1455267667770386e-07, 1.1920928955078125e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 0.0, 0.0, 14.0, 0.0, 32.0, 0.0, 0.0, 117.0, 0.0, 221.0, 0.0, 0.0, 392.0, 0.0, 901.0, 0.0, 0.0, 1841.0, 0.0, 0.0, 3435.0, 0.0, 8347.0, 0.0, 0.0, 18786.0, 0.0, 980307.0, 0.0, 0.0, 18949.0, 0.0, 8220.0, 0.0, 0.0, 3440.0, 0.0, 1902.0, 0.0, 0.0, 874.0, 0.0, 0.0, 436.0, 0.0, 212.0, 0.0, 0.0, 95.0, 0.0, 25.0, 0.0, 0.0, 13.0, 0.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.152557373046875e-07, -6.919726729393005e-07, -6.686896085739136e-07, -6.454065442085266e-07, -6.221234798431396e-07, -5.988404154777527e-07, -5.755573511123657e-07, -5.522742867469788e-07, -5.289912223815918e-07, -5.057081580162048e-07, -4.824250936508179e-07, -4.591420292854309e-07, -4.3585896492004395e-07, -4.12575900554657e-07, -3.8929283618927e-07, -3.6600977182388306e-07, -3.427267074584961e-07, -3.1944364309310913e-07, -2.9616057872772217e-07, -2.728775143623352e-07, -2.4959444999694824e-07, -2.2631138563156128e-07, -2.0302832126617432e-07, -1.7974525690078735e-07, -1.564621925354004e-07, -1.3317912817001343e-07, -1.0989606380462646e-07, -8.66129994392395e-08, -6.332993507385254e-08, -4.0046870708465576e-08, -1.6763806343078613e-08, 6.51925802230835e-09, 2.9802322387695312e-08, 5.3085386753082275e-08, 7.636845111846924e-08, 9.96515154838562e-08, 1.2293457984924316e-07, 1.4621764421463013e-07, 1.695007085800171e-07, 1.9278377294540405e-07, 2.1606683731079102e-07, 2.39349901676178e-07, 2.6263296604156494e-07, 2.859160304069519e-07, 3.0919909477233887e-07, 3.3248215913772583e-07, 3.557652235031128e-07, 3.7904828786849976e-07, 4.023313522338867e-07, 4.256144165992737e-07, 4.4889748096466064e-07, 4.721805453300476e-07, 4.954636096954346e-07, 5.187466740608215e-07, 5.420297384262085e-07, 5.653128027915955e-07, 5.885958671569824e-07, 6.118789315223694e-07, 6.351619958877563e-07, 6.584450602531433e-07, 6.817281246185303e-07, 7.050111889839172e-07, 7.282942533493042e-07, 7.515773177146912e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 938.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0], "bins": [-2.384185791015625e-07, -2.3189932107925415e-07, -2.253800630569458e-07, -2.1886080503463745e-07, -2.123415470123291e-07, -2.0582228899002075e-07, -1.993030309677124e-07, -1.9278377294540405e-07, -1.862645149230957e-07, -1.7974525690078735e-07, -1.73225998878479e-07, -1.6670674085617065e-07, -1.601874828338623e-07, -1.5366822481155396e-07, -1.471489667892456e-07, -1.4062970876693726e-07, -1.341104507446289e-07, -1.2759119272232056e-07, -1.210719347000122e-07, -1.1455267667770386e-07, -1.0803341865539551e-07, -1.0151416063308716e-07, -9.499490261077881e-08, -8.847564458847046e-08, -8.195638656616211e-08, -7.543712854385376e-08, -6.891787052154541e-08, -6.239861249923706e-08, -5.587935447692871e-08, -4.936009645462036e-08, -4.284083843231201e-08, -3.632158041000366e-08, -2.9802322387695312e-08, -2.3283064365386963e-08, -1.6763806343078613e-08, -1.0244548320770264e-08, -3.725290298461914e-09, 2.7939677238464355e-09, 9.313225746154785e-09, 1.5832483768463135e-08, 2.2351741790771484e-08, 2.8870999813079834e-08, 3.5390257835388184e-08, 4.190951585769653e-08, 4.842877388000488e-08, 5.494803190231323e-08, 6.146728992462158e-08, 6.798654794692993e-08, 7.450580596923828e-08, 8.102506399154663e-08, 8.754432201385498e-08, 9.406358003616333e-08, 1.0058283805847168e-07, 1.0710209608078003e-07, 1.1362135410308838e-07, 1.2014061212539673e-07, 1.2665987014770508e-07, 1.3317912817001343e-07, 1.3969838619232178e-07, 1.4621764421463013e-07, 1.5273690223693848e-07, 1.5925616025924683e-07, 1.6577541828155518e-07, 1.7229467630386353e-07, 1.7881393432617188e-07]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 9.0, 8.0, 10.0, 18.0, 12.0, 25.0, 34.0, 42.0, 62.0, 64.0, 90.0, 124.0, 118.0, 77.0, 55.0, 56.0, 33.0, 36.0, 20.0, 23.0, 18.0, 11.0, 12.0, 13.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.906332040060079e-06, -3.780031420319574e-06, -3.6537310279527446e-06, -3.5274306355859153e-06, -3.4011300158454105e-06, -3.2748293961049058e-06, -3.1485290037380764e-06, -3.022228611371247e-06, -2.8959279916307423e-06, -2.7696273718902376e-06, -2.6433269795234082e-06, -2.517026587156579e-06, -2.390725967416074e-06, -2.2644253476755694e-06, -2.13812495530874e-06, -2.0118245629419107e-06, -1.885523943201406e-06, -1.7592234371477389e-06, -1.6329229310940718e-06, -1.5066224250404048e-06, -1.3803219189867377e-06, -1.2540214129330707e-06, -1.1277209068794036e-06, -1.0014204008257366e-06, -8.751198947720695e-07, -7.488193887184025e-07, -6.225188826647354e-07, -4.962183766110684e-07, -3.6991787055740133e-07, -2.436173645037343e-07, -1.1731685845006723e-07, 8.98364760359982e-09, 1.3528415365726687e-07, 2.615846597109339e-07, 3.8788516576460097e-07, 5.14185671818268e-07, 6.404861778719351e-07, 7.667866839256021e-07, 8.930871899792692e-07, 1.0193876960329362e-06, 1.1456882020866033e-06, 1.2719887081402703e-06, 1.3982892141939374e-06, 1.5245897202476044e-06, 1.6508902263012715e-06, 1.7771907323549385e-06, 1.9034912384086056e-06, 2.029791630775435e-06, 2.1560922505159397e-06, 2.2823928702564444e-06, 2.4086932626232738e-06, 2.534993654990103e-06, 2.661294274730608e-06, 2.7875948944711126e-06, 2.913895286837942e-06, 3.0401956792047713e-06, 3.166496298945276e-06, 3.292796918685781e-06, 3.41909731105261e-06, 3.5453977034194395e-06, 3.6716983231599443e-06, 3.797998942900449e-06, 3.924299562640954e-06, 4.050599727634108e-06, 4.1769003473746125e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 5.0, 7.0, 3.0, 6.0, 13.0, 22.0, 18.0, 23.0, 24.0, 21.0, 35.0, 29.0, 33.0, 31.0, 40.0, 48.0, 39.0, 43.0, 48.0, 41.0, 39.0, 44.0, 37.0, 42.0, 31.0, 31.0, 18.0, 26.0, 25.0, 22.0, 31.0, 16.0, 16.0, 16.0, 14.0, 12.0, 11.0, 6.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.3932695967232576e-06, -2.314866378583247e-06, -2.2364629330695607e-06, -2.15805971492955e-06, -2.079656269415864e-06, -2.001253051275853e-06, -1.922849605762167e-06, -1.8444463876221562e-06, -1.7660431694821455e-06, -1.687639837655297e-06, -1.6092365058284486e-06, -1.5308332876884378e-06, -1.4524299558615894e-06, -1.374026624034741e-06, -1.2956232922078925e-06, -1.217219960381044e-06, -1.1388166285541956e-06, -1.0604132967273472e-06, -9.820099649004987e-07, -9.036066899170692e-07, -8.252034149336396e-07, -7.468000831067911e-07, -6.683967512799427e-07, -5.899934762965131e-07, -5.115901444696647e-07, -4.3318684106452565e-07, -3.5478353765938664e-07, -2.763802058325382e-07, -1.9797690242739918e-07, -1.1957359902226017e-07, -4.1170267195411725e-08, 3.723300778801786e-08, 1.156363396148663e-07, 1.9403964302000531e-07, 2.7244294642514433e-07, 3.5084627825199277e-07, 4.292495816571318e-07, 5.076528850622708e-07, 5.860562168891192e-07, 6.644594918725488e-07, 7.428628236993973e-07, 8.212661555262457e-07, 8.996694305096753e-07, 9.780727623365237e-07, 1.0564760941633722e-06, 1.134879312303383e-06, 1.213282757817069e-06, 1.2916859759570798e-06, 1.3700893077839282e-06, 1.4484926396107767e-06, 1.5268959714376251e-06, 1.6052993032644736e-06, 1.6837025214044843e-06, 1.7621058532313327e-06, 1.8405091850581812e-06, 1.918912403198192e-06, 1.997315848711878e-06, 2.0757190668518888e-06, 2.154122512365575e-06, 2.2325257305055857e-06, 2.310929176019272e-06, 2.3893323941592826e-06, 2.4677356122992933e-06, 2.5461390578129794e-06, 2.62454227595299e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 8.0, 14.0, 15.0, 30.0, 47.0, 59.0, 136.0, 142.0, 189.0, 452.0, 446.0, 1046.0, 1086.0, 2458.0, 2461.0, 5652.0, 5763.0, 8701.0, 21124.0, 24530.0, 67791.0, 85061.0, 243854.0, 206094.0, 144229.0, 113471.0, 39477.0, 33170.0, 12561.0, 11620.0, 4837.0, 4678.0, 2085.0, 1542.0, 1423.0, 644.0, 701.0, 281.0, 276.0, 113.0, 86.0, 73.0, 35.0, 37.0, 21.0, 9.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.410743713378906e-06, -4.265457391738892e-06, -4.120171070098877e-06, -3.974884748458862e-06, -3.829598426818848e-06, -3.684312105178833e-06, -3.5390257835388184e-06, -3.3937394618988037e-06, -3.248453140258789e-06, -3.1031668186187744e-06, -2.9578804969787598e-06, -2.812594175338745e-06, -2.6673078536987305e-06, -2.522021532058716e-06, -2.376735210418701e-06, -2.2314488887786865e-06, -2.086162567138672e-06, -1.9408762454986572e-06, -1.7955899238586426e-06, -1.650303602218628e-06, -1.5050172805786133e-06, -1.3597309589385986e-06, -1.214444637298584e-06, -1.0691583156585693e-06, -9.238719940185547e-07, -7.7858567237854e-07, -6.332993507385254e-07, -4.880130290985107e-07, -3.427267074584961e-07, -1.9744038581848145e-07, -5.21540641784668e-08, 9.313225746154785e-08, 2.384185791015625e-07, 3.8370490074157715e-07, 5.289912223815918e-07, 6.742775440216064e-07, 8.195638656616211e-07, 9.648501873016357e-07, 1.1101365089416504e-06, 1.255422830581665e-06, 1.4007091522216797e-06, 1.5459954738616943e-06, 1.691281795501709e-06, 1.8365681171417236e-06, 1.9818544387817383e-06, 2.127140760421753e-06, 2.2724270820617676e-06, 2.4177134037017822e-06, 2.562999725341797e-06, 2.7082860469818115e-06, 2.853572368621826e-06, 2.998858690261841e-06, 3.1441450119018555e-06, 3.28943133354187e-06, 3.4347176551818848e-06, 3.5800039768218994e-06, 3.725290298461914e-06, 3.870576620101929e-06, 4.015862941741943e-06, 4.161149263381958e-06, 4.306435585021973e-06, 4.451721906661987e-06, 4.597008228302002e-06, 4.742294549942017e-06, 4.887580871582031e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 8.0, 3.0, 7.0, 8.0, 11.0, 10.0, 15.0, 17.0, 48.0, 19.0, 24.0, 19.0, 31.0, 36.0, 32.0, 42.0, 41.0, 40.0, 42.0, 32.0, 45.0, 45.0, 39.0, 35.0, 38.0, 24.0, 40.0, 25.0, 26.0, 50.0, 23.0, 12.0, 13.0, 19.0, 11.0, 13.0, 5.0, 9.0, 6.0, 5.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0], "bins": [-2.086162567138672e-06, -2.023763954639435e-06, -1.9613653421401978e-06, -1.8989667296409607e-06, -1.8365681171417236e-06, -1.7741695046424866e-06, -1.7117708921432495e-06, -1.6493722796440125e-06, -1.5869736671447754e-06, -1.5245750546455383e-06, -1.4621764421463013e-06, -1.3997778296470642e-06, -1.3373792171478271e-06, -1.27498060464859e-06, -1.212581992149353e-06, -1.150183379650116e-06, -1.087784767150879e-06, -1.0253861546516418e-06, -9.629875421524048e-07, -9.005889296531677e-07, -8.381903171539307e-07, -7.757917046546936e-07, -7.133930921554565e-07, -6.509944796562195e-07, -5.885958671569824e-07, -5.261972546577454e-07, -4.637986421585083e-07, -4.0140002965927124e-07, -3.390014171600342e-07, -2.766028046607971e-07, -2.1420419216156006e-07, -1.51805579662323e-07, -8.940696716308594e-08, -2.7008354663848877e-08, 3.5390257835388184e-08, 9.778887033462524e-08, 1.601874828338623e-07, 2.2258609533309937e-07, 2.849847078323364e-07, 3.473833203315735e-07, 4.0978193283081055e-07, 4.721805453300476e-07, 5.345791578292847e-07, 5.969777703285217e-07, 6.593763828277588e-07, 7.217749953269958e-07, 7.841736078262329e-07, 8.4657222032547e-07, 9.08970832824707e-07, 9.71369445323944e-07, 1.0337680578231812e-06, 1.0961666703224182e-06, 1.1585652828216553e-06, 1.2209638953208923e-06, 1.2833625078201294e-06, 1.3457611203193665e-06, 1.4081597328186035e-06, 1.4705583453178406e-06, 1.5329569578170776e-06, 1.5953555703163147e-06, 1.6577541828155518e-06, 1.7201527953147888e-06, 1.7825514078140259e-06, 1.844950020313263e-06, 1.9073486328125e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 12.0, 7.0, 17.0, 13.0, 34.0, 48.0, 75.0, 64.0, 151.0, 210.0, 321.0, 257.0, 603.0, 905.0, 664.0, 1847.0, 2782.0, 4368.0, 2944.0, 8737.0, 14198.0, 23755.0, 17267.0, 51646.0, 88900.0, 148465.0, 100668.0, 211268.0, 148369.0, 50379.0, 67936.0, 39805.0, 23741.0, 7962.0, 11129.0, 6801.0, 4358.0, 1526.0, 2219.0, 1357.0, 948.0, 362.0, 502.0, 318.0, 118.0, 178.0, 111.0, 88.0, 23.0, 49.0, 20.0, 18.0, 4.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-3.2186508178710938e-06, -3.1152740120887756e-06, -3.0118972063064575e-06, -2.9085204005241394e-06, -2.8051435947418213e-06, -2.701766788959503e-06, -2.598389983177185e-06, -2.495013177394867e-06, -2.391636371612549e-06, -2.2882595658302307e-06, -2.1848827600479126e-06, -2.0815059542655945e-06, -1.9781291484832764e-06, -1.8747523427009583e-06, -1.7713755369186401e-06, -1.667998731136322e-06, -1.564621925354004e-06, -1.4612451195716858e-06, -1.3578683137893677e-06, -1.2544915080070496e-06, -1.1511147022247314e-06, -1.0477378964424133e-06, -9.443610906600952e-07, -8.409842848777771e-07, -7.37607479095459e-07, -6.342306733131409e-07, -5.308538675308228e-07, -4.2747706174850464e-07, -3.241002559661865e-07, -2.207234501838684e-07, -1.1734664440155029e-07, -1.3969838619232178e-08, 8.940696716308594e-08, 1.9278377294540405e-07, 2.9616057872772217e-07, 3.995373845100403e-07, 5.029141902923584e-07, 6.062909960746765e-07, 7.096678018569946e-07, 8.130446076393127e-07, 9.164214134216309e-07, 1.019798219203949e-06, 1.123175024986267e-06, 1.2265518307685852e-06, 1.3299286365509033e-06, 1.4333054423332214e-06, 1.5366822481155396e-06, 1.6400590538978577e-06, 1.7434358596801758e-06, 1.846812665462494e-06, 1.950189471244812e-06, 2.05356627702713e-06, 2.1569430828094482e-06, 2.2603198885917664e-06, 2.3636966943740845e-06, 2.4670735001564026e-06, 2.5704503059387207e-06, 2.673827111721039e-06, 2.777203917503357e-06, 2.880580723285675e-06, 2.983957529067993e-06, 3.0873343348503113e-06, 3.1907111406326294e-06, 3.2940879464149475e-06, 3.3974647521972656e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 0.0, 6.0, 11.0, 0.0, 9.0, 0.0, 14.0, 24.0, 0.0, 29.0, 28.0, 0.0, 34.0, 40.0, 0.0, 40.0, 46.0, 0.0, 58.0, 0.0, 46.0, 54.0, 0.0, 74.0, 60.0, 0.0, 56.0, 57.0, 0.0, 59.0, 0.0, 43.0, 40.0, 0.0, 39.0, 36.0, 0.0, 26.0, 17.0, 0.0, 17.0, 15.0, 0.0, 8.0, 0.0, 4.0, 4.0, 0.0, 6.0, 7.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1920928955078125e-06, -1.1539086699485779e-06, -1.1157244443893433e-06, -1.0775402188301086e-06, -1.039355993270874e-06, -1.0011717677116394e-06, -9.629875421524048e-07, -9.248033165931702e-07, -8.866190910339355e-07, -8.484348654747009e-07, -8.102506399154663e-07, -7.720664143562317e-07, -7.338821887969971e-07, -6.956979632377625e-07, -6.575137376785278e-07, -6.193295121192932e-07, -5.811452865600586e-07, -5.42961061000824e-07, -5.047768354415894e-07, -4.6659260988235474e-07, -4.284083843231201e-07, -3.902241587638855e-07, -3.520399332046509e-07, -3.1385570764541626e-07, -2.7567148208618164e-07, -2.3748725652694702e-07, -1.993030309677124e-07, -1.6111880540847778e-07, -1.2293457984924316e-07, -8.475035429000854e-08, -4.6566128730773926e-08, -8.381903171539307e-09, 2.9802322387695312e-08, 6.798654794692993e-08, 1.0617077350616455e-07, 1.4435499906539917e-07, 1.825392246246338e-07, 2.207234501838684e-07, 2.5890767574310303e-07, 2.9709190130233765e-07, 3.3527612686157227e-07, 3.734603524208069e-07, 4.116445779800415e-07, 4.498288035392761e-07, 4.880130290985107e-07, 5.261972546577454e-07, 5.6438148021698e-07, 6.025657057762146e-07, 6.407499313354492e-07, 6.789341568946838e-07, 7.171183824539185e-07, 7.553026080131531e-07, 7.934868335723877e-07, 8.316710591316223e-07, 8.698552846908569e-07, 9.080395102500916e-07, 9.462237358093262e-07, 9.844079613685608e-07, 1.0225921869277954e-06, 1.06077641248703e-06, 1.0989606380462646e-06, 1.1371448636054993e-06, 1.1753290891647339e-06, 1.2135133147239685e-06, 1.2516975402832031e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 10.0, 5.0, 3.0, 2.0, 16.0, 8.0, 12.0, 18.0, 44.0, 36.0, 50.0, 64.0, 254.0, 223.0, 390.0, 473.0, 2443.0, 1845.0, 3254.0, 6932.0, 39792.0, 45628.0, 845471.0, 45878.0, 39612.0, 6938.0, 3203.0, 1892.0, 2415.0, 459.0, 403.0, 236.0, 266.0, 66.0, 48.0, 33.0, 40.0, 10.0, 21.0, 12.0, 11.0, 5.0, 4.0, 4.0, 15.0, 1.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2649765014648438e-06, -2.1904706954956055e-06, -2.115964889526367e-06, -2.041459083557129e-06, -1.9669532775878906e-06, -1.8924474716186523e-06, -1.817941665649414e-06, -1.7434358596801758e-06, -1.6689300537109375e-06, -1.5944242477416992e-06, -1.519918441772461e-06, -1.4454126358032227e-06, -1.3709068298339844e-06, -1.296401023864746e-06, -1.2218952178955078e-06, -1.1473894119262695e-06, -1.0728836059570312e-06, -9.98377799987793e-07, -9.238719940185547e-07, -8.493661880493164e-07, -7.748603820800781e-07, -7.003545761108398e-07, -6.258487701416016e-07, -5.513429641723633e-07, -4.76837158203125e-07, -4.023313522338867e-07, -3.2782554626464844e-07, -2.5331974029541016e-07, -1.7881393432617188e-07, -1.043081283569336e-07, -2.9802322387695312e-08, 4.470348358154297e-08, 1.1920928955078125e-07, 1.9371509552001953e-07, 2.682209014892578e-07, 3.427267074584961e-07, 4.172325134277344e-07, 4.917383193969727e-07, 5.662441253662109e-07, 6.407499313354492e-07, 7.152557373046875e-07, 7.897615432739258e-07, 8.642673492431641e-07, 9.387731552124023e-07, 1.0132789611816406e-06, 1.087784767150879e-06, 1.1622905731201172e-06, 1.2367963790893555e-06, 1.3113021850585938e-06, 1.385807991027832e-06, 1.4603137969970703e-06, 1.5348196029663086e-06, 1.6093254089355469e-06, 1.6838312149047852e-06, 1.7583370208740234e-06, 1.8328428268432617e-06, 1.9073486328125e-06, 1.9818544387817383e-06, 2.0563602447509766e-06, 2.130866050720215e-06, 2.205371856689453e-06, 2.2798776626586914e-06, 2.3543834686279297e-06, 2.428889274597168e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 0.0, 6.0, 14.0, 20.0, 25.0, 0.0, 42.0, 54.0, 95.0, 122.0, 0.0, 156.0, 246.0, 321.0, 459.0, 0.0, 710.0, 1004.0, 1633.0, 2501.0, 0.0, 4069.0, 6990.0, 11824.0, 28556.0, 0.0, 69955.0, 791042.0, 69877.0, 28612.0, 0.0, 11821.0, 6903.0, 4091.0, 2486.0, 0.0, 1639.0, 1011.0, 698.0, 464.0, 0.0, 309.0, 277.0, 152.0, 118.0, 0.0, 87.0, 62.0, 37.0, 33.0, 0.0, 16.0, 14.0, 9.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4426186680793762e-06, -1.3951212167739868e-06, -1.3476237654685974e-06, -1.300126314163208e-06, -1.2526288628578186e-06, -1.2051314115524292e-06, -1.1576339602470398e-06, -1.1101365089416504e-06, -1.062639057636261e-06, -1.0151416063308716e-06, -9.676441550254822e-07, -9.201467037200928e-07, -8.726492524147034e-07, -8.25151801109314e-07, -7.776543498039246e-07, -7.301568984985352e-07, -6.826594471931458e-07, -6.351619958877563e-07, -5.876645445823669e-07, -5.401670932769775e-07, -4.926696419715881e-07, -4.4517219066619873e-07, -3.976747393608093e-07, -3.501772880554199e-07, -3.026798367500305e-07, -2.551823854446411e-07, -2.076849341392517e-07, -1.601874828338623e-07, -1.126900315284729e-07, -6.51925802230835e-08, -1.7695128917694092e-08, 2.9802322387695312e-08, 7.729977369308472e-08, 1.2479722499847412e-07, 1.7229467630386353e-07, 2.1979212760925293e-07, 2.6728957891464233e-07, 3.1478703022003174e-07, 3.6228448152542114e-07, 4.0978193283081055e-07, 4.5727938413619995e-07, 5.047768354415894e-07, 5.522742867469788e-07, 5.997717380523682e-07, 6.472691893577576e-07, 6.94766640663147e-07, 7.422640919685364e-07, 7.897615432739258e-07, 8.372589945793152e-07, 8.847564458847046e-07, 9.32253897190094e-07, 9.797513484954834e-07, 1.0272487998008728e-06, 1.0747462511062622e-06, 1.1222437024116516e-06, 1.169741153717041e-06, 1.2172386050224304e-06, 1.2647360563278198e-06, 1.3122335076332092e-06, 1.3597309589385986e-06, 1.407228410243988e-06, 1.4547258615493774e-06, 1.5022233128547668e-06, 1.5497207641601562e-06]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 7.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 43.0, 0.0, 0.0, 0.0, 84.0, 0.0, 0.0, 0.0, 694.0, 0.0, 0.0, 0.0, 95.0, 0.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-07, -4.6193599700927734e-07, -4.470348358154297e-07, -4.3213367462158203e-07, -4.172325134277344e-07, -4.023313522338867e-07, -3.8743019104003906e-07, -3.725290298461914e-07, -3.5762786865234375e-07, -3.427267074584961e-07, -3.2782554626464844e-07, -3.129243850708008e-07, -2.980232238769531e-07, -2.8312206268310547e-07, -2.682209014892578e-07, -2.5331974029541016e-07, -2.384185791015625e-07, -2.2351741790771484e-07, -2.086162567138672e-07, -1.9371509552001953e-07, -1.7881393432617188e-07, -1.6391277313232422e-07, -1.4901161193847656e-07, -1.341104507446289e-07, -1.1920928955078125e-07, -1.043081283569336e-07, -8.940696716308594e-08, -7.450580596923828e-08, -5.960464477539063e-08, -4.470348358154297e-08, -2.9802322387695312e-08, -1.4901161193847656e-08, 0.0, 1.4901161193847656e-08, 2.9802322387695312e-08, 4.470348358154297e-08, 5.960464477539063e-08, 7.450580596923828e-08, 8.940696716308594e-08, 1.043081283569336e-07, 1.1920928955078125e-07, 1.341104507446289e-07, 1.4901161193847656e-07, 1.6391277313232422e-07, 1.7881393432617188e-07, 1.9371509552001953e-07, 2.086162567138672e-07, 2.2351741790771484e-07, 2.384185791015625e-07, 2.5331974029541016e-07, 2.682209014892578e-07, 2.8312206268310547e-07, 2.980232238769531e-07, 3.129243850708008e-07, 3.2782554626464844e-07, 3.427267074584961e-07, 3.5762786865234375e-07, 3.725290298461914e-07, 3.8743019104003906e-07, 4.023313522338867e-07, 4.172325134277344e-07, 4.3213367462158203e-07, 4.470348358154297e-07, 4.6193599700927734e-07, 4.76837158203125e-07]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 3.0, 7.0, 15.0, 6.0, 11.0, 19.0, 20.0, 34.0, 39.0, 54.0, 54.0, 87.0, 77.0, 94.0, 102.0, 88.0, 63.0, 42.0, 42.0, 32.0, 20.0, 11.0, 22.0, 12.0, 5.0, 9.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.177887720084982e-06, -3.070116235903697e-06, -2.962344751722412e-06, -2.8545732675411273e-06, -2.7468017833598424e-06, -2.6390302991785575e-06, -2.5312588149972726e-06, -2.4234873308159877e-06, -2.3157158466347028e-06, -2.207944362453418e-06, -2.100172878272133e-06, -1.992401394090848e-06, -1.8846299099095631e-06, -1.7768584257282782e-06, -1.6690869415469933e-06, -1.5613154573657084e-06, -1.4535439731844235e-06, -1.3457724890031386e-06, -1.2380010048218537e-06, -1.1302295206405688e-06, -1.022458036459284e-06, -9.14686552277999e-07, -8.069150680967141e-07, -6.991435839154292e-07, -5.913720997341443e-07, -4.836006155528594e-07, -3.758291313715745e-07, -2.6805764719028957e-07, -1.6028616300900467e-07, -5.251467882771976e-08, 5.525680535356514e-08, 1.6302828953485005e-07, 2.7079977371613495e-07, 3.7857125789741985e-07, 4.863427420787048e-07, 5.941142262599897e-07, 7.018857104412746e-07, 8.096571946225595e-07, 9.174286788038444e-07, 1.0252001629851293e-06, 1.1329716471664142e-06, 1.240743131347699e-06, 1.348514615528984e-06, 1.456286099710269e-06, 1.5640575838915538e-06, 1.6718290680728387e-06, 1.7796005522541236e-06, 1.8873720364354085e-06, 1.9951435206166934e-06, 2.1029150047979783e-06, 2.2106864889792632e-06, 2.318457973160548e-06, 2.426229457341833e-06, 2.534000941523118e-06, 2.641772425704403e-06, 2.7495439098856878e-06, 2.8573153940669727e-06, 2.9650868782482576e-06, 3.0728583624295425e-06, 3.1806298466108274e-06, 3.2884013307921123e-06, 3.396172814973397e-06, 3.503944299154682e-06, 3.611715783335967e-06, 3.719487267517252e-06]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 3.0, 2.0, 10.0, 7.0, 11.0, 9.0, 13.0, 22.0, 24.0, 21.0, 33.0, 26.0, 20.0, 34.0, 33.0, 31.0, 38.0, 49.0, 41.0, 45.0, 24.0, 43.0, 40.0, 32.0, 30.0, 44.0, 24.0, 28.0, 38.0, 28.0, 19.0, 27.0, 21.0, 21.0, 12.0, 17.0, 11.0, 13.0, 8.0, 10.0, 11.0, 4.0, 3.0, 4.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.0494856016739504e-06, -1.983276888495311e-06, -1.9170679479429964e-06, -1.850859234764357e-06, -1.7846505215857178e-06, -1.7184418084070785e-06, -1.6522329815416015e-06, -1.5860241546761245e-06, -1.5198154414974852e-06, -1.4536067283188459e-06, -1.3873979014533688e-06, -1.3211890745878918e-06, -1.2549803614092525e-06, -1.1887716482306132e-06, -1.1225628213651362e-06, -1.0563539944996592e-06, -9.901452813210199e-07, -9.239365112989617e-07, -8.577277412769035e-07, -7.915189712548454e-07, -7.253102012327872e-07, -6.591014312107291e-07, -5.928926611886709e-07, -5.266838911666127e-07, -4.604751211445546e-07, -3.942663511224964e-07, -3.2805758110043826e-07, -2.618488110783801e-07, -1.9564004105632193e-07, -1.2943127103426377e-07, -6.322250101220561e-08, 2.986269009852549e-09, 6.919503903191071e-08, 1.3540380905396887e-07, 2.0161257907602703e-07, 2.678213490980852e-07, 3.3403011912014335e-07, 4.002388891422015e-07, 4.664476591642597e-07, 5.326564291863178e-07, 5.98865199208376e-07, 6.650739692304342e-07, 7.312827392524923e-07, 7.974915092745505e-07, 8.637002792966086e-07, 9.299090493186668e-07, 9.96117819340725e-07, 1.062326646206202e-06, 1.1285353593848413e-06, 1.1947440725634806e-06, 1.2609528994289576e-06, 1.3271617262944346e-06, 1.393370439473074e-06, 1.4595791526517132e-06, 1.5257879795171903e-06, 1.5919968063826673e-06, 1.6582055195613066e-06, 1.7244142327399459e-06, 1.790623059605423e-06, 1.8568318864709e-06, 1.9230405996495392e-06, 1.9892493128281785e-06, 2.055458026006818e-06, 2.1216669665591326e-06, 2.187875679737772e-06]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 9.0, 5.0, 18.0, 20.0, 24.0, 66.0, 32.0, 134.0, 99.0, 325.0, 255.0, 295.0, 1059.0, 821.0, 2584.0, 2001.0, 2645.0, 8549.0, 6858.0, 22502.0, 18699.0, 66718.0, 60876.0, 94642.0, 480601.0, 745955.0, 1905095.0, 317220.0, 255812.0, 61665.0, 41270.0, 47428.0, 13563.0, 16826.0, 4957.0, 3719.0, 4749.0, 1530.0, 2008.0, 666.0, 885.0, 269.0, 207.0, 291.0, 88.0, 95.0, 44.0, 54.0, 11.0, 17.0, 15.0, 4.0, 6.0, 3.0, 3.0], "bins": [-2.9802322387695312e-06, -2.8954818844795227e-06, -2.810731530189514e-06, -2.7259811758995056e-06, -2.641230821609497e-06, -2.5564804673194885e-06, -2.47173011302948e-06, -2.3869797587394714e-06, -2.302229404449463e-06, -2.2174790501594543e-06, -2.132728695869446e-06, -2.0479783415794373e-06, -1.9632279872894287e-06, -1.8784776329994202e-06, -1.7937272787094116e-06, -1.708976924419403e-06, -1.6242265701293945e-06, -1.539476215839386e-06, -1.4547258615493774e-06, -1.369975507259369e-06, -1.2852251529693604e-06, -1.2004747986793518e-06, -1.1157244443893433e-06, -1.0309740900993347e-06, -9.462237358093262e-07, -8.614733815193176e-07, -7.767230272293091e-07, -6.919726729393005e-07, -6.07222318649292e-07, -5.224719643592834e-07, -4.377216100692749e-07, -3.5297125577926636e-07, -2.682209014892578e-07, -1.8347054719924927e-07, -9.872019290924072e-08, -1.3969838619232178e-08, 7.078051567077637e-08, 1.555308699607849e-07, 2.4028122425079346e-07, 3.25031578540802e-07, 4.0978193283081055e-07, 4.945322871208191e-07, 5.792826414108276e-07, 6.640329957008362e-07, 7.487833499908447e-07, 8.335337042808533e-07, 9.182840585708618e-07, 1.0030344128608704e-06, 1.087784767150879e-06, 1.1725351214408875e-06, 1.257285475730896e-06, 1.3420358300209045e-06, 1.426786184310913e-06, 1.5115365386009216e-06, 1.5962868928909302e-06, 1.6810372471809387e-06, 1.7657876014709473e-06, 1.8505379557609558e-06, 1.9352883100509644e-06, 2.020038664340973e-06, 2.1047890186309814e-06, 2.18953937292099e-06, 2.2742897272109985e-06, 2.359040081501007e-06, 2.4437904357910156e-06]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 0.0, 5.0, 0.0, 6.0, 17.0, 0.0, 18.0, 0.0, 17.0, 24.0, 0.0, 31.0, 0.0, 22.0, 41.0, 0.0, 54.0, 0.0, 46.0, 63.0, 0.0, 71.0, 0.0, 78.0, 0.0, 60.0, 54.0, 0.0, 41.0, 0.0, 51.0, 52.0, 0.0, 46.0, 0.0, 43.0, 35.0, 0.0, 17.0, 0.0, 35.0, 21.0, 0.0, 12.0, 0.0, 9.0, 16.0, 0.0, 7.0, 0.0, 6.0, 5.0, 0.0, 4.0, 0.0, 0.0, 3.0], "bins": [-1.1324882507324219e-06, -1.0970979928970337e-06, -1.0617077350616455e-06, -1.0263174772262573e-06, -9.909272193908691e-07, -9.55536961555481e-07, -9.201467037200928e-07, -8.847564458847046e-07, -8.493661880493164e-07, -8.139759302139282e-07, -7.7858567237854e-07, -7.431954145431519e-07, -7.078051567077637e-07, -6.724148988723755e-07, -6.370246410369873e-07, -6.016343832015991e-07, -5.662441253662109e-07, -5.308538675308228e-07, -4.954636096954346e-07, -4.600733518600464e-07, -4.246830940246582e-07, -3.8929283618927e-07, -3.5390257835388184e-07, -3.1851232051849365e-07, -2.8312206268310547e-07, -2.477318048477173e-07, -2.123415470123291e-07, -1.7695128917694092e-07, -1.4156103134155273e-07, -1.0617077350616455e-07, -7.078051567077637e-08, -3.5390257835388184e-08, 0.0, 3.5390257835388184e-08, 7.078051567077637e-08, 1.0617077350616455e-07, 1.4156103134155273e-07, 1.7695128917694092e-07, 2.123415470123291e-07, 2.477318048477173e-07, 2.8312206268310547e-07, 3.1851232051849365e-07, 3.5390257835388184e-07, 3.8929283618927e-07, 4.246830940246582e-07, 4.600733518600464e-07, 4.954636096954346e-07, 5.308538675308228e-07, 5.662441253662109e-07, 6.016343832015991e-07, 6.370246410369873e-07, 6.724148988723755e-07, 7.078051567077637e-07, 7.431954145431519e-07, 7.7858567237854e-07, 8.139759302139282e-07, 8.493661880493164e-07, 8.847564458847046e-07, 9.201467037200928e-07, 9.55536961555481e-07, 9.909272193908691e-07, 1.0263174772262573e-06, 1.0617077350616455e-06, 1.0970979928970337e-06, 1.1324882507324219e-06]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 6.0, 17.0, 8.0, 23.0, 26.0, 46.0, 69.0, 194.0, 177.0, 223.0, 323.0, 460.0, 639.0, 905.0, 3124.0, 2591.0, 3903.0, 5386.0, 8354.0, 12324.0, 47398.0, 44720.0, 71611.0, 118009.0, 199458.0, 358045.0, 640072.0, 1797289.0, 358428.0, 200084.0, 118338.0, 71643.0, 44796.0, 46836.0, 12324.0, 8255.0, 5528.0, 3791.0, 2665.0, 3118.0, 866.0, 664.0, 452.0, 340.0, 231.0, 150.0, 195.0, 60.0, 35.0, 27.0, 26.0, 11.0, 15.0, 8.0, 5.0, 0.0, 2.0, 0.0, 3.0], "bins": [-2.205371856689453e-06, -2.1364539861679077e-06, -2.0675361156463623e-06, -1.998618245124817e-06, -1.9297003746032715e-06, -1.860782504081726e-06, -1.7918646335601807e-06, -1.7229467630386353e-06, -1.6540288925170898e-06, -1.5851110219955444e-06, -1.516193151473999e-06, -1.4472752809524536e-06, -1.3783574104309082e-06, -1.3094395399093628e-06, -1.2405216693878174e-06, -1.171603798866272e-06, -1.1026859283447266e-06, -1.0337680578231812e-06, -9.648501873016357e-07, -8.959323167800903e-07, -8.270144462585449e-07, -7.580965757369995e-07, -6.891787052154541e-07, -6.202608346939087e-07, -5.513429641723633e-07, -4.824250936508179e-07, -4.1350722312927246e-07, -3.4458935260772705e-07, -2.7567148208618164e-07, -2.0675361156463623e-07, -1.3783574104309082e-07, -6.891787052154541e-08, 0.0, 6.891787052154541e-08, 1.3783574104309082e-07, 2.0675361156463623e-07, 2.7567148208618164e-07, 3.4458935260772705e-07, 4.1350722312927246e-07, 4.824250936508179e-07, 5.513429641723633e-07, 6.202608346939087e-07, 6.891787052154541e-07, 7.580965757369995e-07, 8.270144462585449e-07, 8.959323167800903e-07, 9.648501873016357e-07, 1.0337680578231812e-06, 1.1026859283447266e-06, 1.171603798866272e-06, 1.2405216693878174e-06, 1.3094395399093628e-06, 1.3783574104309082e-06, 1.4472752809524536e-06, 1.516193151473999e-06, 1.5851110219955444e-06, 1.6540288925170898e-06, 1.7229467630386353e-06, 1.7918646335601807e-06, 1.860782504081726e-06, 1.9297003746032715e-06, 1.998618245124817e-06, 2.0675361156463623e-06, 2.1364539861679077e-06, 2.205371856689453e-06]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 0.0, 12.0, 0.0, 0.0, 18.0, 0.0, 25.0, 0.0, 62.0, 0.0, 0.0, 82.0, 0.0, 166.0, 0.0, 0.0, 291.0, 0.0, 419.0, 0.0, 563.0, 0.0, 0.0, 774.0, 0.0, 589.0, 0.0, 426.0, 0.0, 0.0, 279.0, 0.0, 158.0, 0.0, 0.0, 97.0, 0.0, 53.0, 0.0, 31.0, 0.0, 0.0, 17.0, 0.0, 13.0, 0.0, 4.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.093193173408508e-07, -7.841736078262329e-07, -7.59027898311615e-07, -7.338821887969971e-07, -7.087364792823792e-07, -6.835907697677612e-07, -6.584450602531433e-07, -6.332993507385254e-07, -6.081536412239075e-07, -5.830079317092896e-07, -5.578622221946716e-07, -5.327165126800537e-07, -5.075708031654358e-07, -4.824250936508179e-07, -4.5727938413619995e-07, -4.3213367462158203e-07, -4.069879651069641e-07, -3.818422555923462e-07, -3.5669654607772827e-07, -3.3155083656311035e-07, -3.0640512704849243e-07, -2.812594175338745e-07, -2.561137080192566e-07, -2.3096799850463867e-07, -2.0582228899002075e-07, -1.8067657947540283e-07, -1.555308699607849e-07, -1.30385160446167e-07, -1.0523945093154907e-07, -8.009374141693115e-08, -5.494803190231323e-08, -2.9802322387695312e-08, -4.6566128730773926e-09, 2.0489096641540527e-08, 4.563480615615845e-08, 7.078051567077637e-08, 9.592622518539429e-08, 1.210719347000122e-07, 1.4621764421463013e-07, 1.7136335372924805e-07, 1.9650906324386597e-07, 2.2165477275848389e-07, 2.468004822731018e-07, 2.7194619178771973e-07, 2.9709190130233765e-07, 3.2223761081695557e-07, 3.473833203315735e-07, 3.725290298461914e-07, 3.976747393608093e-07, 4.2282044887542725e-07, 4.4796615839004517e-07, 4.731118679046631e-07, 4.98257577419281e-07, 5.234032869338989e-07, 5.485489964485168e-07, 5.736947059631348e-07, 5.988404154777527e-07, 6.239861249923706e-07, 6.491318345069885e-07, 6.742775440216064e-07, 6.994232535362244e-07, 7.245689630508423e-07, 7.497146725654602e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 5.0, 8.0, 5.0, 12.0, 10.0, 21.0, 30.0, 34.0, 44.0, 54.0, 87.0, 74.0, 94.0, 74.0, 84.0, 62.0, 62.0, 56.0, 28.0, 32.0, 27.0, 12.0, 14.0, 9.0, 8.0, 8.0, 3.0, 9.0, 5.0, 1.0, 0.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0859433789155446e-06, -2.0166885406069923e-06, -1.94743370229844e-06, -1.8781786366162123e-06, -1.80892379830766e-06, -1.7396689599991078e-06, -1.6704140080037178e-06, -1.6011590560083278e-06, -1.5319042176997755e-06, -1.4626493793912232e-06, -1.3933944273958332e-06, -1.3241394754004432e-06, -1.254884637091891e-06, -1.1856297987833386e-06, -1.1163748467879486e-06, -1.0471198947925586e-06, -9.778650564840063e-07, -9.086101613320352e-07, -8.393552661800641e-07, -7.701003710280929e-07, -7.008454758761218e-07, -6.315905807241506e-07, -5.623356855721795e-07, -4.930807904202084e-07, -4.238258952682372e-07, -3.545710001162661e-07, -2.8531610496429494e-07, -2.160612098123238e-07, -1.4680631466035265e-07, -7.755141950838151e-08, -8.296524356410373e-09, 6.095837079556077e-08, 1.3021349332120735e-07, 1.994683884731785e-07, 2.6872328362514963e-07, 3.379781787771208e-07, 4.072330739290919e-07, 4.7648796908106306e-07, 5.457428642330342e-07, 6.149977593850053e-07, 6.842526545369765e-07, 7.535075496889476e-07, 8.227624448409188e-07, 8.920173399928899e-07, 9.61272235144861e-07, 1.0305270734534133e-06, 1.0997820254488033e-06, 1.1690369774441933e-06, 1.2382918157527456e-06, 1.3075466540612979e-06, 1.3768016060566879e-06, 1.4460565580520779e-06, 1.5153113963606302e-06, 1.5845662346691824e-06, 1.6538211866645725e-06, 1.7230761386599625e-06, 1.7923309769685147e-06, 1.861585815277067e-06, 1.9308408809592947e-06, 2.000095719267847e-06, 2.0693505575763993e-06, 2.1386053958849516e-06, 2.207860234193504e-06, 2.2771152998757316e-06, 2.346370138184284e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 9.0, 11.0, 9.0, 13.0, 13.0, 11.0, 22.0, 19.0, 13.0, 28.0, 24.0, 37.0, 28.0, 26.0, 29.0, 51.0, 37.0, 45.0, 40.0, 39.0, 41.0, 46.0, 40.0, 36.0, 32.0, 29.0, 27.0, 27.0, 26.0, 24.0, 23.0, 25.0, 34.0, 15.0, 9.0, 11.0, 13.0, 8.0, 7.0, 2.0, 2.0, 3.0, 4.0, 5.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.291862758989737e-06, -1.2454805755623966e-06, -1.1990983921350562e-06, -1.1527162087077159e-06, -1.1063340252803755e-06, -1.0599518418530351e-06, -1.0135696584256948e-06, -9.671874749983544e-07, -9.208052915710141e-07, -8.744231081436737e-07, -8.280409247163334e-07, -7.81658741288993e-07, -7.352765578616527e-07, -6.888943744343123e-07, -6.42512191006972e-07, -5.961300075796316e-07, -5.497478241522913e-07, -5.033656407249509e-07, -4.569834572976106e-07, -4.1060127387027023e-07, -3.642190904429299e-07, -3.1783690701558953e-07, -2.714547235882492e-07, -2.2507254016090883e-07, -1.7869035673356848e-07, -1.3230817330622813e-07, -8.592598987888778e-08, -3.9543806451547425e-08, 6.838376975792926e-09, 5.322056040313328e-08, 9.960274383047363e-08, 1.4598492725781398e-07, 1.923669969983166e-07, 2.3874918042565696e-07, 2.851313638529973e-07, 3.3151354728033766e-07, 3.77895730707678e-07, 4.2427791413501836e-07, 4.706600975623587e-07, 5.170422809896991e-07, 5.634244644170394e-07, 6.098066478443798e-07, 6.561888312717201e-07, 7.025710146990605e-07, 7.489531981264008e-07, 7.953353815537412e-07, 8.417175649810815e-07, 8.880997484084219e-07, 9.344819318357622e-07, 9.808641152631026e-07, 1.027246298690443e-06, 1.0736284821177833e-06, 1.1200106655451236e-06, 1.166392848972464e-06, 1.2127750323998043e-06, 1.2591572158271447e-06, 1.305539399254485e-06, 1.3519215826818254e-06, 1.3983037661091657e-06, 1.444685949536506e-06, 1.4910681329638464e-06, 1.5374503163911868e-06, 1.5838324998185271e-06, 1.6302146832458675e-06, 1.6765968666732078e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 4.0, 12.0, 15.0, 29.0, 22.0, 52.0, 73.0, 133.0, 233.0, 163.0, 463.0, 811.0, 1631.0, 1236.0, 4251.0, 8694.0, 18336.0, 15988.0, 60514.0, 150899.0, 365545.0, 156320.0, 150557.0, 60190.0, 26817.0, 12680.0, 3565.0, 4327.0, 2238.0, 1212.0, 337.0, 492.0, 275.0, 162.0, 63.0, 76.0, 60.0, 22.0, 12.0, 17.0, 14.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.039836883544922e-06, -2.934597432613373e-06, -2.8293579816818237e-06, -2.7241185307502747e-06, -2.6188790798187256e-06, -2.5136396288871765e-06, -2.4084001779556274e-06, -2.3031607270240784e-06, -2.1979212760925293e-06, -2.0926818251609802e-06, -1.987442374229431e-06, -1.882202923297882e-06, -1.776963472366333e-06, -1.671724021434784e-06, -1.5664845705032349e-06, -1.4612451195716858e-06, -1.3560056686401367e-06, -1.2507662177085876e-06, -1.1455267667770386e-06, -1.0402873158454895e-06, -9.350478649139404e-07, -8.298084139823914e-07, -7.245689630508423e-07, -6.193295121192932e-07, -5.140900611877441e-07, -4.0885061025619507e-07, -3.03611159324646e-07, -1.9837170839309692e-07, -9.313225746154785e-08, 1.210719347000122e-08, 1.1734664440155029e-07, 2.2258609533309937e-07, 3.2782554626464844e-07, 4.330649971961975e-07, 5.383044481277466e-07, 6.435438990592957e-07, 7.487833499908447e-07, 8.540228009223938e-07, 9.592622518539429e-07, 1.064501702785492e-06, 1.169741153717041e-06, 1.27498060464859e-06, 1.3802200555801392e-06, 1.4854595065116882e-06, 1.5906989574432373e-06, 1.6959384083747864e-06, 1.8011778593063354e-06, 1.9064173102378845e-06, 2.0116567611694336e-06, 2.1168962121009827e-06, 2.2221356630325317e-06, 2.327375113964081e-06, 2.43261456489563e-06, 2.537854015827179e-06, 2.643093466758728e-06, 2.748332917690277e-06, 2.853572368621826e-06, 2.9588118195533752e-06, 3.0640512704849243e-06, 3.1692907214164734e-06, 3.2745301723480225e-06, 3.3797696232795715e-06, 3.4850090742111206e-06, 3.5902485251426697e-06, 3.6954879760742188e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 3.0, 0.0, 7.0, 10.0, 9.0, 17.0, 0.0, 22.0, 29.0, 25.0, 20.0, 24.0, 0.0, 35.0, 50.0, 36.0, 60.0, 0.0, 53.0, 53.0, 61.0, 63.0, 0.0, 66.0, 40.0, 43.0, 47.0, 44.0, 0.0, 36.0, 39.0, 21.0, 16.0, 0.0, 25.0, 12.0, 16.0, 3.0, 0.0, 4.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.430511474609375e-06, -1.3820827007293701e-06, -1.3336539268493652e-06, -1.2852251529693604e-06, -1.2367963790893555e-06, -1.1883676052093506e-06, -1.1399388313293457e-06, -1.0915100574493408e-06, -1.043081283569336e-06, -9.94652509689331e-07, -9.462237358093262e-07, -8.977949619293213e-07, -8.493661880493164e-07, -8.009374141693115e-07, -7.525086402893066e-07, -7.040798664093018e-07, -6.556510925292969e-07, -6.07222318649292e-07, -5.587935447692871e-07, -5.103647708892822e-07, -4.6193599700927734e-07, -4.1350722312927246e-07, -3.650784492492676e-07, -3.166496753692627e-07, -2.682209014892578e-07, -2.1979212760925293e-07, -1.7136335372924805e-07, -1.2293457984924316e-07, -7.450580596923828e-08, -2.60770320892334e-08, 2.2351741790771484e-08, 7.078051567077637e-08, 1.1920928955078125e-07, 1.6763806343078613e-07, 2.1606683731079102e-07, 2.644956111907959e-07, 3.129243850708008e-07, 3.6135315895080566e-07, 4.0978193283081055e-07, 4.5821070671081543e-07, 5.066394805908203e-07, 5.550682544708252e-07, 6.034970283508301e-07, 6.51925802230835e-07, 7.003545761108398e-07, 7.487833499908447e-07, 7.972121238708496e-07, 8.456408977508545e-07, 8.940696716308594e-07, 9.424984455108643e-07, 9.909272193908691e-07, 1.039355993270874e-06, 1.087784767150879e-06, 1.1362135410308838e-06, 1.1846423149108887e-06, 1.2330710887908936e-06, 1.2814998626708984e-06, 1.3299286365509033e-06, 1.3783574104309082e-06, 1.426786184310913e-06, 1.475214958190918e-06, 1.5236437320709229e-06, 1.5720725059509277e-06, 1.6205012798309326e-06, 1.6689300537109375e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 15.0, 1.0, 9.0, 11.0, 12.0, 28.0, 45.0, 45.0, 69.0, 131.0, 194.0, 341.0, 467.0, 725.0, 1526.0, 2884.0, 15110.0, 58617.0, 931916.0, 22699.0, 7314.0, 2860.0, 1850.0, 582.0, 395.0, 270.0, 154.0, 81.0, 81.0, 36.0, 27.0, 15.0, 11.0, 11.0, 9.0, 7.0, 5.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.410743713378906e-06, -4.28222119808197e-06, -4.153698682785034e-06, -4.025176167488098e-06, -3.896653652191162e-06, -3.768131136894226e-06, -3.63960862159729e-06, -3.511086106300354e-06, -3.382563591003418e-06, -3.254041075706482e-06, -3.125518560409546e-06, -2.99699604511261e-06, -2.868473529815674e-06, -2.739951014518738e-06, -2.6114284992218018e-06, -2.4829059839248657e-06, -2.3543834686279297e-06, -2.2258609533309937e-06, -2.0973384380340576e-06, -1.9688159227371216e-06, -1.8402934074401855e-06, -1.7117708921432495e-06, -1.5832483768463135e-06, -1.4547258615493774e-06, -1.3262033462524414e-06, -1.1976808309555054e-06, -1.0691583156585693e-06, -9.406358003616333e-07, -8.121132850646973e-07, -6.835907697677612e-07, -5.550682544708252e-07, -4.2654573917388916e-07, -2.980232238769531e-07, -1.695007085800171e-07, -4.0978193283081055e-08, 8.754432201385498e-08, 2.1606683731079102e-07, 3.4458935260772705e-07, 4.731118679046631e-07, 6.016343832015991e-07, 7.301568984985352e-07, 8.586794137954712e-07, 9.872019290924072e-07, 1.1157244443893433e-06, 1.2442469596862793e-06, 1.3727694749832153e-06, 1.5012919902801514e-06, 1.6298145055770874e-06, 1.7583370208740234e-06, 1.8868595361709595e-06, 2.0153820514678955e-06, 2.1439045667648315e-06, 2.2724270820617676e-06, 2.4009495973587036e-06, 2.5294721126556396e-06, 2.6579946279525757e-06, 2.7865171432495117e-06, 2.9150396585464478e-06, 3.043562173843384e-06, 3.17208468914032e-06, 3.300607204437256e-06, 3.429129719734192e-06, 3.557652235031128e-06, 3.686174750328064e-06, 3.814697265625e-06]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 0.0, 21.0, 0.0, 0.0, 0.0, 0.0, 108.0, 0.0, 0.0, 0.0, 0.0, 694.0, 0.0, 0.0, 0.0, 0.0, 128.0, 0.0, 0.0, 0.0, 0.0, 36.0, 0.0, 0.0, 0.0, 0.0, 16.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5762786865234375e-07, -3.4552067518234253e-07, -3.334134817123413e-07, -3.213062882423401e-07, -3.0919909477233887e-07, -2.9709190130233765e-07, -2.849847078323364e-07, -2.728775143623352e-07, -2.60770320892334e-07, -2.4866312742233276e-07, -2.3655593395233154e-07, -2.2444874048233032e-07, -2.123415470123291e-07, -2.0023435354232788e-07, -1.8812716007232666e-07, -1.7601996660232544e-07, -1.6391277313232422e-07, -1.51805579662323e-07, -1.3969838619232178e-07, -1.2759119272232056e-07, -1.1548399925231934e-07, -1.0337680578231812e-07, -9.12696123123169e-08, -7.916241884231567e-08, -6.705522537231445e-08, -5.494803190231323e-08, -4.284083843231201e-08, -3.073364496231079e-08, -1.862645149230957e-08, -6.51925802230835e-09, 5.587935447692871e-09, 1.7695128917694092e-08, 2.9802322387695312e-08, 4.190951585769653e-08, 5.4016709327697754e-08, 6.612390279769897e-08, 7.82310962677002e-08, 9.033828973770142e-08, 1.0244548320770264e-07, 1.1455267667770386e-07, 1.2665987014770508e-07, 1.387670636177063e-07, 1.5087425708770752e-07, 1.6298145055770874e-07, 1.7508864402770996e-07, 1.8719583749771118e-07, 1.993030309677124e-07, 2.1141022443771362e-07, 2.2351741790771484e-07, 2.3562461137771606e-07, 2.477318048477173e-07, 2.598389983177185e-07, 2.7194619178771973e-07, 2.8405338525772095e-07, 2.9616057872772217e-07, 3.082677721977234e-07, 3.203749656677246e-07, 3.3248215913772583e-07, 3.4458935260772705e-07, 3.5669654607772827e-07, 3.688037395477295e-07, 3.809109330177307e-07, 3.9301812648773193e-07, 4.0512531995773315e-07, 4.172325134277344e-07]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 5.0, 3.0, 2.0, 3.0, 5.0, 7.0, 11.0, 9.0, 12.0, 19.0, 14.0, 23.0, 25.0, 40.0, 42.0, 57.0, 79.0, 89.0, 74.0, 72.0, 77.0, 62.0, 58.0, 40.0, 33.0, 35.0, 22.0, 13.0, 15.0, 10.0, 10.0, 4.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6453153648399166e-06, -1.5859395716688596e-06, -1.5265636648109648e-06, -1.46718775795307e-06, -1.407811964782013e-06, -1.348436171610956e-06, -1.2890602647530613e-06, -1.2296843578951666e-06, -1.1703085647241096e-06, -1.1109327715530526e-06, -1.0515568646951579e-06, -9.921809578372631e-07, -9.328051646662061e-07, -8.734293146517302e-07, -8.140534646372544e-07, -7.546776146227785e-07, -6.953017646083026e-07, -6.359259145938267e-07, -5.765500645793509e-07, -5.17174214564875e-07, -4.5779836455039913e-07, -3.9842251453592326e-07, -3.390466645214474e-07, -2.796708145069715e-07, -2.2029496449249564e-07, -1.6091911447801976e-07, -1.0154326446354389e-07, -4.216741444906802e-08, 1.7208435565407854e-08, 7.658428557988373e-08, 1.359601355943596e-07, 1.9533598560883547e-07, 2.5471194931014907e-07, 3.1408779932462494e-07, 3.734636493391008e-07, 4.328394993535767e-07, 4.922153493680526e-07, 5.515911993825284e-07, 6.109670493970043e-07, 6.703428994114802e-07, 7.29718749425956e-07, 7.890945994404319e-07, 8.484704494549078e-07, 9.078462994693837e-07, 9.672221494838595e-07, 1.0265980563417543e-06, 1.0859738495128113e-06, 1.1453496426838683e-06, 1.204725549541763e-06, 1.2641014563996578e-06, 1.3234772495707148e-06, 1.3828530427417718e-06, 1.4422289495996665e-06, 1.5016048564575613e-06, 1.5609806496286183e-06, 1.6203564427996753e-06, 1.67973234965757e-06, 1.7391082565154647e-06, 1.7984840496865218e-06, 1.8578598428575788e-06, 1.9172357497154735e-06, 1.9766116565733682e-06, 2.035987563431263e-06, 2.0953632429154823e-06, 2.154739149773377e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 7.0, 8.0, 11.0, 14.0, 8.0, 17.0, 20.0, 17.0, 12.0, 20.0, 27.0, 39.0, 29.0, 25.0, 30.0, 46.0, 40.0, 42.0, 40.0, 37.0, 53.0, 38.0, 36.0, 42.0, 33.0, 31.0, 27.0, 25.0, 32.0, 21.0, 26.0, 22.0, 29.0, 21.0, 10.0, 10.0, 11.0, 13.0, 8.0, 2.0, 2.0, 2.0, 4.0, 6.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.229081817655242e-06, -1.185095925393398e-06, -1.1411100331315538e-06, -1.0971241408697097e-06, -1.0531381349210278e-06, -1.0091522426591837e-06, -9.651663503973396e-07, -9.211804581354954e-07, -8.771945658736513e-07, -8.332086736118072e-07, -7.892227245065442e-07, -7.452368322447001e-07, -7.012509399828559e-07, -6.572649908775929e-07, -6.132790986157488e-07, -5.692932063539047e-07, -5.253072572486417e-07, -4.813213649867976e-07, -4.37335444303244e-07, -3.9334952361969044e-07, -3.493636313578463e-07, -3.0537771067429276e-07, -2.613917899907392e-07, -2.1740589772889507e-07, -1.734199770453415e-07, -1.2943407057264267e-07, -8.544815699451647e-08, -4.1462243416390265e-08, 2.5236630563085782e-09, 4.650956952900742e-08, 9.049549021256098e-08, 1.344813824744051e-07, 1.7846730315795867e-07, 2.224532096306575e-07, 2.6643911610335635e-07, 3.104250367869099e-07, 3.5441092904875404e-07, 3.983968497323076e-07, 4.4238277041586116e-07, 4.863686626777053e-07, 5.303545549395494e-07, 5.743404472013935e-07, 6.183263963066565e-07, 6.623122885685007e-07, 7.062981808303448e-07, 7.502841299356078e-07, 7.942700221974519e-07, 8.38255914459296e-07, 8.82241863564559e-07, 9.262277558264032e-07, 9.702137049316661e-07, 1.0141995971935103e-06, 1.0581854894553544e-06, 1.1021713817171985e-06, 1.1461572739790427e-06, 1.1901431662408868e-06, 1.2341291721895686e-06, 1.2781150644514128e-06, 1.3221009567132569e-06, 1.3660869626619387e-06, 1.4100728549237829e-06, 1.454058747185627e-06, 1.4980446394474711e-06, 1.5420305317093153e-06, 1.5860164239711594e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 13.0, 9.0, 16.0, 36.0, 36.0, 27.0, 48.0, 133.0, 99.0, 154.0, 497.0, 444.0, 606.0, 797.0, 2857.0, 2364.0, 3552.0, 13051.0, 11841.0, 17594.0, 27322.0, 107119.0, 100984.0, 148014.0, 174078.0, 247615.0, 65597.0, 42047.0, 45224.0, 11846.0, 7717.0, 5059.0, 6073.0, 1601.0, 1170.0, 1334.0, 436.0, 292.0, 216.0, 296.0, 98.0, 61.0, 87.0, 25.0, 19.0, 13.0, 19.0, 3.0, 4.0, 11.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.384185791015625e-06, -2.3078173398971558e-06, -2.2314488887786865e-06, -2.1550804376602173e-06, -2.078711986541748e-06, -2.002343535423279e-06, -1.9259750843048096e-06, -1.8496066331863403e-06, -1.773238182067871e-06, -1.6968697309494019e-06, -1.6205012798309326e-06, -1.5441328287124634e-06, -1.4677643775939941e-06, -1.391395926475525e-06, -1.3150274753570557e-06, -1.2386590242385864e-06, -1.1622905731201172e-06, -1.085922122001648e-06, -1.0095536708831787e-06, -9.331852197647095e-07, -8.568167686462402e-07, -7.80448317527771e-07, -7.040798664093018e-07, -6.277114152908325e-07, -5.513429641723633e-07, -4.7497451305389404e-07, -3.986060619354248e-07, -3.2223761081695557e-07, -2.4586915969848633e-07, -1.695007085800171e-07, -9.313225746154785e-08, -1.6763806343078613e-08, 5.960464477539063e-08, 1.3597309589385986e-07, 2.123415470123291e-07, 2.8870999813079834e-07, 3.650784492492676e-07, 4.414469003677368e-07, 5.178153514862061e-07, 5.941838026046753e-07, 6.705522537231445e-07, 7.469207048416138e-07, 8.23289155960083e-07, 8.996576070785522e-07, 9.760260581970215e-07, 1.0523945093154907e-06, 1.12876296043396e-06, 1.2051314115524292e-06, 1.2814998626708984e-06, 1.3578683137893677e-06, 1.434236764907837e-06, 1.5106052160263062e-06, 1.5869736671447754e-06, 1.6633421182632446e-06, 1.7397105693817139e-06, 1.816079020500183e-06, 1.8924474716186523e-06, 1.9688159227371216e-06, 2.045184373855591e-06, 2.12155282497406e-06, 2.1979212760925293e-06, 2.2742897272109985e-06, 2.3506581783294678e-06, 2.427026629447937e-06, 2.5033950805664062e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 6.0, 0.0, 0.0, 0.0, 4.0, 21.0, 0.0, 10.0, 0.0, 19.0, 30.0, 0.0, 31.0, 0.0, 34.0, 53.0, 0.0, 47.0, 63.0, 0.0, 61.0, 0.0, 84.0, 81.0, 0.0, 65.0, 0.0, 58.0, 56.0, 0.0, 63.0, 0.0, 60.0, 46.0, 0.0, 39.0, 0.0, 28.0, 18.0, 0.0, 11.0, 10.0, 0.0, 7.0, 0.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0132789611816406e-06, -9.76957380771637e-07, -9.406358003616333e-07, -9.043142199516296e-07, -8.67992639541626e-07, -8.316710591316223e-07, -7.953494787216187e-07, -7.59027898311615e-07, -7.227063179016113e-07, -6.863847374916077e-07, -6.50063157081604e-07, -6.137415766716003e-07, -5.774199962615967e-07, -5.41098415851593e-07, -5.047768354415894e-07, -4.684552550315857e-07, -4.3213367462158203e-07, -3.9581209421157837e-07, -3.594905138015747e-07, -3.2316893339157104e-07, -2.868473529815674e-07, -2.505257725715637e-07, -2.1420419216156006e-07, -1.778826117515564e-07, -1.4156103134155273e-07, -1.0523945093154907e-07, -6.891787052154541e-08, -3.259629011154175e-08, 3.725290298461914e-09, 4.0046870708465576e-08, 7.636845111846924e-08, 1.126900315284729e-07, 1.4901161193847656e-07, 1.8533319234848022e-07, 2.2165477275848389e-07, 2.5797635316848755e-07, 2.942979335784912e-07, 3.3061951398849487e-07, 3.6694109439849854e-07, 4.032626748085022e-07, 4.3958425521850586e-07, 4.759058356285095e-07, 5.122274160385132e-07, 5.485489964485168e-07, 5.848705768585205e-07, 6.211921572685242e-07, 6.575137376785278e-07, 6.938353180885315e-07, 7.301568984985352e-07, 7.664784789085388e-07, 8.028000593185425e-07, 8.391216397285461e-07, 8.754432201385498e-07, 9.117648005485535e-07, 9.480863809585571e-07, 9.844079613685608e-07, 1.0207295417785645e-06, 1.0570511221885681e-06, 1.0933727025985718e-06, 1.1296942830085754e-06, 1.166015863418579e-06, 1.2023374438285828e-06, 1.2386590242385864e-06, 1.27498060464859e-06, 1.3113021850585938e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 26.0, 21.0, 31.0, 50.0, 51.0, 97.0, 116.0, 200.0, 258.0, 1003.0, 858.0, 1253.0, 1869.0, 2652.0, 3841.0, 5801.0, 8516.0, 12660.0, 47203.0, 42959.0, 65183.0, 99547.0, 144072.0, 171660.0, 143936.0, 99740.0, 65706.0, 71038.0, 18849.0, 12770.0, 8574.0, 5674.0, 4001.0, 2640.0, 1793.0, 1204.0, 1411.0, 425.0, 263.0, 206.0, 138.0, 78.0, 50.0, 44.0, 34.0, 35.0, 13.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1457672119140625e-06, -2.0796433091163635e-06, -2.0135194063186646e-06, -1.9473955035209656e-06, -1.8812716007232666e-06, -1.8151476979255676e-06, -1.7490237951278687e-06, -1.6828998923301697e-06, -1.6167759895324707e-06, -1.5506520867347717e-06, -1.4845281839370728e-06, -1.4184042811393738e-06, -1.3522803783416748e-06, -1.2861564755439758e-06, -1.2200325727462769e-06, -1.1539086699485779e-06, -1.087784767150879e-06, -1.02166086435318e-06, -9.55536961555481e-07, -8.89413058757782e-07, -8.23289155960083e-07, -7.57165253162384e-07, -6.910413503646851e-07, -6.249174475669861e-07, -5.587935447692871e-07, -4.926696419715881e-07, -4.2654573917388916e-07, -3.604218363761902e-07, -2.942979335784912e-07, -2.2817403078079224e-07, -1.6205012798309326e-07, -9.592622518539429e-08, -2.9802322387695312e-08, 3.632158041000366e-08, 1.0244548320770264e-07, 1.685693860054016e-07, 2.3469328880310059e-07, 3.0081719160079956e-07, 3.6694109439849854e-07, 4.330649971961975e-07, 4.991888999938965e-07, 5.653128027915955e-07, 6.314367055892944e-07, 6.975606083869934e-07, 7.636845111846924e-07, 8.298084139823914e-07, 8.959323167800903e-07, 9.620562195777893e-07, 1.0281801223754883e-06, 1.0943040251731873e-06, 1.1604279279708862e-06, 1.2265518307685852e-06, 1.2926757335662842e-06, 1.3587996363639832e-06, 1.4249235391616821e-06, 1.491047441959381e-06, 1.55717134475708e-06, 1.623295247554779e-06, 1.689419150352478e-06, 1.755543053150177e-06, 1.821666955947876e-06, 1.887790858745575e-06, 1.953914761543274e-06, 2.020038664340973e-06, 2.086162567138672e-06]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 15.0, 0.0, 0.0, 13.0, 0.0, 33.0, 0.0, 34.0, 0.0, 67.0, 0.0, 0.0, 83.0, 0.0, 82.0, 0.0, 112.0, 0.0, 0.0, 119.0, 0.0, 108.0, 0.0, 76.0, 0.0, 85.0, 0.0, 0.0, 66.0, 0.0, 41.0, 0.0, 30.0, 0.0, 0.0, 11.0, 0.0, 15.0, 0.0, 13.0, 0.0, 8.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.083879947662354e-07, -7.82310962677002e-07, -7.562339305877686e-07, -7.301568984985352e-07, -7.040798664093018e-07, -6.780028343200684e-07, -6.51925802230835e-07, -6.258487701416016e-07, -5.997717380523682e-07, -5.736947059631348e-07, -5.476176738739014e-07, -5.21540641784668e-07, -4.954636096954346e-07, -4.6938657760620117e-07, -4.4330954551696777e-07, -4.172325134277344e-07, -3.91155481338501e-07, -3.650784492492676e-07, -3.390014171600342e-07, -3.129243850708008e-07, -2.868473529815674e-07, -2.60770320892334e-07, -2.3469328880310059e-07, -2.086162567138672e-07, -1.825392246246338e-07, -1.564621925354004e-07, -1.30385160446167e-07, -1.043081283569336e-07, -7.82310962677002e-08, -5.21540641784668e-08, -2.60770320892334e-08, 0.0, 2.60770320892334e-08, 5.21540641784668e-08, 7.82310962677002e-08, 1.043081283569336e-07, 1.30385160446167e-07, 1.564621925354004e-07, 1.825392246246338e-07, 2.086162567138672e-07, 2.3469328880310059e-07, 2.60770320892334e-07, 2.868473529815674e-07, 3.129243850708008e-07, 3.390014171600342e-07, 3.650784492492676e-07, 3.91155481338501e-07, 4.172325134277344e-07, 4.4330954551696777e-07, 4.6938657760620117e-07, 4.954636096954346e-07, 5.21540641784668e-07, 5.476176738739014e-07, 5.736947059631348e-07, 5.997717380523682e-07, 6.258487701416016e-07, 6.51925802230835e-07, 6.780028343200684e-07, 7.040798664093018e-07, 7.301568984985352e-07, 7.562339305877686e-07, 7.82310962677002e-07, 8.083879947662354e-07, 8.344650268554688e-07]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 15.0, 0.0, 0.0, 30.0, 0.0, 0.0, 0.0, 74.0, 0.0, 0.0, 143.0, 0.0, 0.0, 1294.0, 0.0, 0.0, 3939.0, 0.0, 0.0, 10962.0, 0.0, 0.0, 0.0, 22283.0, 0.0, 0.0, 971186.0, 0.0, 0.0, 22255.0, 0.0, 0.0, 10786.0, 0.0, 0.0, 4006.0, 0.0, 0.0, 0.0, 1291.0, 0.0, 0.0, 154.0, 0.0, 0.0, 95.0, 0.0, 0.0, 31.0, 0.0, 0.0, 27.0, 0.0, 0.0, 1.0], "bins": [-6.556510925292969e-07, -6.370246410369873e-07, -6.183981895446777e-07, -5.997717380523682e-07, -5.811452865600586e-07, -5.62518835067749e-07, -5.438923835754395e-07, -5.252659320831299e-07, -5.066394805908203e-07, -4.880130290985107e-07, -4.6938657760620117e-07, -4.507601261138916e-07, -4.3213367462158203e-07, -4.1350722312927246e-07, -3.948807716369629e-07, -3.762543201446533e-07, -3.5762786865234375e-07, -3.390014171600342e-07, -3.203749656677246e-07, -3.0174851417541504e-07, -2.8312206268310547e-07, -2.644956111907959e-07, -2.4586915969848633e-07, -2.2724270820617676e-07, -2.086162567138672e-07, -1.8998980522155762e-07, -1.7136335372924805e-07, -1.5273690223693848e-07, -1.341104507446289e-07, -1.1548399925231934e-07, -9.685754776000977e-08, -7.82310962677002e-08, -5.960464477539063e-08, -4.0978193283081055e-08, -2.2351741790771484e-08, -3.725290298461914e-09, 1.4901161193847656e-08, 3.3527612686157227e-08, 5.21540641784668e-08, 7.078051567077637e-08, 8.940696716308594e-08, 1.0803341865539551e-07, 1.2665987014770508e-07, 1.4528632164001465e-07, 1.6391277313232422e-07, 1.825392246246338e-07, 2.0116567611694336e-07, 2.1979212760925293e-07, 2.384185791015625e-07, 2.5704503059387207e-07, 2.7567148208618164e-07, 2.942979335784912e-07, 3.129243850708008e-07, 3.3155083656311035e-07, 3.501772880554199e-07, 3.688037395477295e-07, 3.8743019104003906e-07, 4.0605664253234863e-07, 4.246830940246582e-07, 4.4330954551696777e-07, 4.6193599700927734e-07, 4.805624485015869e-07, 4.991888999938965e-07, 5.178153514862061e-07, 5.364418029785156e-07]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 24.0, 0.0, 0.0, 60.0, 0.0, 0.0, 0.0, 186.0, 0.0, 0.0, 363.0, 0.0, 0.0, 815.0, 0.0, 0.0, 0.0, 2363.0, 0.0, 0.0, 10727.0, 0.0, 0.0, 32616.0, 0.0, 0.0, 0.0, 954257.0, 0.0, 0.0, 32623.0, 0.0, 0.0, 0.0, 10705.0, 0.0, 0.0, 2392.0, 0.0, 0.0, 838.0, 0.0, 0.0, 0.0, 334.0, 0.0, 0.0, 175.0, 0.0, 0.0, 50.0, 0.0, 0.0, 0.0, 24.0, 0.0, 0.0, 14.0, 0.0, 0.0, 6.0], "bins": [-5.364418029785156e-07, -5.187466740608215e-07, -5.010515451431274e-07, -4.833564162254333e-07, -4.6566128730773926e-07, -4.4796615839004517e-07, -4.302710294723511e-07, -4.12575900554657e-07, -3.948807716369629e-07, -3.771856427192688e-07, -3.594905138015747e-07, -3.417953848838806e-07, -3.241002559661865e-07, -3.0640512704849243e-07, -2.8870999813079834e-07, -2.7101486921310425e-07, -2.5331974029541016e-07, -2.3562461137771606e-07, -2.1792948246002197e-07, -2.0023435354232788e-07, -1.825392246246338e-07, -1.648440957069397e-07, -1.471489667892456e-07, -1.2945383787155151e-07, -1.1175870895385742e-07, -9.406358003616333e-08, -7.636845111846924e-08, -5.8673322200775146e-08, -4.0978193283081055e-08, -2.3283064365386963e-08, -5.587935447692871e-09, 1.210719347000122e-08, 2.9802322387695312e-08, 4.7497451305389404e-08, 6.51925802230835e-08, 8.288770914077759e-08, 1.0058283805847168e-07, 1.1827796697616577e-07, 1.3597309589385986e-07, 1.5366822481155396e-07, 1.7136335372924805e-07, 1.8905848264694214e-07, 2.0675361156463623e-07, 2.2444874048233032e-07, 2.421438694000244e-07, 2.598389983177185e-07, 2.775341272354126e-07, 2.952292561531067e-07, 3.129243850708008e-07, 3.3061951398849487e-07, 3.4831464290618896e-07, 3.6600977182388306e-07, 3.8370490074157715e-07, 4.0140002965927124e-07, 4.1909515857696533e-07, 4.367902874946594e-07, 4.544854164123535e-07, 4.721805453300476e-07, 4.898756742477417e-07, 5.075708031654358e-07, 5.252659320831299e-07, 5.42961061000824e-07, 5.606561899185181e-07, 5.783513188362122e-07, 5.960464477539062e-07]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 64.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 877.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 60.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.7881393432617188e-07, -1.73225998878479e-07, -1.6763806343078613e-07, -1.6205012798309326e-07, -1.564621925354004e-07, -1.5087425708770752e-07, -1.4528632164001465e-07, -1.3969838619232178e-07, -1.341104507446289e-07, -1.2852251529693604e-07, -1.2293457984924316e-07, -1.1734664440155029e-07, -1.1175870895385742e-07, -1.0617077350616455e-07, -1.0058283805847168e-07, -9.499490261077881e-08, -8.940696716308594e-08, -8.381903171539307e-08, -7.82310962677002e-08, -7.264316082000732e-08, -6.705522537231445e-08, -6.146728992462158e-08, -5.587935447692871e-08, -5.029141902923584e-08, -4.470348358154297e-08, -3.91155481338501e-08, -3.3527612686157227e-08, -2.7939677238464355e-08, -2.2351741790771484e-08, -1.6763806343078613e-08, -1.1175870895385742e-08, -5.587935447692871e-09, 0.0, 5.587935447692871e-09, 1.1175870895385742e-08, 1.6763806343078613e-08, 2.2351741790771484e-08, 2.7939677238464355e-08, 3.3527612686157227e-08, 3.91155481338501e-08, 4.470348358154297e-08, 5.029141902923584e-08, 5.587935447692871e-08, 6.146728992462158e-08, 6.705522537231445e-08, 7.264316082000732e-08, 7.82310962677002e-08, 8.381903171539307e-08, 8.940696716308594e-08, 9.499490261077881e-08, 1.0058283805847168e-07, 1.0617077350616455e-07, 1.1175870895385742e-07, 1.1734664440155029e-07, 1.2293457984924316e-07, 1.2852251529693604e-07, 1.341104507446289e-07, 1.3969838619232178e-07, 1.4528632164001465e-07, 1.5087425708770752e-07, 1.564621925354004e-07, 1.6205012798309326e-07, 1.6763806343078613e-07, 1.73225998878479e-07, 1.7881393432617188e-07]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 7.0, 3.0, 9.0, 12.0, 12.0, 24.0, 19.0, 21.0, 33.0, 44.0, 55.0, 64.0, 77.0, 85.0, 87.0, 65.0, 74.0, 67.0, 46.0, 44.0, 25.0, 22.0, 14.0, 18.0, 16.0, 11.0, 10.0, 6.0, 8.0, 7.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5202499525912572e-06, -1.4648586557086674e-06, -1.4094673588260775e-06, -1.35407594825665e-06, -1.2986846513740602e-06, -1.2432933544914704e-06, -1.1879020576088806e-06, -1.1325107607262908e-06, -1.0771193501568632e-06, -1.0217280532742734e-06, -9.663367563916836e-07, -9.109454026656749e-07, -8.555540489396662e-07, -8.001627520570764e-07, -7.447714551744866e-07, -6.893801014484779e-07, -6.339888045658881e-07, -5.785975076832983e-07, -5.232061539572896e-07, -4.6781485707469983e-07, -4.1242350334869116e-07, -3.5703220646610134e-07, -3.016408811618021e-07, -2.4624955585750286e-07, -1.908582305532036e-07, -1.3546690524890437e-07, -8.007558705003248e-08, -2.4684268851160596e-08, 3.070705645313865e-08, 8.609836754658318e-08, 1.4148969285088242e-07, 1.9688101815518166e-07, 2.522723434594809e-07, 3.0766366876378015e-07, 3.630549940680794e-07, 4.184462909506692e-07, 4.738376446766779e-07, 5.292289415592677e-07, 5.846202384418575e-07, 6.400115921678662e-07, 6.954029458938749e-07, 7.507942427764647e-07, 8.061855965024733e-07, 8.615768933850632e-07, 9.169682471110718e-07, 9.723595439936616e-07, 1.0277508408762515e-06, 1.083142251445679e-06, 1.138533434641431e-06, 1.193924731524021e-06, 1.2493160284066107e-06, 1.3047074389760382e-06, 1.360098735858628e-06, 1.4154900327412179e-06, 1.4708813296238077e-06, 1.5262726265063975e-06, 1.581664037075825e-06, 1.6370553339584148e-06, 1.6924466308410047e-06, 1.7478380414104322e-06, 1.803229338293022e-06, 1.8586206351756118e-06, 1.9140120457450394e-06, 1.9694032289407915e-06, 2.024794639510219e-06]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 7.0, 6.0, 9.0, 13.0, 8.0, 12.0, 11.0, 18.0, 20.0, 20.0, 34.0, 36.0, 25.0, 35.0, 37.0, 35.0, 29.0, 47.0, 40.0, 45.0, 43.0, 39.0, 46.0, 44.0, 36.0, 49.0, 27.0, 29.0, 29.0, 21.0, 26.0, 18.0, 13.0, 23.0, 16.0, 13.0, 13.0, 11.0, 6.0, 5.0, 2.0, 3.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1083533308919868e-06, -1.067708694790781e-06, -1.0270640586895752e-06, -9.864193089015316e-07, -9.457746728003258e-07, -9.0513003669912e-07, -8.644854005979141e-07, -8.238407644967083e-07, -7.831960715520836e-07, -7.425514354508778e-07, -7.019067425062531e-07, -6.612621064050472e-07, -6.206174703038414e-07, -5.799727773592167e-07, -5.393281412580109e-07, -4.986834483133862e-07, -4.5803881221218035e-07, -4.173941476892651e-07, -3.767494831663498e-07, -3.36104847065144e-07, -2.954601825422287e-07, -2.5481551801931346e-07, -2.1417088191810763e-07, -1.7352621739519236e-07, -1.328815528722771e-07, -9.223689545478919e-08, -5.1592238037301286e-08, -1.0947587725240737e-08, 2.9697076797674526e-08, 7.034174132058979e-08, 1.1098637742179562e-07, 1.516310419447109e-07, 1.9227559278078843e-07, 2.329202573037037e-07, 2.7356492182661896e-07, 3.142095579278248e-07, 3.5485422245074005e-07, 3.954988869736553e-07, 4.3614352307486115e-07, 4.767881875977764e-07, 5.174328521206917e-07, 5.580774882218975e-07, 5.987221811665222e-07, 6.39366817267728e-07, 6.800114533689339e-07, 7.206561463135586e-07, 7.613007824147644e-07, 8.019454753593891e-07, 8.425901114605949e-07, 8.832347475618008e-07, 9.238794405064255e-07, 9.645241334510501e-07, 1.005168769552256e-06, 1.0458134056534618e-06, 1.0864580417546676e-06, 1.1271026778558735e-06, 1.1677473139570793e-06, 1.2083919500582851e-06, 1.249036586159491e-06, 1.2896812222606968e-06, 1.3303259720487404e-06, 1.3709706081499462e-06, 1.411615244251152e-06, 1.4522598803523579e-06, 1.4929046301404014e-06]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 9.0, 7.0, 16.0, 0.0, 22.0, 36.0, 53.0, 77.0, 102.0, 146.0, 225.0, 333.0, 0.0, 518.0, 772.0, 1296.0, 1999.0, 3328.0, 5507.0, 9482.0, 16227.0, 0.0, 28890.0, 52986.0, 103295.0, 228149.0, 747591.0, 1781447.0, 756827.0, 237505.0, 0.0, 103937.0, 51748.0, 27272.0, 14529.0, 8200.0, 4667.0, 2827.0, 1627.0, 0.0, 988.0, 631.0, 394.0, 247.0, 151.0, 81.0, 51.0, 37.0, 0.0, 25.0, 17.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7881393432617188e-06, -1.7350539565086365e-06, -1.6819685697555542e-06, -1.628883183002472e-06, -1.5757977962493896e-06, -1.5227124094963074e-06, -1.469627022743225e-06, -1.4165416359901428e-06, -1.3634562492370605e-06, -1.3103708624839783e-06, -1.257285475730896e-06, -1.2042000889778137e-06, -1.1511147022247314e-06, -1.0980293154716492e-06, -1.044943928718567e-06, -9.918585419654846e-07, -9.387731552124023e-07, -8.856877684593201e-07, -8.326023817062378e-07, -7.795169949531555e-07, -7.264316082000732e-07, -6.73346221446991e-07, -6.202608346939087e-07, -5.671754479408264e-07, -5.140900611877441e-07, -4.6100467443466187e-07, -4.079192876815796e-07, -3.548339009284973e-07, -3.0174851417541504e-07, -2.4866312742233276e-07, -1.955777406692505e-07, -1.424923539161682e-07, -8.940696716308594e-08, -3.632158041000366e-08, 1.6763806343078613e-08, 6.984919309616089e-08, 1.2293457984924316e-07, 1.7601996660232544e-07, 2.2910535335540771e-07, 2.8219074010849e-07, 3.3527612686157227e-07, 3.8836151361465454e-07, 4.414469003677368e-07, 4.945322871208191e-07, 5.476176738739014e-07, 6.007030606269836e-07, 6.537884473800659e-07, 7.068738341331482e-07, 7.599592208862305e-07, 8.130446076393127e-07, 8.66129994392395e-07, 9.192153811454773e-07, 9.723007678985596e-07, 1.0253861546516418e-06, 1.0784715414047241e-06, 1.1315569281578064e-06, 1.1846423149108887e-06, 1.237727701663971e-06, 1.2908130884170532e-06, 1.3438984751701355e-06, 1.3969838619232178e-06, 1.4500692486763e-06, 1.5031546354293823e-06, 1.5562400221824646e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 6.0, 0.0, 0.0, 6.0, 0.0, 10.0, 0.0, 0.0, 14.0, 0.0, 19.0, 0.0, 0.0, 37.0, 0.0, 44.0, 0.0, 0.0, 67.0, 0.0, 0.0, 70.0, 0.0, 85.0, 0.0, 0.0, 103.0, 0.0, 106.0, 0.0, 0.0, 99.0, 0.0, 84.0, 0.0, 0.0, 67.0, 0.0, 63.0, 0.0, 0.0, 47.0, 0.0, 0.0, 32.0, 0.0, 26.0, 0.0, 0.0, 17.0, 0.0, 8.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.152557373046875e-07, -6.919726729393005e-07, -6.686896085739136e-07, -6.454065442085266e-07, -6.221234798431396e-07, -5.988404154777527e-07, -5.755573511123657e-07, -5.522742867469788e-07, -5.289912223815918e-07, -5.057081580162048e-07, -4.824250936508179e-07, -4.591420292854309e-07, -4.3585896492004395e-07, -4.12575900554657e-07, -3.8929283618927e-07, -3.6600977182388306e-07, -3.427267074584961e-07, -3.1944364309310913e-07, -2.9616057872772217e-07, -2.728775143623352e-07, -2.4959444999694824e-07, -2.2631138563156128e-07, -2.0302832126617432e-07, -1.7974525690078735e-07, -1.564621925354004e-07, -1.3317912817001343e-07, -1.0989606380462646e-07, -8.66129994392395e-08, -6.332993507385254e-08, -4.0046870708465576e-08, -1.6763806343078613e-08, 6.51925802230835e-09, 2.9802322387695312e-08, 5.3085386753082275e-08, 7.636845111846924e-08, 9.96515154838562e-08, 1.2293457984924316e-07, 1.4621764421463013e-07, 1.695007085800171e-07, 1.9278377294540405e-07, 2.1606683731079102e-07, 2.39349901676178e-07, 2.6263296604156494e-07, 2.859160304069519e-07, 3.0919909477233887e-07, 3.3248215913772583e-07, 3.557652235031128e-07, 3.7904828786849976e-07, 4.023313522338867e-07, 4.256144165992737e-07, 4.4889748096466064e-07, 4.721805453300476e-07, 4.954636096954346e-07, 5.187466740608215e-07, 5.420297384262085e-07, 5.653128027915955e-07, 5.885958671569824e-07, 6.118789315223694e-07, 6.351619958877563e-07, 6.584450602531433e-07, 6.817281246185303e-07, 7.050111889839172e-07, 7.282942533493042e-07, 7.515773177146912e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 8.0, 23.0, 0.0, 30.0, 55.0, 122.0, 0.0, 198.0, 376.0, 689.0, 0.0, 1242.0, 2347.0, 4282.0, 0.0, 8707.0, 16134.0, 32642.0, 0.0, 65685.0, 137400.0, 313343.0, 0.0, 662006.0, 1702481.0, 662917.0, 0.0, 312883.0, 137975.0, 66285.0, 0.0, 32613.0, 16263.0, 8485.0, 0.0, 4272.0, 2215.0, 1182.0, 0.0, 646.0, 341.0, 195.0, 0.0, 101.0, 67.0, 34.0, 0.0, 18.0, 8.0, 15.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.4901161193847656e-06, -1.4454126358032227e-06, -1.4007091522216797e-06, -1.3560056686401367e-06, -1.3113021850585938e-06, -1.2665987014770508e-06, -1.2218952178955078e-06, -1.1771917343139648e-06, -1.1324882507324219e-06, -1.087784767150879e-06, -1.043081283569336e-06, -9.98377799987793e-07, -9.5367431640625e-07, -9.08970832824707e-07, -8.642673492431641e-07, -8.195638656616211e-07, -7.748603820800781e-07, -7.301568984985352e-07, -6.854534149169922e-07, -6.407499313354492e-07, -5.960464477539062e-07, -5.513429641723633e-07, -5.066394805908203e-07, -4.6193599700927734e-07, -4.172325134277344e-07, -3.725290298461914e-07, -3.2782554626464844e-07, -2.8312206268310547e-07, -2.384185791015625e-07, -1.9371509552001953e-07, -1.4901161193847656e-07, -1.043081283569336e-07, -5.960464477539063e-08, -1.4901161193847656e-08, 2.9802322387695312e-08, 7.450580596923828e-08, 1.1920928955078125e-07, 1.6391277313232422e-07, 2.086162567138672e-07, 2.5331974029541016e-07, 2.980232238769531e-07, 3.427267074584961e-07, 3.8743019104003906e-07, 4.3213367462158203e-07, 4.76837158203125e-07, 5.21540641784668e-07, 5.662441253662109e-07, 6.109476089477539e-07, 6.556510925292969e-07, 7.003545761108398e-07, 7.450580596923828e-07, 7.897615432739258e-07, 8.344650268554688e-07, 8.791685104370117e-07, 9.238719940185547e-07, 9.685754776000977e-07, 1.0132789611816406e-06, 1.0579824447631836e-06, 1.1026859283447266e-06, 1.1473894119262695e-06, 1.1920928955078125e-06, 1.2367963790893555e-06, 1.2814998626708984e-06, 1.3262033462524414e-06, 1.3709068298339844e-06]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 12.0, 0.0, 0.0, 0.0, 38.0, 0.0, 0.0, 89.0, 0.0, 0.0, 0.0, 188.0, 0.0, 0.0, 0.0, 396.0, 0.0, 0.0, 0.0, 736.0, 0.0, 0.0, 1236.0, 0.0, 0.0, 0.0, 726.0, 0.0, 0.0, 0.0, 371.0, 0.0, 0.0, 0.0, 191.0, 0.0, 0.0, 70.0, 0.0, 0.0, 0.0, 25.0, 0.0, 0.0, 0.0, 8.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.364418029785156e-07, -5.206093192100525e-07, -5.047768354415894e-07, -4.889443516731262e-07, -4.731118679046631e-07, -4.5727938413619995e-07, -4.414469003677368e-07, -4.256144165992737e-07, -4.0978193283081055e-07, -3.939494490623474e-07, -3.781169652938843e-07, -3.6228448152542114e-07, -3.46451997756958e-07, -3.3061951398849487e-07, -3.1478703022003174e-07, -2.989545464515686e-07, -2.8312206268310547e-07, -2.6728957891464233e-07, -2.514570951461792e-07, -2.3562461137771606e-07, -2.1979212760925293e-07, -2.039596438407898e-07, -1.8812716007232666e-07, -1.7229467630386353e-07, -1.564621925354004e-07, -1.4062970876693726e-07, -1.2479722499847412e-07, -1.0896474123001099e-07, -9.313225746154785e-08, -7.729977369308472e-08, -6.146728992462158e-08, -4.563480615615845e-08, -2.9802322387695312e-08, -1.3969838619232178e-08, 1.862645149230957e-09, 1.7695128917694092e-08, 3.3527612686157227e-08, 4.936009645462036e-08, 6.51925802230835e-08, 8.102506399154663e-08, 9.685754776000977e-08, 1.126900315284729e-07, 1.2852251529693604e-07, 1.4435499906539917e-07, 1.601874828338623e-07, 1.7601996660232544e-07, 1.9185245037078857e-07, 2.076849341392517e-07, 2.2351741790771484e-07, 2.39349901676178e-07, 2.551823854446411e-07, 2.7101486921310425e-07, 2.868473529815674e-07, 3.026798367500305e-07, 3.1851232051849365e-07, 3.343448042869568e-07, 3.501772880554199e-07, 3.6600977182388306e-07, 3.818422555923462e-07, 3.976747393608093e-07, 4.1350722312927246e-07, 4.293397068977356e-07, 4.4517219066619873e-07, 4.6100467443466187e-07, 4.76837158203125e-07]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 6.0, 8.0, 6.0, 8.0, 14.0, 18.0, 9.0, 17.0, 25.0, 27.0, 33.0, 42.0, 51.0, 52.0, 60.0, 58.0, 70.0, 71.0, 57.0, 59.0, 56.0, 49.0, 41.0, 35.0, 23.0, 20.0, 13.0, 10.0, 14.0, 11.0, 3.0, 6.0, 5.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.1811547437901027e-06, -1.144191173807485e-06, -1.1072274901380297e-06, -1.070263920155412e-06, -1.0333003501727944e-06, -9.963367801901768e-07, -9.593732102075592e-07, -9.224095265381038e-07, -8.854459565554862e-07, -8.484823865728686e-07, -8.115187597468321e-07, -7.745551329207956e-07, -7.37591562938178e-07, -7.006279929555603e-07, -6.636643661295238e-07, -6.267007393034874e-07, -5.897371693208697e-07, -5.527735993382521e-07, -5.158099725122156e-07, -4.788463456861791e-07, -4.418827757035615e-07, -4.0491917729923443e-07, -3.679555788949074e-07, -3.309919804905803e-07, -2.9402838208625326e-07, -2.570647836819262e-07, -2.2010118527759914e-07, -1.8313758687327208e-07, -1.4617398846894503e-07, -1.0921039006461797e-07, -7.224679166029091e-08, -3.528319325596385e-08, 1.6804051483632065e-09, 3.8644003552690265e-08, 7.560760195701732e-08, 1.1257120036134438e-07, 1.4953479876567144e-07, 1.864983971699985e-07, 2.2346199557432556e-07, 2.604255939786526e-07, 2.9738919238297967e-07, 3.3435279078730673e-07, 3.713163891916338e-07, 4.0827998759596085e-07, 4.452435860002879e-07, 4.822071559829055e-07, 5.19170782808942e-07, 5.561344096349785e-07, 5.930979796175961e-07, 6.300615496002138e-07, 6.670251764262503e-07, 7.039888032522867e-07, 7.409523732349044e-07, 7.77915943217522e-07, 8.148795700435585e-07, 8.51843196869595e-07, 8.888067668522126e-07, 9.257703368348302e-07, 9.627340205042856e-07, 9.996975904869032e-07, 1.0366611604695208e-06, 1.0736247304521385e-06, 1.110588300434756e-06, 1.1475519841042114e-06, 1.184515554086829e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 3.0, 6.0, 6.0, 7.0, 5.0, 14.0, 6.0, 12.0, 14.0, 18.0, 18.0, 22.0, 25.0, 22.0, 40.0, 30.0, 20.0, 32.0, 31.0, 33.0, 41.0, 31.0, 49.0, 38.0, 41.0, 41.0, 46.0, 40.0, 33.0, 40.0, 29.0, 25.0, 35.0, 21.0, 17.0, 17.0, 20.0, 13.0, 11.0, 12.0, 11.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.379156722388871e-07, -9.085390502150403e-07, -8.791624850346125e-07, -8.497858630107658e-07, -8.204092978303379e-07, -7.910326758064912e-07, -7.616561106260633e-07, -7.322794886022166e-07, -7.029028665783699e-07, -6.735262445545231e-07, -6.441496793740953e-07, -6.147730573502486e-07, -5.853964921698207e-07, -5.56019870145974e-07, -5.266432481221273e-07, -4.972666829416994e-07, -4.678900893395621e-07, -4.385134957374248e-07, -4.0913690213528753e-07, -3.7976030853315024e-07, -3.503836865093035e-07, -3.210070929071662e-07, -2.9163049930502893e-07, -2.622538772811822e-07, -2.3287729788989964e-07, -2.0350070428776235e-07, -1.7412409647477034e-07, -1.4474750287263305e-07, -1.153709021650684e-07, -8.599430145750375e-08, -5.661770785536646e-08, -2.7241100042374455e-08, 2.1354935597628355e-09, 3.1512094267327484e-08, 6.088869497489213e-08, 9.026528857702942e-08, 1.1964189639002143e-07, 1.4901848999215872e-07, 1.78395083594296e-07, 2.0777169140728802e-07, 2.371482850094253e-07, 2.665248928224173e-07, 2.959014864245546e-07, 3.252780800266919e-07, 3.546546736288292e-07, 3.840312956526759e-07, 4.1340786083310377e-07, 4.427844828569505e-07, 4.721610764590878e-07, 5.015376700612251e-07, 5.309142920850718e-07, 5.602908572654997e-07, 5.896674792893464e-07, 6.190440444697742e-07, 6.48420666493621e-07, 6.777972885174677e-07, 7.071738536978955e-07, 7.365504757217423e-07, 7.659270409021701e-07, 7.953036629260168e-07, 8.246802281064447e-07, 8.540568501302914e-07, 8.834334721541381e-07, 9.12810037334566e-07, 9.421866593584127e-07]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 15.0, 21.0, 20.0, 34.0, 45.0, 61.0, 70.0, 110.0, 171.0, 221.0, 351.0, 523.0, 763.0, 1273.0, 2086.0, 3318.0, 5917.0, 10261.0, 19407.0, 37878.0, 81893.0, 190250.0, 529339.0, 82081.0, 38377.0, 19147.0, 10229.0, 5702.0, 3318.0, 1944.0, 1196.0, 825.0, 520.0, 345.0, 247.0, 160.0, 126.0, 81.0, 63.0, 47.0, 28.0, 24.0, 15.0, 8.0, 9.0, 7.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.9669532775878906e-06, -1.905485987663269e-06, -1.8440186977386475e-06, -1.7825514078140259e-06, -1.7210841178894043e-06, -1.6596168279647827e-06, -1.5981495380401611e-06, -1.5366822481155396e-06, -1.475214958190918e-06, -1.4137476682662964e-06, -1.3522803783416748e-06, -1.2908130884170532e-06, -1.2293457984924316e-06, -1.16787850856781e-06, -1.1064112186431885e-06, -1.044943928718567e-06, -9.834766387939453e-07, -9.220093488693237e-07, -8.605420589447021e-07, -7.990747690200806e-07, -7.37607479095459e-07, -6.761401891708374e-07, -6.146728992462158e-07, -5.532056093215942e-07, -4.917383193969727e-07, -4.302710294723511e-07, -3.688037395477295e-07, -3.073364496231079e-07, -2.4586915969848633e-07, -1.8440186977386475e-07, -1.2293457984924316e-07, -6.146728992462158e-08, 0.0, 6.146728992462158e-08, 1.2293457984924316e-07, 1.8440186977386475e-07, 2.4586915969848633e-07, 3.073364496231079e-07, 3.688037395477295e-07, 4.302710294723511e-07, 4.917383193969727e-07, 5.532056093215942e-07, 6.146728992462158e-07, 6.761401891708374e-07, 7.37607479095459e-07, 7.990747690200806e-07, 8.605420589447021e-07, 9.220093488693237e-07, 9.834766387939453e-07, 1.044943928718567e-06, 1.1064112186431885e-06, 1.16787850856781e-06, 1.2293457984924316e-06, 1.2908130884170532e-06, 1.3522803783416748e-06, 1.4137476682662964e-06, 1.475214958190918e-06, 1.5366822481155396e-06, 1.5981495380401611e-06, 1.6596168279647827e-06, 1.7210841178894043e-06, 1.7825514078140259e-06, 1.8440186977386475e-06, 1.905485987663269e-06, 1.9669532775878906e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 0.0, 7.0, 0.0, 13.0, 0.0, 16.0, 0.0, 20.0, 0.0, 25.0, 0.0, 37.0, 0.0, 43.0, 0.0, 51.0, 0.0, 59.0, 0.0, 87.0, 0.0, 88.0, 0.0, 89.0, 0.0, 80.0, 0.0, 91.0, 0.0, 89.0, 0.0, 50.0, 0.0, 58.0, 0.0, 37.0, 0.0, 25.0, 0.0, 12.0, 0.0, 18.0, 0.0, 8.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-07, -9.238719940185547e-07, -8.940696716308594e-07, -8.642673492431641e-07, -8.344650268554688e-07, -8.046627044677734e-07, -7.748603820800781e-07, -7.450580596923828e-07, -7.152557373046875e-07, -6.854534149169922e-07, -6.556510925292969e-07, -6.258487701416016e-07, -5.960464477539062e-07, -5.662441253662109e-07, -5.364418029785156e-07, -5.066394805908203e-07, -4.76837158203125e-07, -4.470348358154297e-07, -4.172325134277344e-07, -3.8743019104003906e-07, -3.5762786865234375e-07, -3.2782554626464844e-07, -2.980232238769531e-07, -2.682209014892578e-07, -2.384185791015625e-07, -2.086162567138672e-07, -1.7881393432617188e-07, -1.4901161193847656e-07, -1.1920928955078125e-07, -8.940696716308594e-08, -5.960464477539063e-08, -2.9802322387695312e-08, 0.0, 2.9802322387695312e-08, 5.960464477539063e-08, 8.940696716308594e-08, 1.1920928955078125e-07, 1.4901161193847656e-07, 1.7881393432617188e-07, 2.086162567138672e-07, 2.384185791015625e-07, 2.682209014892578e-07, 2.980232238769531e-07, 3.2782554626464844e-07, 3.5762786865234375e-07, 3.8743019104003906e-07, 4.172325134277344e-07, 4.470348358154297e-07, 4.76837158203125e-07, 5.066394805908203e-07, 5.364418029785156e-07, 5.662441253662109e-07, 5.960464477539062e-07, 6.258487701416016e-07, 6.556510925292969e-07, 6.854534149169922e-07, 7.152557373046875e-07, 7.450580596923828e-07, 7.748603820800781e-07, 8.046627044677734e-07, 8.344650268554688e-07, 8.642673492431641e-07, 8.940696716308594e-07, 9.238719940185547e-07, 9.5367431640625e-07]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 8.0, 0.0, 9.0, 15.0, 10.0, 8.0, 27.0, 10.0, 38.0, 41.0, 160.0, 66.0, 269.0, 161.0, 678.0, 527.0, 704.0, 3379.0, 4181.0, 35898.0, 956113.0, 36059.0, 4119.0, 3378.0, 716.0, 896.0, 279.0, 327.0, 104.0, 144.0, 63.0, 62.0, 27.0, 22.0, 10.0, 20.0, 1.0, 10.0, 12.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2186508178710938e-06, -3.1301751732826233e-06, -3.041699528694153e-06, -2.9532238841056824e-06, -2.864748239517212e-06, -2.7762725949287415e-06, -2.687796950340271e-06, -2.5993213057518005e-06, -2.51084566116333e-06, -2.4223700165748596e-06, -2.333894371986389e-06, -2.2454187273979187e-06, -2.1569430828094482e-06, -2.0684674382209778e-06, -1.9799917936325073e-06, -1.8915161490440369e-06, -1.8030405044555664e-06, -1.714564859867096e-06, -1.6260892152786255e-06, -1.537613570690155e-06, -1.4491379261016846e-06, -1.3606622815132141e-06, -1.2721866369247437e-06, -1.1837109923362732e-06, -1.0952353477478027e-06, -1.0067597031593323e-06, -9.182840585708618e-07, -8.298084139823914e-07, -7.413327693939209e-07, -6.528571248054504e-07, -5.6438148021698e-07, -4.759058356285095e-07, -3.8743019104003906e-07, -2.989545464515686e-07, -2.1047890186309814e-07, -1.2200325727462769e-07, -3.3527612686157227e-08, 5.494803190231323e-08, 1.434236764907837e-07, 2.3189932107925415e-07, 3.203749656677246e-07, 4.0885061025619507e-07, 4.973262548446655e-07, 5.85801899433136e-07, 6.742775440216064e-07, 7.627531886100769e-07, 8.512288331985474e-07, 9.397044777870178e-07, 1.0281801223754883e-06, 1.1166557669639587e-06, 1.2051314115524292e-06, 1.2936070561408997e-06, 1.3820827007293701e-06, 1.4705583453178406e-06, 1.559033989906311e-06, 1.6475096344947815e-06, 1.735985279083252e-06, 1.8244609236717224e-06, 1.912936568260193e-06, 2.0014122128486633e-06, 2.089887857437134e-06, 2.1783635020256042e-06, 2.2668391466140747e-06, 2.355314791202545e-06, 2.4437904357910156e-06]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 77.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 807.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 76.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.7881393432617188e-07, -1.7229467630386353e-07, -1.6577541828155518e-07, -1.5925616025924683e-07, -1.5273690223693848e-07, -1.4621764421463013e-07, -1.3969838619232178e-07, -1.3317912817001343e-07, -1.2665987014770508e-07, -1.2014061212539673e-07, -1.1362135410308838e-07, -1.0710209608078003e-07, -1.0058283805847168e-07, -9.406358003616333e-08, -8.754432201385498e-08, -8.102506399154663e-08, -7.450580596923828e-08, -6.798654794692993e-08, -6.146728992462158e-08, -5.494803190231323e-08, -4.842877388000488e-08, -4.190951585769653e-08, -3.5390257835388184e-08, -2.8870999813079834e-08, -2.2351741790771484e-08, -1.5832483768463135e-08, -9.313225746154785e-09, -2.7939677238464355e-09, 3.725290298461914e-09, 1.0244548320770264e-08, 1.6763806343078613e-08, 2.3283064365386963e-08, 2.9802322387695312e-08, 3.632158041000366e-08, 4.284083843231201e-08, 4.936009645462036e-08, 5.587935447692871e-08, 6.239861249923706e-08, 6.891787052154541e-08, 7.543712854385376e-08, 8.195638656616211e-08, 8.847564458847046e-08, 9.499490261077881e-08, 1.0151416063308716e-07, 1.0803341865539551e-07, 1.1455267667770386e-07, 1.210719347000122e-07, 1.2759119272232056e-07, 1.341104507446289e-07, 1.4062970876693726e-07, 1.471489667892456e-07, 1.5366822481155396e-07, 1.601874828338623e-07, 1.6670674085617065e-07, 1.73225998878479e-07, 1.7974525690078735e-07, 1.862645149230957e-07, 1.9278377294540405e-07, 1.993030309677124e-07, 2.0582228899002075e-07, 2.123415470123291e-07, 2.1886080503463745e-07, 2.253800630569458e-07, 2.3189932107925415e-07, 2.384185791015625e-07]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 9.0, 5.0, 5.0, 9.0, 14.0, 15.0, 17.0, 23.0, 26.0, 35.0, 52.0, 64.0, 53.0, 89.0, 77.0, 85.0, 67.0, 67.0, 72.0, 41.0, 38.0, 30.0, 26.0, 18.0, 10.0, 11.0, 11.0, 6.0, 4.0, 4.0, 3.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0589745897959801e-06, -1.0167534583160887e-06, -9.745324405230349e-07, -9.323113090431434e-07, -8.900901775632519e-07, -8.478690460833604e-07, -8.056479714468878e-07, -7.634268968104152e-07, -7.212057653305237e-07, -6.789846338506322e-07, -6.367635592141596e-07, -5.94542484577687e-07, -5.523213530977955e-07, -5.10100221617904e-07, -4.678791469814314e-07, -4.2565804392324935e-07, -3.834369408650673e-07, -3.4121583780688525e-07, -2.989947347487032e-07, -2.5677363169052114e-07, -2.145525286323391e-07, -1.7233142557415704e-07, -1.3011032251597499e-07, -8.788921945779293e-08, -4.566811639961088e-08, -3.4470133414288284e-09, 3.8774089716753224e-08, 8.099519277493528e-08, 1.2321629583311733e-07, 1.6543739889129938e-07, 2.0765850194948143e-07, 2.498796050076635e-07, 2.9210070806584554e-07, 3.343218111240276e-07, 3.7654291418220964e-07, 4.187640172403917e-07, 4.6098512029857375e-07, 5.032062517784652e-07, 5.454273264149379e-07, 5.876484010514105e-07, 6.29869532531302e-07, 6.720906640111934e-07, 7.143117386476661e-07, 7.565328132841387e-07, 7.987539447640302e-07, 8.409750762439216e-07, 8.831961508803943e-07, 9.254172255168669e-07, 9.676383569967584e-07, 1.0098594884766499e-06, 1.0520805062697036e-06, 1.094301637749595e-06, 1.1365227692294866e-06, 1.178743900709378e-06, 1.2209650321892696e-06, 1.2631860499823233e-06, 1.3054071814622148e-06, 1.3476283129421063e-06, 1.38984933073516e-06, 1.4320704622150515e-06, 1.474291593694943e-06, 1.5165127251748345e-06, 1.558733856654726e-06, 1.6009548744477797e-06, 1.6431760059276712e-06]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 7.0, 2.0, 7.0, 4.0, 10.0, 3.0, 9.0, 12.0, 12.0, 9.0, 19.0, 19.0, 15.0, 24.0, 29.0, 32.0, 31.0, 24.0, 32.0, 28.0, 30.0, 43.0, 37.0, 35.0, 51.0, 33.0, 48.0, 38.0, 46.0, 31.0, 38.0, 37.0, 24.0, 34.0, 24.0, 21.0, 13.0, 21.0, 12.0, 16.0, 11.0, 8.0, 13.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.191335266223177e-07, -8.905509503165376e-07, -8.619684308541764e-07, -8.333858545483963e-07, -8.048033350860351e-07, -7.76220758780255e-07, -7.476381824744749e-07, -7.190556061686948e-07, -6.904730867063336e-07, -6.618905104005535e-07, -6.333079909381922e-07, -6.047254146324121e-07, -5.76142838326632e-07, -5.475603188642708e-07, -5.189777425584907e-07, -4.903952230961295e-07, -4.618126467903494e-07, -4.3323009890627873e-07, -4.0464755102220806e-07, -3.7606497471642797e-07, -3.474824268323573e-07, -3.1889987894828664e-07, -2.9031730264250655e-07, -2.617347547584359e-07, -2.3315220687436522e-07, -2.0456965899029456e-07, -1.7598709689536918e-07, -1.474045348004438e-07, -1.1882198691637313e-07, -9.023943903230247e-08, -6.165687693737709e-08, -3.307431484245171e-08, -4.4917101149621885e-09, 2.4090844874535833e-08, 5.2673399864033854e-08, 8.125595485353188e-08, 1.098385098430299e-07, 1.3842105772710056e-07, 1.6700361982202594e-07, 1.9558618191695132e-07, 2.2416872980102198e-07, 2.5275127768509265e-07, 2.813338255691633e-07, 3.099164018749434e-07, 3.3849894975901407e-07, 3.6708149764308473e-07, 3.956640739488648e-07, 4.242466218329355e-07, 4.5282916971700615e-07, 4.814117460227862e-07, 5.099942654851475e-07, 5.385768417909276e-07, 5.671594180967077e-07, 5.957419375590689e-07, 6.24324513864849e-07, 6.529070333272102e-07, 6.814896096329903e-07, 7.100721859387704e-07, 7.386547054011317e-07, 7.672372817069117e-07, 7.95819801169273e-07, 8.244023774750531e-07, 8.529849537808332e-07, 8.815675300866133e-07, 9.101500495489745e-07]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 0.0, 17.0, 11.0, 23.0, 38.0, 58.0, 84.0, 114.0, 0.0, 187.0, 306.0, 485.0, 725.0, 1203.0, 1957.0, 3213.0, 0.0, 5390.0, 9466.0, 16576.0, 30240.0, 55924.0, 103040.0, 178547.0, 0.0, 233615.0, 178373.0, 102579.0, 55885.0, 30282.0, 16839.0, 9463.0, 0.0, 5511.0, 3205.0, 1924.0, 1206.0, 767.0, 471.0, 300.0, 0.0, 197.0, 104.0, 73.0, 65.0, 37.0, 24.0, 10.0, 0.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.6689300537109375e-06, -1.6167759895324707e-06, -1.564621925354004e-06, -1.5124678611755371e-06, -1.4603137969970703e-06, -1.4081597328186035e-06, -1.3560056686401367e-06, -1.30385160446167e-06, -1.2516975402832031e-06, -1.1995434761047363e-06, -1.1473894119262695e-06, -1.0952353477478027e-06, -1.043081283569336e-06, -9.909272193908691e-07, -9.387731552124023e-07, -8.866190910339355e-07, -8.344650268554688e-07, -7.82310962677002e-07, -7.301568984985352e-07, -6.780028343200684e-07, -6.258487701416016e-07, -5.736947059631348e-07, -5.21540641784668e-07, -4.6938657760620117e-07, -4.172325134277344e-07, -3.650784492492676e-07, -3.129243850708008e-07, -2.60770320892334e-07, -2.086162567138672e-07, -1.564621925354004e-07, -1.043081283569336e-07, -5.21540641784668e-08, 0.0, 5.21540641784668e-08, 1.043081283569336e-07, 1.564621925354004e-07, 2.086162567138672e-07, 2.60770320892334e-07, 3.129243850708008e-07, 3.650784492492676e-07, 4.172325134277344e-07, 4.6938657760620117e-07, 5.21540641784668e-07, 5.736947059631348e-07, 6.258487701416016e-07, 6.780028343200684e-07, 7.301568984985352e-07, 7.82310962677002e-07, 8.344650268554688e-07, 8.866190910339355e-07, 9.387731552124023e-07, 9.909272193908691e-07, 1.043081283569336e-06, 1.0952353477478027e-06, 1.1473894119262695e-06, 1.1995434761047363e-06, 1.2516975402832031e-06, 1.30385160446167e-06, 1.3560056686401367e-06, 1.4081597328186035e-06, 1.4603137969970703e-06, 1.5124678611755371e-06, 1.564621925354004e-06, 1.6167759895324707e-06, 1.6689300537109375e-06]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 5.0, 0.0, 10.0, 0.0, 0.0, 14.0, 0.0, 17.0, 0.0, 32.0, 0.0, 0.0, 43.0, 0.0, 49.0, 0.0, 0.0, 81.0, 0.0, 79.0, 0.0, 99.0, 0.0, 0.0, 122.0, 0.0, 122.0, 0.0, 83.0, 0.0, 0.0, 84.0, 0.0, 66.0, 0.0, 0.0, 41.0, 0.0, 24.0, 0.0, 19.0, 0.0, 0.0, 12.0, 0.0, 3.0, 0.0, 5.0, 0.0, 0.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-07, -8.093193173408508e-07, -7.841736078262329e-07, -7.59027898311615e-07, -7.338821887969971e-07, -7.087364792823792e-07, -6.835907697677612e-07, -6.584450602531433e-07, -6.332993507385254e-07, -6.081536412239075e-07, -5.830079317092896e-07, -5.578622221946716e-07, -5.327165126800537e-07, -5.075708031654358e-07, -4.824250936508179e-07, -4.5727938413619995e-07, -4.3213367462158203e-07, -4.069879651069641e-07, -3.818422555923462e-07, -3.5669654607772827e-07, -3.3155083656311035e-07, -3.0640512704849243e-07, -2.812594175338745e-07, -2.561137080192566e-07, -2.3096799850463867e-07, -2.0582228899002075e-07, -1.8067657947540283e-07, -1.555308699607849e-07, -1.30385160446167e-07, -1.0523945093154907e-07, -8.009374141693115e-08, -5.494803190231323e-08, -2.9802322387695312e-08, -4.6566128730773926e-09, 2.0489096641540527e-08, 4.563480615615845e-08, 7.078051567077637e-08, 9.592622518539429e-08, 1.210719347000122e-07, 1.4621764421463013e-07, 1.7136335372924805e-07, 1.9650906324386597e-07, 2.2165477275848389e-07, 2.468004822731018e-07, 2.7194619178771973e-07, 2.9709190130233765e-07, 3.2223761081695557e-07, 3.473833203315735e-07, 3.725290298461914e-07, 3.976747393608093e-07, 4.2282044887542725e-07, 4.4796615839004517e-07, 4.731118679046631e-07, 4.98257577419281e-07, 5.234032869338989e-07, 5.485489964485168e-07, 5.736947059631348e-07, 5.988404154777527e-07, 6.239861249923706e-07, 6.491318345069885e-07, 6.742775440216064e-07, 6.994232535362244e-07, 7.245689630508423e-07, 7.497146725654602e-07, 7.748603820800781e-07]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 8.0, 2.0, 0.0, 6.0, 13.0, 18.0, 28.0, 38.0, 0.0, 63.0, 120.0, 228.0, 301.0, 521.0, 792.0, 0.0, 1320.0, 2234.0, 3692.0, 6688.0, 11250.0, 0.0, 19553.0, 33436.0, 59013.0, 102384.0, 165107.0, 0.0, 235100.0, 165469.0, 102189.0, 58385.0, 33958.0, 19395.0, 0.0, 11072.0, 6589.0, 3663.0, 2269.0, 1457.0, 0.0, 778.0, 547.0, 335.0, 215.0, 126.0, 68.0, 0.0, 54.0, 34.0, 13.0, 19.0, 7.0, 0.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6093254089355469e-06, -1.559033989906311e-06, -1.5087425708770752e-06, -1.4584511518478394e-06, -1.4081597328186035e-06, -1.3578683137893677e-06, -1.3075768947601318e-06, -1.257285475730896e-06, -1.2069940567016602e-06, -1.1567026376724243e-06, -1.1064112186431885e-06, -1.0561197996139526e-06, -1.0058283805847168e-06, -9.55536961555481e-07, -9.052455425262451e-07, -8.549541234970093e-07, -8.046627044677734e-07, -7.543712854385376e-07, -7.040798664093018e-07, -6.537884473800659e-07, -6.034970283508301e-07, -5.532056093215942e-07, -5.029141902923584e-07, -4.5262277126312256e-07, -4.023313522338867e-07, -3.520399332046509e-07, -3.0174851417541504e-07, -2.514570951461792e-07, -2.0116567611694336e-07, -1.5087425708770752e-07, -1.0058283805847168e-07, -5.029141902923584e-08, 0.0, 5.029141902923584e-08, 1.0058283805847168e-07, 1.5087425708770752e-07, 2.0116567611694336e-07, 2.514570951461792e-07, 3.0174851417541504e-07, 3.520399332046509e-07, 4.023313522338867e-07, 4.5262277126312256e-07, 5.029141902923584e-07, 5.532056093215942e-07, 6.034970283508301e-07, 6.537884473800659e-07, 7.040798664093018e-07, 7.543712854385376e-07, 8.046627044677734e-07, 8.549541234970093e-07, 9.052455425262451e-07, 9.55536961555481e-07, 1.0058283805847168e-06, 1.0561197996139526e-06, 1.1064112186431885e-06, 1.1567026376724243e-06, 1.2069940567016602e-06, 1.257285475730896e-06, 1.3075768947601318e-06, 1.3578683137893677e-06, 1.4081597328186035e-06, 1.4584511518478394e-06, 1.5087425708770752e-06, 1.559033989906311e-06, 1.6093254089355469e-06]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 8.0, 0.0, 0.0, 26.0, 0.0, 0.0, 0.0, 51.0, 0.0, 0.0, 72.0, 0.0, 0.0, 124.0, 0.0, 0.0, 0.0, 134.0, 0.0, 0.0, 145.0, 0.0, 0.0, 0.0, 136.0, 0.0, 0.0, 130.0, 0.0, 0.0, 85.0, 0.0, 0.0, 0.0, 54.0, 0.0, 0.0, 26.0, 0.0, 0.0, 20.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.960464477539062e-07, -5.783513188362122e-07, -5.606561899185181e-07, -5.42961061000824e-07, -5.252659320831299e-07, -5.075708031654358e-07, -4.898756742477417e-07, -4.721805453300476e-07, -4.544854164123535e-07, -4.367902874946594e-07, -4.1909515857696533e-07, -4.0140002965927124e-07, -3.8370490074157715e-07, -3.6600977182388306e-07, -3.4831464290618896e-07, -3.3061951398849487e-07, -3.129243850708008e-07, -2.952292561531067e-07, -2.775341272354126e-07, -2.598389983177185e-07, -2.421438694000244e-07, -2.2444874048233032e-07, -2.0675361156463623e-07, -1.8905848264694214e-07, -1.7136335372924805e-07, -1.5366822481155396e-07, -1.3597309589385986e-07, -1.1827796697616577e-07, -1.0058283805847168e-07, -8.288770914077759e-08, -6.51925802230835e-08, -4.7497451305389404e-08, -2.9802322387695312e-08, -1.210719347000122e-08, 5.587935447692871e-09, 2.3283064365386963e-08, 4.0978193283081055e-08, 5.8673322200775146e-08, 7.636845111846924e-08, 9.406358003616333e-08, 1.1175870895385742e-07, 1.2945383787155151e-07, 1.471489667892456e-07, 1.648440957069397e-07, 1.825392246246338e-07, 2.0023435354232788e-07, 2.1792948246002197e-07, 2.3562461137771606e-07, 2.5331974029541016e-07, 2.7101486921310425e-07, 2.8870999813079834e-07, 3.0640512704849243e-07, 3.241002559661865e-07, 3.417953848838806e-07, 3.594905138015747e-07, 3.771856427192688e-07, 3.948807716369629e-07, 4.12575900554657e-07, 4.302710294723511e-07, 4.4796615839004517e-07, 4.6566128730773926e-07, 4.833564162254333e-07, 5.010515451431274e-07, 5.187466740608215e-07, 5.364418029785156e-07]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1048576.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1024.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0], "bins": [0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 12.0, 12.0, 9.0, 17.0, 11.0, 21.0, 31.0, 41.0, 52.0, 60.0, 77.0, 104.0, 107.0, 98.0, 67.0, 60.0, 49.0, 34.0, 28.0, 31.0, 15.0, 14.0, 11.0, 7.0, 6.0, 10.0, 2.0, 6.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2852927966378047e-06, -1.2400645346133388e-06, -1.194836158902035e-06, -1.1496078968775691e-06, -1.1043796348531032e-06, -1.0591513728286372e-06, -1.0139229971173336e-06, -9.686947350928676e-07, -9.234664162249828e-07, -8.78238097357098e-07, -8.330098353326321e-07, -7.877815164647473e-07, -7.425531975968624e-07, -6.973249355723965e-07, -6.520966167045117e-07, -6.068682978366269e-07, -5.616400358121609e-07, -5.164117169442761e-07, -4.711834549198102e-07, -4.2595513605192536e-07, -3.8072684560575e-07, -3.354985551595746e-07, -2.902702362916898e-07, -2.450419458455144e-07, -1.9981365539933904e-07, -1.5458536495316366e-07, -1.0935706029613357e-07, -6.412875563910347e-08, -1.8900465192928095e-08, 2.6327825253247283e-08, 7.155614412113209e-08, 1.1678443456730747e-07, 1.6201272501348285e-07, 2.0724101545965823e-07, 2.524693059058336e-07, 2.976976247737184e-07, 3.429259152198938e-07, 3.881542056660692e-07, 4.33382524533954e-07, 4.786107865584199e-07, 5.238391054263047e-07, 5.690674242941895e-07, 6.142956863186555e-07, 6.595240051865403e-07, 7.047523240544251e-07, 7.499805860788911e-07, 7.952089049467759e-07, 8.404372238146607e-07, 8.856654858391266e-07, 9.308938047070114e-07, 9.761221235748962e-07, 1.0213503855993622e-06, 1.0665786476238281e-06, 1.1118070233351318e-06, 1.1570352853595978e-06, 1.2022635473840637e-06, 1.2474918094085297e-06, 1.2927200714329956e-06, 1.3379484471442993e-06, 1.3831767091687652e-06, 1.4284049711932312e-06, 1.4736333469045348e-06, 1.5188616089290008e-06, 1.5640898709534667e-06, 1.6093182466647704e-06]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 7.0, 6.0, 9.0, 16.0, 14.0, 23.0, 18.0, 22.0, 31.0, 30.0, 40.0, 23.0, 34.0, 43.0, 39.0, 32.0, 36.0, 63.0, 51.0, 48.0, 43.0, 44.0, 41.0, 46.0, 30.0, 23.0, 22.0, 27.0, 16.0, 37.0, 13.0, 11.0, 14.0, 7.0, 7.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.888183285511332e-07, -9.595192977940314e-07, -9.302203807237674e-07, -9.009213499666657e-07, -8.716223760529829e-07, -8.423234021393e-07, -8.130244282256172e-07, -7.837254543119343e-07, -7.544264803982514e-07, -7.251275064845686e-07, -6.958285325708857e-07, -6.665295586572029e-07, -6.372305279001012e-07, -6.079315539864183e-07, -5.786325800727354e-07, -5.493336061590526e-07, -5.200346322453697e-07, -4.907356583316869e-07, -4.614366559962946e-07, -4.321376820826117e-07, -4.0283870816892886e-07, -3.7353970583353657e-07, -3.442407319198537e-07, -3.1494175800617086e-07, -2.8564272724906914e-07, -2.563437533353863e-07, -2.270447652108487e-07, -1.9774577708631114e-07, -1.6844680317262828e-07, -1.391478150480907e-07, -1.0984882692355313e-07, -8.054985300987028e-08, -5.125087909618742e-08, -2.1951896300720364e-08, 7.347086494746691e-09, 3.6646071066570585e-08, 6.59450520856808e-08, 9.524403310479101e-08, 1.245430212293286e-07, 1.5384199514301145e-07, 1.8314098326754902e-07, 2.124399713920866e-07, 2.4173894530576945e-07, 2.7103794764116174e-07, 3.003369215548446e-07, 3.2963589546852745e-07, 3.589348693822103e-07, 3.8823384329589317e-07, 4.1753284563128545e-07, 4.468318195449683e-07, 4.761308218803606e-07, 5.054297957940435e-07, 5.347287697077263e-07, 5.640277436214092e-07, 5.93326717535092e-07, 6.226257482921937e-07, 6.519247222058766e-07, 6.812236961195595e-07, 7.105226700332423e-07, 7.398216439469252e-07, 7.691206747040269e-07, 7.984196486177098e-07, 8.277186225313926e-07, 8.570175964450755e-07, 8.863165703587583e-07]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 6.0, 6.0, 7.0, 19.0, 15.0, 23.0, 23.0, 35.0, 36.0, 54.0, 53.0, 67.0, 62.0, 83.0, 73.0, 102.0, 131.0, 244.0, 520729.0, 1498.0, 203.0, 110.0, 90.0, 94.0, 87.0, 89.0, 49.0, 55.0, 47.0, 29.0, 40.0, 22.0, 24.0, 14.0, 12.0, 9.0, 5.0, 6.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3836129912524484e-05, -2.3132000933401287e-05, -2.242787195427809e-05, -2.172374297515489e-05, -2.1019615815021098e-05, -2.03154868358979e-05, -1.9611357856774703e-05, -1.8907228877651505e-05, -1.8203099898528308e-05, -1.749897091940511e-05, -1.6794841940281913e-05, -1.6090712961158715e-05, -1.5386583982035518e-05, -1.4682455912407022e-05, -1.3978327842778526e-05, -1.3274198863655329e-05, -1.2570069884532131e-05, -1.1865940905408934e-05, -1.1161811926285736e-05, -1.045768385665724e-05, -9.753554877534043e-06, -9.049425898410846e-06, -8.34529782878235e-06, -7.641168849659152e-06, -6.937039870535955e-06, -6.232910891412757e-06, -5.528782367036911e-06, -4.824653842661064e-06, -4.120524863537867e-06, -3.4163961117883446e-06, -2.7122673600388225e-06, -2.008138835662976e-06, -1.304011675529182e-06, -5.998829237796599e-07, 1.0424582796986215e-07, 8.083745797193842e-07, 1.5125033314689063e-06, 2.2166320832184283e-06, 2.9207608349679504e-06, 3.624889359343797e-06, 4.3290183384669945e-06, 5.033147317590192e-06, 5.7372758419660386e-06, 6.441404366341885e-06, 7.145533345465083e-06, 7.84966232458828e-06, 8.553790394216776e-06, 9.257919373339973e-06, 9.962048352463171e-06, 1.0666177331586368e-05, 1.1370306310709566e-05, 1.2074434380338062e-05, 1.2778563359461259e-05, 1.3482692338584457e-05, 1.4186820408212952e-05, 1.489094938733615e-05, 1.5595078366459347e-05, 1.6299207345582545e-05, 1.7003336324705742e-05, 1.770746530382894e-05, 1.8411592463962734e-05, 1.911572144308593e-05, 1.981985042220913e-05, 2.0523979401332326e-05, 2.1228108380455524e-05]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 7.0, 6.0, 15.0, 13.0, 18.0, 22.0, 18.0, 31.0, 27.0, 44.0, 26.0, 31.0, 38.0, 46.0, 31.0, 33.0, 1077.0, 62.0, 42.0, 46.0, 45.0, 42.0, 39.0, 43.0, 15.0, 33.0, 23.0, 19.0, 29.0, 22.0, 10.0, 14.0, 11.0, 5.0, 7.0, 4.0, 1.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.9159618861740455e-05, -2.83007939287927e-05, -2.744197081483435e-05, -2.6583147700875998e-05, -2.5724322767928243e-05, -2.4865497834980488e-05, -2.4006674721022137e-05, -2.3147851607063785e-05, -2.228902667411603e-05, -2.1430201741168275e-05, -2.0571378627209924e-05, -1.9712555513251573e-05, -1.8853730580303818e-05, -1.7994905647356063e-05, -1.7136082533397712e-05, -1.627725941943936e-05, -1.5418434486491606e-05, -1.4559610463038553e-05, -1.37007864395855e-05, -1.2841962416132446e-05, -1.1983138392679393e-05, -1.112431436922634e-05, -1.0265490345773287e-05, -9.406666322320234e-06, -8.547842298867181e-06, -7.689018275414128e-06, -6.830194251961075e-06, -5.971370228508022e-06, -5.112546205054969e-06, -4.2537221816019155e-06, -3.3948981581488624e-06, -2.5360741346958093e-06, -1.6772519302321598e-06, -8.184279067791067e-07, 4.039611667394638e-08, 8.992201401269995e-07, 1.7580441635800526e-06, 2.6168681870331056e-06, 3.4756922104861587e-06, 4.334516233939212e-06, 5.193340257392265e-06, 6.052164280845318e-06, 6.910988304298371e-06, 7.769812327751424e-06, 8.628636351204477e-06, 9.48746037465753e-06, 1.0346284398110583e-05, 1.1205108421563637e-05, 1.206393244501669e-05, 1.2922756468469743e-05, 1.3781580491922796e-05, 1.4640404515375849e-05, 1.5499228538828902e-05, 1.6358051652787253e-05, 1.7216876585735008e-05, 1.8075701518682763e-05, 1.8934524632641114e-05, 1.9793347746599466e-05, 2.065217267954722e-05, 2.1510997612494975e-05, 2.2369820726453327e-05, 2.3228643840411678e-05, 2.4087468773359433e-05, 2.4946293706307188e-05, 2.580511682026554e-05]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 15.0, 4.0, 4.0, 18.0, 16.0, 26.0, 28.0, 32.0, 45.0, 54.0, 80.0, 103.0, 173.0, 237.0, 405.0, 653.0, 979.0, 1399.0, 2013.0, 2829.0, 3932.0, 5157.0, 6329.0, 8034.0, 10883.0, 19243.0, 29995964.0, 1087955.0, 39173.0, 56244.0, 5352.0, 4692.0, 1530.0, 366.0, 214.0, 207.0, 187.0, 32.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-377.75, -369.16015625, -360.5703125, -351.98046875, -343.390625, -334.80078125, -326.2109375, -317.62109375, -309.03125, -300.44140625, -291.8515625, -283.26171875, -274.671875, -266.08203125, -257.4921875, -248.90234375, -240.3125, -231.72265625, -223.1328125, -214.54296875, -205.953125, -197.36328125, -188.7734375, -180.18359375, -171.59375, -163.00390625, -154.4140625, -145.82421875, -137.234375, -128.64453125, -120.0546875, -111.46484375, -102.875, -94.28515625, -85.6953125, -77.10546875, -68.515625, -59.92578125, -51.3359375, -42.74609375, -34.15625, -25.56640625, -16.9765625, -8.38671875, 0.203125, 8.79296875, 17.3828125, 25.97265625, 34.5625, 43.15234375, 51.7421875, 60.33203125, 68.921875, 77.51171875, 86.1015625, 94.69140625, 103.28125, 111.87109375, 120.4609375, 129.05078125, 137.640625, 146.23046875, 154.8203125, 163.41015625, 172.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [6.0, 2.0, 4.0, 4.0, 18.0, 13.0, 24.0, 34.0, 23.0, 39.0, 57.0, 66.0, 85.0, 167.0, 203.0, 316.0, 452.0, 650.0, 1068.0, 1512.0, 2317.0, 3332.0, 5364.0, 8702.0, 14519.0, 25674.0, 48271.0, 101153.0, 245034.0, 753132.0, 2997798.0, 1405683.0, 382272.0, 145525.0, 65772.0, 33575.0, 18572.0, 10861.0, 6603.0, 4131.0, 2697.0, 1813.0, 1223.0, 797.0, 569.0, 377.0, 289.0, 168.0, 143.0, 108.0, 75.0, 50.0, 34.0, 20.0, 19.0, 15.0, 10.0, 1.0, 2.0, 4.0, 5.0, 0.0, 3.0, 1.0], "bins": [-46.03125, -44.53271484375, -43.0341796875, -41.53564453125, -40.037109375, -38.53857421875, -37.0400390625, -35.54150390625, -34.04296875, -32.54443359375, -31.0458984375, -29.54736328125, -28.048828125, -26.55029296875, -25.0517578125, -23.55322265625, -22.0546875, -20.55615234375, -19.0576171875, -17.55908203125, -16.060546875, -14.56201171875, -13.0634765625, -11.56494140625, -10.06640625, -8.56787109375, -7.0693359375, -5.57080078125, -4.072265625, -2.57373046875, -1.0751953125, 0.42333984375, 1.921875, 3.42041015625, 4.9189453125, 6.41748046875, 7.916015625, 9.41455078125, 10.9130859375, 12.41162109375, 13.91015625, 15.40869140625, 16.9072265625, 18.40576171875, 19.904296875, 21.40283203125, 22.9013671875, 24.39990234375, 25.8984375, 27.39697265625, 28.8955078125, 30.39404296875, 31.892578125, 33.39111328125, 34.8896484375, 36.38818359375, 37.88671875, 39.38525390625, 40.8837890625, 42.38232421875, 43.880859375, 45.37939453125, 46.8779296875, 48.37646484375, 49.875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 3.0, 2.0, 5.0, 4.0, 12.0, 14.0, 8.0, 15.0, 20.0, 24.0, 27.0, 45.0, 50.0, 72.0, 70.0, 110.0, 169.0, 223.0, 307.0, 239.0, 149.0, 74.0, 63.0, 63.0, 46.0, 32.0, 30.0, 24.0, 21.0, 13.0, 19.0, 18.0, 7.0, 14.0, 4.0, 3.0, 8.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-48.8125, -47.37158203125, -45.9306640625, -44.48974609375, -43.048828125, -41.60791015625, -40.1669921875, -38.72607421875, -37.28515625, -35.84423828125, -34.4033203125, -32.96240234375, -31.521484375, -30.08056640625, -28.6396484375, -27.19873046875, -25.7578125, -24.31689453125, -22.8759765625, -21.43505859375, -19.994140625, -18.55322265625, -17.1123046875, -15.67138671875, -14.23046875, -12.78955078125, -11.3486328125, -9.90771484375, -8.466796875, -7.02587890625, -5.5849609375, -4.14404296875, -2.703125, -1.26220703125, 0.1787109375, 1.61962890625, 3.060546875, 4.50146484375, 5.9423828125, 7.38330078125, 8.82421875, 10.26513671875, 11.7060546875, 13.14697265625, 14.587890625, 16.02880859375, 17.4697265625, 18.91064453125, 20.3515625, 21.79248046875, 23.2333984375, 24.67431640625, 26.115234375, 27.55615234375, 28.9970703125, 30.43798828125, 31.87890625, 33.31982421875, 34.7607421875, 36.20166015625, 37.642578125, 39.08349609375, 40.5244140625, 41.96533203125, 43.40625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 9.0, 16.0, 35.0, 35.0, 36.0, 64.0, 98.0, 153.0, 210.0, 311.0, 457.0, 616.0, 827.0, 1268.0, 1805.0, 2469.0, 3679.0, 5467.0, 8813.0, 14128.0, 22446.0, 37873.0, 66999.0, 122756.0, 243975.0, 517882.0, 1410112.0, 2377736.0, 745239.0, 331127.0, 164722.0, 85842.0, 48125.0, 28038.0, 16716.0, 10368.0, 6678.0, 4409.0, 3020.0, 1987.0, 1435.0, 987.0, 732.0, 523.0, 354.0, 250.0, 186.0, 132.0, 84.0, 57.0, 42.0, 32.0, 24.0, 11.0, 14.0, 12.0, 6.0, 6.0], "bins": [-25.34375, -24.5810546875, -23.818359375, -23.0556640625, -22.29296875, -21.5302734375, -20.767578125, -20.0048828125, -19.2421875, -18.4794921875, -17.716796875, -16.9541015625, -16.19140625, -15.4287109375, -14.666015625, -13.9033203125, -13.140625, -12.3779296875, -11.615234375, -10.8525390625, -10.08984375, -9.3271484375, -8.564453125, -7.8017578125, -7.0390625, -6.2763671875, -5.513671875, -4.7509765625, -3.98828125, -3.2255859375, -2.462890625, -1.7001953125, -0.9375, -0.1748046875, 0.587890625, 1.3505859375, 2.11328125, 2.8759765625, 3.638671875, 4.4013671875, 5.1640625, 5.9267578125, 6.689453125, 7.4521484375, 8.21484375, 8.9775390625, 9.740234375, 10.5029296875, 11.265625, 12.0283203125, 12.791015625, 13.5537109375, 14.31640625, 15.0791015625, 15.841796875, 16.6044921875, 17.3671875, 18.1298828125, 18.892578125, 19.6552734375, 20.41796875, 21.1806640625, 21.943359375, 22.7060546875, 23.46875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 9.0, 8.0, 10.0, 7.0, 9.0, 11.0, 14.0, 15.0, 24.0, 28.0, 27.0, 34.0, 55.0, 74.0, 109.0, 187.0, 395.0, 446.0, 146.0, 75.0, 62.0, 54.0, 44.0, 39.0, 25.0, 20.0, 20.0, 15.0, 9.0, 10.0, 7.0, 5.0, 5.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.5, -90.6103515625, -87.720703125, -84.8310546875, -81.94140625, -79.0517578125, -76.162109375, -73.2724609375, -70.3828125, -67.4931640625, -64.603515625, -61.7138671875, -58.82421875, -55.9345703125, -53.044921875, -50.1552734375, -47.265625, -44.3759765625, -41.486328125, -38.5966796875, -35.70703125, -32.8173828125, -29.927734375, -27.0380859375, -24.1484375, -21.2587890625, -18.369140625, -15.4794921875, -12.58984375, -9.7001953125, -6.810546875, -3.9208984375, -1.03125, 1.8583984375, 4.748046875, 7.6376953125, 10.52734375, 13.4169921875, 16.306640625, 19.1962890625, 22.0859375, 24.9755859375, 27.865234375, 30.7548828125, 33.64453125, 36.5341796875, 39.423828125, 42.3134765625, 45.203125, 48.0927734375, 50.982421875, 53.8720703125, 56.76171875, 59.6513671875, 62.541015625, 65.4306640625, 68.3203125, 71.2099609375, 74.099609375, 76.9892578125, 79.87890625, 82.7685546875, 85.658203125, 88.5478515625, 91.4375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 4.0, 5.0, 5.0, 6.0, 5.0, 12.0, 10.0, 15.0, 20.0, 28.0, 17.0, 28.0, 64.0, 64.0, 84.0, 114.0, 182.0, 258.0, 497.0, 1006.0, 2191.0, 4820.0, 13365.0, 48183.0, 283104.0, 5806576.0, 94266.0, 22691.0, 7617.0, 3013.0, 1326.0, 659.0, 403.0, 244.0, 161.0, 84.0, 55.0, 60.0, 46.0, 46.0, 27.0, 10.0, 10.0, 13.0, 12.0, 6.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 6.0, 3.0], "bins": [-168.75, -163.513671875, -158.27734375, -153.041015625, -147.8046875, -142.568359375, -137.33203125, -132.095703125, -126.859375, -121.623046875, -116.38671875, -111.150390625, -105.9140625, -100.677734375, -95.44140625, -90.205078125, -84.96875, -79.732421875, -74.49609375, -69.259765625, -64.0234375, -58.787109375, -53.55078125, -48.314453125, -43.078125, -37.841796875, -32.60546875, -27.369140625, -22.1328125, -16.896484375, -11.66015625, -6.423828125, -1.1875, 4.048828125, 9.28515625, 14.521484375, 19.7578125, 24.994140625, 30.23046875, 35.466796875, 40.703125, 45.939453125, 51.17578125, 56.412109375, 61.6484375, 66.884765625, 72.12109375, 77.357421875, 82.59375, 87.830078125, 93.06640625, 98.302734375, 103.5390625, 108.775390625, 114.01171875, 119.248046875, 124.484375, 129.720703125, 134.95703125, 140.193359375, 145.4296875, 150.666015625, 155.90234375, 161.138671875, 166.375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 8.0, 2.0, 7.0, 7.0, 18.0, 23.0, 22.0, 35.0, 25.0, 35.0, 37.0, 54.0, 64.0, 80.0, 304.0, 792.0, 118.0, 76.0, 52.0, 49.0, 31.0, 33.0, 17.0, 19.0, 17.0, 17.0, 17.0, 14.0, 14.0, 4.0, 3.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-193.0, -186.654296875, -180.30859375, -173.962890625, -167.6171875, -161.271484375, -154.92578125, -148.580078125, -142.234375, -135.888671875, -129.54296875, -123.197265625, -116.8515625, -110.505859375, -104.16015625, -97.814453125, -91.46875, -85.123046875, -78.77734375, -72.431640625, -66.0859375, -59.740234375, -53.39453125, -47.048828125, -40.703125, -34.357421875, -28.01171875, -21.666015625, -15.3203125, -8.974609375, -2.62890625, 3.716796875, 10.0625, 16.408203125, 22.75390625, 29.099609375, 35.4453125, 41.791015625, 48.13671875, 54.482421875, 60.828125, 67.173828125, 73.51953125, 79.865234375, 86.2109375, 92.556640625, 98.90234375, 105.248046875, 111.59375, 117.939453125, 124.28515625, 130.630859375, 136.9765625, 143.322265625, 149.66796875, 156.013671875, 162.359375, 168.705078125, 175.05078125, 181.396484375, 187.7421875, 194.087890625, 200.43359375, 206.779296875, 213.125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 12.0, 379.0, 607.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14219.568359375, -13824.8173828125, -13430.06640625, -13035.3154296875, -12640.564453125, -12245.8134765625, -11851.0625, -11456.3125, -11061.560546875, -10666.8095703125, -10272.05859375, -9877.3076171875, -9482.556640625, -9087.8056640625, -8693.0546875, -8298.3046875, -7903.5537109375, -7508.802734375, -7114.0517578125, -6719.30078125, -6324.5498046875, -5929.798828125, -5535.04833984375, -5140.29736328125, -4745.54638671875, -4350.79541015625, -3956.04443359375, -3561.293701171875, -3166.542724609375, -2771.791748046875, -2377.041015625, -1982.2900390625, -1587.5390625, -1192.7880859375, -798.0372314453125, -403.286376953125, -8.535400390625, 386.215576171875, 780.96630859375, 1175.71728515625, 1570.46826171875, 1965.21923828125, 2359.97021484375, 2754.720947265625, 3149.471923828125, 3544.222900390625, 3938.9736328125, 4333.724609375, 4728.4755859375, 5123.2265625, 5517.9775390625, 5912.728515625, 6307.4794921875, 6702.23046875, 7096.98095703125, 7491.73193359375, 7886.48291015625, 8281.2333984375, 8675.984375, 9070.7353515625, 9465.486328125, 9860.2373046875, 10254.98828125, 10649.7392578125, 11044.490234375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 11.0, 25.0, 237.0, 654.0, 41.0, 10.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5052.6259765625, -4851.18408203125, -4649.7421875, -4448.30078125, -4246.85888671875, -4045.4169921875, -3843.975341796875, -3642.53369140625, -3441.091796875, -3239.64990234375, -3038.208251953125, -2836.7666015625, -2635.32470703125, -2433.8828125, -2232.441162109375, -2030.9993896484375, -1829.5576171875, -1628.1158447265625, -1426.674072265625, -1225.2322998046875, -1023.79052734375, -822.3487548828125, -620.906982421875, -419.4652099609375, -218.0234375, -16.5816650390625, 184.860107421875, 386.3018798828125, 587.74365234375, 789.1854248046875, 990.627197265625, 1192.0689697265625, 1393.5107421875, 1594.9525146484375, 1796.394287109375, 1997.8360595703125, 2199.27783203125, 2400.7197265625, 2602.161376953125, 2803.60302734375, 3005.044921875, 3206.48681640625, 3407.928466796875, 3609.3701171875, 3810.81201171875, 4012.25390625, 4213.6953125, 4415.13720703125, 4616.5791015625, 4818.02099609375, 5019.462890625, 5220.904296875, 5422.34619140625, 5623.7880859375, 5825.2294921875, 6026.67138671875, 6228.11328125, 6429.55517578125, 6630.9970703125, 6832.4384765625, 7033.88037109375, 7235.322265625, 7436.763671875, 7638.20556640625, 7839.6474609375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 3.0, 10.0, 5.0, 19.0, 25.0, 24.0, 46.0, 54.0, 114.0, 177.0, 246.0, 503.0, 962.0, 2061.0, 5322.0, 19313.0, 286503.0, 3837219.0, 29435.0, 7067.0, 2549.0, 1153.0, 520.0, 319.0, 201.0, 97.0, 70.0, 75.0, 44.0, 32.0, 21.0, 18.0, 20.0, 18.0, 6.0, 7.0, 8.0, 7.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.375, -15.723388671875, -15.07177734375, -14.420166015625, -13.7685546875, -13.116943359375, -12.46533203125, -11.813720703125, -11.162109375, -10.510498046875, -9.85888671875, -9.207275390625, -8.5556640625, -7.904052734375, -7.25244140625, -6.600830078125, -5.94921875, -5.297607421875, -4.64599609375, -3.994384765625, -3.3427734375, -2.691162109375, -2.03955078125, -1.387939453125, -0.736328125, -0.084716796875, 0.56689453125, 1.218505859375, 1.8701171875, 2.521728515625, 3.17333984375, 3.824951171875, 4.4765625, 5.128173828125, 5.77978515625, 6.431396484375, 7.0830078125, 7.734619140625, 8.38623046875, 9.037841796875, 9.689453125, 10.341064453125, 10.99267578125, 11.644287109375, 12.2958984375, 12.947509765625, 13.59912109375, 14.250732421875, 14.90234375, 15.553955078125, 16.20556640625, 16.857177734375, 17.5087890625, 18.160400390625, 18.81201171875, 19.463623046875, 20.115234375, 20.766845703125, 21.41845703125, 22.070068359375, 22.7216796875, 23.373291015625, 24.02490234375, 24.676513671875, 25.328125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 10.0, 12.0, 9.0, 14.0, 21.0, 28.0, 68.0, 589.0, 135.0, 27.0, 16.0, 13.0, 11.0, 10.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1171875, -3.9619140625, -3.806640625, -3.6513671875, -3.49609375, -3.3408203125, -3.185546875, -3.0302734375, -2.875, -2.7197265625, -2.564453125, -2.4091796875, -2.25390625, -2.0986328125, -1.943359375, -1.7880859375, -1.6328125, -1.4775390625, -1.322265625, -1.1669921875, -1.01171875, -0.8564453125, -0.701171875, -0.5458984375, -0.390625, -0.2353515625, -0.080078125, 0.0751953125, 0.23046875, 0.3857421875, 0.541015625, 0.6962890625, 0.8515625, 1.0068359375, 1.162109375, 1.3173828125, 1.47265625, 1.6279296875, 1.783203125, 1.9384765625, 2.09375, 2.2490234375, 2.404296875, 2.5595703125, 2.71484375, 2.8701171875, 3.025390625, 3.1806640625, 3.3359375, 3.4912109375, 3.646484375, 3.8017578125, 3.95703125, 4.1123046875, 4.267578125, 4.4228515625, 4.578125, 4.7333984375, 4.888671875, 5.0439453125, 5.19921875, 5.3544921875, 5.509765625, 5.6650390625, 5.8203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 15.0, 14.0, 14.0, 39.0, 69.0, 118.0, 261.0, 609.0, 1812.0, 7010.0, 40036.0, 810046.0, 3260219.0, 61721.0, 8998.0, 2087.0, 638.0, 271.0, 117.0, 66.0, 42.0, 22.0, 19.0, 14.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.1875, -23.535888671875, -22.88427734375, -22.232666015625, -21.5810546875, -20.929443359375, -20.27783203125, -19.626220703125, -18.974609375, -18.322998046875, -17.67138671875, -17.019775390625, -16.3681640625, -15.716552734375, -15.06494140625, -14.413330078125, -13.76171875, -13.110107421875, -12.45849609375, -11.806884765625, -11.1552734375, -10.503662109375, -9.85205078125, -9.200439453125, -8.548828125, -7.897216796875, -7.24560546875, -6.593994140625, -5.9423828125, -5.290771484375, -4.63916015625, -3.987548828125, -3.3359375, -2.684326171875, -2.03271484375, -1.381103515625, -0.7294921875, -0.077880859375, 0.57373046875, 1.225341796875, 1.876953125, 2.528564453125, 3.18017578125, 3.831787109375, 4.4833984375, 5.135009765625, 5.78662109375, 6.438232421875, 7.08984375, 7.741455078125, 8.39306640625, 9.044677734375, 9.6962890625, 10.347900390625, 10.99951171875, 11.651123046875, 12.302734375, 12.954345703125, 13.60595703125, 14.257568359375, 14.9091796875, 15.560791015625, 16.21240234375, 16.864013671875, 17.515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 6.0, 6.0, 4.0, 9.0, 21.0, 18.0, 15.0, 32.0, 36.0, 54.0, 72.0, 108.0, 154.0, 324.0, 822.0, 1428.0, 394.0, 218.0, 119.0, 68.0, 49.0, 26.0, 29.0, 14.0, 19.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.662109375, -3.522491455078125, -3.38287353515625, -3.243255615234375, -3.1036376953125, -2.964019775390625, -2.82440185546875, -2.684783935546875, -2.545166015625, -2.405548095703125, -2.26593017578125, -2.126312255859375, -1.9866943359375, -1.847076416015625, -1.70745849609375, -1.567840576171875, -1.42822265625, -1.288604736328125, -1.14898681640625, -1.009368896484375, -0.8697509765625, -0.730133056640625, -0.59051513671875, -0.450897216796875, -0.311279296875, -0.171661376953125, -0.03204345703125, 0.107574462890625, 0.2471923828125, 0.386810302734375, 0.52642822265625, 0.666046142578125, 0.8056640625, 0.945281982421875, 1.08489990234375, 1.224517822265625, 1.3641357421875, 1.503753662109375, 1.64337158203125, 1.782989501953125, 1.922607421875, 2.062225341796875, 2.20184326171875, 2.341461181640625, 2.4810791015625, 2.620697021484375, 2.76031494140625, 2.899932861328125, 3.03955078125, 3.179168701171875, 3.31878662109375, 3.458404541015625, 3.5980224609375, 3.737640380859375, 3.87725830078125, 4.016876220703125, 4.156494140625, 4.296112060546875, 4.43572998046875, 4.575347900390625, 4.7149658203125, 4.854583740234375, 4.99420166015625, 5.133819580078125, 5.2734375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 17.0, 78.0, 470.0, 374.0, 43.0, 11.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-87.3570556640625, -83.54649353027344, -79.73592376708984, -75.92535400390625, -72.11479187011719, -68.30422973632812, -64.49365997314453, -60.6830940246582, -56.872528076171875, -53.06196212768555, -49.25139617919922, -45.44083023071289, -41.63026428222656, -37.819698333740234, -34.009132385253906, -30.198566436767578, -26.38800048828125, -22.577434539794922, -18.766868591308594, -14.956302642822266, -11.145736694335938, -7.335170745849609, -3.5246047973632812, 0.2859611511230469, 4.096527099609375, 7.907093048095703, 11.717658996582031, 15.52822494506836, 19.338790893554688, 23.149356842041016, 26.959922790527344, 30.770488739013672, 34.5810546875, 38.39162063598633, 42.202186584472656, 46.012752532958984, 49.82331848144531, 53.63388442993164, 57.44445037841797, 61.2550163269043, 65.06558227539062, 68.87614440917969, 72.68671417236328, 76.49728393554688, 80.30784606933594, 84.118408203125, 87.9289779663086, 91.73954772949219, 95.55010986328125, 99.36067199707031, 103.1712417602539, 106.9818115234375, 110.79237365722656, 114.60293579101562, 118.41350555419922, 122.22407531738281, 126.03463745117188, 129.84519958496094, 133.65576171875, 137.46633911132812, 141.2769012451172, 145.08746337890625, 148.89804077148438, 152.70860290527344, 156.5191650390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 18.0, 22.0, 28.0, 53.0, 54.0, 76.0, 87.0, 119.0, 91.0, 122.0, 89.0, 67.0, 59.0, 31.0, 32.0, 21.0, 9.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.208810806274414, -24.011411666870117, -22.81401252746582, -21.616613388061523, -20.419214248657227, -19.22181510925293, -18.0244140625, -16.827014923095703, -15.629616737365723, -14.432217597961426, -13.234818458557129, -12.037418365478516, -10.840019226074219, -9.642620086669922, -8.445220947265625, -7.247821807861328, -6.050422668457031, -4.853023529052734, -3.6556241512298584, -2.4582247734069824, -1.2608256340026855, -0.06342649459838867, 1.1339731216430664, 2.3313722610473633, 3.52877140045166, 4.726170539855957, 5.923569679260254, 7.120969295501709, 8.318368911743164, 9.515768051147461, 10.713167190551758, 11.910566329956055, 13.107963562011719, 14.305362701416016, 15.502761840820312, 16.70016098022461, 17.897560119628906, 19.094959259033203, 20.2923583984375, 21.489757537841797, 22.687156677246094, 23.88455581665039, 25.081954956054688, 26.279354095458984, 27.47675323486328, 28.674152374267578, 29.871551513671875, 31.068950653076172, 32.26634979248047, 33.463748931884766, 34.66114807128906, 35.85854721069336, 37.055946350097656, 38.25334548950195, 39.45074462890625, 40.64814376831055, 41.84554672241211, 43.042945861816406, 44.2403450012207, 45.437744140625, 46.6351432800293, 47.832542419433594, 49.02994155883789, 50.22734069824219, 51.424739837646484]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 12.0, 13.0, 18.0, 24.0, 25.0, 46.0, 61.0, 66.0, 105.0, 140.0, 200.0, 320.0, 500.0, 860.0, 1506.0, 2778.0, 6002.0, 15193.0, 51921.0, 857246.0, 77668.0, 18888.0, 7224.0, 3353.0, 1674.0, 957.0, 543.0, 357.0, 257.0, 166.0, 131.0, 77.0, 51.0, 46.0, 23.0, 30.0, 15.0, 12.0, 14.0, 3.0, 12.0, 3.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.5, -17.9326171875, -17.365234375, -16.7978515625, -16.23046875, -15.6630859375, -15.095703125, -14.5283203125, -13.9609375, -13.3935546875, -12.826171875, -12.2587890625, -11.69140625, -11.1240234375, -10.556640625, -9.9892578125, -9.421875, -8.8544921875, -8.287109375, -7.7197265625, -7.15234375, -6.5849609375, -6.017578125, -5.4501953125, -4.8828125, -4.3154296875, -3.748046875, -3.1806640625, -2.61328125, -2.0458984375, -1.478515625, -0.9111328125, -0.34375, 0.2236328125, 0.791015625, 1.3583984375, 1.92578125, 2.4931640625, 3.060546875, 3.6279296875, 4.1953125, 4.7626953125, 5.330078125, 5.8974609375, 6.46484375, 7.0322265625, 7.599609375, 8.1669921875, 8.734375, 9.3017578125, 9.869140625, 10.4365234375, 11.00390625, 11.5712890625, 12.138671875, 12.7060546875, 13.2734375, 13.8408203125, 14.408203125, 14.9755859375, 15.54296875, 16.1103515625, 16.677734375, 17.2451171875, 17.8125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 8.0, 8.0, 12.0, 11.0, 19.0, 23.0, 22.0, 105.0, 506.0, 178.0, 27.0, 15.0, 15.0, 13.0, 7.0, 9.0, 2.0, 1.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.9542236328125, -3.799072265625, -3.6439208984375, -3.48876953125, -3.3336181640625, -3.178466796875, -3.0233154296875, -2.8681640625, -2.7130126953125, -2.557861328125, -2.4027099609375, -2.24755859375, -2.0924072265625, -1.937255859375, -1.7821044921875, -1.626953125, -1.4718017578125, -1.316650390625, -1.1614990234375, -1.00634765625, -0.8511962890625, -0.696044921875, -0.5408935546875, -0.3857421875, -0.2305908203125, -0.075439453125, 0.0797119140625, 0.23486328125, 0.3900146484375, 0.545166015625, 0.7003173828125, 0.85546875, 1.0106201171875, 1.165771484375, 1.3209228515625, 1.47607421875, 1.6312255859375, 1.786376953125, 1.9415283203125, 2.0966796875, 2.2518310546875, 2.406982421875, 2.5621337890625, 2.71728515625, 2.8724365234375, 3.027587890625, 3.1827392578125, 3.337890625, 3.4930419921875, 3.648193359375, 3.8033447265625, 3.95849609375, 4.1136474609375, 4.268798828125, 4.4239501953125, 4.5791015625, 4.7342529296875, 4.889404296875, 5.0445556640625, 5.19970703125, 5.3548583984375, 5.510009765625, 5.6651611328125, 5.8203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 13.0, 18.0, 25.0, 26.0, 56.0, 90.0, 167.0, 347.0, 770.0, 2645.0, 17719.0, 225242.0, 741151.0, 51730.0, 6238.0, 1345.0, 452.0, 203.0, 106.0, 73.0, 41.0, 31.0, 18.0, 8.0, 15.0, 9.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.9375, -21.132080078125, -20.32666015625, -19.521240234375, -18.7158203125, -17.910400390625, -17.10498046875, -16.299560546875, -15.494140625, -14.688720703125, -13.88330078125, -13.077880859375, -12.2724609375, -11.467041015625, -10.66162109375, -9.856201171875, -9.05078125, -8.245361328125, -7.43994140625, -6.634521484375, -5.8291015625, -5.023681640625, -4.21826171875, -3.412841796875, -2.607421875, -1.802001953125, -0.99658203125, -0.191162109375, 0.6142578125, 1.419677734375, 2.22509765625, 3.030517578125, 3.8359375, 4.641357421875, 5.44677734375, 6.252197265625, 7.0576171875, 7.863037109375, 8.66845703125, 9.473876953125, 10.279296875, 11.084716796875, 11.89013671875, 12.695556640625, 13.5009765625, 14.306396484375, 15.11181640625, 15.917236328125, 16.72265625, 17.528076171875, 18.33349609375, 19.138916015625, 19.9443359375, 20.749755859375, 21.55517578125, 22.360595703125, 23.166015625, 23.971435546875, 24.77685546875, 25.582275390625, 26.3876953125, 27.193115234375, 27.99853515625, 28.803955078125, 29.609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 13.0, 12.0, 11.0, 11.0, 9.0, 16.0, 15.0, 19.0, 20.0, 29.0, 28.0, 19.0, 33.0, 32.0, 37.0, 36.0, 50.0, 42.0, 34.0, 51.0, 39.0, 39.0, 36.0, 40.0, 40.0, 38.0, 37.0, 29.0, 33.0, 20.0, 21.0, 14.0, 21.0, 12.0, 11.0, 10.0, 7.0, 5.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 3.0], "bins": [-11.625, -11.309814453125, -10.99462890625, -10.679443359375, -10.3642578125, -10.049072265625, -9.73388671875, -9.418701171875, -9.103515625, -8.788330078125, -8.47314453125, -8.157958984375, -7.8427734375, -7.527587890625, -7.21240234375, -6.897216796875, -6.58203125, -6.266845703125, -5.95166015625, -5.636474609375, -5.3212890625, -5.006103515625, -4.69091796875, -4.375732421875, -4.060546875, -3.745361328125, -3.43017578125, -3.114990234375, -2.7998046875, -2.484619140625, -2.16943359375, -1.854248046875, -1.5390625, -1.223876953125, -0.90869140625, -0.593505859375, -0.2783203125, 0.036865234375, 0.35205078125, 0.667236328125, 0.982421875, 1.297607421875, 1.61279296875, 1.927978515625, 2.2431640625, 2.558349609375, 2.87353515625, 3.188720703125, 3.50390625, 3.819091796875, 4.13427734375, 4.449462890625, 4.7646484375, 5.079833984375, 5.39501953125, 5.710205078125, 6.025390625, 6.340576171875, 6.65576171875, 6.970947265625, 7.2861328125, 7.601318359375, 7.91650390625, 8.231689453125, 8.546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 10.0, 10.0, 11.0, 17.0, 25.0, 44.0, 72.0, 139.0, 228.0, 409.0, 904.0, 1962.0, 5113.0, 16993.0, 94060.0, 735304.0, 158724.0, 23236.0, 6661.0, 2449.0, 1034.0, 490.0, 245.0, 143.0, 100.0, 51.0, 35.0, 27.0, 12.0, 16.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2421875, -11.7447509765625, -11.247314453125, -10.7498779296875, -10.25244140625, -9.7550048828125, -9.257568359375, -8.7601318359375, -8.2626953125, -7.7652587890625, -7.267822265625, -6.7703857421875, -6.27294921875, -5.7755126953125, -5.278076171875, -4.7806396484375, -4.283203125, -3.7857666015625, -3.288330078125, -2.7908935546875, -2.29345703125, -1.7960205078125, -1.298583984375, -0.8011474609375, -0.3037109375, 0.1937255859375, 0.691162109375, 1.1885986328125, 1.68603515625, 2.1834716796875, 2.680908203125, 3.1783447265625, 3.67578125, 4.1732177734375, 4.670654296875, 5.1680908203125, 5.66552734375, 6.1629638671875, 6.660400390625, 7.1578369140625, 7.6552734375, 8.1527099609375, 8.650146484375, 9.1475830078125, 9.64501953125, 10.1424560546875, 10.639892578125, 11.1373291015625, 11.634765625, 12.1322021484375, 12.629638671875, 13.1270751953125, 13.62451171875, 14.1219482421875, 14.619384765625, 15.1168212890625, 15.6142578125, 16.1116943359375, 16.609130859375, 17.1065673828125, 17.60400390625, 18.1014404296875, 18.598876953125, 19.0963134765625, 19.59375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 8.0, 12.0, 11.0, 14.0, 18.0, 16.0, 27.0, 27.0, 36.0, 62.0, 69.0, 95.0, 111.0, 109.0, 87.0, 75.0, 58.0, 40.0, 35.0, 18.0, 9.0, 17.0, 7.0, 10.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004410743713378906, -0.0004271268844604492, -0.0004131793975830078, -0.0003992319107055664, -0.000385284423828125, -0.0003713369369506836, -0.0003573894500732422, -0.0003434419631958008, -0.0003294944763183594, -0.00031554698944091797, -0.00030159950256347656, -0.00028765201568603516, -0.00027370452880859375, -0.00025975704193115234, -0.00024580955505371094, -0.00023186206817626953, -0.00021791458129882812, -0.00020396709442138672, -0.0001900196075439453, -0.0001760721206665039, -0.0001621246337890625, -0.0001481771469116211, -0.0001342296600341797, -0.00012028217315673828, -0.00010633468627929688, -9.238719940185547e-05, -7.843971252441406e-05, -6.449222564697266e-05, -5.054473876953125e-05, -3.6597251892089844e-05, -2.2649765014648438e-05, -8.702278137207031e-06, 5.245208740234375e-06, 1.919269561767578e-05, 3.314018249511719e-05, 4.7087669372558594e-05, 6.103515625e-05, 7.49826431274414e-05, 8.893013000488281e-05, 0.00010287761688232422, 0.00011682510375976562, 0.00013077259063720703, 0.00014472007751464844, 0.00015866756439208984, 0.00017261505126953125, 0.00018656253814697266, 0.00020051002502441406, 0.00021445751190185547, 0.00022840499877929688, 0.00024235248565673828, 0.0002562999725341797, 0.0002702474594116211, 0.0002841949462890625, 0.0002981424331665039, 0.0003120899200439453, 0.0003260374069213867, 0.0003399848937988281, 0.00035393238067626953, 0.00036787986755371094, 0.00038182735443115234, 0.00039577484130859375, 0.00040972232818603516, 0.00042366981506347656, 0.00043761730194091797, 0.0004515647888183594]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 8.0, 10.0, 16.0, 13.0, 12.0, 11.0, 29.0, 46.0, 65.0, 104.0, 120.0, 253.0, 355.0, 660.0, 1158.0, 2191.0, 4658.0, 10677.0, 29741.0, 102465.0, 411176.0, 353044.0, 87095.0, 25961.0, 9757.0, 4248.0, 2097.0, 999.0, 624.0, 318.0, 221.0, 119.0, 114.0, 45.0, 40.0, 21.0, 23.0, 21.0, 8.0, 12.0, 7.0, 10.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.0390625, -8.7646484375, -8.490234375, -8.2158203125, -7.94140625, -7.6669921875, -7.392578125, -7.1181640625, -6.84375, -6.5693359375, -6.294921875, -6.0205078125, -5.74609375, -5.4716796875, -5.197265625, -4.9228515625, -4.6484375, -4.3740234375, -4.099609375, -3.8251953125, -3.55078125, -3.2763671875, -3.001953125, -2.7275390625, -2.453125, -2.1787109375, -1.904296875, -1.6298828125, -1.35546875, -1.0810546875, -0.806640625, -0.5322265625, -0.2578125, 0.0166015625, 0.291015625, 0.5654296875, 0.83984375, 1.1142578125, 1.388671875, 1.6630859375, 1.9375, 2.2119140625, 2.486328125, 2.7607421875, 3.03515625, 3.3095703125, 3.583984375, 3.8583984375, 4.1328125, 4.4072265625, 4.681640625, 4.9560546875, 5.23046875, 5.5048828125, 5.779296875, 6.0537109375, 6.328125, 6.6025390625, 6.876953125, 7.1513671875, 7.42578125, 7.7001953125, 7.974609375, 8.2490234375, 8.5234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 9.0, 17.0, 19.0, 22.0, 29.0, 39.0, 26.0, 51.0, 38.0, 47.0, 48.0, 63.0, 66.0, 83.0, 60.0, 66.0, 48.0, 50.0, 33.0, 36.0, 25.0, 22.0, 13.0, 12.0, 12.0, 12.0, 6.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.8101806640625, -7.557861328125, -7.3055419921875, -7.05322265625, -6.8009033203125, -6.548583984375, -6.2962646484375, -6.0439453125, -5.7916259765625, -5.539306640625, -5.2869873046875, -5.03466796875, -4.7823486328125, -4.530029296875, -4.2777099609375, -4.025390625, -3.7730712890625, -3.520751953125, -3.2684326171875, -3.01611328125, -2.7637939453125, -2.511474609375, -2.2591552734375, -2.0068359375, -1.7545166015625, -1.502197265625, -1.2498779296875, -0.99755859375, -0.7452392578125, -0.492919921875, -0.2406005859375, 0.01171875, 0.2640380859375, 0.516357421875, 0.7686767578125, 1.02099609375, 1.2733154296875, 1.525634765625, 1.7779541015625, 2.0302734375, 2.2825927734375, 2.534912109375, 2.7872314453125, 3.03955078125, 3.2918701171875, 3.544189453125, 3.7965087890625, 4.048828125, 4.3011474609375, 4.553466796875, 4.8057861328125, 5.05810546875, 5.3104248046875, 5.562744140625, 5.8150634765625, 6.0673828125, 6.3197021484375, 6.572021484375, 6.8243408203125, 7.07666015625, 7.3289794921875, 7.581298828125, 7.8336181640625, 8.0859375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 11.0, 22.0, 256.0, 534.0, 137.0, 29.0, 7.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-425.1136169433594, -411.51708984375, -397.9205627441406, -384.32403564453125, -370.72747802734375, -357.1309509277344, -343.534423828125, -329.9378967285156, -316.34136962890625, -302.7448425292969, -289.1483154296875, -275.5517578125, -261.9552307128906, -248.35870361328125, -234.76217651367188, -221.1656494140625, -207.569091796875, -193.97256469726562, -180.3760223388672, -166.7794952392578, -153.18295288085938, -139.58642578125, -125.98989868164062, -112.39336395263672, -98.79682922363281, -85.2002944946289, -71.603759765625, -58.007232666015625, -44.41069793701172, -30.814163208007812, -17.217636108398438, -3.6211013793945312, 9.97540283203125, 23.571935653686523, 37.1684684753418, 50.76499938964844, 64.36153411865234, 77.95806884765625, 91.55459594726562, 105.15113067626953, 118.74766540527344, 132.3441925048828, 145.94073486328125, 159.53726196289062, 173.1337890625, 186.73033142089844, 200.3268585205078, 213.92340087890625, 227.51992797851562, 241.116455078125, 254.71299743652344, 268.30950927734375, 281.90606689453125, 295.5025939941406, 309.09912109375, 322.6956481933594, 336.29217529296875, 349.8887023925781, 363.4852294921875, 377.081787109375, 390.6783142089844, 404.27484130859375, 417.8713684082031, 431.4678955078125, 445.064453125]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 5.0, 12.0, 11.0, 11.0, 35.0, 56.0, 82.0, 134.0, 157.0, 140.0, 103.0, 100.0, 38.0, 22.0, 15.0, 9.0, 11.0, 2.0, 6.0, 6.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.03836059570312, -182.28524780273438, -175.5321502685547, -168.77903747558594, -162.0259246826172, -155.2728271484375, -148.51971435546875, -141.7666015625, -135.01348876953125, -128.2603759765625, -121.50727081298828, -114.75416564941406, -108.00105285644531, -101.2479476928711, -94.49484252929688, -87.74172973632812, -80.98863220214844, -74.23552703857422, -67.48241424560547, -60.72930908203125, -53.976200103759766, -47.22309112548828, -40.46998596191406, -33.71687698364258, -26.963768005371094, -20.21065902709961, -13.457551956176758, -6.704444885253906, 0.048664093017578125, 6.8017730712890625, 13.554878234863281, 20.307987213134766, 27.06109619140625, 33.814205169677734, 40.56731414794922, 47.32041931152344, 54.07352828979492, 60.826637268066406, 67.57974243164062, 74.33285522460938, 81.0859603881836, 87.83906555175781, 94.59217834472656, 101.34528350830078, 108.098388671875, 114.85150146484375, 121.60460662841797, 128.3577117919922, 135.11082458496094, 141.8639373779297, 148.61703491210938, 155.37014770507812, 162.12326049804688, 168.87637329101562, 175.6294708251953, 182.38258361816406, 189.13568115234375, 195.8887939453125, 202.6418914794922, 209.39500427246094, 216.1481170654297, 222.90121459960938, 229.65432739257812, 236.40744018554688, 243.16055297851562]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 7.0, 6.0, 8.0, 29.0, 46.0, 40.0, 120.0, 215.0, 589.0, 2120.0, 14208.0, 4085049.0, 85028.0, 4783.0, 1146.0, 396.0, 215.0, 104.0, 54.0, 39.0, 25.0, 21.0, 11.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.5, -80.380859375, -77.26171875, -74.142578125, -71.0234375, -67.904296875, -64.78515625, -61.666015625, -58.546875, -55.427734375, -52.30859375, -49.189453125, -46.0703125, -42.951171875, -39.83203125, -36.712890625, -33.59375, -30.474609375, -27.35546875, -24.236328125, -21.1171875, -17.998046875, -14.87890625, -11.759765625, -8.640625, -5.521484375, -2.40234375, 0.716796875, 3.8359375, 6.955078125, 10.07421875, 13.193359375, 16.3125, 19.431640625, 22.55078125, 25.669921875, 28.7890625, 31.908203125, 35.02734375, 38.146484375, 41.265625, 44.384765625, 47.50390625, 50.623046875, 53.7421875, 56.861328125, 59.98046875, 63.099609375, 66.21875, 69.337890625, 72.45703125, 75.576171875, 78.6953125, 81.814453125, 84.93359375, 88.052734375, 91.171875, 94.291015625, 97.41015625, 100.529296875, 103.6484375, 106.767578125, 109.88671875, 113.005859375, 116.125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 3.0, 10.0, 14.0, 22.0, 21.0, 32.0, 125.0, 392.0, 250.0, 59.0, 20.0, 11.0, 16.0, 11.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.0718994140625, -3.913330078125, -3.7547607421875, -3.59619140625, -3.4376220703125, -3.279052734375, -3.1204833984375, -2.9619140625, -2.8033447265625, -2.644775390625, -2.4862060546875, -2.32763671875, -2.1690673828125, -2.010498046875, -1.8519287109375, -1.693359375, -1.5347900390625, -1.376220703125, -1.2176513671875, -1.05908203125, -0.9005126953125, -0.741943359375, -0.5833740234375, -0.4248046875, -0.2662353515625, -0.107666015625, 0.0509033203125, 0.20947265625, 0.3680419921875, 0.526611328125, 0.6851806640625, 0.84375, 1.0023193359375, 1.160888671875, 1.3194580078125, 1.47802734375, 1.6365966796875, 1.795166015625, 1.9537353515625, 2.1123046875, 2.2708740234375, 2.429443359375, 2.5880126953125, 2.74658203125, 2.9051513671875, 3.063720703125, 3.2222900390625, 3.380859375, 3.5394287109375, 3.697998046875, 3.8565673828125, 4.01513671875, 4.1737060546875, 4.332275390625, 4.4908447265625, 4.6494140625, 4.8079833984375, 4.966552734375, 5.1251220703125, 5.28369140625, 5.4422607421875, 5.600830078125, 5.7593994140625, 5.91796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 6.0, 12.0, 13.0, 21.0, 32.0, 41.0, 84.0, 108.0, 215.0, 400.0, 690.0, 1310.0, 2748.0, 6523.0, 16592.0, 50903.0, 241917.0, 3462712.0, 315570.0, 61143.0, 19220.0, 7453.0, 3194.0, 1518.0, 799.0, 423.0, 246.0, 120.0, 89.0, 58.0, 43.0, 33.0, 13.0, 8.0, 10.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-25.65625, -24.990966796875, -24.32568359375, -23.660400390625, -22.9951171875, -22.329833984375, -21.66455078125, -20.999267578125, -20.333984375, -19.668701171875, -19.00341796875, -18.338134765625, -17.6728515625, -17.007568359375, -16.34228515625, -15.677001953125, -15.01171875, -14.346435546875, -13.68115234375, -13.015869140625, -12.3505859375, -11.685302734375, -11.02001953125, -10.354736328125, -9.689453125, -9.024169921875, -8.35888671875, -7.693603515625, -7.0283203125, -6.363037109375, -5.69775390625, -5.032470703125, -4.3671875, -3.701904296875, -3.03662109375, -2.371337890625, -1.7060546875, -1.040771484375, -0.37548828125, 0.289794921875, 0.955078125, 1.620361328125, 2.28564453125, 2.950927734375, 3.6162109375, 4.281494140625, 4.94677734375, 5.612060546875, 6.27734375, 6.942626953125, 7.60791015625, 8.273193359375, 8.9384765625, 9.603759765625, 10.26904296875, 10.934326171875, 11.599609375, 12.264892578125, 12.93017578125, 13.595458984375, 14.2607421875, 14.926025390625, 15.59130859375, 16.256591796875, 16.921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 8.0, 12.0, 13.0, 14.0, 27.0, 47.0, 65.0, 79.0, 109.0, 193.0, 383.0, 1973.0, 465.0, 212.0, 135.0, 81.0, 62.0, 41.0, 34.0, 17.0, 13.0, 14.0, 9.0, 11.0, 7.0, 9.0, 5.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.82421875, -2.72564697265625, -2.6270751953125, -2.52850341796875, -2.429931640625, -2.33135986328125, -2.2327880859375, -2.13421630859375, -2.03564453125, -1.93707275390625, -1.8385009765625, -1.73992919921875, -1.641357421875, -1.54278564453125, -1.4442138671875, -1.34564208984375, -1.2470703125, -1.14849853515625, -1.0499267578125, -0.95135498046875, -0.852783203125, -0.75421142578125, -0.6556396484375, -0.55706787109375, -0.45849609375, -0.35992431640625, -0.2613525390625, -0.16278076171875, -0.064208984375, 0.03436279296875, 0.1329345703125, 0.23150634765625, 0.330078125, 0.42864990234375, 0.5272216796875, 0.62579345703125, 0.724365234375, 0.82293701171875, 0.9215087890625, 1.02008056640625, 1.11865234375, 1.21722412109375, 1.3157958984375, 1.41436767578125, 1.512939453125, 1.61151123046875, 1.7100830078125, 1.80865478515625, 1.9072265625, 2.00579833984375, 2.1043701171875, 2.20294189453125, 2.301513671875, 2.40008544921875, 2.4986572265625, 2.59722900390625, 2.69580078125, 2.79437255859375, 2.8929443359375, 2.99151611328125, 3.090087890625, 3.18865966796875, 3.2872314453125, 3.38580322265625, 3.484375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 30.0, 135.0, 324.0, 322.0, 130.0, 36.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.28564453125, -57.49095916748047, -55.69627380371094, -53.901588439941406, -52.106903076171875, -50.312217712402344, -48.51752853393555, -46.722843170166016, -44.928157806396484, -43.13347244262695, -41.33878707885742, -39.54410171508789, -37.749412536621094, -35.95472717285156, -34.16004180908203, -32.3653564453125, -30.57067108154297, -28.775985717773438, -26.981300354003906, -25.186613082885742, -23.39192771911621, -21.59724235534668, -19.802555084228516, -18.007869720458984, -16.213184356689453, -14.418498992919922, -12.623812675476074, -10.829126358032227, -9.034440994262695, -7.239755630493164, -5.445069313049316, -3.6503829956054688, -1.8556938171386719, -0.06100797653198242, 1.733677864074707, 3.5283637046813965, 5.323049545288086, 7.117734909057617, 8.912421226501465, 10.707107543945312, 12.501792907714844, 14.296478271484375, 16.091163635253906, 17.88585090637207, 19.6805362701416, 21.475221633911133, 23.269908905029297, 25.064594268798828, 26.85927963256836, 28.65396499633789, 30.448650360107422, 32.24333572387695, 34.03802490234375, 35.83271026611328, 37.62739562988281, 39.422080993652344, 41.216766357421875, 43.011451721191406, 44.80613708496094, 46.60082244873047, 48.3955078125, 50.19019317626953, 51.98488235473633, 53.77956771850586, 55.57425308227539]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 1.0, 5.0, 6.0, 6.0, 11.0, 20.0, 16.0, 27.0, 23.0, 41.0, 48.0, 56.0, 65.0, 59.0, 80.0, 70.0, 73.0, 58.0, 59.0, 62.0, 47.0, 37.0, 33.0, 25.0, 15.0, 19.0, 8.0, 9.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.208098411560059, -11.720442771911621, -11.232787132263184, -10.745131492614746, -10.257475852966309, -9.769820213317871, -9.282163619995117, -8.79450798034668, -8.306852340698242, -7.819196701049805, -7.331541061401367, -6.84388542175293, -6.356229782104492, -5.868574142456055, -5.380918025970459, -4.8932623863220215, -4.405607223510742, -3.9179515838623047, -3.430295944213867, -2.9426400661468506, -2.454984426498413, -1.9673287868499756, -1.479672908782959, -0.9920172691345215, -0.504361629486084, -0.01670593023300171, 0.47094976902008057, 0.9586055278778076, 1.4462611675262451, 1.9339168071746826, 2.421572685241699, 2.9092283248901367, 3.396883010864258, 3.8845386505126953, 4.372194290161133, 4.85984992980957, 5.347505569458008, 5.835161209106445, 6.322817325592041, 6.8104729652404785, 7.298128604888916, 7.7857842445373535, 8.27344036102295, 8.761096000671387, 9.248751640319824, 9.736407279968262, 10.2240629196167, 10.711718559265137, 11.199374198913574, 11.687029838562012, 12.17468547821045, 12.662341117858887, 13.149996757507324, 13.637652397155762, 14.125308990478516, 14.612964630126953, 15.10062026977539, 15.588275909423828, 16.075931549072266, 16.563587188720703, 17.05124282836914, 17.538898468017578, 18.026554107666016, 18.514209747314453, 19.00186538696289]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 3.0, 3.0, 7.0, 14.0, 10.0, 15.0, 23.0, 41.0, 66.0, 69.0, 186.0, 311.0, 613.0, 1666.0, 6354.0, 134108.0, 888768.0, 12203.0, 2379.0, 849.0, 375.0, 179.0, 106.0, 58.0, 36.0, 28.0, 24.0, 17.0, 11.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.25, -65.826171875, -63.40234375, -60.978515625, -58.5546875, -56.130859375, -53.70703125, -51.283203125, -48.859375, -46.435546875, -44.01171875, -41.587890625, -39.1640625, -36.740234375, -34.31640625, -31.892578125, -29.46875, -27.044921875, -24.62109375, -22.197265625, -19.7734375, -17.349609375, -14.92578125, -12.501953125, -10.078125, -7.654296875, -5.23046875, -2.806640625, -0.3828125, 2.041015625, 4.46484375, 6.888671875, 9.3125, 11.736328125, 14.16015625, 16.583984375, 19.0078125, 21.431640625, 23.85546875, 26.279296875, 28.703125, 31.126953125, 33.55078125, 35.974609375, 38.3984375, 40.822265625, 43.24609375, 45.669921875, 48.09375, 50.517578125, 52.94140625, 55.365234375, 57.7890625, 60.212890625, 62.63671875, 65.060546875, 67.484375, 69.908203125, 72.33203125, 74.755859375, 77.1796875, 79.603515625, 82.02734375, 84.451171875, 86.875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 8.0, 16.0, 15.0, 26.0, 38.0, 123.0, 323.0, 264.0, 100.0, 35.0, 16.0, 12.0, 9.0, 6.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.06915283203125, -3.9117431640625, -3.75433349609375, -3.596923828125, -3.43951416015625, -3.2821044921875, -3.12469482421875, -2.96728515625, -2.80987548828125, -2.6524658203125, -2.49505615234375, -2.337646484375, -2.18023681640625, -2.0228271484375, -1.86541748046875, -1.7080078125, -1.55059814453125, -1.3931884765625, -1.23577880859375, -1.078369140625, -0.92095947265625, -0.7635498046875, -0.60614013671875, -0.44873046875, -0.29132080078125, -0.1339111328125, 0.02349853515625, 0.180908203125, 0.33831787109375, 0.4957275390625, 0.65313720703125, 0.810546875, 0.96795654296875, 1.1253662109375, 1.28277587890625, 1.440185546875, 1.59759521484375, 1.7550048828125, 1.91241455078125, 2.06982421875, 2.22723388671875, 2.3846435546875, 2.54205322265625, 2.699462890625, 2.85687255859375, 3.0142822265625, 3.17169189453125, 3.3291015625, 3.48651123046875, 3.6439208984375, 3.80133056640625, 3.958740234375, 4.11614990234375, 4.2735595703125, 4.43096923828125, 4.58837890625, 4.74578857421875, 4.9031982421875, 5.06060791015625, 5.218017578125, 5.37542724609375, 5.5328369140625, 5.69024658203125, 5.84765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 0.0, 5.0, 7.0, 24.0, 85.0, 496.0, 9135.0, 1019078.0, 18816.0, 694.0, 102.0, 29.0, 8.0, 6.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.875, -79.009765625, -76.14453125, -73.279296875, -70.4140625, -67.548828125, -64.68359375, -61.818359375, -58.953125, -56.087890625, -53.22265625, -50.357421875, -47.4921875, -44.626953125, -41.76171875, -38.896484375, -36.03125, -33.166015625, -30.30078125, -27.435546875, -24.5703125, -21.705078125, -18.83984375, -15.974609375, -13.109375, -10.244140625, -7.37890625, -4.513671875, -1.6484375, 1.216796875, 4.08203125, 6.947265625, 9.8125, 12.677734375, 15.54296875, 18.408203125, 21.2734375, 24.138671875, 27.00390625, 29.869140625, 32.734375, 35.599609375, 38.46484375, 41.330078125, 44.1953125, 47.060546875, 49.92578125, 52.791015625, 55.65625, 58.521484375, 61.38671875, 64.251953125, 67.1171875, 69.982421875, 72.84765625, 75.712890625, 78.578125, 81.443359375, 84.30859375, 87.173828125, 90.0390625, 92.904296875, 95.76953125, 98.634765625, 101.5]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 6.0, 8.0, 12.0, 15.0, 18.0, 14.0, 23.0, 23.0, 31.0, 26.0, 39.0, 41.0, 36.0, 52.0, 72.0, 52.0, 59.0, 60.0, 53.0, 53.0, 44.0, 36.0, 39.0, 35.0, 29.0, 30.0, 28.0, 17.0, 8.0, 13.0, 11.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8125, -8.5572509765625, -8.302001953125, -8.0467529296875, -7.79150390625, -7.5362548828125, -7.281005859375, -7.0257568359375, -6.7705078125, -6.5152587890625, -6.260009765625, -6.0047607421875, -5.74951171875, -5.4942626953125, -5.239013671875, -4.9837646484375, -4.728515625, -4.4732666015625, -4.218017578125, -3.9627685546875, -3.70751953125, -3.4522705078125, -3.197021484375, -2.9417724609375, -2.6865234375, -2.4312744140625, -2.176025390625, -1.9207763671875, -1.66552734375, -1.4102783203125, -1.155029296875, -0.8997802734375, -0.64453125, -0.3892822265625, -0.134033203125, 0.1212158203125, 0.37646484375, 0.6317138671875, 0.886962890625, 1.1422119140625, 1.3974609375, 1.6527099609375, 1.907958984375, 2.1632080078125, 2.41845703125, 2.6737060546875, 2.928955078125, 3.1842041015625, 3.439453125, 3.6947021484375, 3.949951171875, 4.2052001953125, 4.46044921875, 4.7156982421875, 4.970947265625, 5.2261962890625, 5.4814453125, 5.7366943359375, 5.991943359375, 6.2471923828125, 6.50244140625, 6.7576904296875, 7.012939453125, 7.2681884765625, 7.5234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 11.0, 8.0, 10.0, 16.0, 22.0, 34.0, 48.0, 78.0, 148.0, 326.0, 746.0, 2460.0, 10743.0, 95585.0, 819905.0, 103147.0, 11199.0, 2492.0, 860.0, 323.0, 130.0, 107.0, 46.0, 28.0, 22.0, 11.0, 13.0, 7.0, 2.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.296875, -23.4736328125, -22.650390625, -21.8271484375, -21.00390625, -20.1806640625, -19.357421875, -18.5341796875, -17.7109375, -16.8876953125, -16.064453125, -15.2412109375, -14.41796875, -13.5947265625, -12.771484375, -11.9482421875, -11.125, -10.3017578125, -9.478515625, -8.6552734375, -7.83203125, -7.0087890625, -6.185546875, -5.3623046875, -4.5390625, -3.7158203125, -2.892578125, -2.0693359375, -1.24609375, -0.4228515625, 0.400390625, 1.2236328125, 2.046875, 2.8701171875, 3.693359375, 4.5166015625, 5.33984375, 6.1630859375, 6.986328125, 7.8095703125, 8.6328125, 9.4560546875, 10.279296875, 11.1025390625, 11.92578125, 12.7490234375, 13.572265625, 14.3955078125, 15.21875, 16.0419921875, 16.865234375, 17.6884765625, 18.51171875, 19.3349609375, 20.158203125, 20.9814453125, 21.8046875, 22.6279296875, 23.451171875, 24.2744140625, 25.09765625, 25.9208984375, 26.744140625, 27.5673828125, 28.390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 6.0, 9.0, 11.0, 21.0, 37.0, 66.0, 109.0, 162.0, 194.0, 151.0, 92.0, 49.0, 32.0, 25.0, 11.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010471343994140625, -0.001012563705444336, -0.0009779930114746094, -0.0009434223175048828, -0.0009088516235351562, -0.0008742809295654297, -0.0008397102355957031, -0.0008051395416259766, -0.00077056884765625, -0.0007359981536865234, -0.0007014274597167969, -0.0006668567657470703, -0.0006322860717773438, -0.0005977153778076172, -0.0005631446838378906, -0.0005285739898681641, -0.0004940032958984375, -0.00045943260192871094, -0.0004248619079589844, -0.0003902912139892578, -0.00035572052001953125, -0.0003211498260498047, -0.0002865791320800781, -0.00025200843811035156, -0.000217437744140625, -0.00018286705017089844, -0.00014829635620117188, -0.00011372566223144531, -7.915496826171875e-05, -4.458427429199219e-05, -1.0013580322265625e-05, 2.4557113647460938e-05, 5.91278076171875e-05, 9.369850158691406e-05, 0.00012826919555664062, 0.0001628398895263672, 0.00019741058349609375, 0.0002319812774658203, 0.0002665519714355469, 0.00030112266540527344, 0.000335693359375, 0.00037026405334472656, 0.0004048347473144531, 0.0004394054412841797, 0.00047397613525390625, 0.0005085468292236328, 0.0005431175231933594, 0.0005776882171630859, 0.0006122589111328125, 0.0006468296051025391, 0.0006814002990722656, 0.0007159709930419922, 0.0007505416870117188, 0.0007851123809814453, 0.0008196830749511719, 0.0008542537689208984, 0.000888824462890625, 0.0009233951568603516, 0.0009579658508300781, 0.0009925365447998047, 0.0010271072387695312, 0.0010616779327392578, 0.0010962486267089844, 0.001130819320678711, 0.0011653900146484375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 8.0, 5.0, 14.0, 26.0, 43.0, 63.0, 86.0, 198.0, 376.0, 768.0, 1933.0, 5302.0, 17103.0, 78648.0, 546174.0, 330137.0, 49410.0, 11613.0, 3846.0, 1438.0, 648.0, 304.0, 182.0, 94.0, 46.0, 28.0, 11.0, 15.0, 16.0, 3.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.09375, -16.57373046875, -16.0537109375, -15.53369140625, -15.013671875, -14.49365234375, -13.9736328125, -13.45361328125, -12.93359375, -12.41357421875, -11.8935546875, -11.37353515625, -10.853515625, -10.33349609375, -9.8134765625, -9.29345703125, -8.7734375, -8.25341796875, -7.7333984375, -7.21337890625, -6.693359375, -6.17333984375, -5.6533203125, -5.13330078125, -4.61328125, -4.09326171875, -3.5732421875, -3.05322265625, -2.533203125, -2.01318359375, -1.4931640625, -0.97314453125, -0.453125, 0.06689453125, 0.5869140625, 1.10693359375, 1.626953125, 2.14697265625, 2.6669921875, 3.18701171875, 3.70703125, 4.22705078125, 4.7470703125, 5.26708984375, 5.787109375, 6.30712890625, 6.8271484375, 7.34716796875, 7.8671875, 8.38720703125, 8.9072265625, 9.42724609375, 9.947265625, 10.46728515625, 10.9873046875, 11.50732421875, 12.02734375, 12.54736328125, 13.0673828125, 13.58740234375, 14.107421875, 14.62744140625, 15.1474609375, 15.66748046875, 16.1875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 6.0, 9.0, 8.0, 12.0, 9.0, 21.0, 11.0, 20.0, 29.0, 35.0, 54.0, 46.0, 49.0, 74.0, 90.0, 128.0, 60.0, 59.0, 53.0, 44.0, 38.0, 36.0, 20.0, 15.0, 16.0, 6.0, 10.0, 6.0, 5.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.3203125, -8.084228515625, -7.84814453125, -7.612060546875, -7.3759765625, -7.139892578125, -6.90380859375, -6.667724609375, -6.431640625, -6.195556640625, -5.95947265625, -5.723388671875, -5.4873046875, -5.251220703125, -5.01513671875, -4.779052734375, -4.54296875, -4.306884765625, -4.07080078125, -3.834716796875, -3.5986328125, -3.362548828125, -3.12646484375, -2.890380859375, -2.654296875, -2.418212890625, -2.18212890625, -1.946044921875, -1.7099609375, -1.473876953125, -1.23779296875, -1.001708984375, -0.765625, -0.529541015625, -0.29345703125, -0.057373046875, 0.1787109375, 0.414794921875, 0.65087890625, 0.886962890625, 1.123046875, 1.359130859375, 1.59521484375, 1.831298828125, 2.0673828125, 2.303466796875, 2.53955078125, 2.775634765625, 3.01171875, 3.247802734375, 3.48388671875, 3.719970703125, 3.9560546875, 4.192138671875, 4.42822265625, 4.664306640625, 4.900390625, 5.136474609375, 5.37255859375, 5.608642578125, 5.8447265625, 6.080810546875, 6.31689453125, 6.552978515625, 6.7890625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 22.0, 32.0, 92.0, 215.0, 298.0, 191.0, 88.0, 31.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.6951904296875, -123.1673583984375, -117.6395263671875, -112.1116943359375, -106.5838623046875, -101.0560302734375, -95.5281982421875, -90.0003662109375, -84.4725341796875, -78.9447021484375, -73.4168701171875, -67.8890380859375, -62.3612060546875, -56.8333740234375, -51.305538177490234, -45.777706146240234, -40.24987030029297, -34.72203826904297, -29.19420623779297, -23.666372299194336, -18.138540267944336, -12.610708236694336, -7.082874298095703, -1.5550422668457031, 3.972789764404297, 9.500621795654297, 15.028454780578613, 20.55628776550293, 26.08411979675293, 31.61195182800293, 37.13978576660156, 42.66761779785156, 48.19544982910156, 53.72328186035156, 59.25111389160156, 64.77894592285156, 70.30677795410156, 75.83460998535156, 81.36244201660156, 86.89027404785156, 92.41810607910156, 97.94593811035156, 103.47377014160156, 109.00160217285156, 114.52943420410156, 120.05726623535156, 125.58509826660156, 131.11293029785156, 136.64077758789062, 142.16860961914062, 147.69644165039062, 153.22427368164062, 158.75210571289062, 164.27993774414062, 169.80776977539062, 175.33560180664062, 180.86343383789062, 186.39126586914062, 191.91909790039062, 197.44692993164062, 202.97476196289062, 208.50259399414062, 214.03042602539062, 219.55825805664062, 225.08609008789062]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 7.0, 6.0, 9.0, 13.0, 21.0, 28.0, 24.0, 39.0, 50.0, 64.0, 89.0, 80.0, 70.0, 80.0, 72.0, 68.0, 77.0, 48.0, 38.0, 31.0, 29.0, 20.0, 10.0, 10.0, 3.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.92555236816406, -89.06329345703125, -86.20104217529297, -83.33878326416016, -80.47653198242188, -77.61427307128906, -74.75201416015625, -71.88976287841797, -69.02750396728516, -66.16524505615234, -63.30299377441406, -60.44073486328125, -57.5784797668457, -54.716224670410156, -51.85396957397461, -48.99171447753906, -46.129459381103516, -43.26720428466797, -40.40494918823242, -37.542694091796875, -34.68043518066406, -31.818180084228516, -28.95592498779297, -26.09366798400879, -23.231412887573242, -20.369157791137695, -17.506900787353516, -14.644645690917969, -11.782389640808105, -8.920133590698242, -6.057878494262695, -3.1956214904785156, -0.33336639404296875, 2.5288894176483154, 5.3911452293396, 8.253400802612305, 11.115656852722168, 13.977912902832031, 16.840167999267578, 19.702425003051758, 22.564680099487305, 25.42693519592285, 28.28919219970703, 31.151447296142578, 34.013702392578125, 36.87596130371094, 39.73821258544922, 42.60047149658203, 45.46272659301758, 48.324981689453125, 51.18723678588867, 54.04949188232422, 56.91175079345703, 59.77400588989258, 62.636260986328125, 65.49851989746094, 68.36077117919922, 71.22303009033203, 74.08528137207031, 76.94754028320312, 79.8097915649414, 82.67205047607422, 85.5343017578125, 88.39656066894531, 91.25881958007812]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 8.0, 11.0, 9.0, 15.0, 23.0, 23.0, 39.0, 46.0, 66.0, 96.0, 176.0, 343.0, 715.0, 1685.0, 6142.0, 151563.0, 4020478.0, 8944.0, 1994.0, 820.0, 393.0, 215.0, 136.0, 88.0, 59.0, 37.0, 39.0, 24.0, 7.0, 19.0, 9.0, 9.0, 5.0, 9.0, 5.0, 4.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.125, -108.79296875, -104.4609375, -100.12890625, -95.796875, -91.46484375, -87.1328125, -82.80078125, -78.46875, -74.13671875, -69.8046875, -65.47265625, -61.140625, -56.80859375, -52.4765625, -48.14453125, -43.8125, -39.48046875, -35.1484375, -30.81640625, -26.484375, -22.15234375, -17.8203125, -13.48828125, -9.15625, -4.82421875, -0.4921875, 3.83984375, 8.171875, 12.50390625, 16.8359375, 21.16796875, 25.5, 29.83203125, 34.1640625, 38.49609375, 42.828125, 47.16015625, 51.4921875, 55.82421875, 60.15625, 64.48828125, 68.8203125, 73.15234375, 77.484375, 81.81640625, 86.1484375, 90.48046875, 94.8125, 99.14453125, 103.4765625, 107.80859375, 112.140625, 116.47265625, 120.8046875, 125.13671875, 129.46875, 133.80078125, 138.1328125, 142.46484375, 146.796875, 151.12890625, 155.4609375, 159.79296875, 164.125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 10.0, 19.0, 19.0, 41.0, 98.0, 238.0, 291.0, 160.0, 58.0, 24.0, 13.0, 8.0, 7.0, 7.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.187744140625, -4.02783203125, -3.867919921875, -3.7080078125, -3.548095703125, -3.38818359375, -3.228271484375, -3.068359375, -2.908447265625, -2.74853515625, -2.588623046875, -2.4287109375, -2.268798828125, -2.10888671875, -1.948974609375, -1.7890625, -1.629150390625, -1.46923828125, -1.309326171875, -1.1494140625, -0.989501953125, -0.82958984375, -0.669677734375, -0.509765625, -0.349853515625, -0.18994140625, -0.030029296875, 0.1298828125, 0.289794921875, 0.44970703125, 0.609619140625, 0.76953125, 0.929443359375, 1.08935546875, 1.249267578125, 1.4091796875, 1.569091796875, 1.72900390625, 1.888916015625, 2.048828125, 2.208740234375, 2.36865234375, 2.528564453125, 2.6884765625, 2.848388671875, 3.00830078125, 3.168212890625, 3.328125, 3.488037109375, 3.64794921875, 3.807861328125, 3.9677734375, 4.127685546875, 4.28759765625, 4.447509765625, 4.607421875, 4.767333984375, 4.92724609375, 5.087158203125, 5.2470703125, 5.406982421875, 5.56689453125, 5.726806640625, 5.88671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 8.0, 7.0, 7.0, 9.0, 8.0, 12.0, 18.0, 23.0, 31.0, 40.0, 89.0, 231.0, 1614.0, 74456.0, 4108538.0, 8102.0, 699.0, 162.0, 63.0, 48.0, 33.0, 26.0, 19.0, 11.0, 8.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.125, -136.75, -132.375, -128.0, -123.625, -119.25, -114.875, -110.5, -106.125, -101.75, -97.375, -93.0, -88.625, -84.25, -79.875, -75.5, -71.125, -66.75, -62.375, -58.0, -53.625, -49.25, -44.875, -40.5, -36.125, -31.75, -27.375, -23.0, -18.625, -14.25, -9.875, -5.5, -1.125, 3.25, 7.625, 12.0, 16.375, 20.75, 25.125, 29.5, 33.875, 38.25, 42.625, 47.0, 51.375, 55.75, 60.125, 64.5, 68.875, 73.25, 77.625, 82.0, 86.375, 90.75, 95.125, 99.5, 103.875, 108.25, 112.625, 117.0, 121.375, 125.75, 130.125, 134.5, 138.875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 11.0, 15.0, 29.0, 30.0, 28.0, 44.0, 81.0, 128.0, 262.0, 794.0, 1963.0, 274.0, 136.0, 86.0, 43.0, 28.0, 20.0, 22.0, 12.0, 8.0, 9.0, 6.0, 11.0, 7.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.14453125, -4.0155029296875, -3.886474609375, -3.7574462890625, -3.62841796875, -3.4993896484375, -3.370361328125, -3.2413330078125, -3.1123046875, -2.9832763671875, -2.854248046875, -2.7252197265625, -2.59619140625, -2.4671630859375, -2.338134765625, -2.2091064453125, -2.080078125, -1.9510498046875, -1.822021484375, -1.6929931640625, -1.56396484375, -1.4349365234375, -1.305908203125, -1.1768798828125, -1.0478515625, -0.9188232421875, -0.789794921875, -0.6607666015625, -0.53173828125, -0.4027099609375, -0.273681640625, -0.1446533203125, -0.015625, 0.1134033203125, 0.242431640625, 0.3714599609375, 0.50048828125, 0.6295166015625, 0.758544921875, 0.8875732421875, 1.0166015625, 1.1456298828125, 1.274658203125, 1.4036865234375, 1.53271484375, 1.6617431640625, 1.790771484375, 1.9197998046875, 2.048828125, 2.1778564453125, 2.306884765625, 2.4359130859375, 2.56494140625, 2.6939697265625, 2.822998046875, 2.9520263671875, 3.0810546875, 3.2100830078125, 3.339111328125, 3.4681396484375, 3.59716796875, 3.7261962890625, 3.855224609375, 3.9842529296875, 4.11328125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 21.0, 29.0, 42.0, 117.0, 239.0, 248.0, 161.0, 67.0, 35.0, 17.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.626405715942383, -21.111913681030273, -19.59741973876953, -18.082927703857422, -16.568435668945312, -15.05394172668457, -13.539449691772461, -12.024956703186035, -10.51046371459961, -8.995970726013184, -7.481478214263916, -5.966985702514648, -4.452492713928223, -2.937999725341797, -1.4235076904296875, 0.09098529815673828, 1.605478286743164, 3.1199710369110107, 4.634463787078857, 6.148956298828125, 7.663449287414551, 9.177942276000977, 10.692434310913086, 12.206927299499512, 13.721420288085938, 15.235913276672363, 16.75040626525879, 18.2648983001709, 19.77939224243164, 21.29388427734375, 22.80837631225586, 24.32286834716797, 25.837364196777344, 27.351856231689453, 28.866350173950195, 30.380842208862305, 31.895336151123047, 33.409828186035156, 34.924320220947266, 36.438812255859375, 37.95330810546875, 39.46780014038086, 40.98229217529297, 42.496788024902344, 44.01128005981445, 45.52577209472656, 47.04026412963867, 48.55475616455078, 50.06924819946289, 51.583740234375, 53.09823226928711, 54.61272430419922, 56.127220153808594, 57.6417121887207, 59.15620422363281, 60.67069625854492, 62.18518829345703, 63.69968032836914, 65.21417236328125, 66.72866821289062, 68.24315643310547, 69.75765228271484, 71.27214050292969, 72.78663635253906, 74.30113220214844]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 5.0, 9.0, 8.0, 17.0, 24.0, 20.0, 34.0, 28.0, 39.0, 40.0, 47.0, 35.0, 73.0, 56.0, 59.0, 62.0, 61.0, 54.0, 52.0, 36.0, 36.0, 29.0, 38.0, 39.0, 28.0, 20.0, 12.0, 7.0, 6.0, 8.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.083532333374023, -14.552916526794434, -14.02230167388916, -13.49168586730957, -12.961071014404297, -12.430455207824707, -11.899839401245117, -11.369224548339844, -10.838608741760254, -10.307992935180664, -9.77737808227539, -9.2467622756958, -8.716146469116211, -8.185531616210938, -7.654915809631348, -7.124300479888916, -6.593685150146484, -6.063069820404053, -5.532454490661621, -5.001838684082031, -4.4712233543396, -3.940608024597168, -3.4099924564361572, -2.8793768882751465, -2.348761558532715, -1.8181461095809937, -1.2875306606292725, -0.7569152116775513, -0.22629976272583008, 0.30431556701660156, 0.8349311351776123, 1.365546703338623, 1.8961601257324219, 2.4267754554748535, 2.9573910236358643, 3.488006591796875, 4.018621921539307, 4.549237251281738, 5.079853057861328, 5.61046838760376, 6.141083717346191, 6.671699047088623, 7.202314376831055, 7.7329301834106445, 8.263545989990234, 8.794160842895508, 9.324776649475098, 9.855392456054688, 10.386007308959961, 10.91662311553955, 11.447237968444824, 11.977853775024414, 12.508468627929688, 13.039084434509277, 13.569700241088867, 14.10031509399414, 14.63093090057373, 15.16154670715332, 15.692161560058594, 16.222776412963867, 16.753393173217773, 17.284008026123047, 17.81462287902832, 18.345239639282227, 18.8758544921875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 7.0, 11.0, 9.0, 10.0, 18.0, 21.0, 35.0, 49.0, 73.0, 109.0, 173.0, 263.0, 420.0, 921.0, 2206.0, 9065.0, 122990.0, 860651.0, 42795.0, 5305.0, 1625.0, 724.0, 421.0, 227.0, 141.0, 79.0, 65.0, 51.0, 24.0, 12.0, 25.0, 8.0, 4.0, 7.0, 3.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.71875, -54.9091796875, -53.099609375, -51.2900390625, -49.48046875, -47.6708984375, -45.861328125, -44.0517578125, -42.2421875, -40.4326171875, -38.623046875, -36.8134765625, -35.00390625, -33.1943359375, -31.384765625, -29.5751953125, -27.765625, -25.9560546875, -24.146484375, -22.3369140625, -20.52734375, -18.7177734375, -16.908203125, -15.0986328125, -13.2890625, -11.4794921875, -9.669921875, -7.8603515625, -6.05078125, -4.2412109375, -2.431640625, -0.6220703125, 1.1875, 2.9970703125, 4.806640625, 6.6162109375, 8.42578125, 10.2353515625, 12.044921875, 13.8544921875, 15.6640625, 17.4736328125, 19.283203125, 21.0927734375, 22.90234375, 24.7119140625, 26.521484375, 28.3310546875, 30.140625, 31.9501953125, 33.759765625, 35.5693359375, 37.37890625, 39.1884765625, 40.998046875, 42.8076171875, 44.6171875, 46.4267578125, 48.236328125, 50.0458984375, 51.85546875, 53.6650390625, 55.474609375, 57.2841796875, 59.09375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 9.0, 18.0, 39.0, 79.0, 162.0, 259.0, 226.0, 104.0, 54.0, 18.0, 7.0, 4.0, 6.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.34478759765625, -4.1817626953125, -4.01873779296875, -3.855712890625, -3.69268798828125, -3.5296630859375, -3.36663818359375, -3.20361328125, -3.04058837890625, -2.8775634765625, -2.71453857421875, -2.551513671875, -2.38848876953125, -2.2254638671875, -2.06243896484375, -1.8994140625, -1.73638916015625, -1.5733642578125, -1.41033935546875, -1.247314453125, -1.08428955078125, -0.9212646484375, -0.75823974609375, -0.59521484375, -0.43218994140625, -0.2691650390625, -0.10614013671875, 0.056884765625, 0.21990966796875, 0.3829345703125, 0.54595947265625, 0.708984375, 0.87200927734375, 1.0350341796875, 1.19805908203125, 1.361083984375, 1.52410888671875, 1.6871337890625, 1.85015869140625, 2.01318359375, 2.17620849609375, 2.3392333984375, 2.50225830078125, 2.665283203125, 2.82830810546875, 2.9913330078125, 3.15435791015625, 3.3173828125, 3.48040771484375, 3.6434326171875, 3.80645751953125, 3.969482421875, 4.13250732421875, 4.2955322265625, 4.45855712890625, 4.62158203125, 4.78460693359375, 4.9476318359375, 5.11065673828125, 5.273681640625, 5.43670654296875, 5.5997314453125, 5.76275634765625, 5.92578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 10.0, 18.0, 19.0, 25.0, 31.0, 59.0, 56.0, 102.0, 148.0, 180.0, 239.0, 366.0, 525.0, 892.0, 1685.0, 3534.0, 8712.0, 28329.0, 120477.0, 473943.0, 313099.0, 66348.0, 17475.0, 5960.0, 2660.0, 1310.0, 775.0, 496.0, 294.0, 214.0, 145.0, 108.0, 90.0, 47.0, 31.0, 36.0, 27.0, 27.0, 12.0, 5.0, 4.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-26.828125, -26.03466796875, -25.2412109375, -24.44775390625, -23.654296875, -22.86083984375, -22.0673828125, -21.27392578125, -20.48046875, -19.68701171875, -18.8935546875, -18.10009765625, -17.306640625, -16.51318359375, -15.7197265625, -14.92626953125, -14.1328125, -13.33935546875, -12.5458984375, -11.75244140625, -10.958984375, -10.16552734375, -9.3720703125, -8.57861328125, -7.78515625, -6.99169921875, -6.1982421875, -5.40478515625, -4.611328125, -3.81787109375, -3.0244140625, -2.23095703125, -1.4375, -0.64404296875, 0.1494140625, 0.94287109375, 1.736328125, 2.52978515625, 3.3232421875, 4.11669921875, 4.91015625, 5.70361328125, 6.4970703125, 7.29052734375, 8.083984375, 8.87744140625, 9.6708984375, 10.46435546875, 11.2578125, 12.05126953125, 12.8447265625, 13.63818359375, 14.431640625, 15.22509765625, 16.0185546875, 16.81201171875, 17.60546875, 18.39892578125, 19.1923828125, 19.98583984375, 20.779296875, 21.57275390625, 22.3662109375, 23.15966796875, 23.953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 6.0, 8.0, 7.0, 4.0, 7.0, 9.0, 13.0, 13.0, 18.0, 18.0, 22.0, 36.0, 39.0, 35.0, 38.0, 34.0, 30.0, 38.0, 55.0, 48.0, 44.0, 49.0, 46.0, 42.0, 39.0, 36.0, 38.0, 40.0, 24.0, 25.0, 21.0, 18.0, 15.0, 18.0, 16.0, 4.0, 7.0, 4.0, 3.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.953125, -9.62744140625, -9.3017578125, -8.97607421875, -8.650390625, -8.32470703125, -7.9990234375, -7.67333984375, -7.34765625, -7.02197265625, -6.6962890625, -6.37060546875, -6.044921875, -5.71923828125, -5.3935546875, -5.06787109375, -4.7421875, -4.41650390625, -4.0908203125, -3.76513671875, -3.439453125, -3.11376953125, -2.7880859375, -2.46240234375, -2.13671875, -1.81103515625, -1.4853515625, -1.15966796875, -0.833984375, -0.50830078125, -0.1826171875, 0.14306640625, 0.46875, 0.79443359375, 1.1201171875, 1.44580078125, 1.771484375, 2.09716796875, 2.4228515625, 2.74853515625, 3.07421875, 3.39990234375, 3.7255859375, 4.05126953125, 4.376953125, 4.70263671875, 5.0283203125, 5.35400390625, 5.6796875, 6.00537109375, 6.3310546875, 6.65673828125, 6.982421875, 7.30810546875, 7.6337890625, 7.95947265625, 8.28515625, 8.61083984375, 8.9365234375, 9.26220703125, 9.587890625, 9.91357421875, 10.2392578125, 10.56494140625, 10.890625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 7.0, 7.0, 11.0, 12.0, 18.0, 33.0, 39.0, 97.0, 140.0, 271.0, 528.0, 1483.0, 5554.0, 34603.0, 533011.0, 436162.0, 29089.0, 4995.0, 1388.0, 528.0, 230.0, 145.0, 72.0, 40.0, 28.0, 18.0, 11.0, 9.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-46.1875, -45.001953125, -43.81640625, -42.630859375, -41.4453125, -40.259765625, -39.07421875, -37.888671875, -36.703125, -35.517578125, -34.33203125, -33.146484375, -31.9609375, -30.775390625, -29.58984375, -28.404296875, -27.21875, -26.033203125, -24.84765625, -23.662109375, -22.4765625, -21.291015625, -20.10546875, -18.919921875, -17.734375, -16.548828125, -15.36328125, -14.177734375, -12.9921875, -11.806640625, -10.62109375, -9.435546875, -8.25, -7.064453125, -5.87890625, -4.693359375, -3.5078125, -2.322265625, -1.13671875, 0.048828125, 1.234375, 2.419921875, 3.60546875, 4.791015625, 5.9765625, 7.162109375, 8.34765625, 9.533203125, 10.71875, 11.904296875, 13.08984375, 14.275390625, 15.4609375, 16.646484375, 17.83203125, 19.017578125, 20.203125, 21.388671875, 22.57421875, 23.759765625, 24.9453125, 26.130859375, 27.31640625, 28.501953125, 29.6875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 13.0, 12.0, 18.0, 19.0, 25.0, 31.0, 72.0, 66.0, 79.0, 104.0, 104.0, 91.0, 81.0, 63.0, 48.0, 41.0, 35.0, 28.0, 17.0, 12.0, 5.0, 10.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001438140869140625, -0.0013911277055740356, -0.0013441145420074463, -0.001297101378440857, -0.0012500882148742676, -0.0012030750513076782, -0.0011560618877410889, -0.0011090487241744995, -0.0010620355606079102, -0.0010150223970413208, -0.0009680092334747314, -0.0009209960699081421, -0.0008739829063415527, -0.0008269697427749634, -0.000779956579208374, -0.0007329434156417847, -0.0006859302520751953, -0.000638917088508606, -0.0005919039249420166, -0.0005448907613754272, -0.0004978775978088379, -0.00045086443424224854, -0.0004038512706756592, -0.0003568381071090698, -0.00030982494354248047, -0.0002628117799758911, -0.00021579861640930176, -0.0001687854528427124, -0.00012177228927612305, -7.475912570953369e-05, -2.7745962142944336e-05, 1.926720142364502e-05, 6.628036499023438e-05, 0.00011329352855682373, 0.00016030669212341309, 0.00020731985569000244, 0.0002543330192565918, 0.00030134618282318115, 0.0003483593463897705, 0.00039537250995635986, 0.0004423856735229492, 0.0004893988370895386, 0.0005364120006561279, 0.0005834251642227173, 0.0006304383277893066, 0.000677451491355896, 0.0007244646549224854, 0.0007714778184890747, 0.0008184909820556641, 0.0008655041456222534, 0.0009125173091888428, 0.0009595304727554321, 0.0010065436363220215, 0.0010535567998886108, 0.0011005699634552002, 0.0011475831270217896, 0.001194596290588379, 0.0012416094541549683, 0.0012886226177215576, 0.001335635781288147, 0.0013826489448547363, 0.0014296621084213257, 0.001476675271987915, 0.0015236884355545044, 0.0015707015991210938]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 10.0, 11.0, 11.0, 25.0, 38.0, 70.0, 101.0, 148.0, 243.0, 536.0, 1151.0, 3475.0, 15037.0, 143416.0, 786444.0, 82500.0, 10656.0, 2676.0, 945.0, 470.0, 254.0, 118.0, 69.0, 38.0, 39.0, 16.0, 18.0, 12.0, 4.0, 7.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.09375, -31.96826171875, -30.8427734375, -29.71728515625, -28.591796875, -27.46630859375, -26.3408203125, -25.21533203125, -24.08984375, -22.96435546875, -21.8388671875, -20.71337890625, -19.587890625, -18.46240234375, -17.3369140625, -16.21142578125, -15.0859375, -13.96044921875, -12.8349609375, -11.70947265625, -10.583984375, -9.45849609375, -8.3330078125, -7.20751953125, -6.08203125, -4.95654296875, -3.8310546875, -2.70556640625, -1.580078125, -0.45458984375, 0.6708984375, 1.79638671875, 2.921875, 4.04736328125, 5.1728515625, 6.29833984375, 7.423828125, 8.54931640625, 9.6748046875, 10.80029296875, 11.92578125, 13.05126953125, 14.1767578125, 15.30224609375, 16.427734375, 17.55322265625, 18.6787109375, 19.80419921875, 20.9296875, 22.05517578125, 23.1806640625, 24.30615234375, 25.431640625, 26.55712890625, 27.6826171875, 28.80810546875, 29.93359375, 31.05908203125, 32.1845703125, 33.31005859375, 34.435546875, 35.56103515625, 36.6865234375, 37.81201171875, 38.9375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 3.0, 7.0, 9.0, 20.0, 25.0, 42.0, 55.0, 75.0, 105.0, 123.0, 138.0, 105.0, 83.0, 60.0, 45.0, 25.0, 14.0, 15.0, 13.0, 7.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-21.078125, -20.578369140625, -20.07861328125, -19.578857421875, -19.0791015625, -18.579345703125, -18.07958984375, -17.579833984375, -17.080078125, -16.580322265625, -16.08056640625, -15.580810546875, -15.0810546875, -14.581298828125, -14.08154296875, -13.581787109375, -13.08203125, -12.582275390625, -12.08251953125, -11.582763671875, -11.0830078125, -10.583251953125, -10.08349609375, -9.583740234375, -9.083984375, -8.584228515625, -8.08447265625, -7.584716796875, -7.0849609375, -6.585205078125, -6.08544921875, -5.585693359375, -5.0859375, -4.586181640625, -4.08642578125, -3.586669921875, -3.0869140625, -2.587158203125, -2.08740234375, -1.587646484375, -1.087890625, -0.588134765625, -0.08837890625, 0.411376953125, 0.9111328125, 1.410888671875, 1.91064453125, 2.410400390625, 2.91015625, 3.409912109375, 3.90966796875, 4.409423828125, 4.9091796875, 5.408935546875, 5.90869140625, 6.408447265625, 6.908203125, 7.407958984375, 7.90771484375, 8.407470703125, 8.9072265625, 9.406982421875, 9.90673828125, 10.406494140625, 10.90625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 13.0, 24.0, 80.0, 210.0, 313.0, 220.0, 68.0, 34.0, 18.0, 8.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-366.717529296875, -357.88861083984375, -349.0596923828125, -340.23077392578125, -331.40185546875, -322.57293701171875, -313.7440185546875, -304.91510009765625, -296.086181640625, -287.25726318359375, -278.4283447265625, -269.59942626953125, -260.7705078125, -251.94158935546875, -243.11265563964844, -234.2837371826172, -225.45480346679688, -216.62588500976562, -207.79696655273438, -198.96804809570312, -190.13912963867188, -181.31021118164062, -172.4812774658203, -163.65235900878906, -154.8234405517578, -145.99452209472656, -137.1656036376953, -128.33668518066406, -119.50775909423828, -110.67884063720703, -101.84991455078125, -93.02099609375, -84.19204711914062, -75.36312866210938, -66.53421020507812, -57.705284118652344, -48.876365661621094, -40.047447204589844, -31.218524932861328, -22.389602661132812, -13.560684204101562, -4.73176383972168, 4.097156524658203, 12.926076889038086, 21.75499725341797, 30.58391571044922, 39.412837982177734, 48.24176025390625, 57.0706787109375, 65.89959716796875, 74.728515625, 83.55744171142578, 92.38636016845703, 101.21527862548828, 110.04420471191406, 118.87312316894531, 127.70204162597656, 136.5309600830078, 145.35987854003906, 154.1887969970703, 163.01773071289062, 171.84664916992188, 180.67556762695312, 189.50448608398438, 198.33340454101562]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 5.0, 3.0, 12.0, 25.0, 36.0, 26.0, 31.0, 32.0, 50.0, 53.0, 66.0, 77.0, 54.0, 85.0, 60.0, 73.0, 57.0, 54.0, 37.0, 34.0, 36.0, 18.0, 26.0, 22.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-97.95089721679688, -94.25940704345703, -90.56790924072266, -86.87641906738281, -83.18492126464844, -79.4934310913086, -75.80193328857422, -72.11044311523438, -68.4189453125, -64.72745513916016, -61.03595733642578, -57.34446334838867, -53.65296936035156, -49.96147918701172, -46.269981384277344, -42.5784912109375, -38.88699722290039, -35.19550323486328, -31.504009246826172, -27.812515258789062, -24.121021270751953, -20.429529190063477, -16.738035202026367, -13.046541213989258, -9.355047225952148, -5.663553237915039, -1.972059726715088, 1.7194337844848633, 5.410927772521973, 9.102420806884766, 12.793914794921875, 16.485408782958984, 20.176902770996094, 23.868396759033203, 27.559890747070312, 31.251384735107422, 34.94287872314453, 38.634368896484375, 42.32586669921875, 46.017356872558594, 49.70885467529297, 53.40034866333008, 57.09184265136719, 60.7833366394043, 64.4748306274414, 68.16632080078125, 71.85781860351562, 75.54930877685547, 79.24079895019531, 82.93228912353516, 86.62378692626953, 90.31527709960938, 94.00677490234375, 97.6982650756836, 101.38976287841797, 105.08125305175781, 108.77275085449219, 112.46424102783203, 116.1557388305664, 119.84722900390625, 123.53872680664062, 127.23021697998047, 130.9217071533203, 134.6132049560547, 138.30470275878906]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 16.0, 26.0, 52.0, 161.0, 458.0, 2363.0, 4105409.0, 83843.0, 1330.0, 348.0, 145.0, 55.0, 25.0, 17.0, 10.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-215.75, -207.71875, -199.6875, -191.65625, -183.625, -175.59375, -167.5625, -159.53125, -151.5, -143.46875, -135.4375, -127.40625, -119.375, -111.34375, -103.3125, -95.28125, -87.25, -79.21875, -71.1875, -63.15625, -55.125, -47.09375, -39.0625, -31.03125, -23.0, -14.96875, -6.9375, 1.09375, 9.125, 17.15625, 25.1875, 33.21875, 41.25, 49.28125, 57.3125, 65.34375, 73.375, 81.40625, 89.4375, 97.46875, 105.5, 113.53125, 121.5625, 129.59375, 137.625, 145.65625, 153.6875, 161.71875, 169.75, 177.78125, 185.8125, 193.84375, 201.875, 209.90625, 217.9375, 225.96875, 234.0, 242.03125, 250.0625, 258.09375, 266.125, 274.15625, 282.1875, 290.21875, 298.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 12.0, 19.0, 44.0, 83.0, 121.0, 158.0, 197.0, 145.0, 101.0, 55.0, 23.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.75189208984375, -4.5701904296875, -4.38848876953125, -4.206787109375, -4.02508544921875, -3.8433837890625, -3.66168212890625, -3.47998046875, -3.29827880859375, -3.1165771484375, -2.93487548828125, -2.753173828125, -2.57147216796875, -2.3897705078125, -2.20806884765625, -2.0263671875, -1.84466552734375, -1.6629638671875, -1.48126220703125, -1.299560546875, -1.11785888671875, -0.9361572265625, -0.75445556640625, -0.57275390625, -0.39105224609375, -0.2093505859375, -0.02764892578125, 0.154052734375, 0.33575439453125, 0.5174560546875, 0.69915771484375, 0.880859375, 1.06256103515625, 1.2442626953125, 1.42596435546875, 1.607666015625, 1.78936767578125, 1.9710693359375, 2.15277099609375, 2.33447265625, 2.51617431640625, 2.6978759765625, 2.87957763671875, 3.061279296875, 3.24298095703125, 3.4246826171875, 3.60638427734375, 3.7880859375, 3.96978759765625, 4.1514892578125, 4.33319091796875, 4.514892578125, 4.69659423828125, 4.8782958984375, 5.05999755859375, 5.24169921875, 5.42340087890625, 5.6051025390625, 5.78680419921875, 5.968505859375, 6.15020751953125, 6.3319091796875, 6.51361083984375, 6.6953125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 15.0, 12.0, 11.0, 24.0, 41.0, 66.0, 114.0, 220.0, 525.0, 1688.0, 6724.0, 37243.0, 722622.0, 3349474.0, 61896.0, 9717.0, 2402.0, 747.0, 311.0, 121.0, 86.0, 40.0, 28.0, 38.0, 22.0, 22.0, 8.0, 9.0, 6.0, 7.0, 8.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.28125, -38.89794921875, -37.5146484375, -36.13134765625, -34.748046875, -33.36474609375, -31.9814453125, -30.59814453125, -29.21484375, -27.83154296875, -26.4482421875, -25.06494140625, -23.681640625, -22.29833984375, -20.9150390625, -19.53173828125, -18.1484375, -16.76513671875, -15.3818359375, -13.99853515625, -12.615234375, -11.23193359375, -9.8486328125, -8.46533203125, -7.08203125, -5.69873046875, -4.3154296875, -2.93212890625, -1.548828125, -0.16552734375, 1.2177734375, 2.60107421875, 3.984375, 5.36767578125, 6.7509765625, 8.13427734375, 9.517578125, 10.90087890625, 12.2841796875, 13.66748046875, 15.05078125, 16.43408203125, 17.8173828125, 19.20068359375, 20.583984375, 21.96728515625, 23.3505859375, 24.73388671875, 26.1171875, 27.50048828125, 28.8837890625, 30.26708984375, 31.650390625, 33.03369140625, 34.4169921875, 35.80029296875, 37.18359375, 38.56689453125, 39.9501953125, 41.33349609375, 42.716796875, 44.10009765625, 45.4833984375, 46.86669921875, 48.25]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 1.0, 4.0, 11.0, 6.0, 15.0, 22.0, 21.0, 20.0, 56.0, 73.0, 107.0, 193.0, 477.0, 1848.0, 598.0, 252.0, 134.0, 67.0, 40.0, 39.0, 27.0, 15.0, 10.0, 5.0, 9.0, 1.0, 6.0, 7.0, 7.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8671875, -4.69110107421875, -4.5150146484375, -4.33892822265625, -4.162841796875, -3.98675537109375, -3.8106689453125, -3.63458251953125, -3.45849609375, -3.28240966796875, -3.1063232421875, -2.93023681640625, -2.754150390625, -2.57806396484375, -2.4019775390625, -2.22589111328125, -2.0498046875, -1.87371826171875, -1.6976318359375, -1.52154541015625, -1.345458984375, -1.16937255859375, -0.9932861328125, -0.81719970703125, -0.64111328125, -0.46502685546875, -0.2889404296875, -0.11285400390625, 0.063232421875, 0.23931884765625, 0.4154052734375, 0.59149169921875, 0.767578125, 0.94366455078125, 1.1197509765625, 1.29583740234375, 1.471923828125, 1.64801025390625, 1.8240966796875, 2.00018310546875, 2.17626953125, 2.35235595703125, 2.5284423828125, 2.70452880859375, 2.880615234375, 3.05670166015625, 3.2327880859375, 3.40887451171875, 3.5849609375, 3.76104736328125, 3.9371337890625, 4.11322021484375, 4.289306640625, 4.46539306640625, 4.6414794921875, 4.81756591796875, 4.99365234375, 5.16973876953125, 5.3458251953125, 5.52191162109375, 5.697998046875, 5.87408447265625, 6.0501708984375, 6.22625732421875, 6.40234375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 7.0, 32.0, 81.0, 204.0, 300.0, 193.0, 109.0, 37.0, 16.0, 9.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.83592987060547, -79.59486389160156, -77.35379028320312, -75.11272430419922, -72.87165069580078, -70.63058471679688, -68.38951110839844, -66.14844512939453, -63.907379150390625, -61.66630935668945, -59.42523956298828, -57.184173583984375, -54.9431037902832, -52.70203399658203, -50.46096420288086, -48.21989440917969, -45.978824615478516, -43.737754821777344, -41.49668502807617, -39.255615234375, -37.014549255371094, -34.77347946166992, -32.53240966796875, -30.291339874267578, -28.05027198791504, -25.809202194213867, -23.568134307861328, -21.327064514160156, -19.085994720458984, -16.844926834106445, -14.603857040405273, -12.362788200378418, -10.121723175048828, -7.880654335021973, -5.639585018157959, -3.3985157012939453, -1.1574468612670898, 1.0836219787597656, 3.3246917724609375, 5.565760612487793, 7.806829452514648, 10.047898292541504, 12.28896713256836, 14.530036926269531, 16.771106719970703, 19.012174606323242, 21.253244400024414, 23.494312286376953, 25.735382080078125, 27.976451873779297, 30.217519760131836, 32.458587646484375, 34.69965744018555, 36.94072723388672, 39.18179702758789, 41.42286682128906, 43.66393280029297, 45.90500259399414, 48.14607238769531, 50.38713836669922, 52.62820816040039, 54.86927795410156, 57.110347747802734, 59.351417541503906, 61.59248733520508]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 5.0, 9.0, 16.0, 12.0, 14.0, 18.0, 20.0, 24.0, 37.0, 36.0, 31.0, 40.0, 36.0, 39.0, 51.0, 39.0, 52.0, 44.0, 48.0, 44.0, 48.0, 44.0, 34.0, 33.0, 28.0, 37.0, 27.0, 31.0, 21.0, 17.0, 11.0, 10.0, 7.0, 3.0, 8.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-18.93552017211914, -18.376623153686523, -17.817724227905273, -17.258827209472656, -16.69993019104004, -16.141033172607422, -15.582134246826172, -15.023237228393555, -14.464340209960938, -13.905442237854004, -13.346545219421387, -12.787647247314453, -12.228750228881836, -11.669852256774902, -11.110954284667969, -10.552057266235352, -9.993159294128418, -9.434261322021484, -8.875364303588867, -8.316466331481934, -7.757569313049316, -7.198671340942383, -6.639773845672607, -6.080876350402832, -5.521978855133057, -4.963081359863281, -4.404183864593506, -3.8452861309051514, -3.286388635635376, -2.7274911403656006, -2.168593406677246, -1.6096959114074707, -1.0507984161376953, -0.49190086126327515, 0.06699669361114502, 0.62589430809021, 1.1847918033599854, 1.7436892986297607, 2.3025870323181152, 2.8614845275878906, 3.420382022857666, 3.9792795181274414, 4.538177013397217, 5.097074508666992, 5.655972480773926, 6.214869499206543, 6.773767471313477, 7.332664966583252, 7.891562461853027, 8.450460433959961, 9.009357452392578, 9.568255424499512, 10.127152442932129, 10.686050415039062, 11.24494743347168, 11.803845405578613, 12.362743377685547, 12.92164134979248, 13.480538368225098, 14.039436340332031, 14.598333358764648, 15.157231330871582, 15.716129302978516, 16.275026321411133, 16.83392333984375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 0.0, 7.0, 4.0, 9.0, 9.0, 9.0, 12.0, 16.0, 24.0, 42.0, 52.0, 75.0, 100.0, 129.0, 204.0, 305.0, 519.0, 948.0, 2078.0, 5963.0, 32558.0, 379213.0, 561602.0, 51276.0, 8138.0, 2495.0, 1076.0, 587.0, 354.0, 222.0, 151.0, 104.0, 72.0, 52.0, 41.0, 27.0, 24.0, 13.0, 11.0, 11.0, 5.0, 4.0, 8.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-42.78125, -41.52685546875, -40.2724609375, -39.01806640625, -37.763671875, -36.50927734375, -35.2548828125, -34.00048828125, -32.74609375, -31.49169921875, -30.2373046875, -28.98291015625, -27.728515625, -26.47412109375, -25.2197265625, -23.96533203125, -22.7109375, -21.45654296875, -20.2021484375, -18.94775390625, -17.693359375, -16.43896484375, -15.1845703125, -13.93017578125, -12.67578125, -11.42138671875, -10.1669921875, -8.91259765625, -7.658203125, -6.40380859375, -5.1494140625, -3.89501953125, -2.640625, -1.38623046875, -0.1318359375, 1.12255859375, 2.376953125, 3.63134765625, 4.8857421875, 6.14013671875, 7.39453125, 8.64892578125, 9.9033203125, 11.15771484375, 12.412109375, 13.66650390625, 14.9208984375, 16.17529296875, 17.4296875, 18.68408203125, 19.9384765625, 21.19287109375, 22.447265625, 23.70166015625, 24.9560546875, 26.21044921875, 27.46484375, 28.71923828125, 29.9736328125, 31.22802734375, 32.482421875, 33.73681640625, 34.9912109375, 36.24560546875, 37.5]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 4.0, 11.0, 22.0, 39.0, 67.0, 113.0, 123.0, 188.0, 169.0, 123.0, 73.0, 31.0, 15.0, 12.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.90875244140625, -4.7237548828125, -4.53875732421875, -4.353759765625, -4.16876220703125, -3.9837646484375, -3.79876708984375, -3.61376953125, -3.42877197265625, -3.2437744140625, -3.05877685546875, -2.873779296875, -2.68878173828125, -2.5037841796875, -2.31878662109375, -2.1337890625, -1.94879150390625, -1.7637939453125, -1.57879638671875, -1.393798828125, -1.20880126953125, -1.0238037109375, -0.83880615234375, -0.65380859375, -0.46881103515625, -0.2838134765625, -0.09881591796875, 0.086181640625, 0.27117919921875, 0.4561767578125, 0.64117431640625, 0.826171875, 1.01116943359375, 1.1961669921875, 1.38116455078125, 1.566162109375, 1.75115966796875, 1.9361572265625, 2.12115478515625, 2.30615234375, 2.49114990234375, 2.6761474609375, 2.86114501953125, 3.046142578125, 3.23114013671875, 3.4161376953125, 3.60113525390625, 3.7861328125, 3.97113037109375, 4.1561279296875, 4.34112548828125, 4.526123046875, 4.71112060546875, 4.8961181640625, 5.08111572265625, 5.26611328125, 5.45111083984375, 5.6361083984375, 5.82110595703125, 6.006103515625, 6.19110107421875, 6.3760986328125, 6.56109619140625, 6.74609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 13.0, 8.0, 10.0, 16.0, 34.0, 33.0, 49.0, 73.0, 92.0, 125.0, 166.0, 256.0, 409.0, 700.0, 1155.0, 2421.0, 6074.0, 20643.0, 99771.0, 501075.0, 335236.0, 57906.0, 13482.0, 4366.0, 1847.0, 945.0, 541.0, 369.0, 208.0, 155.0, 107.0, 63.0, 59.0, 39.0, 34.0, 23.0, 7.0, 6.0, 13.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-34.8125, -33.892578125, -32.97265625, -32.052734375, -31.1328125, -30.212890625, -29.29296875, -28.373046875, -27.453125, -26.533203125, -25.61328125, -24.693359375, -23.7734375, -22.853515625, -21.93359375, -21.013671875, -20.09375, -19.173828125, -18.25390625, -17.333984375, -16.4140625, -15.494140625, -14.57421875, -13.654296875, -12.734375, -11.814453125, -10.89453125, -9.974609375, -9.0546875, -8.134765625, -7.21484375, -6.294921875, -5.375, -4.455078125, -3.53515625, -2.615234375, -1.6953125, -0.775390625, 0.14453125, 1.064453125, 1.984375, 2.904296875, 3.82421875, 4.744140625, 5.6640625, 6.583984375, 7.50390625, 8.423828125, 9.34375, 10.263671875, 11.18359375, 12.103515625, 13.0234375, 13.943359375, 14.86328125, 15.783203125, 16.703125, 17.623046875, 18.54296875, 19.462890625, 20.3828125, 21.302734375, 22.22265625, 23.142578125, 24.0625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 5.0, 3.0, 6.0, 11.0, 8.0, 15.0, 26.0, 30.0, 27.0, 34.0, 47.0, 48.0, 62.0, 59.0, 61.0, 53.0, 57.0, 60.0, 43.0, 44.0, 47.0, 42.0, 30.0, 32.0, 34.0, 22.0, 25.0, 18.0, 15.0, 11.0, 8.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.700927734375, -17.16748046875, -16.634033203125, -16.1005859375, -15.567138671875, -15.03369140625, -14.500244140625, -13.966796875, -13.433349609375, -12.89990234375, -12.366455078125, -11.8330078125, -11.299560546875, -10.76611328125, -10.232666015625, -9.69921875, -9.165771484375, -8.63232421875, -8.098876953125, -7.5654296875, -7.031982421875, -6.49853515625, -5.965087890625, -5.431640625, -4.898193359375, -4.36474609375, -3.831298828125, -3.2978515625, -2.764404296875, -2.23095703125, -1.697509765625, -1.1640625, -0.630615234375, -0.09716796875, 0.436279296875, 0.9697265625, 1.503173828125, 2.03662109375, 2.570068359375, 3.103515625, 3.636962890625, 4.17041015625, 4.703857421875, 5.2373046875, 5.770751953125, 6.30419921875, 6.837646484375, 7.37109375, 7.904541015625, 8.43798828125, 8.971435546875, 9.5048828125, 10.038330078125, 10.57177734375, 11.105224609375, 11.638671875, 12.172119140625, 12.70556640625, 13.239013671875, 13.7724609375, 14.305908203125, 14.83935546875, 15.372802734375, 15.90625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 7.0, 15.0, 10.0, 14.0, 20.0, 33.0, 32.0, 50.0, 65.0, 122.0, 181.0, 352.0, 730.0, 2070.0, 6783.0, 38530.0, 681622.0, 290337.0, 20339.0, 4429.0, 1456.0, 616.0, 286.0, 150.0, 82.0, 48.0, 42.0, 28.0, 27.0, 20.0, 12.0, 13.0, 9.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-51.0, -49.61572265625, -48.2314453125, -46.84716796875, -45.462890625, -44.07861328125, -42.6943359375, -41.31005859375, -39.92578125, -38.54150390625, -37.1572265625, -35.77294921875, -34.388671875, -33.00439453125, -31.6201171875, -30.23583984375, -28.8515625, -27.46728515625, -26.0830078125, -24.69873046875, -23.314453125, -21.93017578125, -20.5458984375, -19.16162109375, -17.77734375, -16.39306640625, -15.0087890625, -13.62451171875, -12.240234375, -10.85595703125, -9.4716796875, -8.08740234375, -6.703125, -5.31884765625, -3.9345703125, -2.55029296875, -1.166015625, 0.21826171875, 1.6025390625, 2.98681640625, 4.37109375, 5.75537109375, 7.1396484375, 8.52392578125, 9.908203125, 11.29248046875, 12.6767578125, 14.06103515625, 15.4453125, 16.82958984375, 18.2138671875, 19.59814453125, 20.982421875, 22.36669921875, 23.7509765625, 25.13525390625, 26.51953125, 27.90380859375, 29.2880859375, 30.67236328125, 32.056640625, 33.44091796875, 34.8251953125, 36.20947265625, 37.59375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 12.0, 11.0, 9.0, 29.0, 27.0, 46.0, 59.0, 90.0, 103.0, 142.0, 124.0, 96.0, 76.0, 54.0, 33.0, 25.0, 18.0, 15.0, 8.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002017974853515625, -0.0019543468952178955, -0.001890718936920166, -0.0018270909786224365, -0.001763463020324707, -0.0016998350620269775, -0.001636207103729248, -0.0015725791454315186, -0.001508951187133789, -0.0014453232288360596, -0.00138169527053833, -0.0013180673122406006, -0.001254439353942871, -0.0011908113956451416, -0.0011271834373474121, -0.0010635554790496826, -0.0009999275207519531, -0.0009362995624542236, -0.0008726716041564941, -0.0008090436458587646, -0.0007454156875610352, -0.0006817877292633057, -0.0006181597709655762, -0.0005545318126678467, -0.0004909038543701172, -0.0004272758960723877, -0.0003636479377746582, -0.0003000199794769287, -0.00023639202117919922, -0.00017276406288146973, -0.00010913610458374023, -4.550814628601074e-05, 1.811981201171875e-05, 8.174777030944824e-05, 0.00014537572860717773, 0.00020900368690490723, 0.0002726316452026367, 0.0003362596035003662, 0.0003998875617980957, 0.0004635155200958252, 0.0005271434783935547, 0.0005907714366912842, 0.0006543993949890137, 0.0007180273532867432, 0.0007816553115844727, 0.0008452832698822021, 0.0009089112281799316, 0.0009725391864776611, 0.0010361671447753906, 0.0010997951030731201, 0.0011634230613708496, 0.001227051019668579, 0.0012906789779663086, 0.001354306936264038, 0.0014179348945617676, 0.001481562852859497, 0.0015451908111572266, 0.001608818769454956, 0.0016724467277526855, 0.001736074686050415, 0.0017997026443481445, 0.001863330602645874, 0.0019269585609436035, 0.001990586519241333, 0.0020542144775390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 3.0, 12.0, 14.0, 16.0, 27.0, 24.0, 38.0, 45.0, 63.0, 111.0, 168.0, 290.0, 520.0, 1198.0, 3234.0, 11302.0, 62890.0, 664073.0, 265835.0, 28238.0, 6435.0, 2027.0, 864.0, 405.0, 237.0, 130.0, 91.0, 61.0, 49.0, 43.0, 20.0, 19.0, 10.0, 13.0, 9.0, 10.0, 6.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-35.0625, -33.9931640625, -32.923828125, -31.8544921875, -30.78515625, -29.7158203125, -28.646484375, -27.5771484375, -26.5078125, -25.4384765625, -24.369140625, -23.2998046875, -22.23046875, -21.1611328125, -20.091796875, -19.0224609375, -17.953125, -16.8837890625, -15.814453125, -14.7451171875, -13.67578125, -12.6064453125, -11.537109375, -10.4677734375, -9.3984375, -8.3291015625, -7.259765625, -6.1904296875, -5.12109375, -4.0517578125, -2.982421875, -1.9130859375, -0.84375, 0.2255859375, 1.294921875, 2.3642578125, 3.43359375, 4.5029296875, 5.572265625, 6.6416015625, 7.7109375, 8.7802734375, 9.849609375, 10.9189453125, 11.98828125, 13.0576171875, 14.126953125, 15.1962890625, 16.265625, 17.3349609375, 18.404296875, 19.4736328125, 20.54296875, 21.6123046875, 22.681640625, 23.7509765625, 24.8203125, 25.8896484375, 26.958984375, 28.0283203125, 29.09765625, 30.1669921875, 31.236328125, 32.3056640625, 33.375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 10.0, 11.0, 18.0, 17.0, 37.0, 34.0, 62.0, 66.0, 81.0, 129.0, 119.0, 92.0, 70.0, 43.0, 41.0, 28.0, 28.0, 23.0, 15.0, 10.0, 2.0, 7.0, 9.0, 6.0, 3.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.265625, -14.756103515625, -14.24658203125, -13.737060546875, -13.2275390625, -12.718017578125, -12.20849609375, -11.698974609375, -11.189453125, -10.679931640625, -10.17041015625, -9.660888671875, -9.1513671875, -8.641845703125, -8.13232421875, -7.622802734375, -7.11328125, -6.603759765625, -6.09423828125, -5.584716796875, -5.0751953125, -4.565673828125, -4.05615234375, -3.546630859375, -3.037109375, -2.527587890625, -2.01806640625, -1.508544921875, -0.9990234375, -0.489501953125, 0.02001953125, 0.529541015625, 1.0390625, 1.548583984375, 2.05810546875, 2.567626953125, 3.0771484375, 3.586669921875, 4.09619140625, 4.605712890625, 5.115234375, 5.624755859375, 6.13427734375, 6.643798828125, 7.1533203125, 7.662841796875, 8.17236328125, 8.681884765625, 9.19140625, 9.700927734375, 10.21044921875, 10.719970703125, 11.2294921875, 11.739013671875, 12.24853515625, 12.758056640625, 13.267578125, 13.777099609375, 14.28662109375, 14.796142578125, 15.3056640625, 15.815185546875, 16.32470703125, 16.834228515625, 17.34375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 14.0, 25.0, 63.0, 109.0, 186.0, 236.0, 162.0, 92.0, 49.0, 25.0, 16.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.768310546875, -260.9114074707031, -253.05450439453125, -245.1975860595703, -237.34068298339844, -229.48377990722656, -221.6268768310547, -213.76995849609375, -205.91305541992188, -198.05615234375, -190.19924926757812, -182.3423309326172, -174.4854278564453, -166.62852478027344, -158.77162170410156, -150.91470336914062, -143.05780029296875, -135.20089721679688, -127.34398651123047, -119.4870834350586, -111.63017272949219, -103.77326965332031, -95.91636657714844, -88.05945587158203, -80.20256042480469, -72.34565734863281, -64.4887466430664, -56.63184356689453, -48.774932861328125, -40.91802978515625, -33.06112289428711, -25.20421600341797, -17.347305297851562, -9.490398406982422, -1.6334924697875977, 6.223413467407227, 14.080320358276367, 21.937225341796875, 29.794132232666016, 37.651039123535156, 45.5079460144043, 53.36485290527344, 61.22175979614258, 69.07866668701172, 76.9355697631836, 84.79248046875, 92.64938354492188, 100.50628662109375, 108.36319732666016, 116.22010040283203, 124.07701110839844, 131.9339141845703, 139.7908172607422, 147.64773559570312, 155.504638671875, 163.36154174804688, 171.21844482421875, 179.07534790039062, 186.9322509765625, 194.78916931152344, 202.6460723876953, 210.5029754638672, 218.35987854003906, 226.216796875, 234.07369995117188]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 12.0, 19.0, 23.0, 29.0, 33.0, 41.0, 52.0, 44.0, 49.0, 54.0, 67.0, 68.0, 66.0, 50.0, 60.0, 60.0, 50.0, 48.0, 44.0, 27.0, 19.0, 24.0, 14.0, 9.0, 10.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.94523620605469, -98.15853118896484, -93.37183380126953, -88.58512878417969, -83.79843139648438, -79.01172637939453, -74.22502136230469, -69.43832397460938, -64.65161895751953, -59.86491775512695, -55.078216552734375, -50.29151153564453, -45.50481033325195, -40.718109130859375, -35.93140411376953, -31.144702911376953, -26.358001708984375, -21.571300506591797, -16.784597396850586, -11.997895240783691, -7.211193084716797, -2.4244918823242188, 2.362211227416992, 7.148914337158203, 11.935615539550781, 16.72231674194336, 21.50901985168457, 26.29572296142578, 31.08242416381836, 35.86912536621094, 40.65583038330078, 45.44253158569336, 50.229248046875, 55.01594924926758, 59.802650451660156, 64.58935546875, 69.37605285644531, 74.16275787353516, 78.949462890625, 83.73616027832031, 88.52286529541016, 93.3095703125, 98.09626770019531, 102.88297271728516, 107.669677734375, 112.45637512207031, 117.24308013916016, 122.02978515625, 126.81648254394531, 131.60317993164062, 136.389892578125, 141.1765899658203, 145.96328735351562, 150.75, 155.5366973876953, 160.32339477539062, 165.110107421875, 169.8968048095703, 174.6835174560547, 179.47021484375, 184.2569122314453, 189.04360961914062, 193.830322265625, 198.6170196533203, 203.40371704101562]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 5.0, 9.0, 19.0, 23.0, 44.0, 90.0, 132.0, 279.0, 665.0, 2764.0, 22931.0, 3994752.0, 162072.0, 7597.0, 1596.0, 622.0, 284.0, 163.0, 75.0, 56.0, 24.0, 26.0, 18.0, 11.0, 5.0, 3.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.1875, -68.712890625, -66.23828125, -63.763671875, -61.2890625, -58.814453125, -56.33984375, -53.865234375, -51.390625, -48.916015625, -46.44140625, -43.966796875, -41.4921875, -39.017578125, -36.54296875, -34.068359375, -31.59375, -29.119140625, -26.64453125, -24.169921875, -21.6953125, -19.220703125, -16.74609375, -14.271484375, -11.796875, -9.322265625, -6.84765625, -4.373046875, -1.8984375, 0.576171875, 3.05078125, 5.525390625, 8.0, 10.474609375, 12.94921875, 15.423828125, 17.8984375, 20.373046875, 22.84765625, 25.322265625, 27.796875, 30.271484375, 32.74609375, 35.220703125, 37.6953125, 40.169921875, 42.64453125, 45.119140625, 47.59375, 50.068359375, 52.54296875, 55.017578125, 57.4921875, 59.966796875, 62.44140625, 64.916015625, 67.390625, 69.865234375, 72.33984375, 74.814453125, 77.2890625, 79.763671875, 82.23828125, 84.712890625, 87.1875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 12.0, 19.0, 19.0, 21.0, 60.0, 74.0, 101.0, 128.0, 119.0, 119.0, 119.0, 77.0, 54.0, 23.0, 16.0, 14.0, 7.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73046875, -5.52947998046875, -5.3284912109375, -5.12750244140625, -4.926513671875, -4.72552490234375, -4.5245361328125, -4.32354736328125, -4.12255859375, -3.92156982421875, -3.7205810546875, -3.51959228515625, -3.318603515625, -3.11761474609375, -2.9166259765625, -2.71563720703125, -2.5146484375, -2.31365966796875, -2.1126708984375, -1.91168212890625, -1.710693359375, -1.50970458984375, -1.3087158203125, -1.10772705078125, -0.90673828125, -0.70574951171875, -0.5047607421875, -0.30377197265625, -0.102783203125, 0.09820556640625, 0.2991943359375, 0.50018310546875, 0.701171875, 0.90216064453125, 1.1031494140625, 1.30413818359375, 1.505126953125, 1.70611572265625, 1.9071044921875, 2.10809326171875, 2.30908203125, 2.51007080078125, 2.7110595703125, 2.91204833984375, 3.113037109375, 3.31402587890625, 3.5150146484375, 3.71600341796875, 3.9169921875, 4.11798095703125, 4.3189697265625, 4.51995849609375, 4.720947265625, 4.92193603515625, 5.1229248046875, 5.32391357421875, 5.52490234375, 5.72589111328125, 5.9268798828125, 6.12786865234375, 6.328857421875, 6.52984619140625, 6.7308349609375, 6.93182373046875, 7.1328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 12.0, 9.0, 13.0, 23.0, 41.0, 63.0, 90.0, 180.0, 346.0, 642.0, 1374.0, 2893.0, 7876.0, 24333.0, 116753.0, 3111965.0, 829220.0, 70230.0, 16967.0, 5919.0, 2527.0, 1244.0, 619.0, 329.0, 225.0, 122.0, 85.0, 66.0, 38.0, 27.0, 20.0, 11.0, 6.0, 2.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.3125, -32.432861328125, -31.55322265625, -30.673583984375, -29.7939453125, -28.914306640625, -28.03466796875, -27.155029296875, -26.275390625, -25.395751953125, -24.51611328125, -23.636474609375, -22.7568359375, -21.877197265625, -20.99755859375, -20.117919921875, -19.23828125, -18.358642578125, -17.47900390625, -16.599365234375, -15.7197265625, -14.840087890625, -13.96044921875, -13.080810546875, -12.201171875, -11.321533203125, -10.44189453125, -9.562255859375, -8.6826171875, -7.802978515625, -6.92333984375, -6.043701171875, -5.1640625, -4.284423828125, -3.40478515625, -2.525146484375, -1.6455078125, -0.765869140625, 0.11376953125, 0.993408203125, 1.873046875, 2.752685546875, 3.63232421875, 4.511962890625, 5.3916015625, 6.271240234375, 7.15087890625, 8.030517578125, 8.91015625, 9.789794921875, 10.66943359375, 11.549072265625, 12.4287109375, 13.308349609375, 14.18798828125, 15.067626953125, 15.947265625, 16.826904296875, 17.70654296875, 18.586181640625, 19.4658203125, 20.345458984375, 21.22509765625, 22.104736328125, 22.984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 3.0, 6.0, 10.0, 21.0, 21.0, 16.0, 31.0, 50.0, 90.0, 144.0, 321.0, 1510.0, 1208.0, 289.0, 132.0, 76.0, 48.0, 25.0, 11.0, 13.0, 14.0, 6.0, 8.0, 4.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.109375, -5.843505859375, -5.57763671875, -5.311767578125, -5.0458984375, -4.780029296875, -4.51416015625, -4.248291015625, -3.982421875, -3.716552734375, -3.45068359375, -3.184814453125, -2.9189453125, -2.653076171875, -2.38720703125, -2.121337890625, -1.85546875, -1.589599609375, -1.32373046875, -1.057861328125, -0.7919921875, -0.526123046875, -0.26025390625, 0.005615234375, 0.271484375, 0.537353515625, 0.80322265625, 1.069091796875, 1.3349609375, 1.600830078125, 1.86669921875, 2.132568359375, 2.3984375, 2.664306640625, 2.93017578125, 3.196044921875, 3.4619140625, 3.727783203125, 3.99365234375, 4.259521484375, 4.525390625, 4.791259765625, 5.05712890625, 5.322998046875, 5.5888671875, 5.854736328125, 6.12060546875, 6.386474609375, 6.65234375, 6.918212890625, 7.18408203125, 7.449951171875, 7.7158203125, 7.981689453125, 8.24755859375, 8.513427734375, 8.779296875, 9.045166015625, 9.31103515625, 9.576904296875, 9.8427734375, 10.108642578125, 10.37451171875, 10.640380859375, 10.90625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 13.0, 22.0, 54.0, 81.0, 138.0, 207.0, 161.0, 132.0, 74.0, 35.0, 23.0, 21.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.4171142578125, -45.73039245605469, -44.04367446899414, -42.356956481933594, -40.67023468017578, -38.98351287841797, -37.29679489135742, -35.610076904296875, -33.92335510253906, -32.23663330078125, -30.549915313720703, -28.863195419311523, -27.176475524902344, -25.489755630493164, -23.803035736083984, -22.116315841674805, -20.429595947265625, -18.742876052856445, -17.056156158447266, -15.369436264038086, -13.682716369628906, -11.995996475219727, -10.309276580810547, -8.622556686401367, -6.9358367919921875, -5.249116897583008, -3.562397003173828, -1.8756771087646484, -0.18895721435546875, 1.497762680053711, 3.1844825744628906, 4.87120246887207, 6.557918548583984, 8.244638442993164, 9.931358337402344, 11.618078231811523, 13.304798126220703, 14.991518020629883, 16.678237915039062, 18.364957809448242, 20.051677703857422, 21.7383975982666, 23.42511749267578, 25.11183738708496, 26.79855728149414, 28.48527717590332, 30.1719970703125, 31.85871696472168, 33.54543685913086, 35.232154846191406, 36.91887664794922, 38.60559844970703, 40.29231643676758, 41.979034423828125, 43.66575622558594, 45.35247802734375, 47.0391960144043, 48.725914001464844, 50.412635803222656, 52.09935760498047, 53.786075592041016, 55.47279357910156, 57.159515380859375, 58.84623718261719, 60.532955169677734]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 10.0, 11.0, 14.0, 13.0, 21.0, 32.0, 32.0, 47.0, 53.0, 56.0, 56.0, 71.0, 69.0, 57.0, 52.0, 65.0, 50.0, 63.0, 48.0, 31.0, 34.0, 26.0, 20.0, 17.0, 15.0, 11.0, 8.0, 9.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.90068435668945, -40.81103515625, -39.72138214111328, -38.63173294067383, -37.54207992553711, -36.452430725097656, -35.36277770996094, -34.273128509521484, -33.18347930908203, -32.09383010864258, -31.00417709350586, -29.914527893066406, -28.82487678527832, -27.735225677490234, -26.64557456970215, -25.555923461914062, -24.466272354125977, -23.37662124633789, -22.286970138549805, -21.19731903076172, -20.107669830322266, -19.01801872253418, -17.928367614746094, -16.838716506958008, -15.749066352844238, -14.659415245056152, -13.569765090942383, -12.480113983154297, -11.390462875366211, -10.300812721252441, -9.211161613464355, -8.121511459350586, -7.0318603515625, -5.942209720611572, -4.8525590896606445, -3.7629079818725586, -2.673257350921631, -1.5836067199707031, -0.4939556121826172, 0.5956950187683105, 1.6853456497192383, 2.774996280670166, 3.864647150039673, 4.95429801940918, 6.043948650360107, 7.133599281311035, 8.223250389099121, 9.31290054321289, 10.402551651000977, 11.492202758789062, 12.581852912902832, 13.671504020690918, 14.761154174804688, 15.850805282592773, 16.94045639038086, 18.030107498168945, 19.11975860595703, 20.209409713745117, 21.299060821533203, 22.388710021972656, 23.478361129760742, 24.568012237548828, 25.657663345336914, 26.747314453125, 27.836963653564453]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 1.0, 6.0, 8.0, 10.0, 16.0, 18.0, 23.0, 27.0, 37.0, 64.0, 95.0, 129.0, 176.0, 286.0, 422.0, 764.0, 1527.0, 3770.0, 11339.0, 43551.0, 199256.0, 512889.0, 209065.0, 45507.0, 11901.0, 3979.0, 1609.0, 721.0, 455.0, 295.0, 190.0, 112.0, 68.0, 77.0, 44.0, 28.0, 27.0, 11.0, 15.0, 8.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.9375, -23.153076171875, -22.36865234375, -21.584228515625, -20.7998046875, -20.015380859375, -19.23095703125, -18.446533203125, -17.662109375, -16.877685546875, -16.09326171875, -15.308837890625, -14.5244140625, -13.739990234375, -12.95556640625, -12.171142578125, -11.38671875, -10.602294921875, -9.81787109375, -9.033447265625, -8.2490234375, -7.464599609375, -6.68017578125, -5.895751953125, -5.111328125, -4.326904296875, -3.54248046875, -2.758056640625, -1.9736328125, -1.189208984375, -0.40478515625, 0.379638671875, 1.1640625, 1.948486328125, 2.73291015625, 3.517333984375, 4.3017578125, 5.086181640625, 5.87060546875, 6.655029296875, 7.439453125, 8.223876953125, 9.00830078125, 9.792724609375, 10.5771484375, 11.361572265625, 12.14599609375, 12.930419921875, 13.71484375, 14.499267578125, 15.28369140625, 16.068115234375, 16.8525390625, 17.636962890625, 18.42138671875, 19.205810546875, 19.990234375, 20.774658203125, 21.55908203125, 22.343505859375, 23.1279296875, 23.912353515625, 24.69677734375, 25.481201171875, 26.265625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 7.0, 13.0, 18.0, 21.0, 55.0, 56.0, 86.0, 112.0, 84.0, 120.0, 117.0, 99.0, 82.0, 57.0, 29.0, 14.0, 18.0, 4.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69921875, -5.49774169921875, -5.2962646484375, -5.09478759765625, -4.893310546875, -4.69183349609375, -4.4903564453125, -4.28887939453125, -4.08740234375, -3.88592529296875, -3.6844482421875, -3.48297119140625, -3.281494140625, -3.08001708984375, -2.8785400390625, -2.67706298828125, -2.4755859375, -2.27410888671875, -2.0726318359375, -1.87115478515625, -1.669677734375, -1.46820068359375, -1.2667236328125, -1.06524658203125, -0.86376953125, -0.66229248046875, -0.4608154296875, -0.25933837890625, -0.057861328125, 0.14361572265625, 0.3450927734375, 0.54656982421875, 0.748046875, 0.94952392578125, 1.1510009765625, 1.35247802734375, 1.553955078125, 1.75543212890625, 1.9569091796875, 2.15838623046875, 2.35986328125, 2.56134033203125, 2.7628173828125, 2.96429443359375, 3.165771484375, 3.36724853515625, 3.5687255859375, 3.77020263671875, 3.9716796875, 4.17315673828125, 4.3746337890625, 4.57611083984375, 4.777587890625, 4.97906494140625, 5.1805419921875, 5.38201904296875, 5.58349609375, 5.78497314453125, 5.9864501953125, 6.18792724609375, 6.389404296875, 6.59088134765625, 6.7923583984375, 6.99383544921875, 7.1953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 4.0, 7.0, 14.0, 25.0, 44.0, 76.0, 128.0, 223.0, 386.0, 967.0, 2780.0, 14881.0, 203210.0, 755891.0, 60224.0, 6833.0, 1583.0, 616.0, 279.0, 173.0, 91.0, 53.0, 26.0, 19.0, 9.0, 8.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.21875, -61.60986328125, -60.0009765625, -58.39208984375, -56.783203125, -55.17431640625, -53.5654296875, -51.95654296875, -50.34765625, -48.73876953125, -47.1298828125, -45.52099609375, -43.912109375, -42.30322265625, -40.6943359375, -39.08544921875, -37.4765625, -35.86767578125, -34.2587890625, -32.64990234375, -31.041015625, -29.43212890625, -27.8232421875, -26.21435546875, -24.60546875, -22.99658203125, -21.3876953125, -19.77880859375, -18.169921875, -16.56103515625, -14.9521484375, -13.34326171875, -11.734375, -10.12548828125, -8.5166015625, -6.90771484375, -5.298828125, -3.68994140625, -2.0810546875, -0.47216796875, 1.13671875, 2.74560546875, 4.3544921875, 5.96337890625, 7.572265625, 9.18115234375, 10.7900390625, 12.39892578125, 14.0078125, 15.61669921875, 17.2255859375, 18.83447265625, 20.443359375, 22.05224609375, 23.6611328125, 25.27001953125, 26.87890625, 28.48779296875, 30.0966796875, 31.70556640625, 33.314453125, 34.92333984375, 36.5322265625, 38.14111328125, 39.75]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 8.0, 5.0, 9.0, 16.0, 11.0, 17.0, 19.0, 17.0, 31.0, 30.0, 44.0, 53.0, 60.0, 60.0, 78.0, 58.0, 64.0, 74.0, 56.0, 43.0, 49.0, 45.0, 42.0, 27.0, 23.0, 17.0, 13.0, 12.0, 12.0, 9.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.28125, -22.5087890625, -21.736328125, -20.9638671875, -20.19140625, -19.4189453125, -18.646484375, -17.8740234375, -17.1015625, -16.3291015625, -15.556640625, -14.7841796875, -14.01171875, -13.2392578125, -12.466796875, -11.6943359375, -10.921875, -10.1494140625, -9.376953125, -8.6044921875, -7.83203125, -7.0595703125, -6.287109375, -5.5146484375, -4.7421875, -3.9697265625, -3.197265625, -2.4248046875, -1.65234375, -0.8798828125, -0.107421875, 0.6650390625, 1.4375, 2.2099609375, 2.982421875, 3.7548828125, 4.52734375, 5.2998046875, 6.072265625, 6.8447265625, 7.6171875, 8.3896484375, 9.162109375, 9.9345703125, 10.70703125, 11.4794921875, 12.251953125, 13.0244140625, 13.796875, 14.5693359375, 15.341796875, 16.1142578125, 16.88671875, 17.6591796875, 18.431640625, 19.2041015625, 19.9765625, 20.7490234375, 21.521484375, 22.2939453125, 23.06640625, 23.8388671875, 24.611328125, 25.3837890625, 26.15625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 9.0, 5.0, 10.0, 15.0, 21.0, 30.0, 55.0, 82.0, 103.0, 227.0, 426.0, 882.0, 2554.0, 9904.0, 63066.0, 620494.0, 311818.0, 29709.0, 5889.0, 1776.0, 669.0, 336.0, 158.0, 108.0, 64.0, 40.0, 35.0, 16.0, 8.0, 8.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.5, -21.834716796875, -21.16943359375, -20.504150390625, -19.8388671875, -19.173583984375, -18.50830078125, -17.843017578125, -17.177734375, -16.512451171875, -15.84716796875, -15.181884765625, -14.5166015625, -13.851318359375, -13.18603515625, -12.520751953125, -11.85546875, -11.190185546875, -10.52490234375, -9.859619140625, -9.1943359375, -8.529052734375, -7.86376953125, -7.198486328125, -6.533203125, -5.867919921875, -5.20263671875, -4.537353515625, -3.8720703125, -3.206787109375, -2.54150390625, -1.876220703125, -1.2109375, -0.545654296875, 0.11962890625, 0.784912109375, 1.4501953125, 2.115478515625, 2.78076171875, 3.446044921875, 4.111328125, 4.776611328125, 5.44189453125, 6.107177734375, 6.7724609375, 7.437744140625, 8.10302734375, 8.768310546875, 9.43359375, 10.098876953125, 10.76416015625, 11.429443359375, 12.0947265625, 12.760009765625, 13.42529296875, 14.090576171875, 14.755859375, 15.421142578125, 16.08642578125, 16.751708984375, 17.4169921875, 18.082275390625, 18.74755859375, 19.412841796875, 20.078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 3.0, 10.0, 13.0, 11.0, 14.0, 24.0, 42.0, 48.0, 62.0, 79.0, 82.0, 139.0, 115.0, 83.0, 62.0, 46.0, 46.0, 32.0, 16.0, 8.0, 10.0, 14.0, 5.0, 4.0, 3.0, 2.0, 1.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001529693603515625, -0.0014866441488265991, -0.0014435946941375732, -0.0014005452394485474, -0.0013574957847595215, -0.0013144463300704956, -0.0012713968753814697, -0.0012283474206924438, -0.001185297966003418, -0.001142248511314392, -0.0010991990566253662, -0.0010561496019363403, -0.0010131001472473145, -0.0009700506925582886, -0.0009270012378692627, -0.0008839517831802368, -0.0008409023284912109, -0.0007978528738021851, -0.0007548034191131592, -0.0007117539644241333, -0.0006687045097351074, -0.0006256550550460815, -0.0005826056003570557, -0.0005395561456680298, -0.0004965066909790039, -0.00045345723628997803, -0.00041040778160095215, -0.00036735832691192627, -0.0003243088722229004, -0.0002812594175338745, -0.00023820996284484863, -0.00019516050815582275, -0.00015211105346679688, -0.000109061598777771, -6.601214408874512e-05, -2.2962689399719238e-05, 2.008676528930664e-05, 6.313621997833252e-05, 0.0001061856746673584, 0.00014923512935638428, 0.00019228458404541016, 0.00023533403873443604, 0.0002783834934234619, 0.0003214329481124878, 0.00036448240280151367, 0.00040753185749053955, 0.00045058131217956543, 0.0004936307668685913, 0.0005366802215576172, 0.0005797296762466431, 0.0006227791309356689, 0.0006658285856246948, 0.0007088780403137207, 0.0007519274950027466, 0.0007949769496917725, 0.0008380264043807983, 0.0008810758590698242, 0.0009241253137588501, 0.000967174768447876, 0.0010102242231369019, 0.0010532736778259277, 0.0010963231325149536, 0.0011393725872039795, 0.0011824220418930054, 0.0012254714965820312]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 11.0, 3.0, 10.0, 10.0, 10.0, 13.0, 21.0, 34.0, 48.0, 79.0, 126.0, 214.0, 417.0, 943.0, 2889.0, 12798.0, 127806.0, 809348.0, 79756.0, 9776.0, 2478.0, 831.0, 363.0, 201.0, 119.0, 66.0, 40.0, 36.0, 23.0, 21.0, 8.0, 11.0, 11.0, 9.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.859375, -23.984619140625, -23.10986328125, -22.235107421875, -21.3603515625, -20.485595703125, -19.61083984375, -18.736083984375, -17.861328125, -16.986572265625, -16.11181640625, -15.237060546875, -14.3623046875, -13.487548828125, -12.61279296875, -11.738037109375, -10.86328125, -9.988525390625, -9.11376953125, -8.239013671875, -7.3642578125, -6.489501953125, -5.61474609375, -4.739990234375, -3.865234375, -2.990478515625, -2.11572265625, -1.240966796875, -0.3662109375, 0.508544921875, 1.38330078125, 2.258056640625, 3.1328125, 4.007568359375, 4.88232421875, 5.757080078125, 6.6318359375, 7.506591796875, 8.38134765625, 9.256103515625, 10.130859375, 11.005615234375, 11.88037109375, 12.755126953125, 13.6298828125, 14.504638671875, 15.37939453125, 16.254150390625, 17.12890625, 18.003662109375, 18.87841796875, 19.753173828125, 20.6279296875, 21.502685546875, 22.37744140625, 23.252197265625, 24.126953125, 25.001708984375, 25.87646484375, 26.751220703125, 27.6259765625, 28.500732421875, 29.37548828125, 30.250244140625, 31.125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 6.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 10.0, 15.0, 7.0, 25.0, 17.0, 30.0, 34.0, 35.0, 52.0, 80.0, 73.0, 72.0, 93.0, 75.0, 63.0, 71.0, 44.0, 34.0, 36.0, 25.0, 13.0, 12.0, 16.0, 11.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.0703125, -8.7457275390625, -8.421142578125, -8.0965576171875, -7.77197265625, -7.4473876953125, -7.122802734375, -6.7982177734375, -6.4736328125, -6.1490478515625, -5.824462890625, -5.4998779296875, -5.17529296875, -4.8507080078125, -4.526123046875, -4.2015380859375, -3.876953125, -3.5523681640625, -3.227783203125, -2.9031982421875, -2.57861328125, -2.2540283203125, -1.929443359375, -1.6048583984375, -1.2802734375, -0.9556884765625, -0.631103515625, -0.3065185546875, 0.01806640625, 0.3426513671875, 0.667236328125, 0.9918212890625, 1.31640625, 1.6409912109375, 1.965576171875, 2.2901611328125, 2.61474609375, 2.9393310546875, 3.263916015625, 3.5885009765625, 3.9130859375, 4.2376708984375, 4.562255859375, 4.8868408203125, 5.21142578125, 5.5360107421875, 5.860595703125, 6.1851806640625, 6.509765625, 6.8343505859375, 7.158935546875, 7.4835205078125, 7.80810546875, 8.1326904296875, 8.457275390625, 8.7818603515625, 9.1064453125, 9.4310302734375, 9.755615234375, 10.0802001953125, 10.40478515625, 10.7293701171875, 11.053955078125, 11.3785400390625, 11.703125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 15.0, 27.0, 44.0, 103.0, 228.0, 234.0, 169.0, 76.0, 38.0, 24.0, 12.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-277.29296875, -270.2442321777344, -263.19549560546875, -256.146728515625, -249.09799194335938, -242.04925537109375, -235.00050354003906, -227.95176696777344, -220.90301513671875, -213.85427856445312, -206.80552673339844, -199.7567901611328, -192.70803833007812, -185.6593017578125, -178.6105499267578, -171.5618133544922, -164.5130615234375, -157.46432495117188, -150.4155731201172, -143.36683654785156, -136.31808471679688, -129.26934814453125, -122.22059631347656, -115.17185974121094, -108.12312316894531, -101.07437896728516, -94.025634765625, -86.97689056396484, -79.92814636230469, -72.87940979003906, -65.83065795898438, -58.781917572021484, -51.73316955566406, -44.684425354003906, -37.63568115234375, -30.586938858032227, -23.53819465637207, -16.489452362060547, -9.44070816040039, -2.3919639587402344, 4.656780242919922, 11.705524444580078, 18.754268646240234, 25.803010940551758, 32.85175323486328, 39.90049743652344, 46.949241638183594, 53.99798583984375, 61.046730041503906, 68.09547424316406, 75.14421844482422, 82.19296264648438, 89.24170684814453, 96.29045104980469, 103.33918762207031, 110.387939453125, 117.43667602539062, 124.48542022705078, 131.53416442871094, 138.58290100097656, 145.63165283203125, 152.68038940429688, 159.72914123535156, 166.7778778076172, 173.82662963867188]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 12.0, 20.0, 15.0, 10.0, 29.0, 26.0, 31.0, 26.0, 55.0, 30.0, 48.0, 56.0, 46.0, 47.0, 53.0, 55.0, 42.0, 42.0, 68.0, 41.0, 38.0, 41.0, 30.0, 19.0, 27.0, 13.0, 20.0, 13.0, 11.0, 6.0, 8.0, 8.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.71200561523438, -111.81444549560547, -107.91688537597656, -104.01932525634766, -100.12176513671875, -96.22421264648438, -92.32665252685547, -88.42909240722656, -84.53153228759766, -80.63397216796875, -76.73641204833984, -72.83885192871094, -68.94129943847656, -65.04373168945312, -61.14617919921875, -57.248619079589844, -53.35105895996094, -49.45349884033203, -45.555938720703125, -41.658382415771484, -37.76082229614258, -33.86326217651367, -29.9657039642334, -26.068145751953125, -22.17058563232422, -18.273025512695312, -14.375467300415039, -10.47790813446045, -6.580348968505859, -2.682788848876953, 1.2147693634033203, 5.112327575683594, 9.0098876953125, 12.90744686126709, 16.80500602722168, 20.702564239501953, 24.60012435913086, 28.497684478759766, 32.395240783691406, 36.29280090332031, 40.19036102294922, 44.087921142578125, 47.98548126220703, 51.88303756713867, 55.78059768676758, 59.678157806396484, 63.575714111328125, 67.47327423095703, 71.37083435058594, 75.26839447021484, 79.16595458984375, 83.06351470947266, 86.96107482910156, 90.85862731933594, 94.75618743896484, 98.65374755859375, 102.55130767822266, 106.44886779785156, 110.34642791748047, 114.24398803710938, 118.14154052734375, 122.03910827636719, 125.93666076660156, 129.834228515625, 133.73178100585938]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 5.0, 10.0, 10.0, 18.0, 26.0, 52.0, 62.0, 120.0, 229.0, 782.0, 5573.0, 160520.0, 4006259.0, 17639.0, 1960.0, 490.0, 210.0, 101.0, 74.0, 51.0, 29.0, 25.0, 12.0, 11.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.5625, -35.6083984375, -33.654296875, -31.7001953125, -29.74609375, -27.7919921875, -25.837890625, -23.8837890625, -21.9296875, -19.9755859375, -18.021484375, -16.0673828125, -14.11328125, -12.1591796875, -10.205078125, -8.2509765625, -6.296875, -4.3427734375, -2.388671875, -0.4345703125, 1.51953125, 3.4736328125, 5.427734375, 7.3818359375, 9.3359375, 11.2900390625, 13.244140625, 15.1982421875, 17.15234375, 19.1064453125, 21.060546875, 23.0146484375, 24.96875, 26.9228515625, 28.876953125, 30.8310546875, 32.78515625, 34.7392578125, 36.693359375, 38.6474609375, 40.6015625, 42.5556640625, 44.509765625, 46.4638671875, 48.41796875, 50.3720703125, 52.326171875, 54.2802734375, 56.234375, 58.1884765625, 60.142578125, 62.0966796875, 64.05078125, 66.0048828125, 67.958984375, 69.9130859375, 71.8671875, 73.8212890625, 75.775390625, 77.7294921875, 79.68359375, 81.6376953125, 83.591796875, 85.5458984375, 87.5]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 10.0, 25.0, 28.0, 36.0, 42.0, 65.0, 88.0, 94.0, 118.0, 113.0, 106.0, 66.0, 56.0, 57.0, 37.0, 23.0, 10.0, 7.0, 6.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1015625, -5.88287353515625, -5.6641845703125, -5.44549560546875, -5.226806640625, -5.00811767578125, -4.7894287109375, -4.57073974609375, -4.35205078125, -4.13336181640625, -3.9146728515625, -3.69598388671875, -3.477294921875, -3.25860595703125, -3.0399169921875, -2.82122802734375, -2.6025390625, -2.38385009765625, -2.1651611328125, -1.94647216796875, -1.727783203125, -1.50909423828125, -1.2904052734375, -1.07171630859375, -0.85302734375, -0.63433837890625, -0.4156494140625, -0.19696044921875, 0.021728515625, 0.24041748046875, 0.4591064453125, 0.67779541015625, 0.896484375, 1.11517333984375, 1.3338623046875, 1.55255126953125, 1.771240234375, 1.98992919921875, 2.2086181640625, 2.42730712890625, 2.64599609375, 2.86468505859375, 3.0833740234375, 3.30206298828125, 3.520751953125, 3.73944091796875, 3.9581298828125, 4.17681884765625, 4.3955078125, 4.61419677734375, 4.8328857421875, 5.05157470703125, 5.270263671875, 5.48895263671875, 5.7076416015625, 5.92633056640625, 6.14501953125, 6.36370849609375, 6.5823974609375, 6.80108642578125, 7.019775390625, 7.23846435546875, 7.4571533203125, 7.67584228515625, 7.89453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 4.0, 7.0, 7.0, 19.0, 14.0, 21.0, 31.0, 54.0, 79.0, 106.0, 172.0, 255.0, 424.0, 725.0, 1303.0, 2668.0, 6337.0, 17518.0, 63931.0, 465822.0, 3379299.0, 195296.0, 39080.0, 11906.0, 4528.0, 2005.0, 1080.0, 595.0, 338.0, 182.0, 149.0, 96.0, 68.0, 50.0, 33.0, 32.0, 10.0, 12.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-20.484375, -19.887451171875, -19.29052734375, -18.693603515625, -18.0966796875, -17.499755859375, -16.90283203125, -16.305908203125, -15.708984375, -15.112060546875, -14.51513671875, -13.918212890625, -13.3212890625, -12.724365234375, -12.12744140625, -11.530517578125, -10.93359375, -10.336669921875, -9.73974609375, -9.142822265625, -8.5458984375, -7.948974609375, -7.35205078125, -6.755126953125, -6.158203125, -5.561279296875, -4.96435546875, -4.367431640625, -3.7705078125, -3.173583984375, -2.57666015625, -1.979736328125, -1.3828125, -0.785888671875, -0.18896484375, 0.407958984375, 1.0048828125, 1.601806640625, 2.19873046875, 2.795654296875, 3.392578125, 3.989501953125, 4.58642578125, 5.183349609375, 5.7802734375, 6.377197265625, 6.97412109375, 7.571044921875, 8.16796875, 8.764892578125, 9.36181640625, 9.958740234375, 10.5556640625, 11.152587890625, 11.74951171875, 12.346435546875, 12.943359375, 13.540283203125, 14.13720703125, 14.734130859375, 15.3310546875, 15.927978515625, 16.52490234375, 17.121826171875, 17.71875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 9.0, 9.0, 12.0, 21.0, 22.0, 36.0, 77.0, 116.0, 214.0, 729.0, 1956.0, 404.0, 165.0, 107.0, 66.0, 34.0, 31.0, 18.0, 11.0, 8.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3046875, -7.07867431640625, -6.8526611328125, -6.62664794921875, -6.400634765625, -6.17462158203125, -5.9486083984375, -5.72259521484375, -5.49658203125, -5.27056884765625, -5.0445556640625, -4.81854248046875, -4.592529296875, -4.36651611328125, -4.1405029296875, -3.91448974609375, -3.6884765625, -3.46246337890625, -3.2364501953125, -3.01043701171875, -2.784423828125, -2.55841064453125, -2.3323974609375, -2.10638427734375, -1.88037109375, -1.65435791015625, -1.4283447265625, -1.20233154296875, -0.976318359375, -0.75030517578125, -0.5242919921875, -0.29827880859375, -0.072265625, 0.15374755859375, 0.3797607421875, 0.60577392578125, 0.831787109375, 1.05780029296875, 1.2838134765625, 1.50982666015625, 1.73583984375, 1.96185302734375, 2.1878662109375, 2.41387939453125, 2.639892578125, 2.86590576171875, 3.0919189453125, 3.31793212890625, 3.5439453125, 3.76995849609375, 3.9959716796875, 4.22198486328125, 4.447998046875, 4.67401123046875, 4.9000244140625, 5.12603759765625, 5.35205078125, 5.57806396484375, 5.8040771484375, 6.03009033203125, 6.256103515625, 6.48211669921875, 6.7081298828125, 6.93414306640625, 7.16015625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 11.0, 16.0, 20.0, 43.0, 63.0, 118.0, 156.0, 164.0, 143.0, 106.0, 69.0, 31.0, 34.0, 6.0, 7.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.224361419677734, -27.91451644897461, -26.60466957092285, -25.294824600219727, -23.98497772216797, -22.675132751464844, -21.36528778076172, -20.05544090270996, -18.745594024658203, -17.435749053955078, -16.12590217590332, -14.816057205200195, -13.506210327148438, -12.196365356445312, -10.886519432067871, -9.57667350769043, -8.266828536987305, -6.956982612609863, -5.647136688232422, -4.337291240692139, -3.0274453163146973, -1.7175993919372559, -0.40775394439697266, 0.9020919799804688, 2.21193790435791, 3.5217838287353516, 4.831629753112793, 6.141475200653076, 7.451321125030518, 8.761167526245117, 10.071012496948242, 11.380858421325684, 12.690704345703125, 14.000550270080566, 15.310396194458008, 16.620241165161133, 17.93008804321289, 19.239933013916016, 20.54977798461914, 21.8596248626709, 23.169471740722656, 24.47931671142578, 25.78916358947754, 27.099008560180664, 28.408855438232422, 29.718700408935547, 31.028545379638672, 32.33839416503906, 33.64823913574219, 34.95808410644531, 36.26792907714844, 37.57777786254883, 38.88762283325195, 40.19746780395508, 41.5073127746582, 42.817161560058594, 44.12700271606445, 45.43684768676758, 46.7466926574707, 48.056541442871094, 49.36638641357422, 50.676231384277344, 51.98607635498047, 53.295921325683594, 54.605770111083984]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 8.0, 6.0, 6.0, 15.0, 15.0, 18.0, 35.0, 48.0, 55.0, 61.0, 60.0, 66.0, 68.0, 70.0, 81.0, 59.0, 54.0, 60.0, 51.0, 36.0, 28.0, 32.0, 20.0, 16.0, 15.0, 7.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.04438781738281, -33.10906982421875, -32.17375183105469, -31.238433837890625, -30.303115844726562, -29.3677978515625, -28.432479858398438, -27.497161865234375, -26.561843872070312, -25.62652587890625, -24.691207885742188, -23.755889892578125, -22.820571899414062, -21.88525390625, -20.949935913085938, -20.014617919921875, -19.07929801940918, -18.143980026245117, -17.208662033081055, -16.273344039916992, -15.33802604675293, -14.402708053588867, -13.467389106750488, -12.532071113586426, -11.596753120422363, -10.6614351272583, -9.726117134094238, -8.79079818725586, -7.855480670928955, -6.920162677764893, -5.984844207763672, -5.049526214599609, -4.114208221435547, -3.1788902282714844, -2.2435719966888428, -1.3082537651062012, -0.37293577194213867, 0.5623822212219238, 1.4977006912231445, 2.433018684387207, 3.3683366775512695, 4.303654670715332, 5.2389726638793945, 6.174291133880615, 7.109609127044678, 8.044927597045898, 8.980245590209961, 9.915563583374023, 10.850881576538086, 11.786199569702148, 12.721517562866211, 13.656835556030273, 14.592153549194336, 15.527471542358398, 16.462791442871094, 17.398109436035156, 18.33342742919922, 19.26874542236328, 20.204063415527344, 21.139381408691406, 22.07469940185547, 23.01001739501953, 23.945335388183594, 24.880653381347656, 25.81597137451172]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 10.0, 14.0, 23.0, 45.0, 52.0, 103.0, 128.0, 237.0, 462.0, 991.0, 2671.0, 8942.0, 41487.0, 283203.0, 575759.0, 107698.0, 18858.0, 4796.0, 1553.0, 647.0, 336.0, 203.0, 116.0, 77.0, 45.0, 28.0, 24.0, 5.0, 11.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.4375, -32.46142578125, -31.4853515625, -30.50927734375, -29.533203125, -28.55712890625, -27.5810546875, -26.60498046875, -25.62890625, -24.65283203125, -23.6767578125, -22.70068359375, -21.724609375, -20.74853515625, -19.7724609375, -18.79638671875, -17.8203125, -16.84423828125, -15.8681640625, -14.89208984375, -13.916015625, -12.93994140625, -11.9638671875, -10.98779296875, -10.01171875, -9.03564453125, -8.0595703125, -7.08349609375, -6.107421875, -5.13134765625, -4.1552734375, -3.17919921875, -2.203125, -1.22705078125, -0.2509765625, 0.72509765625, 1.701171875, 2.67724609375, 3.6533203125, 4.62939453125, 5.60546875, 6.58154296875, 7.5576171875, 8.53369140625, 9.509765625, 10.48583984375, 11.4619140625, 12.43798828125, 13.4140625, 14.39013671875, 15.3662109375, 16.34228515625, 17.318359375, 18.29443359375, 19.2705078125, 20.24658203125, 21.22265625, 22.19873046875, 23.1748046875, 24.15087890625, 25.126953125, 26.10302734375, 27.0791015625, 28.05517578125, 29.03125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 11.0, 18.0, 27.0, 45.0, 52.0, 64.0, 68.0, 113.0, 117.0, 102.0, 88.0, 87.0, 61.0, 46.0, 39.0, 27.0, 12.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -5.96209716796875, -5.7406005859375, -5.51910400390625, -5.297607421875, -5.07611083984375, -4.8546142578125, -4.63311767578125, -4.41162109375, -4.19012451171875, -3.9686279296875, -3.74713134765625, -3.525634765625, -3.30413818359375, -3.0826416015625, -2.86114501953125, -2.6396484375, -2.41815185546875, -2.1966552734375, -1.97515869140625, -1.753662109375, -1.53216552734375, -1.3106689453125, -1.08917236328125, -0.86767578125, -0.64617919921875, -0.4246826171875, -0.20318603515625, 0.018310546875, 0.23980712890625, 0.4613037109375, 0.68280029296875, 0.904296875, 1.12579345703125, 1.3472900390625, 1.56878662109375, 1.790283203125, 2.01177978515625, 2.2332763671875, 2.45477294921875, 2.67626953125, 2.89776611328125, 3.1192626953125, 3.34075927734375, 3.562255859375, 3.78375244140625, 4.0052490234375, 4.22674560546875, 4.4482421875, 4.66973876953125, 4.8912353515625, 5.11273193359375, 5.334228515625, 5.55572509765625, 5.7772216796875, 5.99871826171875, 6.22021484375, 6.44171142578125, 6.6632080078125, 6.88470458984375, 7.106201171875, 7.32769775390625, 7.5491943359375, 7.77069091796875, 7.9921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 5.0, 7.0, 13.0, 21.0, 25.0, 40.0, 34.0, 45.0, 78.0, 134.0, 189.0, 308.0, 497.0, 998.0, 2128.0, 5816.0, 23468.0, 168368.0, 680734.0, 135720.0, 20195.0, 5418.0, 2047.0, 866.0, 476.0, 301.0, 169.0, 116.0, 92.0, 57.0, 39.0, 38.0, 23.0, 22.0, 17.0, 7.0, 13.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.1875, -29.087890625, -27.98828125, -26.888671875, -25.7890625, -24.689453125, -23.58984375, -22.490234375, -21.390625, -20.291015625, -19.19140625, -18.091796875, -16.9921875, -15.892578125, -14.79296875, -13.693359375, -12.59375, -11.494140625, -10.39453125, -9.294921875, -8.1953125, -7.095703125, -5.99609375, -4.896484375, -3.796875, -2.697265625, -1.59765625, -0.498046875, 0.6015625, 1.701171875, 2.80078125, 3.900390625, 5.0, 6.099609375, 7.19921875, 8.298828125, 9.3984375, 10.498046875, 11.59765625, 12.697265625, 13.796875, 14.896484375, 15.99609375, 17.095703125, 18.1953125, 19.294921875, 20.39453125, 21.494140625, 22.59375, 23.693359375, 24.79296875, 25.892578125, 26.9921875, 28.091796875, 29.19140625, 30.291015625, 31.390625, 32.490234375, 33.58984375, 34.689453125, 35.7890625, 36.888671875, 37.98828125, 39.087890625, 40.1875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 13.0, 13.0, 13.0, 13.0, 15.0, 20.0, 29.0, 31.0, 39.0, 60.0, 53.0, 65.0, 83.0, 65.0, 62.0, 58.0, 59.0, 42.0, 49.0, 40.0, 39.0, 30.0, 24.0, 18.0, 15.0, 7.0, 4.0, 3.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.796875, -21.96533203125, -21.1337890625, -20.30224609375, -19.470703125, -18.63916015625, -17.8076171875, -16.97607421875, -16.14453125, -15.31298828125, -14.4814453125, -13.64990234375, -12.818359375, -11.98681640625, -11.1552734375, -10.32373046875, -9.4921875, -8.66064453125, -7.8291015625, -6.99755859375, -6.166015625, -5.33447265625, -4.5029296875, -3.67138671875, -2.83984375, -2.00830078125, -1.1767578125, -0.34521484375, 0.486328125, 1.31787109375, 2.1494140625, 2.98095703125, 3.8125, 4.64404296875, 5.4755859375, 6.30712890625, 7.138671875, 7.97021484375, 8.8017578125, 9.63330078125, 10.46484375, 11.29638671875, 12.1279296875, 12.95947265625, 13.791015625, 14.62255859375, 15.4541015625, 16.28564453125, 17.1171875, 17.94873046875, 18.7802734375, 19.61181640625, 20.443359375, 21.27490234375, 22.1064453125, 22.93798828125, 23.76953125, 24.60107421875, 25.4326171875, 26.26416015625, 27.095703125, 27.92724609375, 28.7587890625, 29.59033203125, 30.421875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 17.0, 9.0, 21.0, 25.0, 42.0, 64.0, 97.0, 166.0, 315.0, 812.0, 2278.0, 9726.0, 126767.0, 878165.0, 23392.0, 4309.0, 1226.0, 552.0, 237.0, 118.0, 61.0, 48.0, 22.0, 23.0, 19.0, 15.0, 7.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.78125, -37.49853515625, -36.2158203125, -34.93310546875, -33.650390625, -32.36767578125, -31.0849609375, -29.80224609375, -28.51953125, -27.23681640625, -25.9541015625, -24.67138671875, -23.388671875, -22.10595703125, -20.8232421875, -19.54052734375, -18.2578125, -16.97509765625, -15.6923828125, -14.40966796875, -13.126953125, -11.84423828125, -10.5615234375, -9.27880859375, -7.99609375, -6.71337890625, -5.4306640625, -4.14794921875, -2.865234375, -1.58251953125, -0.2998046875, 0.98291015625, 2.265625, 3.54833984375, 4.8310546875, 6.11376953125, 7.396484375, 8.67919921875, 9.9619140625, 11.24462890625, 12.52734375, 13.81005859375, 15.0927734375, 16.37548828125, 17.658203125, 18.94091796875, 20.2236328125, 21.50634765625, 22.7890625, 24.07177734375, 25.3544921875, 26.63720703125, 27.919921875, 29.20263671875, 30.4853515625, 31.76806640625, 33.05078125, 34.33349609375, 35.6162109375, 36.89892578125, 38.181640625, 39.46435546875, 40.7470703125, 42.02978515625, 43.3125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 8.0, 12.0, 18.0, 24.0, 53.0, 109.0, 195.0, 245.0, 161.0, 67.0, 32.0, 27.0, 19.0, 12.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00312042236328125, -0.0030317306518554688, -0.0029430389404296875, -0.0028543472290039062, -0.002765655517578125, -0.0026769638061523438, -0.0025882720947265625, -0.0024995803833007812, -0.002410888671875, -0.0023221969604492188, -0.0022335052490234375, -0.0021448135375976562, -0.002056121826171875, -0.0019674301147460938, -0.0018787384033203125, -0.0017900466918945312, -0.00170135498046875, -0.0016126632690429688, -0.0015239715576171875, -0.0014352798461914062, -0.001346588134765625, -0.0012578964233398438, -0.0011692047119140625, -0.0010805130004882812, -0.0009918212890625, -0.0009031295776367188, -0.0008144378662109375, -0.0007257461547851562, -0.000637054443359375, -0.0005483627319335938, -0.0004596710205078125, -0.00037097930908203125, -0.00028228759765625, -0.00019359588623046875, -0.0001049041748046875, -1.621246337890625e-05, 7.2479248046875e-05, 0.00016117095947265625, 0.0002498626708984375, 0.00033855438232421875, 0.00042724609375, 0.0005159378051757812, 0.0006046295166015625, 0.0006933212280273438, 0.000782012939453125, 0.0008707046508789062, 0.0009593963623046875, 0.0010480880737304688, 0.00113677978515625, 0.0012254714965820312, 0.0013141632080078125, 0.0014028549194335938, 0.001491546630859375, 0.0015802383422851562, 0.0016689300537109375, 0.0017576217651367188, 0.0018463134765625, 0.0019350051879882812, 0.0020236968994140625, 0.0021123886108398438, 0.002201080322265625, 0.0022897720336914062, 0.0023784637451171875, 0.0024671554565429688, 0.00255584716796875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 2.0, 3.0, 3.0, 10.0, 8.0, 14.0, 12.0, 14.0, 24.0, 40.0, 60.0, 99.0, 204.0, 514.0, 1778.0, 9148.0, 486397.0, 538022.0, 9298.0, 1864.0, 525.0, 208.0, 119.0, 63.0, 30.0, 27.0, 17.0, 8.0, 14.0, 7.0, 6.0, 3.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.4375, -53.4580078125, -51.478515625, -49.4990234375, -47.51953125, -45.5400390625, -43.560546875, -41.5810546875, -39.6015625, -37.6220703125, -35.642578125, -33.6630859375, -31.68359375, -29.7041015625, -27.724609375, -25.7451171875, -23.765625, -21.7861328125, -19.806640625, -17.8271484375, -15.84765625, -13.8681640625, -11.888671875, -9.9091796875, -7.9296875, -5.9501953125, -3.970703125, -1.9912109375, -0.01171875, 1.9677734375, 3.947265625, 5.9267578125, 7.90625, 9.8857421875, 11.865234375, 13.8447265625, 15.82421875, 17.8037109375, 19.783203125, 21.7626953125, 23.7421875, 25.7216796875, 27.701171875, 29.6806640625, 31.66015625, 33.6396484375, 35.619140625, 37.5986328125, 39.578125, 41.5576171875, 43.537109375, 45.5166015625, 47.49609375, 49.4755859375, 51.455078125, 53.4345703125, 55.4140625, 57.3935546875, 59.373046875, 61.3525390625, 63.33203125, 65.3115234375, 67.291015625, 69.2705078125, 71.25]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 6.0, 22.0, 21.0, 54.0, 164.0, 327.0, 219.0, 54.0, 20.0, 23.0, 12.0, 13.0, 10.0, 6.0, 6.0, 5.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.28125, -34.317138671875, -33.35302734375, -32.388916015625, -31.4248046875, -30.460693359375, -29.49658203125, -28.532470703125, -27.568359375, -26.604248046875, -25.64013671875, -24.676025390625, -23.7119140625, -22.747802734375, -21.78369140625, -20.819580078125, -19.85546875, -18.891357421875, -17.92724609375, -16.963134765625, -15.9990234375, -15.034912109375, -14.07080078125, -13.106689453125, -12.142578125, -11.178466796875, -10.21435546875, -9.250244140625, -8.2861328125, -7.322021484375, -6.35791015625, -5.393798828125, -4.4296875, -3.465576171875, -2.50146484375, -1.537353515625, -0.5732421875, 0.390869140625, 1.35498046875, 2.319091796875, 3.283203125, 4.247314453125, 5.21142578125, 6.175537109375, 7.1396484375, 8.103759765625, 9.06787109375, 10.031982421875, 10.99609375, 11.960205078125, 12.92431640625, 13.888427734375, 14.8525390625, 15.816650390625, 16.78076171875, 17.744873046875, 18.708984375, 19.673095703125, 20.63720703125, 21.601318359375, 22.5654296875, 23.529541015625, 24.49365234375, 25.457763671875, 26.421875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 17.0, 60.0, 156.0, 301.0, 273.0, 107.0, 38.0, 20.0, 13.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-460.02301025390625, -448.4735107421875, -436.92401123046875, -425.37451171875, -413.82501220703125, -402.2755126953125, -390.72601318359375, -379.176513671875, -367.62701416015625, -356.0775146484375, -344.52801513671875, -332.978515625, -321.42901611328125, -309.8795166015625, -298.33001708984375, -286.780517578125, -275.23101806640625, -263.6815185546875, -252.13201904296875, -240.58251953125, -229.03302001953125, -217.4835205078125, -205.93402099609375, -194.384521484375, -182.83502197265625, -171.2855224609375, -159.73602294921875, -148.1865234375, -136.63702392578125, -125.0875244140625, -113.53802490234375, -101.988525390625, -90.43902587890625, -78.8895263671875, -67.34002685546875, -55.79052734375, -44.24102783203125, -32.6915283203125, -21.14202880859375, -9.592529296875, 1.95697021484375, 13.5064697265625, 25.05596923828125, 36.60546875, 48.15496826171875, 59.7044677734375, 71.25396728515625, 82.803466796875, 94.35296630859375, 105.9024658203125, 117.45196533203125, 129.00146484375, 140.55096435546875, 152.1004638671875, 163.64996337890625, 175.199462890625, 186.74896240234375, 198.2984619140625, 209.84796142578125, 221.3974609375, 232.94696044921875, 244.4964599609375, 256.04595947265625, 267.595458984375, 279.14495849609375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 4.0, 6.0, 8.0, 11.0, 11.0, 19.0, 26.0, 22.0, 29.0, 32.0, 30.0, 39.0, 43.0, 43.0, 39.0, 45.0, 49.0, 58.0, 49.0, 45.0, 44.0, 34.0, 63.0, 35.0, 31.0, 22.0, 32.0, 19.0, 22.0, 16.0, 14.0, 8.0, 3.0, 7.0, 10.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-150.17935180664062, -145.4374237060547, -140.69549560546875, -135.9535675048828, -131.21163940429688, -126.46971130371094, -121.727783203125, -116.98585510253906, -112.24392700195312, -107.50199890136719, -102.76007080078125, -98.01814270019531, -93.27621459960938, -88.53428649902344, -83.7923583984375, -79.05043029785156, -74.30850219726562, -69.56657409667969, -64.82464599609375, -60.08271789550781, -55.340789794921875, -50.59886169433594, -45.85693359375, -41.11500549316406, -36.373077392578125, -31.631149291992188, -26.88922119140625, -22.147293090820312, -17.405364990234375, -12.663436889648438, -7.9215087890625, -3.1795806884765625, 1.562347412109375, 6.3042755126953125, 11.04620361328125, 15.788131713867188, 20.530059814453125, 25.271987915039062, 30.013916015625, 34.75584411621094, 39.497772216796875, 44.23970031738281, 48.98162841796875, 53.72355651855469, 58.465484619140625, 63.20741271972656, 67.9493408203125, 72.69126892089844, 77.43319702148438, 82.17512512207031, 86.91705322265625, 91.65898132324219, 96.40090942382812, 101.14283752441406, 105.884765625, 110.62669372558594, 115.36862182617188, 120.11054992675781, 124.85247802734375, 129.5944061279297, 134.33633422851562, 139.07826232910156, 143.8201904296875, 148.56211853027344, 153.30404663085938]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 8.0, 4.0, 6.0, 5.0, 28.0, 35.0, 46.0, 112.0, 175.0, 336.0, 776.0, 1989.0, 6340.0, 37522.0, 3137232.0, 970703.0, 29636.0, 5724.0, 1881.0, 759.0, 404.0, 233.0, 122.0, 61.0, 43.0, 16.0, 24.0, 18.0, 7.0, 14.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.46875, -35.16357421875, -33.8583984375, -32.55322265625, -31.248046875, -29.94287109375, -28.6376953125, -27.33251953125, -26.02734375, -24.72216796875, -23.4169921875, -22.11181640625, -20.806640625, -19.50146484375, -18.1962890625, -16.89111328125, -15.5859375, -14.28076171875, -12.9755859375, -11.67041015625, -10.365234375, -9.06005859375, -7.7548828125, -6.44970703125, -5.14453125, -3.83935546875, -2.5341796875, -1.22900390625, 0.076171875, 1.38134765625, 2.6865234375, 3.99169921875, 5.296875, 6.60205078125, 7.9072265625, 9.21240234375, 10.517578125, 11.82275390625, 13.1279296875, 14.43310546875, 15.73828125, 17.04345703125, 18.3486328125, 19.65380859375, 20.958984375, 22.26416015625, 23.5693359375, 24.87451171875, 26.1796875, 27.48486328125, 28.7900390625, 30.09521484375, 31.400390625, 32.70556640625, 34.0107421875, 35.31591796875, 36.62109375, 37.92626953125, 39.2314453125, 40.53662109375, 41.841796875, 43.14697265625, 44.4521484375, 45.75732421875, 47.0625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 20.0, 29.0, 48.0, 56.0, 73.0, 96.0, 104.0, 100.0, 104.0, 110.0, 76.0, 53.0, 33.0, 31.0, 16.0, 11.0, 15.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.795166015625, -7.51220703125, -7.229248046875, -6.9462890625, -6.663330078125, -6.38037109375, -6.097412109375, -5.814453125, -5.531494140625, -5.24853515625, -4.965576171875, -4.6826171875, -4.399658203125, -4.11669921875, -3.833740234375, -3.55078125, -3.267822265625, -2.98486328125, -2.701904296875, -2.4189453125, -2.135986328125, -1.85302734375, -1.570068359375, -1.287109375, -1.004150390625, -0.72119140625, -0.438232421875, -0.1552734375, 0.127685546875, 0.41064453125, 0.693603515625, 0.9765625, 1.259521484375, 1.54248046875, 1.825439453125, 2.1083984375, 2.391357421875, 2.67431640625, 2.957275390625, 3.240234375, 3.523193359375, 3.80615234375, 4.089111328125, 4.3720703125, 4.655029296875, 4.93798828125, 5.220947265625, 5.50390625, 5.786865234375, 6.06982421875, 6.352783203125, 6.6357421875, 6.918701171875, 7.20166015625, 7.484619140625, 7.767578125, 8.050537109375, 8.33349609375, 8.616455078125, 8.8994140625, 9.182373046875, 9.46533203125, 9.748291015625, 10.03125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 10.0, 13.0, 21.0, 23.0, 42.0, 65.0, 84.0, 118.0, 176.0, 285.0, 487.0, 824.0, 1504.0, 3056.0, 7385.0, 21967.0, 94584.0, 1193931.0, 2695823.0, 131302.0, 26412.0, 8535.0, 3485.0, 1703.0, 932.0, 500.0, 304.0, 194.0, 134.0, 102.0, 76.0, 42.0, 34.0, 34.0, 22.0, 20.0, 8.0, 10.0, 3.0, 11.0, 5.0, 9.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.765625, -18.12060546875, -17.4755859375, -16.83056640625, -16.185546875, -15.54052734375, -14.8955078125, -14.25048828125, -13.60546875, -12.96044921875, -12.3154296875, -11.67041015625, -11.025390625, -10.38037109375, -9.7353515625, -9.09033203125, -8.4453125, -7.80029296875, -7.1552734375, -6.51025390625, -5.865234375, -5.22021484375, -4.5751953125, -3.93017578125, -3.28515625, -2.64013671875, -1.9951171875, -1.35009765625, -0.705078125, -0.06005859375, 0.5849609375, 1.22998046875, 1.875, 2.52001953125, 3.1650390625, 3.81005859375, 4.455078125, 5.10009765625, 5.7451171875, 6.39013671875, 7.03515625, 7.68017578125, 8.3251953125, 8.97021484375, 9.615234375, 10.26025390625, 10.9052734375, 11.55029296875, 12.1953125, 12.84033203125, 13.4853515625, 14.13037109375, 14.775390625, 15.42041015625, 16.0654296875, 16.71044921875, 17.35546875, 18.00048828125, 18.6455078125, 19.29052734375, 19.935546875, 20.58056640625, 21.2255859375, 21.87060546875, 22.515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 13.0, 15.0, 11.0, 25.0, 47.0, 95.0, 152.0, 345.0, 1523.0, 1186.0, 369.0, 134.0, 50.0, 30.0, 21.0, 14.0, 19.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.265625, -9.81787109375, -9.3701171875, -8.92236328125, -8.474609375, -8.02685546875, -7.5791015625, -7.13134765625, -6.68359375, -6.23583984375, -5.7880859375, -5.34033203125, -4.892578125, -4.44482421875, -3.9970703125, -3.54931640625, -3.1015625, -2.65380859375, -2.2060546875, -1.75830078125, -1.310546875, -0.86279296875, -0.4150390625, 0.03271484375, 0.48046875, 0.92822265625, 1.3759765625, 1.82373046875, 2.271484375, 2.71923828125, 3.1669921875, 3.61474609375, 4.0625, 4.51025390625, 4.9580078125, 5.40576171875, 5.853515625, 6.30126953125, 6.7490234375, 7.19677734375, 7.64453125, 8.09228515625, 8.5400390625, 8.98779296875, 9.435546875, 9.88330078125, 10.3310546875, 10.77880859375, 11.2265625, 11.67431640625, 12.1220703125, 12.56982421875, 13.017578125, 13.46533203125, 13.9130859375, 14.36083984375, 14.80859375, 15.25634765625, 15.7041015625, 16.15185546875, 16.599609375, 17.04736328125, 17.4951171875, 17.94287109375, 18.390625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 9.0, 14.0, 24.0, 87.0, 129.0, 175.0, 177.0, 169.0, 112.0, 59.0, 26.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.53042602539062, -75.12693786621094, -72.72344970703125, -70.31996154785156, -67.91646575927734, -65.51297760009766, -63.10948944091797, -60.70600128173828, -58.302513122558594, -55.899024963378906, -53.49553298950195, -51.092044830322266, -48.68855667114258, -46.285064697265625, -43.88157653808594, -41.47808837890625, -39.0745964050293, -36.67110824584961, -34.267616271972656, -31.86412811279297, -29.46063995361328, -27.05714988708496, -24.65365982055664, -22.250171661376953, -19.846681594848633, -17.443191528320312, -15.039703369140625, -12.636213302612305, -10.2327241897583, -7.829235076904297, -5.425745010375977, -3.022256851196289, -0.6187667846679688, 1.7847225666046143, 4.188211917877197, 6.591701507568359, 8.995190620422363, 11.398679733276367, 13.802169799804688, 16.205657958984375, 18.609148025512695, 21.012638092041016, 23.416126251220703, 25.819616317749023, 28.223106384277344, 30.62659454345703, 33.03008270263672, 35.433570861816406, 37.83706283569336, 40.24055099487305, 42.64404296875, 45.04753112792969, 47.451019287109375, 49.85450744628906, 52.257999420166016, 54.6614875793457, 57.064979553222656, 59.468467712402344, 61.8719596862793, 64.27545166015625, 66.67893981933594, 69.08242797851562, 71.48591613769531, 73.889404296875, 76.29289245605469]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 9.0, 13.0, 29.0, 37.0, 45.0, 59.0, 74.0, 80.0, 91.0, 103.0, 94.0, 78.0, 77.0, 69.0, 43.0, 25.0, 29.0, 22.0, 11.0, 9.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.79353332519531, -72.56404876708984, -70.33456420898438, -68.1050796508789, -65.87559509277344, -63.64611053466797, -61.4166259765625, -59.18714141845703, -56.95765686035156, -54.728172302246094, -52.498687744140625, -50.269203186035156, -48.03971862792969, -45.81023406982422, -43.58074951171875, -41.35126495361328, -39.12178039550781, -36.892295837402344, -34.662811279296875, -32.433326721191406, -30.203842163085938, -27.97435760498047, -25.744873046875, -23.51538848876953, -21.285903930664062, -19.056419372558594, -16.826934814453125, -14.597450256347656, -12.367965698242188, -10.138481140136719, -7.90899658203125, -5.679512023925781, -3.4500274658203125, -1.2205429077148438, 1.008941650390625, 3.2384262084960938, 5.4679107666015625, 7.697395324707031, 9.9268798828125, 12.156364440917969, 14.385848999023438, 16.615333557128906, 18.844818115234375, 21.074302673339844, 23.303787231445312, 25.53327178955078, 27.76275634765625, 29.99224090576172, 32.22172546386719, 34.451210021972656, 36.680694580078125, 38.910179138183594, 41.13966369628906, 43.36914825439453, 45.5986328125, 47.82811737060547, 50.05760192871094, 52.287086486816406, 54.516571044921875, 56.746055603027344, 58.97554016113281, 61.20502471923828, 63.43450927734375, 65.66399383544922, 67.89347839355469]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 9.0, 7.0, 18.0, 9.0, 25.0, 39.0, 74.0, 94.0, 196.0, 425.0, 985.0, 2936.0, 11622.0, 74096.0, 600378.0, 311633.0, 35817.0, 6870.0, 1890.0, 679.0, 329.0, 170.0, 101.0, 56.0, 32.0, 26.0, 12.0, 15.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.78125, -49.47314453125, -48.1650390625, -46.85693359375, -45.548828125, -44.24072265625, -42.9326171875, -41.62451171875, -40.31640625, -39.00830078125, -37.7001953125, -36.39208984375, -35.083984375, -33.77587890625, -32.4677734375, -31.15966796875, -29.8515625, -28.54345703125, -27.2353515625, -25.92724609375, -24.619140625, -23.31103515625, -22.0029296875, -20.69482421875, -19.38671875, -18.07861328125, -16.7705078125, -15.46240234375, -14.154296875, -12.84619140625, -11.5380859375, -10.22998046875, -8.921875, -7.61376953125, -6.3056640625, -4.99755859375, -3.689453125, -2.38134765625, -1.0732421875, 0.23486328125, 1.54296875, 2.85107421875, 4.1591796875, 5.46728515625, 6.775390625, 8.08349609375, 9.3916015625, 10.69970703125, 12.0078125, 13.31591796875, 14.6240234375, 15.93212890625, 17.240234375, 18.54833984375, 19.8564453125, 21.16455078125, 22.47265625, 23.78076171875, 25.0888671875, 26.39697265625, 27.705078125, 29.01318359375, 30.3212890625, 31.62939453125, 32.9375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 11.0, 15.0, 36.0, 37.0, 56.0, 72.0, 88.0, 106.0, 102.0, 90.0, 91.0, 87.0, 66.0, 37.0, 22.0, 28.0, 15.0, 13.0, 5.0, 8.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7890625, -6.525634765625, -6.26220703125, -5.998779296875, -5.7353515625, -5.471923828125, -5.20849609375, -4.945068359375, -4.681640625, -4.418212890625, -4.15478515625, -3.891357421875, -3.6279296875, -3.364501953125, -3.10107421875, -2.837646484375, -2.57421875, -2.310791015625, -2.04736328125, -1.783935546875, -1.5205078125, -1.257080078125, -0.99365234375, -0.730224609375, -0.466796875, -0.203369140625, 0.06005859375, 0.323486328125, 0.5869140625, 0.850341796875, 1.11376953125, 1.377197265625, 1.640625, 1.904052734375, 2.16748046875, 2.430908203125, 2.6943359375, 2.957763671875, 3.22119140625, 3.484619140625, 3.748046875, 4.011474609375, 4.27490234375, 4.538330078125, 4.8017578125, 5.065185546875, 5.32861328125, 5.592041015625, 5.85546875, 6.118896484375, 6.38232421875, 6.645751953125, 6.9091796875, 7.172607421875, 7.43603515625, 7.699462890625, 7.962890625, 8.226318359375, 8.48974609375, 8.753173828125, 9.0166015625, 9.280029296875, 9.54345703125, 9.806884765625, 10.0703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 4.0, 15.0, 14.0, 35.0, 39.0, 69.0, 146.0, 243.0, 658.0, 1662.0, 5292.0, 28839.0, 432855.0, 534760.0, 34626.0, 6155.0, 1783.0, 703.0, 277.0, 165.0, 75.0, 45.0, 29.0, 13.0, 10.0, 9.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.625, -46.138671875, -44.65234375, -43.166015625, -41.6796875, -40.193359375, -38.70703125, -37.220703125, -35.734375, -34.248046875, -32.76171875, -31.275390625, -29.7890625, -28.302734375, -26.81640625, -25.330078125, -23.84375, -22.357421875, -20.87109375, -19.384765625, -17.8984375, -16.412109375, -14.92578125, -13.439453125, -11.953125, -10.466796875, -8.98046875, -7.494140625, -6.0078125, -4.521484375, -3.03515625, -1.548828125, -0.0625, 1.423828125, 2.91015625, 4.396484375, 5.8828125, 7.369140625, 8.85546875, 10.341796875, 11.828125, 13.314453125, 14.80078125, 16.287109375, 17.7734375, 19.259765625, 20.74609375, 22.232421875, 23.71875, 25.205078125, 26.69140625, 28.177734375, 29.6640625, 31.150390625, 32.63671875, 34.123046875, 35.609375, 37.095703125, 38.58203125, 40.068359375, 41.5546875, 43.041015625, 44.52734375, 46.013671875, 47.5]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 5.0, 7.0, 11.0, 17.0, 27.0, 22.0, 36.0, 53.0, 57.0, 82.0, 85.0, 101.0, 86.0, 67.0, 67.0, 63.0, 63.0, 29.0, 30.0, 19.0, 14.0, 13.0, 10.0, 4.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.46875, -40.28125, -39.09375, -37.90625, -36.71875, -35.53125, -34.34375, -33.15625, -31.96875, -30.78125, -29.59375, -28.40625, -27.21875, -26.03125, -24.84375, -23.65625, -22.46875, -21.28125, -20.09375, -18.90625, -17.71875, -16.53125, -15.34375, -14.15625, -12.96875, -11.78125, -10.59375, -9.40625, -8.21875, -7.03125, -5.84375, -4.65625, -3.46875, -2.28125, -1.09375, 0.09375, 1.28125, 2.46875, 3.65625, 4.84375, 6.03125, 7.21875, 8.40625, 9.59375, 10.78125, 11.96875, 13.15625, 14.34375, 15.53125, 16.71875, 17.90625, 19.09375, 20.28125, 21.46875, 22.65625, 23.84375, 25.03125, 26.21875, 27.40625, 28.59375, 29.78125, 30.96875, 32.15625, 33.34375, 34.53125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 5.0, 9.0, 5.0, 12.0, 28.0, 26.0, 47.0, 74.0, 124.0, 268.0, 710.0, 2536.0, 16842.0, 979988.0, 42420.0, 3758.0, 936.0, 343.0, 162.0, 95.0, 60.0, 30.0, 15.0, 15.0, 12.0, 9.0, 4.0, 5.0, 7.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-88.0625, -85.72265625, -83.3828125, -81.04296875, -78.703125, -76.36328125, -74.0234375, -71.68359375, -69.34375, -67.00390625, -64.6640625, -62.32421875, -59.984375, -57.64453125, -55.3046875, -52.96484375, -50.625, -48.28515625, -45.9453125, -43.60546875, -41.265625, -38.92578125, -36.5859375, -34.24609375, -31.90625, -29.56640625, -27.2265625, -24.88671875, -22.546875, -20.20703125, -17.8671875, -15.52734375, -13.1875, -10.84765625, -8.5078125, -6.16796875, -3.828125, -1.48828125, 0.8515625, 3.19140625, 5.53125, 7.87109375, 10.2109375, 12.55078125, 14.890625, 17.23046875, 19.5703125, 21.91015625, 24.25, 26.58984375, 28.9296875, 31.26953125, 33.609375, 35.94921875, 38.2890625, 40.62890625, 42.96875, 45.30859375, 47.6484375, 49.98828125, 52.328125, 54.66796875, 57.0078125, 59.34765625, 61.6875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 9.0, 9.0, 10.0, 10.0, 24.0, 26.0, 42.0, 48.0, 105.0, 135.0, 170.0, 164.0, 62.0, 49.0, 43.0, 23.0, 19.0, 19.0, 10.0, 6.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0023288726806640625, -0.002271205186843872, -0.0022135376930236816, -0.002155870199203491, -0.0020982027053833008, -0.0020405352115631104, -0.00198286771774292, -0.0019252002239227295, -0.001867532730102539, -0.0018098652362823486, -0.0017521977424621582, -0.0016945302486419678, -0.0016368627548217773, -0.001579195261001587, -0.0015215277671813965, -0.001463860273361206, -0.0014061927795410156, -0.0013485252857208252, -0.0012908577919006348, -0.0012331902980804443, -0.001175522804260254, -0.0011178553104400635, -0.001060187816619873, -0.0010025203227996826, -0.0009448528289794922, -0.0008871853351593018, -0.0008295178413391113, -0.0007718503475189209, -0.0007141828536987305, -0.00065651535987854, -0.0005988478660583496, -0.0005411803722381592, -0.00048351287841796875, -0.0004258453845977783, -0.0003681778907775879, -0.00031051039695739746, -0.00025284290313720703, -0.0001951754093170166, -0.00013750791549682617, -7.984042167663574e-05, -2.2172927856445312e-05, 3.549456596374512e-05, 9.316205978393555e-05, 0.00015082955360412598, 0.0002084970474243164, 0.00026616454124450684, 0.00032383203506469727, 0.0003814995288848877, 0.0004391670227050781, 0.0004968345165252686, 0.000554502010345459, 0.0006121695041656494, 0.0006698369979858398, 0.0007275044918060303, 0.0007851719856262207, 0.0008428394794464111, 0.0009005069732666016, 0.000958174467086792, 0.0010158419609069824, 0.0010735094547271729, 0.0011311769485473633, 0.0011888444423675537, 0.0012465119361877441, 0.0013041794300079346, 0.001361846923828125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 7.0, 5.0, 7.0, 13.0, 12.0, 31.0, 41.0, 50.0, 119.0, 252.0, 584.0, 1446.0, 4082.0, 23184.0, 968432.0, 41932.0, 5189.0, 1716.0, 804.0, 270.0, 162.0, 64.0, 44.0, 25.0, 10.0, 12.0, 6.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-60.59375, -58.67578125, -56.7578125, -54.83984375, -52.921875, -51.00390625, -49.0859375, -47.16796875, -45.25, -43.33203125, -41.4140625, -39.49609375, -37.578125, -35.66015625, -33.7421875, -31.82421875, -29.90625, -27.98828125, -26.0703125, -24.15234375, -22.234375, -20.31640625, -18.3984375, -16.48046875, -14.5625, -12.64453125, -10.7265625, -8.80859375, -6.890625, -4.97265625, -3.0546875, -1.13671875, 0.78125, 2.69921875, 4.6171875, 6.53515625, 8.453125, 10.37109375, 12.2890625, 14.20703125, 16.125, 18.04296875, 19.9609375, 21.87890625, 23.796875, 25.71484375, 27.6328125, 29.55078125, 31.46875, 33.38671875, 35.3046875, 37.22265625, 39.140625, 41.05859375, 42.9765625, 44.89453125, 46.8125, 48.73046875, 50.6484375, 52.56640625, 54.484375, 56.40234375, 58.3203125, 60.23828125, 62.15625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 10.0, 20.0, 39.0, 158.0, 326.0, 289.0, 79.0, 31.0, 14.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.5625, -54.939453125, -53.31640625, -51.693359375, -50.0703125, -48.447265625, -46.82421875, -45.201171875, -43.578125, -41.955078125, -40.33203125, -38.708984375, -37.0859375, -35.462890625, -33.83984375, -32.216796875, -30.59375, -28.970703125, -27.34765625, -25.724609375, -24.1015625, -22.478515625, -20.85546875, -19.232421875, -17.609375, -15.986328125, -14.36328125, -12.740234375, -11.1171875, -9.494140625, -7.87109375, -6.248046875, -4.625, -3.001953125, -1.37890625, 0.244140625, 1.8671875, 3.490234375, 5.11328125, 6.736328125, 8.359375, 9.982421875, 11.60546875, 13.228515625, 14.8515625, 16.474609375, 18.09765625, 19.720703125, 21.34375, 22.966796875, 24.58984375, 26.212890625, 27.8359375, 29.458984375, 31.08203125, 32.705078125, 34.328125, 35.951171875, 37.57421875, 39.197265625, 40.8203125, 42.443359375, 44.06640625, 45.689453125, 47.3125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 13.0, 19.0, 36.0, 64.0, 191.0, 252.0, 203.0, 109.0, 56.0, 34.0, 12.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.50088500976562, -188.31272888183594, -178.12457275390625, -167.9364013671875, -157.7482452392578, -147.56008911132812, -137.37191772460938, -127.18376159667969, -116.99560546875, -106.80744934082031, -96.6192855834961, -86.43112182617188, -76.24296569824219, -66.0548095703125, -55.86664581298828, -45.67848205566406, -35.490325927734375, -25.302165985107422, -15.114006042480469, -4.925846099853516, 5.2623138427734375, 15.45047378540039, 25.638633728027344, 35.82679748535156, 46.01495361328125, 56.2031135559082, 66.39127349853516, 76.57943725585938, 86.76759338378906, 96.95574951171875, 107.14391326904297, 117.33207702636719, 127.52023315429688, 137.70838928222656, 147.89654541015625, 158.084716796875, 168.2728729248047, 178.46102905273438, 188.64920043945312, 198.8373565673828, 209.0255126953125, 219.2136688232422, 229.40182495117188, 239.58999633789062, 249.7781524658203, 259.96630859375, 270.15447998046875, 280.3426513671875, 290.5307922363281, 300.7189636230469, 310.9071044921875, 321.09527587890625, 331.283447265625, 341.4715881347656, 351.6597595214844, 361.847900390625, 372.03607177734375, 382.2242431640625, 392.4123840332031, 402.6005554199219, 412.7886962890625, 422.97686767578125, 433.1650390625, 443.35321044921875, 453.5413513183594]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 9.0, 21.0, 15.0, 27.0, 40.0, 36.0, 45.0, 50.0, 52.0, 63.0, 51.0, 63.0, 75.0, 59.0, 59.0, 52.0, 57.0, 41.0, 46.0, 27.0, 26.0, 20.0, 20.0, 11.0, 11.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-234.2310791015625, -226.9092254638672, -219.5873565673828, -212.2655029296875, -204.9436492919922, -197.62179565429688, -190.2999267578125, -182.9780731201172, -175.65621948242188, -168.33436584472656, -161.0124969482422, -153.69064331054688, -146.36878967285156, -139.04693603515625, -131.72506713867188, -124.40321350097656, -117.08134460449219, -109.75948333740234, -102.43762969970703, -95.11576843261719, -87.79391479492188, -80.47205352783203, -73.15019226074219, -65.82833862304688, -58.50647735595703, -51.18461990356445, -43.862762451171875, -36.54090118408203, -29.219043731689453, -21.897186279296875, -14.575325012207031, -7.253467559814453, 0.068389892578125, 7.3902482986450195, 14.712106704711914, 22.033966064453125, 29.355823516845703, 36.67768096923828, 43.999542236328125, 51.3213996887207, 58.64325714111328, 65.96511840820312, 73.28697204589844, 80.60883331298828, 87.93069458007812, 95.25254821777344, 102.57440948486328, 109.89627075195312, 117.21812438964844, 124.53998565673828, 131.86184692382812, 139.18370056152344, 146.50555419921875, 153.82742309570312, 161.14927673339844, 168.47113037109375, 175.79299926757812, 183.11485290527344, 190.4367218017578, 197.75857543945312, 205.08042907714844, 212.40228271484375, 219.72415161132812, 227.04600524902344, 234.36785888671875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 7.0, 11.0, 31.0, 34.0, 71.0, 140.0, 277.0, 634.0, 2362.0, 22997.0, 4010357.0, 148918.0, 6440.0, 1168.0, 386.0, 185.0, 110.0, 67.0, 25.0, 18.0, 13.0, 8.0, 3.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.6875, -68.86279296875, -67.0380859375, -65.21337890625, -63.388671875, -61.56396484375, -59.7392578125, -57.91455078125, -56.08984375, -54.26513671875, -52.4404296875, -50.61572265625, -48.791015625, -46.96630859375, -45.1416015625, -43.31689453125, -41.4921875, -39.66748046875, -37.8427734375, -36.01806640625, -34.193359375, -32.36865234375, -30.5439453125, -28.71923828125, -26.89453125, -25.06982421875, -23.2451171875, -21.42041015625, -19.595703125, -17.77099609375, -15.9462890625, -14.12158203125, -12.296875, -10.47216796875, -8.6474609375, -6.82275390625, -4.998046875, -3.17333984375, -1.3486328125, 0.47607421875, 2.30078125, 4.12548828125, 5.9501953125, 7.77490234375, 9.599609375, 11.42431640625, 13.2490234375, 15.07373046875, 16.8984375, 18.72314453125, 20.5478515625, 22.37255859375, 24.197265625, 26.02197265625, 27.8466796875, 29.67138671875, 31.49609375, 33.32080078125, 35.1455078125, 36.97021484375, 38.794921875, 40.61962890625, 42.4443359375, 44.26904296875, 46.09375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 12.0, 11.0, 23.0, 36.0, 64.0, 100.0, 101.0, 129.0, 139.0, 108.0, 97.0, 80.0, 46.0, 17.0, 16.0, 10.0, 9.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4140625, -13.043212890625, -12.67236328125, -12.301513671875, -11.9306640625, -11.559814453125, -11.18896484375, -10.818115234375, -10.447265625, -10.076416015625, -9.70556640625, -9.334716796875, -8.9638671875, -8.593017578125, -8.22216796875, -7.851318359375, -7.48046875, -7.109619140625, -6.73876953125, -6.367919921875, -5.9970703125, -5.626220703125, -5.25537109375, -4.884521484375, -4.513671875, -4.142822265625, -3.77197265625, -3.401123046875, -3.0302734375, -2.659423828125, -2.28857421875, -1.917724609375, -1.546875, -1.176025390625, -0.80517578125, -0.434326171875, -0.0634765625, 0.307373046875, 0.67822265625, 1.049072265625, 1.419921875, 1.790771484375, 2.16162109375, 2.532470703125, 2.9033203125, 3.274169921875, 3.64501953125, 4.015869140625, 4.38671875, 4.757568359375, 5.12841796875, 5.499267578125, 5.8701171875, 6.240966796875, 6.61181640625, 6.982666015625, 7.353515625, 7.724365234375, 8.09521484375, 8.466064453125, 8.8369140625, 9.207763671875, 9.57861328125, 9.949462890625, 10.3203125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 8.0, 10.0, 18.0, 20.0, 23.0, 38.0, 57.0, 94.0, 135.0, 206.0, 356.0, 526.0, 865.0, 1395.0, 2375.0, 4226.0, 8353.0, 20228.0, 63935.0, 424350.0, 3384045.0, 209973.0, 43681.0, 14849.0, 6550.0, 3334.0, 1791.0, 1040.0, 660.0, 404.0, 249.0, 159.0, 102.0, 84.0, 49.0, 31.0, 25.0, 12.0, 8.0, 5.0, 9.0, 0.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.34375, -16.7529296875, -16.162109375, -15.5712890625, -14.98046875, -14.3896484375, -13.798828125, -13.2080078125, -12.6171875, -12.0263671875, -11.435546875, -10.8447265625, -10.25390625, -9.6630859375, -9.072265625, -8.4814453125, -7.890625, -7.2998046875, -6.708984375, -6.1181640625, -5.52734375, -4.9365234375, -4.345703125, -3.7548828125, -3.1640625, -2.5732421875, -1.982421875, -1.3916015625, -0.80078125, -0.2099609375, 0.380859375, 0.9716796875, 1.5625, 2.1533203125, 2.744140625, 3.3349609375, 3.92578125, 4.5166015625, 5.107421875, 5.6982421875, 6.2890625, 6.8798828125, 7.470703125, 8.0615234375, 8.65234375, 9.2431640625, 9.833984375, 10.4248046875, 11.015625, 11.6064453125, 12.197265625, 12.7880859375, 13.37890625, 13.9697265625, 14.560546875, 15.1513671875, 15.7421875, 16.3330078125, 16.923828125, 17.5146484375, 18.10546875, 18.6962890625, 19.287109375, 19.8779296875, 20.46875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 2.0, 2.0, 10.0, 9.0, 8.0, 17.0, 23.0, 27.0, 40.0, 66.0, 115.0, 329.0, 1552.0, 1245.0, 301.0, 125.0, 70.0, 38.0, 22.0, 19.0, 11.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4453125, -10.084716796875, -9.72412109375, -9.363525390625, -9.0029296875, -8.642333984375, -8.28173828125, -7.921142578125, -7.560546875, -7.199951171875, -6.83935546875, -6.478759765625, -6.1181640625, -5.757568359375, -5.39697265625, -5.036376953125, -4.67578125, -4.315185546875, -3.95458984375, -3.593994140625, -3.2333984375, -2.872802734375, -2.51220703125, -2.151611328125, -1.791015625, -1.430419921875, -1.06982421875, -0.709228515625, -0.3486328125, 0.011962890625, 0.37255859375, 0.733154296875, 1.09375, 1.454345703125, 1.81494140625, 2.175537109375, 2.5361328125, 2.896728515625, 3.25732421875, 3.617919921875, 3.978515625, 4.339111328125, 4.69970703125, 5.060302734375, 5.4208984375, 5.781494140625, 6.14208984375, 6.502685546875, 6.86328125, 7.223876953125, 7.58447265625, 7.945068359375, 8.3056640625, 8.666259765625, 9.02685546875, 9.387451171875, 9.748046875, 10.108642578125, 10.46923828125, 10.829833984375, 11.1904296875, 11.551025390625, 11.91162109375, 12.272216796875, 12.6328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 21.0, 34.0, 103.0, 167.0, 213.0, 216.0, 118.0, 63.0, 27.0, 8.0, 9.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.47527313232422, -110.83724212646484, -108.19921112060547, -105.56117248535156, -102.92314147949219, -100.28511047363281, -97.64707946777344, -95.00904846191406, -92.37100982666016, -89.73297882080078, -87.0949478149414, -84.4569091796875, -81.81887817382812, -79.18084716796875, -76.54281616210938, -73.90478515625, -71.26675415039062, -68.62872314453125, -65.99069213867188, -63.352657318115234, -60.714622497558594, -58.07659149169922, -55.438560485839844, -52.8005256652832, -50.16249084472656, -47.52445983886719, -44.88642501831055, -42.24839401245117, -39.61035919189453, -36.972328186035156, -34.33429718017578, -31.69626235961914, -29.058223724365234, -26.420190811157227, -23.78215789794922, -21.144126892089844, -18.506092071533203, -15.868060111999512, -13.23002815246582, -10.591995239257812, -7.953962326049805, -5.315929412841797, -2.6778969764709473, -0.039864540100097656, 2.59816837310791, 5.236201286315918, 7.874233245849609, 10.512266159057617, 13.150299072265625, 15.788331985473633, 18.42636489868164, 21.064395904541016, 23.702430725097656, 26.34046173095703, 28.97849464416504, 31.616527557373047, 34.25456237792969, 36.89259338378906, 39.5306282043457, 42.16865921020508, 44.80669403076172, 47.444725036621094, 50.08275604248047, 52.72079086303711, 55.358821868896484]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 11.0, 8.0, 16.0, 27.0, 29.0, 43.0, 56.0, 50.0, 57.0, 86.0, 84.0, 71.0, 84.0, 85.0, 49.0, 51.0, 53.0, 39.0, 32.0, 24.0, 20.0, 5.0, 6.0, 10.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.36634063720703, -43.465248107910156, -41.564151763916016, -39.66305923461914, -37.761966705322266, -35.860870361328125, -33.95977783203125, -32.058685302734375, -30.1575927734375, -28.256498336791992, -26.355405807495117, -24.45431137084961, -22.553218841552734, -20.652124404907227, -18.75102996826172, -16.849937438964844, -14.948843002319336, -13.047749519348145, -11.146656036376953, -9.245561599731445, -7.344468593597412, -5.4433746337890625, -3.542281150817871, -1.6411876678466797, 0.2599058151245117, 2.160999298095703, 4.0620927810668945, 5.963186740875244, 7.8642802238464355, 9.765374183654785, 11.666467666625977, 13.567561149597168, 15.46865463256836, 17.369749069213867, 19.270841598510742, 21.17193603515625, 23.073028564453125, 24.974123001098633, 26.87521743774414, 28.776309967041016, 30.67740249633789, 32.578495025634766, 34.479591369628906, 36.38068389892578, 38.281776428222656, 40.18286895751953, 42.08396530151367, 43.98505783081055, 45.88615417480469, 47.78724670410156, 49.6883430480957, 51.58943557739258, 53.49052810668945, 55.391624450683594, 57.29271697998047, 59.193809509277344, 61.09490203857422, 62.995994567871094, 64.89708709716797, 66.79817962646484, 68.69927978515625, 70.60037231445312, 72.50146484375, 74.40255737304688, 76.30364990234375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 5.0, 16.0, 21.0, 41.0, 40.0, 48.0, 106.0, 156.0, 278.0, 477.0, 904.0, 2042.0, 5413.0, 17244.0, 69043.0, 323204.0, 470384.0, 118967.0, 26853.0, 7821.0, 2853.0, 1180.0, 567.0, 299.0, 184.0, 121.0, 81.0, 59.0, 38.0, 25.0, 25.0, 13.0, 15.0, 6.0, 2.0, 2.0, 7.0, 1.0, 4.0, 1.0], "bins": [-36.40625, -35.5, -34.59375, -33.6875, -32.78125, -31.875, -30.96875, -30.0625, -29.15625, -28.25, -27.34375, -26.4375, -25.53125, -24.625, -23.71875, -22.8125, -21.90625, -21.0, -20.09375, -19.1875, -18.28125, -17.375, -16.46875, -15.5625, -14.65625, -13.75, -12.84375, -11.9375, -11.03125, -10.125, -9.21875, -8.3125, -7.40625, -6.5, -5.59375, -4.6875, -3.78125, -2.875, -1.96875, -1.0625, -0.15625, 0.75, 1.65625, 2.5625, 3.46875, 4.375, 5.28125, 6.1875, 7.09375, 8.0, 8.90625, 9.8125, 10.71875, 11.625, 12.53125, 13.4375, 14.34375, 15.25, 16.15625, 17.0625, 17.96875, 18.875, 19.78125, 20.6875, 21.59375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 10.0, 15.0, 30.0, 35.0, 55.0, 72.0, 92.0, 120.0, 114.0, 93.0, 84.0, 79.0, 54.0, 49.0, 33.0, 21.0, 13.0, 6.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.46875, -8.1734619140625, -7.878173828125, -7.5828857421875, -7.28759765625, -6.9923095703125, -6.697021484375, -6.4017333984375, -6.1064453125, -5.8111572265625, -5.515869140625, -5.2205810546875, -4.92529296875, -4.6300048828125, -4.334716796875, -4.0394287109375, -3.744140625, -3.4488525390625, -3.153564453125, -2.8582763671875, -2.56298828125, -2.2677001953125, -1.972412109375, -1.6771240234375, -1.3818359375, -1.0865478515625, -0.791259765625, -0.4959716796875, -0.20068359375, 0.0946044921875, 0.389892578125, 0.6851806640625, 0.98046875, 1.2757568359375, 1.571044921875, 1.8663330078125, 2.16162109375, 2.4569091796875, 2.752197265625, 3.0474853515625, 3.3427734375, 3.6380615234375, 3.933349609375, 4.2286376953125, 4.52392578125, 4.8192138671875, 5.114501953125, 5.4097900390625, 5.705078125, 6.0003662109375, 6.295654296875, 6.5909423828125, 6.88623046875, 7.1815185546875, 7.476806640625, 7.7720947265625, 8.0673828125, 8.3626708984375, 8.657958984375, 8.9532470703125, 9.24853515625, 9.5438232421875, 9.839111328125, 10.1343994140625, 10.4296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 0.0, 4.0, 3.0, 2.0, 9.0, 11.0, 8.0, 19.0, 22.0, 60.0, 75.0, 91.0, 149.0, 211.0, 469.0, 892.0, 2459.0, 13534.0, 249439.0, 735675.0, 38351.0, 4458.0, 1231.0, 603.0, 299.0, 189.0, 84.0, 70.0, 40.0, 31.0, 33.0, 13.0, 9.0, 6.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.125, -49.3125, -47.5, -45.6875, -43.875, -42.0625, -40.25, -38.4375, -36.625, -34.8125, -33.0, -31.1875, -29.375, -27.5625, -25.75, -23.9375, -22.125, -20.3125, -18.5, -16.6875, -14.875, -13.0625, -11.25, -9.4375, -7.625, -5.8125, -4.0, -2.1875, -0.375, 1.4375, 3.25, 5.0625, 6.875, 8.6875, 10.5, 12.3125, 14.125, 15.9375, 17.75, 19.5625, 21.375, 23.1875, 25.0, 26.8125, 28.625, 30.4375, 32.25, 34.0625, 35.875, 37.6875, 39.5, 41.3125, 43.125, 44.9375, 46.75, 48.5625, 50.375, 52.1875, 54.0, 55.8125, 57.625, 59.4375, 61.25, 63.0625, 64.875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 12.0, 16.0, 13.0, 18.0, 20.0, 28.0, 38.0, 31.0, 52.0, 66.0, 65.0, 71.0, 72.0, 78.0, 70.0, 60.0, 60.0, 45.0, 40.0, 26.0, 38.0, 18.0, 11.0, 12.0, 9.0, 9.0, 3.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.796875, -28.646240234375, -27.49560546875, -26.344970703125, -25.1943359375, -24.043701171875, -22.89306640625, -21.742431640625, -20.591796875, -19.441162109375, -18.29052734375, -17.139892578125, -15.9892578125, -14.838623046875, -13.68798828125, -12.537353515625, -11.38671875, -10.236083984375, -9.08544921875, -7.934814453125, -6.7841796875, -5.633544921875, -4.48291015625, -3.332275390625, -2.181640625, -1.031005859375, 0.11962890625, 1.270263671875, 2.4208984375, 3.571533203125, 4.72216796875, 5.872802734375, 7.0234375, 8.174072265625, 9.32470703125, 10.475341796875, 11.6259765625, 12.776611328125, 13.92724609375, 15.077880859375, 16.228515625, 17.379150390625, 18.52978515625, 19.680419921875, 20.8310546875, 21.981689453125, 23.13232421875, 24.282958984375, 25.43359375, 26.584228515625, 27.73486328125, 28.885498046875, 30.0361328125, 31.186767578125, 32.33740234375, 33.488037109375, 34.638671875, 35.789306640625, 36.93994140625, 38.090576171875, 39.2412109375, 40.391845703125, 41.54248046875, 42.693115234375, 43.84375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 7.0, 11.0, 14.0, 17.0, 15.0, 38.0, 47.0, 69.0, 110.0, 165.0, 352.0, 685.0, 1622.0, 4716.0, 18614.0, 129128.0, 736618.0, 129749.0, 18679.0, 4649.0, 1668.0, 702.0, 336.0, 168.0, 112.0, 73.0, 43.0, 30.0, 20.0, 19.0, 12.0, 8.0, 11.0, 8.0, 6.0, 3.0, 3.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.703125, -17.10302734375, -16.5029296875, -15.90283203125, -15.302734375, -14.70263671875, -14.1025390625, -13.50244140625, -12.90234375, -12.30224609375, -11.7021484375, -11.10205078125, -10.501953125, -9.90185546875, -9.3017578125, -8.70166015625, -8.1015625, -7.50146484375, -6.9013671875, -6.30126953125, -5.701171875, -5.10107421875, -4.5009765625, -3.90087890625, -3.30078125, -2.70068359375, -2.1005859375, -1.50048828125, -0.900390625, -0.30029296875, 0.2998046875, 0.89990234375, 1.5, 2.10009765625, 2.7001953125, 3.30029296875, 3.900390625, 4.50048828125, 5.1005859375, 5.70068359375, 6.30078125, 6.90087890625, 7.5009765625, 8.10107421875, 8.701171875, 9.30126953125, 9.9013671875, 10.50146484375, 11.1015625, 11.70166015625, 12.3017578125, 12.90185546875, 13.501953125, 14.10205078125, 14.7021484375, 15.30224609375, 15.90234375, 16.50244140625, 17.1025390625, 17.70263671875, 18.302734375, 18.90283203125, 19.5029296875, 20.10302734375, 20.703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 7.0, 20.0, 27.0, 27.0, 50.0, 90.0, 144.0, 221.0, 165.0, 108.0, 58.0, 28.0, 17.0, 18.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003009796142578125, -0.002931833267211914, -0.002853870391845703, -0.002775907516479492, -0.0026979446411132812, -0.0026199817657470703, -0.0025420188903808594, -0.0024640560150146484, -0.0023860931396484375, -0.0023081302642822266, -0.0022301673889160156, -0.0021522045135498047, -0.0020742416381835938, -0.001996278762817383, -0.0019183158874511719, -0.001840353012084961, -0.00176239013671875, -0.001684427261352539, -0.0016064643859863281, -0.0015285015106201172, -0.0014505386352539062, -0.0013725757598876953, -0.0012946128845214844, -0.0012166500091552734, -0.0011386871337890625, -0.0010607242584228516, -0.0009827613830566406, -0.0009047985076904297, -0.0008268356323242188, -0.0007488727569580078, -0.0006709098815917969, -0.0005929470062255859, -0.000514984130859375, -0.00043702125549316406, -0.0003590583801269531, -0.0002810955047607422, -0.00020313262939453125, -0.0001251697540283203, -4.7206878662109375e-05, 3.075599670410156e-05, 0.0001087188720703125, 0.00018668174743652344, 0.0002646446228027344, 0.0003426074981689453, 0.00042057037353515625, 0.0004985332489013672, 0.0005764961242675781, 0.0006544589996337891, 0.000732421875, 0.0008103847503662109, 0.0008883476257324219, 0.0009663105010986328, 0.0010442733764648438, 0.0011222362518310547, 0.0012001991271972656, 0.0012781620025634766, 0.0013561248779296875, 0.0014340877532958984, 0.0015120506286621094, 0.0015900135040283203, 0.0016679763793945312, 0.0017459392547607422, 0.0018239021301269531, 0.001901865005493164, 0.001979827880859375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 9.0, 8.0, 4.0, 9.0, 16.0, 34.0, 43.0, 56.0, 110.0, 270.0, 587.0, 1826.0, 10776.0, 374528.0, 643117.0, 13671.0, 2212.0, 709.0, 263.0, 128.0, 63.0, 38.0, 23.0, 17.0, 8.0, 12.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-44.84375, -43.564453125, -42.28515625, -41.005859375, -39.7265625, -38.447265625, -37.16796875, -35.888671875, -34.609375, -33.330078125, -32.05078125, -30.771484375, -29.4921875, -28.212890625, -26.93359375, -25.654296875, -24.375, -23.095703125, -21.81640625, -20.537109375, -19.2578125, -17.978515625, -16.69921875, -15.419921875, -14.140625, -12.861328125, -11.58203125, -10.302734375, -9.0234375, -7.744140625, -6.46484375, -5.185546875, -3.90625, -2.626953125, -1.34765625, -0.068359375, 1.2109375, 2.490234375, 3.76953125, 5.048828125, 6.328125, 7.607421875, 8.88671875, 10.166015625, 11.4453125, 12.724609375, 14.00390625, 15.283203125, 16.5625, 17.841796875, 19.12109375, 20.400390625, 21.6796875, 22.958984375, 24.23828125, 25.517578125, 26.796875, 28.076171875, 29.35546875, 30.634765625, 31.9140625, 33.193359375, 34.47265625, 35.751953125, 37.03125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 8.0, 17.0, 21.0, 42.0, 55.0, 108.0, 198.0, 215.0, 128.0, 72.0, 43.0, 25.0, 16.0, 9.0, 9.0, 11.0, 5.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.96875, -23.2001953125, -22.431640625, -21.6630859375, -20.89453125, -20.1259765625, -19.357421875, -18.5888671875, -17.8203125, -17.0517578125, -16.283203125, -15.5146484375, -14.74609375, -13.9775390625, -13.208984375, -12.4404296875, -11.671875, -10.9033203125, -10.134765625, -9.3662109375, -8.59765625, -7.8291015625, -7.060546875, -6.2919921875, -5.5234375, -4.7548828125, -3.986328125, -3.2177734375, -2.44921875, -1.6806640625, -0.912109375, -0.1435546875, 0.625, 1.3935546875, 2.162109375, 2.9306640625, 3.69921875, 4.4677734375, 5.236328125, 6.0048828125, 6.7734375, 7.5419921875, 8.310546875, 9.0791015625, 9.84765625, 10.6162109375, 11.384765625, 12.1533203125, 12.921875, 13.6904296875, 14.458984375, 15.2275390625, 15.99609375, 16.7646484375, 17.533203125, 18.3017578125, 19.0703125, 19.8388671875, 20.607421875, 21.3759765625, 22.14453125, 22.9130859375, 23.681640625, 24.4501953125, 25.21875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 11.0, 30.0, 153.0, 394.0, 295.0, 92.0, 18.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-475.1171569824219, -459.5964050292969, -444.07568359375, -428.554931640625, -413.0341796875, -397.513427734375, -381.99267578125, -366.4719543457031, -350.9512023925781, -335.4304504394531, -319.90972900390625, -304.38897705078125, -288.86822509765625, -273.34747314453125, -257.82672119140625, -242.30599975585938, -226.78524780273438, -211.26449584960938, -195.74375915527344, -180.2230224609375, -164.7022705078125, -149.1815185546875, -133.66078186035156, -118.1400375366211, -102.61929321289062, -87.09854888916016, -71.57780456542969, -56.05706024169922, -40.53631591796875, -25.01557159423828, -9.494827270507812, 6.025917053222656, 21.546630859375, 37.06737518310547, 52.58811950683594, 68.1088638305664, 83.62960815429688, 99.15035247802734, 114.67109680175781, 130.19183349609375, 145.71258544921875, 161.23333740234375, 176.7540740966797, 192.27481079101562, 207.79556274414062, 223.31631469726562, 238.83705139160156, 254.3577880859375, 269.8785400390625, 285.3992919921875, 300.9200439453125, 316.4407653808594, 331.9615173339844, 347.4822692871094, 363.00299072265625, 378.52374267578125, 394.04449462890625, 409.56524658203125, 425.08599853515625, 440.6067199707031, 456.1274719238281, 471.6482238769531, 487.1689453125, 502.689697265625, 518.21044921875]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 8.0, 12.0, 8.0, 7.0, 8.0, 11.0, 12.0, 15.0, 18.0, 14.0, 25.0, 32.0, 28.0, 36.0, 44.0, 39.0, 43.0, 58.0, 50.0, 51.0, 40.0, 29.0, 35.0, 43.0, 29.0, 48.0, 34.0, 30.0, 30.0, 17.0, 21.0, 19.0, 17.0, 19.0, 14.0, 6.0, 8.0, 12.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.11732482910156, -114.18535614013672, -110.25337982177734, -106.3214111328125, -102.38943481445312, -98.45746612548828, -94.5254898071289, -90.59352111816406, -86.66154479980469, -82.72957611083984, -78.79759979248047, -74.86563110351562, -70.93365478515625, -67.0016860961914, -63.06970977783203, -59.13774108886719, -55.20576858520508, -51.27379608154297, -47.34182357788086, -43.40985107421875, -39.47787857055664, -35.54590606689453, -31.613935470581055, -27.681962966918945, -23.749990463256836, -19.818017959594727, -15.886045455932617, -11.954073905944824, -8.022101402282715, -4.090129852294922, -0.1581573486328125, 3.773815155029297, 7.705787658691406, 11.637760162353516, 15.569732666015625, 19.501705169677734, 23.433677673339844, 27.36564826965332, 31.29762077331543, 35.229591369628906, 39.16156768798828, 43.09354019165039, 47.0255126953125, 50.95748519897461, 54.88945770263672, 58.82142639160156, 62.75340270996094, 66.68537139892578, 70.61734008789062, 74.54930877685547, 78.48128509521484, 82.41325378417969, 86.34523010253906, 90.2771987915039, 94.20917510986328, 98.14114379882812, 102.0731201171875, 106.00508880615234, 109.93706512451172, 113.86903381347656, 117.80101013183594, 121.73297882080078, 125.66495513916016, 129.596923828125, 133.52890014648438]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 2.0, 7.0, 3.0, 7.0, 9.0, 5.0, 10.0, 19.0, 24.0, 51.0, 102.0, 135.0, 354.0, 811.0, 2256.0, 8637.0, 78753.0, 3945293.0, 140226.0, 12526.0, 3034.0, 1058.0, 443.0, 215.0, 114.0, 78.0, 36.0, 27.0, 14.0, 9.0, 11.0, 4.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.0625, -34.53369140625, -33.0048828125, -31.47607421875, -29.947265625, -28.41845703125, -26.8896484375, -25.36083984375, -23.83203125, -22.30322265625, -20.7744140625, -19.24560546875, -17.716796875, -16.18798828125, -14.6591796875, -13.13037109375, -11.6015625, -10.07275390625, -8.5439453125, -7.01513671875, -5.486328125, -3.95751953125, -2.4287109375, -0.89990234375, 0.62890625, 2.15771484375, 3.6865234375, 5.21533203125, 6.744140625, 8.27294921875, 9.8017578125, 11.33056640625, 12.859375, 14.38818359375, 15.9169921875, 17.44580078125, 18.974609375, 20.50341796875, 22.0322265625, 23.56103515625, 25.08984375, 26.61865234375, 28.1474609375, 29.67626953125, 31.205078125, 32.73388671875, 34.2626953125, 35.79150390625, 37.3203125, 38.84912109375, 40.3779296875, 41.90673828125, 43.435546875, 44.96435546875, 46.4931640625, 48.02197265625, 49.55078125, 51.07958984375, 52.6083984375, 54.13720703125, 55.666015625, 57.19482421875, 58.7236328125, 60.25244140625, 61.78125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 17.0, 19.0, 34.0, 56.0, 67.0, 92.0, 89.0, 125.0, 109.0, 91.0, 72.0, 64.0, 59.0, 37.0, 22.0, 16.0, 10.0, 4.0, 2.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.359375, -10.01513671875, -9.6708984375, -9.32666015625, -8.982421875, -8.63818359375, -8.2939453125, -7.94970703125, -7.60546875, -7.26123046875, -6.9169921875, -6.57275390625, -6.228515625, -5.88427734375, -5.5400390625, -5.19580078125, -4.8515625, -4.50732421875, -4.1630859375, -3.81884765625, -3.474609375, -3.13037109375, -2.7861328125, -2.44189453125, -2.09765625, -1.75341796875, -1.4091796875, -1.06494140625, -0.720703125, -0.37646484375, -0.0322265625, 0.31201171875, 0.65625, 1.00048828125, 1.3447265625, 1.68896484375, 2.033203125, 2.37744140625, 2.7216796875, 3.06591796875, 3.41015625, 3.75439453125, 4.0986328125, 4.44287109375, 4.787109375, 5.13134765625, 5.4755859375, 5.81982421875, 6.1640625, 6.50830078125, 6.8525390625, 7.19677734375, 7.541015625, 7.88525390625, 8.2294921875, 8.57373046875, 8.91796875, 9.26220703125, 9.6064453125, 9.95068359375, 10.294921875, 10.63916015625, 10.9833984375, 11.32763671875, 11.671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 6.0, 4.0, 12.0, 19.0, 25.0, 36.0, 55.0, 73.0, 142.0, 180.0, 330.0, 543.0, 1132.0, 2349.0, 5603.0, 15407.0, 55795.0, 425033.0, 3368872.0, 256490.0, 41344.0, 12145.0, 4451.0, 1991.0, 928.0, 516.0, 251.0, 176.0, 93.0, 83.0, 55.0, 46.0, 39.0, 15.0, 11.0, 9.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.015625, -22.3466796875, -21.677734375, -21.0087890625, -20.33984375, -19.6708984375, -19.001953125, -18.3330078125, -17.6640625, -16.9951171875, -16.326171875, -15.6572265625, -14.98828125, -14.3193359375, -13.650390625, -12.9814453125, -12.3125, -11.6435546875, -10.974609375, -10.3056640625, -9.63671875, -8.9677734375, -8.298828125, -7.6298828125, -6.9609375, -6.2919921875, -5.623046875, -4.9541015625, -4.28515625, -3.6162109375, -2.947265625, -2.2783203125, -1.609375, -0.9404296875, -0.271484375, 0.3974609375, 1.06640625, 1.7353515625, 2.404296875, 3.0732421875, 3.7421875, 4.4111328125, 5.080078125, 5.7490234375, 6.41796875, 7.0869140625, 7.755859375, 8.4248046875, 9.09375, 9.7626953125, 10.431640625, 11.1005859375, 11.76953125, 12.4384765625, 13.107421875, 13.7763671875, 14.4453125, 15.1142578125, 15.783203125, 16.4521484375, 17.12109375, 17.7900390625, 18.458984375, 19.1279296875, 19.796875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 8.0, 8.0, 13.0, 23.0, 26.0, 37.0, 55.0, 104.0, 227.0, 465.0, 1524.0, 940.0, 322.0, 135.0, 56.0, 30.0, 22.0, 17.0, 12.0, 9.0, 5.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.4493408203125, -9.015869140625, -8.5823974609375, -8.14892578125, -7.7154541015625, -7.281982421875, -6.8485107421875, -6.4150390625, -5.9815673828125, -5.548095703125, -5.1146240234375, -4.68115234375, -4.2476806640625, -3.814208984375, -3.3807373046875, -2.947265625, -2.5137939453125, -2.080322265625, -1.6468505859375, -1.21337890625, -0.7799072265625, -0.346435546875, 0.0870361328125, 0.5205078125, 0.9539794921875, 1.387451171875, 1.8209228515625, 2.25439453125, 2.6878662109375, 3.121337890625, 3.5548095703125, 3.98828125, 4.4217529296875, 4.855224609375, 5.2886962890625, 5.72216796875, 6.1556396484375, 6.589111328125, 7.0225830078125, 7.4560546875, 7.8895263671875, 8.322998046875, 8.7564697265625, 9.18994140625, 9.6234130859375, 10.056884765625, 10.4903564453125, 10.923828125, 11.3572998046875, 11.790771484375, 12.2242431640625, 12.65771484375, 13.0911865234375, 13.524658203125, 13.9581298828125, 14.3916015625, 14.8250732421875, 15.258544921875, 15.6920166015625, 16.12548828125, 16.5589599609375, 16.992431640625, 17.4259033203125, 17.859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 40.0, 267.0, 555.0, 133.0, 9.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-496.1182556152344, -487.1654357910156, -478.212646484375, -469.25982666015625, -460.3070068359375, -451.3542175292969, -442.4013977050781, -433.4486083984375, -424.49578857421875, -415.54296875, -406.5901794433594, -397.6373596191406, -388.6845703125, -379.73175048828125, -370.7789306640625, -361.8261413574219, -352.8733215332031, -343.9205017089844, -334.96771240234375, -326.014892578125, -317.06207275390625, -308.1092834472656, -299.1564636230469, -290.20367431640625, -281.2508544921875, -272.29803466796875, -263.3452453613281, -254.39242553710938, -245.4396209716797, -236.48681640625, -227.53399658203125, -218.58119201660156, -209.62835693359375, -200.67555236816406, -191.72274780273438, -182.76992797851562, -173.81712341308594, -164.86431884765625, -155.9114990234375, -146.9586944580078, -138.00588989257812, -129.05308532714844, -120.10027313232422, -111.1474609375, -102.19465637207031, -93.24185180664062, -84.2890396118164, -75.33622741699219, -66.3834228515625, -57.43061447143555, -48.477806091308594, -39.52499771118164, -30.572189331054688, -21.619380950927734, -12.666572570800781, -3.713764190673828, 5.239044189453125, 14.191852569580078, 23.14466094970703, 32.097469329833984, 41.05027770996094, 50.00308609008789, 58.955894470214844, 67.90870666503906, 76.86151123046875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 10.0, 11.0, 25.0, 25.0, 32.0, 39.0, 63.0, 62.0, 78.0, 63.0, 80.0, 84.0, 88.0, 73.0, 56.0, 42.0, 43.0, 41.0, 31.0, 15.0, 12.0, 11.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.04608154296875, -69.70710754394531, -67.3681411743164, -65.02916717529297, -62.69019317626953, -60.35122299194336, -58.01225280761719, -55.67327880859375, -53.33430862426758, -50.995338439941406, -48.65636444091797, -46.3173942565918, -43.978424072265625, -41.63945007324219, -39.300479888916016, -36.961509704589844, -34.622535705566406, -32.283565521240234, -29.944591522216797, -27.605621337890625, -25.26664924621582, -22.927677154541016, -20.588706970214844, -18.24973487854004, -15.910762786865234, -13.57179069519043, -11.232819557189941, -8.893848419189453, -6.554876327514648, -4.215904235839844, -1.8769330978393555, 0.4620380401611328, 2.8010101318359375, 5.139981746673584, 7.4789533615112305, 9.817924499511719, 12.156896591186523, 14.495868682861328, 16.8348388671875, 19.173810958862305, 21.51278305053711, 23.851755142211914, 26.19072723388672, 28.52969741821289, 30.868669509887695, 33.2076416015625, 35.54661178588867, 37.885581970214844, 40.22455596923828, 42.56352615356445, 44.90250015258789, 47.24147033691406, 49.5804443359375, 51.91941452026367, 54.258384704589844, 56.59735870361328, 58.93632888793945, 61.275299072265625, 63.61427307128906, 65.9532470703125, 68.2922134399414, 70.63118743896484, 72.97016143798828, 75.30912780761719, 77.64810180664062]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 5.0, 5.0, 6.0, 18.0, 14.0, 29.0, 29.0, 46.0, 89.0, 153.0, 245.0, 541.0, 1081.0, 2689.0, 7718.0, 29562.0, 158703.0, 676857.0, 133172.0, 26135.0, 6964.0, 2385.0, 991.0, 470.0, 260.0, 143.0, 84.0, 50.0, 27.0, 33.0, 12.0, 12.0, 10.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.84375, -35.7744140625, -34.705078125, -33.6357421875, -32.56640625, -31.4970703125, -30.427734375, -29.3583984375, -28.2890625, -27.2197265625, -26.150390625, -25.0810546875, -24.01171875, -22.9423828125, -21.873046875, -20.8037109375, -19.734375, -18.6650390625, -17.595703125, -16.5263671875, -15.45703125, -14.3876953125, -13.318359375, -12.2490234375, -11.1796875, -10.1103515625, -9.041015625, -7.9716796875, -6.90234375, -5.8330078125, -4.763671875, -3.6943359375, -2.625, -1.5556640625, -0.486328125, 0.5830078125, 1.65234375, 2.7216796875, 3.791015625, 4.8603515625, 5.9296875, 6.9990234375, 8.068359375, 9.1376953125, 10.20703125, 11.2763671875, 12.345703125, 13.4150390625, 14.484375, 15.5537109375, 16.623046875, 17.6923828125, 18.76171875, 19.8310546875, 20.900390625, 21.9697265625, 23.0390625, 24.1083984375, 25.177734375, 26.2470703125, 27.31640625, 28.3857421875, 29.455078125, 30.5244140625, 31.59375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 12.0, 14.0, 26.0, 34.0, 49.0, 71.0, 85.0, 92.0, 114.0, 93.0, 78.0, 67.0, 59.0, 53.0, 52.0, 29.0, 23.0, 13.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66015625, -7.35711669921875, -7.0540771484375, -6.75103759765625, -6.447998046875, -6.14495849609375, -5.8419189453125, -5.53887939453125, -5.23583984375, -4.93280029296875, -4.6297607421875, -4.32672119140625, -4.023681640625, -3.72064208984375, -3.4176025390625, -3.11456298828125, -2.8115234375, -2.50848388671875, -2.2054443359375, -1.90240478515625, -1.599365234375, -1.29632568359375, -0.9932861328125, -0.69024658203125, -0.38720703125, -0.08416748046875, 0.2188720703125, 0.52191162109375, 0.824951171875, 1.12799072265625, 1.4310302734375, 1.73406982421875, 2.037109375, 2.34014892578125, 2.6431884765625, 2.94622802734375, 3.249267578125, 3.55230712890625, 3.8553466796875, 4.15838623046875, 4.46142578125, 4.76446533203125, 5.0675048828125, 5.37054443359375, 5.673583984375, 5.97662353515625, 6.2796630859375, 6.58270263671875, 6.8857421875, 7.18878173828125, 7.4918212890625, 7.79486083984375, 8.097900390625, 8.40093994140625, 8.7039794921875, 9.00701904296875, 9.31005859375, 9.61309814453125, 9.9161376953125, 10.21917724609375, 10.522216796875, 10.82525634765625, 11.1282958984375, 11.43133544921875, 11.734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 14.0, 5.0, 13.0, 12.0, 19.0, 32.0, 37.0, 62.0, 97.0, 178.0, 252.0, 486.0, 1081.0, 3408.0, 22455.0, 804491.0, 202134.0, 9835.0, 2158.0, 817.0, 368.0, 183.0, 118.0, 90.0, 56.0, 38.0, 26.0, 24.0, 16.0, 11.0, 13.0, 4.0, 6.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-89.3125, -86.951171875, -84.58984375, -82.228515625, -79.8671875, -77.505859375, -75.14453125, -72.783203125, -70.421875, -68.060546875, -65.69921875, -63.337890625, -60.9765625, -58.615234375, -56.25390625, -53.892578125, -51.53125, -49.169921875, -46.80859375, -44.447265625, -42.0859375, -39.724609375, -37.36328125, -35.001953125, -32.640625, -30.279296875, -27.91796875, -25.556640625, -23.1953125, -20.833984375, -18.47265625, -16.111328125, -13.75, -11.388671875, -9.02734375, -6.666015625, -4.3046875, -1.943359375, 0.41796875, 2.779296875, 5.140625, 7.501953125, 9.86328125, 12.224609375, 14.5859375, 16.947265625, 19.30859375, 21.669921875, 24.03125, 26.392578125, 28.75390625, 31.115234375, 33.4765625, 35.837890625, 38.19921875, 40.560546875, 42.921875, 45.283203125, 47.64453125, 50.005859375, 52.3671875, 54.728515625, 57.08984375, 59.451171875, 61.8125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 15.0, 7.0, 14.0, 26.0, 37.0, 61.0, 52.0, 80.0, 99.0, 97.0, 108.0, 73.0, 77.0, 70.0, 52.0, 44.0, 26.0, 16.0, 8.0, 7.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.28125, -61.57421875, -59.8671875, -58.16015625, -56.453125, -54.74609375, -53.0390625, -51.33203125, -49.625, -47.91796875, -46.2109375, -44.50390625, -42.796875, -41.08984375, -39.3828125, -37.67578125, -35.96875, -34.26171875, -32.5546875, -30.84765625, -29.140625, -27.43359375, -25.7265625, -24.01953125, -22.3125, -20.60546875, -18.8984375, -17.19140625, -15.484375, -13.77734375, -12.0703125, -10.36328125, -8.65625, -6.94921875, -5.2421875, -3.53515625, -1.828125, -0.12109375, 1.5859375, 3.29296875, 5.0, 6.70703125, 8.4140625, 10.12109375, 11.828125, 13.53515625, 15.2421875, 16.94921875, 18.65625, 20.36328125, 22.0703125, 23.77734375, 25.484375, 27.19140625, 28.8984375, 30.60546875, 32.3125, 34.01953125, 35.7265625, 37.43359375, 39.140625, 40.84765625, 42.5546875, 44.26171875, 45.96875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 10.0, 10.0, 9.0, 6.0, 16.0, 12.0, 21.0, 24.0, 51.0, 58.0, 108.0, 197.0, 522.0, 1707.0, 11522.0, 602631.0, 418914.0, 10108.0, 1619.0, 498.0, 206.0, 111.0, 47.0, 32.0, 22.0, 19.0, 18.0, 17.0, 8.0, 7.0, 6.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.90625, -35.5869140625, -34.267578125, -32.9482421875, -31.62890625, -30.3095703125, -28.990234375, -27.6708984375, -26.3515625, -25.0322265625, -23.712890625, -22.3935546875, -21.07421875, -19.7548828125, -18.435546875, -17.1162109375, -15.796875, -14.4775390625, -13.158203125, -11.8388671875, -10.51953125, -9.2001953125, -7.880859375, -6.5615234375, -5.2421875, -3.9228515625, -2.603515625, -1.2841796875, 0.03515625, 1.3544921875, 2.673828125, 3.9931640625, 5.3125, 6.6318359375, 7.951171875, 9.2705078125, 10.58984375, 11.9091796875, 13.228515625, 14.5478515625, 15.8671875, 17.1865234375, 18.505859375, 19.8251953125, 21.14453125, 22.4638671875, 23.783203125, 25.1025390625, 26.421875, 27.7412109375, 29.060546875, 30.3798828125, 31.69921875, 33.0185546875, 34.337890625, 35.6572265625, 36.9765625, 38.2958984375, 39.615234375, 40.9345703125, 42.25390625, 43.5732421875, 44.892578125, 46.2119140625, 47.53125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 10.0, 9.0, 18.0, 24.0, 27.0, 36.0, 70.0, 207.0, 276.0, 112.0, 48.0, 32.0, 29.0, 22.0, 19.0, 11.0, 14.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.002384185791015625, -0.002318471670150757, -0.0022527575492858887, -0.0021870434284210205, -0.0021213293075561523, -0.002055615186691284, -0.001989901065826416, -0.0019241869449615479, -0.0018584728240966797, -0.0017927587032318115, -0.0017270445823669434, -0.0016613304615020752, -0.001595616340637207, -0.0015299022197723389, -0.0014641880989074707, -0.0013984739780426025, -0.0013327598571777344, -0.0012670457363128662, -0.001201331615447998, -0.0011356174945831299, -0.0010699033737182617, -0.0010041892528533936, -0.0009384751319885254, -0.0008727610111236572, -0.0008070468902587891, -0.0007413327693939209, -0.0006756186485290527, -0.0006099045276641846, -0.0005441904067993164, -0.00047847628593444824, -0.0004127621650695801, -0.0003470480442047119, -0.00028133392333984375, -0.00021561980247497559, -0.00014990568161010742, -8.419156074523926e-05, -1.8477439880371094e-05, 4.723668098449707e-05, 0.00011295080184936523, 0.0001786649227142334, 0.00024437904357910156, 0.0003100931644439697, 0.0003758072853088379, 0.00044152140617370605, 0.0005072355270385742, 0.0005729496479034424, 0.0006386637687683105, 0.0007043778896331787, 0.0007700920104980469, 0.000835806131362915, 0.0009015202522277832, 0.0009672343730926514, 0.0010329484939575195, 0.0010986626148223877, 0.0011643767356872559, 0.001230090856552124, 0.0012958049774169922, 0.0013615190982818604, 0.0014272332191467285, 0.0014929473400115967, 0.0015586614608764648, 0.001624375581741333, 0.0016900897026062012, 0.0017558038234710693, 0.0018215179443359375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 5.0, 3.0, 4.0, 13.0, 12.0, 15.0, 30.0, 34.0, 58.0, 81.0, 224.0, 544.0, 2543.0, 30045.0, 995003.0, 17199.0, 1883.0, 432.0, 176.0, 73.0, 57.0, 36.0, 20.0, 14.0, 14.0, 5.0, 11.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.5, -56.44140625, -54.3828125, -52.32421875, -50.265625, -48.20703125, -46.1484375, -44.08984375, -42.03125, -39.97265625, -37.9140625, -35.85546875, -33.796875, -31.73828125, -29.6796875, -27.62109375, -25.5625, -23.50390625, -21.4453125, -19.38671875, -17.328125, -15.26953125, -13.2109375, -11.15234375, -9.09375, -7.03515625, -4.9765625, -2.91796875, -0.859375, 1.19921875, 3.2578125, 5.31640625, 7.375, 9.43359375, 11.4921875, 13.55078125, 15.609375, 17.66796875, 19.7265625, 21.78515625, 23.84375, 25.90234375, 27.9609375, 30.01953125, 32.078125, 34.13671875, 36.1953125, 38.25390625, 40.3125, 42.37109375, 44.4296875, 46.48828125, 48.546875, 50.60546875, 52.6640625, 54.72265625, 56.78125, 58.83984375, 60.8984375, 62.95703125, 65.015625, 67.07421875, 69.1328125, 71.19140625, 73.25]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 11.0, 21.0, 34.0, 134.0, 390.0, 261.0, 65.0, 23.0, 14.0, 8.0, 5.0, 3.0, 2.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.21875, -47.916015625, -46.61328125, -45.310546875, -44.0078125, -42.705078125, -41.40234375, -40.099609375, -38.796875, -37.494140625, -36.19140625, -34.888671875, -33.5859375, -32.283203125, -30.98046875, -29.677734375, -28.375, -27.072265625, -25.76953125, -24.466796875, -23.1640625, -21.861328125, -20.55859375, -19.255859375, -17.953125, -16.650390625, -15.34765625, -14.044921875, -12.7421875, -11.439453125, -10.13671875, -8.833984375, -7.53125, -6.228515625, -4.92578125, -3.623046875, -2.3203125, -1.017578125, 0.28515625, 1.587890625, 2.890625, 4.193359375, 5.49609375, 6.798828125, 8.1015625, 9.404296875, 10.70703125, 12.009765625, 13.3125, 14.615234375, 15.91796875, 17.220703125, 18.5234375, 19.826171875, 21.12890625, 22.431640625, 23.734375, 25.037109375, 26.33984375, 27.642578125, 28.9453125, 30.248046875, 31.55078125, 32.853515625, 34.15625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 11.0, 21.0, 110.0, 341.0, 352.0, 119.0, 27.0, 13.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-666.03369140625, -650.8236083984375, -635.6135864257812, -620.4035034179688, -605.1934204101562, -589.9833374023438, -574.7733154296875, -559.563232421875, -544.3531494140625, -529.14306640625, -513.9330444335938, -498.72296142578125, -483.51287841796875, -468.3028259277344, -453.0927429199219, -437.8826904296875, -422.672607421875, -407.4625549316406, -392.2524719238281, -377.04241943359375, -361.83233642578125, -346.6222839355469, -331.4122009277344, -316.2021484375, -300.9920959472656, -285.78204345703125, -270.57196044921875, -255.3618927001953, -240.15182495117188, -224.9417724609375, -209.731689453125, -194.52163696289062, -179.31155395507812, -164.1014862060547, -148.89141845703125, -133.6813507080078, -118.47128295898438, -103.26122283935547, -88.05115509033203, -72.8410873413086, -57.631019592285156, -42.42095184326172, -27.210886001586914, -12.00082015991211, 3.209247589111328, 18.4193115234375, 33.62937927246094, 48.839447021484375, 64.04951477050781, 79.25958251953125, 94.46965026855469, 109.67971801757812, 124.88978576660156, 140.099853515625, 155.30990600585938, 170.51998901367188, 185.73004150390625, 200.9401092529297, 216.15017700195312, 231.36024475097656, 246.5703125, 261.7803649902344, 276.9904479980469, 292.20050048828125, 307.41058349609375]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 6.0, 14.0, 23.0, 21.0, 25.0, 37.0, 48.0, 54.0, 69.0, 73.0, 79.0, 73.0, 79.0, 76.0, 65.0, 60.0, 61.0, 33.0, 33.0, 20.0, 20.0, 16.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-277.38763427734375, -269.22467041015625, -261.06170654296875, -252.8987274169922, -244.73574829101562, -236.57278442382812, -228.40982055664062, -220.24685668945312, -212.08387756347656, -203.92091369628906, -195.7579345703125, -187.594970703125, -179.4320068359375, -171.26902770996094, -163.10606384277344, -154.94308471679688, -146.78012084960938, -138.61715698242188, -130.4541778564453, -122.29121398925781, -114.12824249267578, -105.96527099609375, -97.80230712890625, -89.63933563232422, -81.47636413574219, -73.31339263916016, -65.15042114257812, -56.987457275390625, -48.824485778808594, -40.66151428222656, -32.4985466003418, -24.33557891845703, -16.172637939453125, -8.009668350219727, 0.15330123901367188, 8.31627082824707, 16.47924041748047, 24.6422119140625, 32.805179595947266, 40.96814727783203, 49.13111877441406, 57.294090270996094, 65.45706176757812, 73.62002563476562, 81.78299713134766, 89.94596862792969, 98.10893249511719, 106.27190399169922, 114.43487548828125, 122.59784698486328, 130.7608184814453, 138.9237823486328, 147.08676147460938, 155.24972534179688, 163.41268920898438, 171.57565307617188, 179.73863220214844, 187.90159606933594, 196.0645751953125, 204.2275390625, 212.3905029296875, 220.55348205566406, 228.71644592285156, 236.87942504882812, 245.04238891601562]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 21.0, 20.0, 32.0, 60.0, 117.0, 215.0, 546.0, 1700.0, 7023.0, 55037.0, 3926251.0, 185501.0, 13085.0, 2992.0, 911.0, 355.0, 166.0, 76.0, 47.0, 35.0, 26.0, 8.0, 18.0, 9.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.09375, -52.27099609375, -50.4482421875, -48.62548828125, -46.802734375, -44.97998046875, -43.1572265625, -41.33447265625, -39.51171875, -37.68896484375, -35.8662109375, -34.04345703125, -32.220703125, -30.39794921875, -28.5751953125, -26.75244140625, -24.9296875, -23.10693359375, -21.2841796875, -19.46142578125, -17.638671875, -15.81591796875, -13.9931640625, -12.17041015625, -10.34765625, -8.52490234375, -6.7021484375, -4.87939453125, -3.056640625, -1.23388671875, 0.5888671875, 2.41162109375, 4.234375, 6.05712890625, 7.8798828125, 9.70263671875, 11.525390625, 13.34814453125, 15.1708984375, 16.99365234375, 18.81640625, 20.63916015625, 22.4619140625, 24.28466796875, 26.107421875, 27.93017578125, 29.7529296875, 31.57568359375, 33.3984375, 35.22119140625, 37.0439453125, 38.86669921875, 40.689453125, 42.51220703125, 44.3349609375, 46.15771484375, 47.98046875, 49.80322265625, 51.6259765625, 53.44873046875, 55.271484375, 57.09423828125, 58.9169921875, 60.73974609375, 62.5625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 13.0, 19.0, 31.0, 49.0, 78.0, 95.0, 119.0, 113.0, 119.0, 97.0, 67.0, 69.0, 54.0, 28.0, 16.0, 14.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.703125, -11.2666015625, -10.830078125, -10.3935546875, -9.95703125, -9.5205078125, -9.083984375, -8.6474609375, -8.2109375, -7.7744140625, -7.337890625, -6.9013671875, -6.46484375, -6.0283203125, -5.591796875, -5.1552734375, -4.71875, -4.2822265625, -3.845703125, -3.4091796875, -2.97265625, -2.5361328125, -2.099609375, -1.6630859375, -1.2265625, -0.7900390625, -0.353515625, 0.0830078125, 0.51953125, 0.9560546875, 1.392578125, 1.8291015625, 2.265625, 2.7021484375, 3.138671875, 3.5751953125, 4.01171875, 4.4482421875, 4.884765625, 5.3212890625, 5.7578125, 6.1943359375, 6.630859375, 7.0673828125, 7.50390625, 7.9404296875, 8.376953125, 8.8134765625, 9.25, 9.6865234375, 10.123046875, 10.5595703125, 10.99609375, 11.4326171875, 11.869140625, 12.3056640625, 12.7421875, 13.1787109375, 13.615234375, 14.0517578125, 14.48828125, 14.9248046875, 15.361328125, 15.7978515625, 16.234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 9.0, 18.0, 21.0, 25.0, 43.0, 51.0, 80.0, 122.0, 193.0, 374.0, 756.0, 1632.0, 4269.0, 13420.0, 67380.0, 3025597.0, 1018817.0, 45613.0, 9958.0, 3266.0, 1320.0, 586.0, 253.0, 165.0, 131.0, 62.0, 44.0, 20.0, 16.0, 13.0, 10.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.890625, -29.822021484375, -28.75341796875, -27.684814453125, -26.6162109375, -25.547607421875, -24.47900390625, -23.410400390625, -22.341796875, -21.273193359375, -20.20458984375, -19.135986328125, -18.0673828125, -16.998779296875, -15.93017578125, -14.861572265625, -13.79296875, -12.724365234375, -11.65576171875, -10.587158203125, -9.5185546875, -8.449951171875, -7.38134765625, -6.312744140625, -5.244140625, -4.175537109375, -3.10693359375, -2.038330078125, -0.9697265625, 0.098876953125, 1.16748046875, 2.236083984375, 3.3046875, 4.373291015625, 5.44189453125, 6.510498046875, 7.5791015625, 8.647705078125, 9.71630859375, 10.784912109375, 11.853515625, 12.922119140625, 13.99072265625, 15.059326171875, 16.1279296875, 17.196533203125, 18.26513671875, 19.333740234375, 20.40234375, 21.470947265625, 22.53955078125, 23.608154296875, 24.6767578125, 25.745361328125, 26.81396484375, 27.882568359375, 28.951171875, 30.019775390625, 31.08837890625, 32.156982421875, 33.2255859375, 34.294189453125, 35.36279296875, 36.431396484375, 37.5]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 5.0, 7.0, 12.0, 13.0, 11.0, 25.0, 30.0, 54.0, 160.0, 365.0, 1961.0, 1036.0, 210.0, 91.0, 39.0, 18.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.296875, -21.7073974609375, -21.117919921875, -20.5284423828125, -19.93896484375, -19.3494873046875, -18.760009765625, -18.1705322265625, -17.5810546875, -16.9915771484375, -16.402099609375, -15.8126220703125, -15.22314453125, -14.6336669921875, -14.044189453125, -13.4547119140625, -12.865234375, -12.2757568359375, -11.686279296875, -11.0968017578125, -10.50732421875, -9.9178466796875, -9.328369140625, -8.7388916015625, -8.1494140625, -7.5599365234375, -6.970458984375, -6.3809814453125, -5.79150390625, -5.2020263671875, -4.612548828125, -4.0230712890625, -3.43359375, -2.8441162109375, -2.254638671875, -1.6651611328125, -1.07568359375, -0.4862060546875, 0.103271484375, 0.6927490234375, 1.2822265625, 1.8717041015625, 2.461181640625, 3.0506591796875, 3.64013671875, 4.2296142578125, 4.819091796875, 5.4085693359375, 5.998046875, 6.5875244140625, 7.177001953125, 7.7664794921875, 8.35595703125, 8.9454345703125, 9.534912109375, 10.1243896484375, 10.7138671875, 11.3033447265625, 11.892822265625, 12.4822998046875, 13.07177734375, 13.6612548828125, 14.250732421875, 14.8402099609375, 15.4296875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 8.0, 20.0, 69.0, 468.0, 406.0, 34.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-537.8612060546875, -527.7481079101562, -517.635009765625, -507.5219421386719, -497.4088439941406, -487.2957458496094, -477.1826477050781, -467.069580078125, -456.95648193359375, -446.8433837890625, -436.73028564453125, -426.6172180175781, -416.5041198730469, -406.3910217285156, -396.2779235839844, -386.16485595703125, -376.0517578125, -365.93865966796875, -355.8255615234375, -345.7124938964844, -335.5993957519531, -325.4862976074219, -315.3731994628906, -305.2601318359375, -295.1470031738281, -285.0339050292969, -274.9208068847656, -264.8077392578125, -254.69464111328125, -244.58154296875, -234.46844482421875, -224.35536193847656, -214.24227905273438, -204.12918090820312, -194.01609802246094, -183.9029998779297, -173.7899169921875, -163.67681884765625, -153.563720703125, -143.4506378173828, -133.33755493164062, -123.2244644165039, -113.11137390136719, -102.99827575683594, -92.88519287109375, -82.7720947265625, -72.65900421142578, -62.54591369628906, -52.43281555175781, -42.319725036621094, -32.206634521484375, -22.09354019165039, -11.980449676513672, -1.8673591613769531, 8.245735168457031, 18.35882568359375, 28.47191619873047, 38.58500671386719, 48.698097229003906, 58.81119155883789, 68.92428588867188, 79.03736877441406, 89.15046691894531, 99.26355743408203, 109.37664794921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 15.0, 14.0, 13.0, 26.0, 27.0, 49.0, 53.0, 54.0, 70.0, 70.0, 48.0, 71.0, 61.0, 70.0, 59.0, 70.0, 50.0, 40.0, 30.0, 20.0, 21.0, 21.0, 15.0, 12.0, 3.0, 4.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.38117218017578, -48.9798583984375, -46.57854461669922, -44.17722702026367, -41.77591323852539, -39.37459945678711, -36.97328186035156, -34.57196807861328, -32.170654296875, -29.76934051513672, -27.368024826049805, -24.96670913696289, -22.56539535522461, -20.164081573486328, -17.762765884399414, -15.3614501953125, -12.960136413574219, -10.558821678161621, -8.157506942749023, -5.756192207336426, -3.354877471923828, -0.9535627365112305, 1.4477519989013672, 3.8490676879882812, 6.2503814697265625, 8.65169620513916, 11.053010940551758, 13.454325675964355, 15.855640411376953, 18.256954193115234, 20.65826988220215, 23.059585571289062, 25.460899353027344, 27.862213134765625, 30.26352882385254, 32.66484451293945, 35.066158294677734, 37.467472076416016, 39.86878967285156, 42.270103454589844, 44.671417236328125, 47.072731018066406, 49.47404479980469, 51.875362396240234, 54.276676177978516, 56.6779899597168, 59.079307556152344, 61.480621337890625, 63.881935119628906, 66.28324890136719, 68.68456268310547, 71.08587646484375, 73.48719787597656, 75.88851165771484, 78.28982543945312, 80.6911392211914, 83.09245300292969, 85.49376678466797, 87.89508056640625, 90.29639434814453, 92.69770812988281, 95.09902954101562, 97.5003433227539, 99.90165710449219, 102.30297088623047]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 11.0, 10.0, 21.0, 34.0, 83.0, 119.0, 236.0, 536.0, 1394.0, 7985.0, 89819.0, 834715.0, 102340.0, 8645.0, 1551.0, 490.0, 253.0, 124.0, 90.0, 29.0, 23.0, 20.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-49.71875, -48.03466796875, -46.3505859375, -44.66650390625, -42.982421875, -41.29833984375, -39.6142578125, -37.93017578125, -36.24609375, -34.56201171875, -32.8779296875, -31.19384765625, -29.509765625, -27.82568359375, -26.1416015625, -24.45751953125, -22.7734375, -21.08935546875, -19.4052734375, -17.72119140625, -16.037109375, -14.35302734375, -12.6689453125, -10.98486328125, -9.30078125, -7.61669921875, -5.9326171875, -4.24853515625, -2.564453125, -0.88037109375, 0.8037109375, 2.48779296875, 4.171875, 5.85595703125, 7.5400390625, 9.22412109375, 10.908203125, 12.59228515625, 14.2763671875, 15.96044921875, 17.64453125, 19.32861328125, 21.0126953125, 22.69677734375, 24.380859375, 26.06494140625, 27.7490234375, 29.43310546875, 31.1171875, 32.80126953125, 34.4853515625, 36.16943359375, 37.853515625, 39.53759765625, 41.2216796875, 42.90576171875, 44.58984375, 46.27392578125, 47.9580078125, 49.64208984375, 51.326171875, 53.01025390625, 54.6943359375, 56.37841796875, 58.0625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 23.0, 50.0, 63.0, 77.0, 93.0, 106.0, 127.0, 113.0, 87.0, 75.0, 63.0, 46.0, 25.0, 14.0, 10.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6796875, -11.2398681640625, -10.800048828125, -10.3602294921875, -9.92041015625, -9.4805908203125, -9.040771484375, -8.6009521484375, -8.1611328125, -7.7213134765625, -7.281494140625, -6.8416748046875, -6.40185546875, -5.9620361328125, -5.522216796875, -5.0823974609375, -4.642578125, -4.2027587890625, -3.762939453125, -3.3231201171875, -2.88330078125, -2.4434814453125, -2.003662109375, -1.5638427734375, -1.1240234375, -0.6842041015625, -0.244384765625, 0.1954345703125, 0.63525390625, 1.0750732421875, 1.514892578125, 1.9547119140625, 2.39453125, 2.8343505859375, 3.274169921875, 3.7139892578125, 4.15380859375, 4.5936279296875, 5.033447265625, 5.4732666015625, 5.9130859375, 6.3529052734375, 6.792724609375, 7.2325439453125, 7.67236328125, 8.1121826171875, 8.552001953125, 8.9918212890625, 9.431640625, 9.8714599609375, 10.311279296875, 10.7510986328125, 11.19091796875, 11.6307373046875, 12.070556640625, 12.5103759765625, 12.9501953125, 13.3900146484375, 13.829833984375, 14.2696533203125, 14.70947265625, 15.1492919921875, 15.589111328125, 16.0289306640625, 16.46875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 1.0, 4.0, 9.0, 10.0, 7.0, 19.0, 29.0, 44.0, 51.0, 107.0, 114.0, 200.0, 379.0, 750.0, 1722.0, 5243.0, 20166.0, 115303.0, 688017.0, 177085.0, 28364.0, 6713.0, 2166.0, 930.0, 406.0, 242.0, 152.0, 101.0, 62.0, 47.0, 24.0, 28.0, 21.0, 10.0, 7.0, 5.0, 9.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.90625, -24.9677734375, -24.029296875, -23.0908203125, -22.15234375, -21.2138671875, -20.275390625, -19.3369140625, -18.3984375, -17.4599609375, -16.521484375, -15.5830078125, -14.64453125, -13.7060546875, -12.767578125, -11.8291015625, -10.890625, -9.9521484375, -9.013671875, -8.0751953125, -7.13671875, -6.1982421875, -5.259765625, -4.3212890625, -3.3828125, -2.4443359375, -1.505859375, -0.5673828125, 0.37109375, 1.3095703125, 2.248046875, 3.1865234375, 4.125, 5.0634765625, 6.001953125, 6.9404296875, 7.87890625, 8.8173828125, 9.755859375, 10.6943359375, 11.6328125, 12.5712890625, 13.509765625, 14.4482421875, 15.38671875, 16.3251953125, 17.263671875, 18.2021484375, 19.140625, 20.0791015625, 21.017578125, 21.9560546875, 22.89453125, 23.8330078125, 24.771484375, 25.7099609375, 26.6484375, 27.5869140625, 28.525390625, 29.4638671875, 30.40234375, 31.3408203125, 32.279296875, 33.2177734375, 34.15625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 15.0, 10.0, 8.0, 20.0, 20.0, 26.0, 27.0, 41.0, 33.0, 42.0, 57.0, 36.0, 59.0, 60.0, 46.0, 52.0, 50.0, 50.0, 57.0, 54.0, 31.0, 38.0, 25.0, 35.0, 14.0, 18.0, 17.0, 12.0, 5.0, 10.0, 5.0, 6.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.859375, -23.845947265625, -22.83251953125, -21.819091796875, -20.8056640625, -19.792236328125, -18.77880859375, -17.765380859375, -16.751953125, -15.738525390625, -14.72509765625, -13.711669921875, -12.6982421875, -11.684814453125, -10.67138671875, -9.657958984375, -8.64453125, -7.631103515625, -6.61767578125, -5.604248046875, -4.5908203125, -3.577392578125, -2.56396484375, -1.550537109375, -0.537109375, 0.476318359375, 1.48974609375, 2.503173828125, 3.5166015625, 4.530029296875, 5.54345703125, 6.556884765625, 7.5703125, 8.583740234375, 9.59716796875, 10.610595703125, 11.6240234375, 12.637451171875, 13.65087890625, 14.664306640625, 15.677734375, 16.691162109375, 17.70458984375, 18.718017578125, 19.7314453125, 20.744873046875, 21.75830078125, 22.771728515625, 23.78515625, 24.798583984375, 25.81201171875, 26.825439453125, 27.8388671875, 28.852294921875, 29.86572265625, 30.879150390625, 31.892578125, 32.906005859375, 33.91943359375, 34.932861328125, 35.9462890625, 36.959716796875, 37.97314453125, 38.986572265625, 40.0]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 12.0, 11.0, 12.0, 12.0, 28.0, 33.0, 36.0, 78.0, 138.0, 265.0, 696.0, 2009.0, 7006.0, 42690.0, 729287.0, 240968.0, 18826.0, 4173.0, 1300.0, 479.0, 193.0, 125.0, 60.0, 37.0, 18.0, 18.0, 13.0, 10.0, 8.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.25, -17.7796630859375, -17.309326171875, -16.8389892578125, -16.36865234375, -15.8983154296875, -15.427978515625, -14.9576416015625, -14.4873046875, -14.0169677734375, -13.546630859375, -13.0762939453125, -12.60595703125, -12.1356201171875, -11.665283203125, -11.1949462890625, -10.724609375, -10.2542724609375, -9.783935546875, -9.3135986328125, -8.84326171875, -8.3729248046875, -7.902587890625, -7.4322509765625, -6.9619140625, -6.4915771484375, -6.021240234375, -5.5509033203125, -5.08056640625, -4.6102294921875, -4.139892578125, -3.6695556640625, -3.19921875, -2.7288818359375, -2.258544921875, -1.7882080078125, -1.31787109375, -0.8475341796875, -0.377197265625, 0.0931396484375, 0.5634765625, 1.0338134765625, 1.504150390625, 1.9744873046875, 2.44482421875, 2.9151611328125, 3.385498046875, 3.8558349609375, 4.326171875, 4.7965087890625, 5.266845703125, 5.7371826171875, 6.20751953125, 6.6778564453125, 7.148193359375, 7.6185302734375, 8.0888671875, 8.5592041015625, 9.029541015625, 9.4998779296875, 9.97021484375, 10.4405517578125, 10.910888671875, 11.3812255859375, 11.8515625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 5.0, 5.0, 11.0, 5.0, 10.0, 12.0, 8.0, 12.0, 29.0, 28.0, 34.0, 56.0, 116.0, 230.0, 180.0, 97.0, 46.0, 27.0, 18.0, 16.0, 6.0, 8.0, 5.0, 8.0, 7.0, 4.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010776519775390625, -0.0010389834642410278, -0.0010003149509429932, -0.0009616464376449585, -0.0009229779243469238, -0.0008843094110488892, -0.0008456408977508545, -0.0008069723844528198, -0.0007683038711547852, -0.0007296353578567505, -0.0006909668445587158, -0.0006522983312606812, -0.0006136298179626465, -0.0005749613046646118, -0.0005362927913665771, -0.0004976242780685425, -0.0004589557647705078, -0.00042028725147247314, -0.0003816187381744385, -0.0003429502248764038, -0.00030428171157836914, -0.00026561319828033447, -0.0002269446849822998, -0.00018827617168426514, -0.00014960765838623047, -0.0001109391450881958, -7.227063179016113e-05, -3.3602118492126465e-05, 5.066394805908203e-06, 4.373490810394287e-05, 8.240342140197754e-05, 0.00012107193470001221, 0.00015974044799804688, 0.00019840896129608154, 0.0002370774745941162, 0.0002757459878921509, 0.00031441450119018555, 0.0003530830144882202, 0.0003917515277862549, 0.00043042004108428955, 0.0004690885543823242, 0.0005077570676803589, 0.0005464255809783936, 0.0005850940942764282, 0.0006237626075744629, 0.0006624311208724976, 0.0007010996341705322, 0.0007397681474685669, 0.0007784366607666016, 0.0008171051740646362, 0.0008557736873626709, 0.0008944422006607056, 0.0009331107139587402, 0.0009717792272567749, 0.0010104477405548096, 0.0010491162538528442, 0.001087784767150879, 0.0011264532804489136, 0.0011651217937469482, 0.001203790307044983, 0.0012424588203430176, 0.0012811273336410522, 0.001319795846939087, 0.0013584643602371216, 0.0013971328735351562]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 10.0, 8.0, 14.0, 16.0, 23.0, 30.0, 45.0, 80.0, 101.0, 199.0, 402.0, 1063.0, 4192.0, 29390.0, 698476.0, 293617.0, 16540.0, 2745.0, 803.0, 302.0, 162.0, 113.0, 70.0, 46.0, 24.0, 24.0, 16.0, 12.0, 16.0, 10.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.796875, -10.30322265625, -9.8095703125, -9.31591796875, -8.822265625, -8.32861328125, -7.8349609375, -7.34130859375, -6.84765625, -6.35400390625, -5.8603515625, -5.36669921875, -4.873046875, -4.37939453125, -3.8857421875, -3.39208984375, -2.8984375, -2.40478515625, -1.9111328125, -1.41748046875, -0.923828125, -0.43017578125, 0.0634765625, 0.55712890625, 1.05078125, 1.54443359375, 2.0380859375, 2.53173828125, 3.025390625, 3.51904296875, 4.0126953125, 4.50634765625, 5.0, 5.49365234375, 5.9873046875, 6.48095703125, 6.974609375, 7.46826171875, 7.9619140625, 8.45556640625, 8.94921875, 9.44287109375, 9.9365234375, 10.43017578125, 10.923828125, 11.41748046875, 11.9111328125, 12.40478515625, 12.8984375, 13.39208984375, 13.8857421875, 14.37939453125, 14.873046875, 15.36669921875, 15.8603515625, 16.35400390625, 16.84765625, 17.34130859375, 17.8349609375, 18.32861328125, 18.822265625, 19.31591796875, 19.8095703125, 20.30322265625, 20.796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 11.0, 23.0, 29.0, 48.0, 62.0, 115.0, 155.0, 169.0, 131.0, 103.0, 54.0, 30.0, 25.0, 10.0, 15.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375, -8.916015625, -8.45703125, -7.998046875, -7.5390625, -7.080078125, -6.62109375, -6.162109375, -5.703125, -5.244140625, -4.78515625, -4.326171875, -3.8671875, -3.408203125, -2.94921875, -2.490234375, -2.03125, -1.572265625, -1.11328125, -0.654296875, -0.1953125, 0.263671875, 0.72265625, 1.181640625, 1.640625, 2.099609375, 2.55859375, 3.017578125, 3.4765625, 3.935546875, 4.39453125, 4.853515625, 5.3125, 5.771484375, 6.23046875, 6.689453125, 7.1484375, 7.607421875, 8.06640625, 8.525390625, 8.984375, 9.443359375, 9.90234375, 10.361328125, 10.8203125, 11.279296875, 11.73828125, 12.197265625, 12.65625, 13.115234375, 13.57421875, 14.033203125, 14.4921875, 14.951171875, 15.41015625, 15.869140625, 16.328125, 16.787109375, 17.24609375, 17.705078125, 18.1640625, 18.623046875, 19.08203125, 19.541015625, 20.0]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 23.0, 47.0, 200.0, 411.0, 238.0, 67.0, 17.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-601.9779663085938, -588.9923706054688, -576.0067138671875, -563.0211181640625, -550.0355224609375, -537.0498657226562, -524.0642700195312, -511.0786437988281, -498.093017578125, -485.1073913574219, -472.1217956542969, -459.13616943359375, -446.1505432128906, -433.1649169921875, -420.1793212890625, -407.1936950683594, -394.20806884765625, -381.2224426269531, -368.2368469238281, -355.251220703125, -342.2655944824219, -329.27996826171875, -316.29437255859375, -303.3087463378906, -290.3231506347656, -277.3375244140625, -264.3519287109375, -251.36630249023438, -238.38067626953125, -225.3950653076172, -212.40945434570312, -199.423828125, -186.4381866455078, -173.45257568359375, -160.46694946289062, -147.48133850097656, -134.49571228027344, -121.51010131835938, -108.52448272705078, -95.53886413574219, -82.5532455444336, -69.567626953125, -56.582008361816406, -43.59639358520508, -30.610774993896484, -17.625160217285156, -4.6395416259765625, 8.346076965332031, 21.331695556640625, 34.31731414794922, 47.30293273925781, 60.28854751586914, 73.274169921875, 86.25978088378906, 99.24539947509766, 112.23101806640625, 125.21663665771484, 138.20225524902344, 151.1878662109375, 164.17349243164062, 177.1591033935547, 190.14471435546875, 203.13034057617188, 216.115966796875, 229.10157775878906]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 5.0, 8.0, 7.0, 11.0, 11.0, 21.0, 18.0, 33.0, 28.0, 36.0, 39.0, 50.0, 37.0, 51.0, 49.0, 49.0, 51.0, 66.0, 47.0, 43.0, 37.0, 48.0, 32.0, 43.0, 40.0, 27.0, 20.0, 17.0, 20.0, 18.0, 11.0, 8.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-174.9173126220703, -170.01104736328125, -165.10476684570312, -160.198486328125, -155.29222106933594, -150.38595581054688, -145.47967529296875, -140.57339477539062, -135.66712951660156, -130.7608642578125, -125.85458374023438, -120.94831085205078, -116.04203796386719, -111.1357650756836, -106.2294921875, -101.3232192993164, -96.41694641113281, -91.51067352294922, -86.60440063476562, -81.69812774658203, -76.79185485839844, -71.88558197021484, -66.97930908203125, -62.073036193847656, -57.16676330566406, -52.26049041748047, -47.354217529296875, -42.44794464111328, -37.54167175292969, -32.635398864746094, -27.7291259765625, -22.822853088378906, -17.916595458984375, -13.010322570800781, -8.104049682617188, -3.1977767944335938, 1.70849609375, 6.614768981933594, 11.521041870117188, 16.42731475830078, 21.333587646484375, 26.23986053466797, 31.146133422851562, 36.052406311035156, 40.95867919921875, 45.864952087402344, 50.77122497558594, 55.67749786376953, 60.583770751953125, 65.49004364013672, 70.39631652832031, 75.3025894165039, 80.2088623046875, 85.1151351928711, 90.02140808105469, 94.92768096923828, 99.83395385742188, 104.74022674560547, 109.64649963378906, 114.55277252197266, 119.45904541015625, 124.36531829833984, 129.27159118652344, 134.1778564453125, 139.08413696289062]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 18.0, 16.0, 22.0, 31.0, 44.0, 65.0, 86.0, 159.0, 282.0, 513.0, 1039.0, 2306.0, 6307.0, 20628.0, 96680.0, 3283128.0, 700244.0, 58945.0, 14618.0, 4999.0, 1974.0, 889.0, 448.0, 268.0, 166.0, 107.0, 69.0, 41.0, 45.0, 27.0, 22.0, 16.0, 13.0, 10.0, 7.0, 5.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-33.125, -32.0517578125, -30.978515625, -29.9052734375, -28.83203125, -27.7587890625, -26.685546875, -25.6123046875, -24.5390625, -23.4658203125, -22.392578125, -21.3193359375, -20.24609375, -19.1728515625, -18.099609375, -17.0263671875, -15.953125, -14.8798828125, -13.806640625, -12.7333984375, -11.66015625, -10.5869140625, -9.513671875, -8.4404296875, -7.3671875, -6.2939453125, -5.220703125, -4.1474609375, -3.07421875, -2.0009765625, -0.927734375, 0.1455078125, 1.21875, 2.2919921875, 3.365234375, 4.4384765625, 5.51171875, 6.5849609375, 7.658203125, 8.7314453125, 9.8046875, 10.8779296875, 11.951171875, 13.0244140625, 14.09765625, 15.1708984375, 16.244140625, 17.3173828125, 18.390625, 19.4638671875, 20.537109375, 21.6103515625, 22.68359375, 23.7568359375, 24.830078125, 25.9033203125, 26.9765625, 28.0498046875, 29.123046875, 30.1962890625, 31.26953125, 32.3427734375, 33.416015625, 34.4892578125, 35.5625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 7.0, 10.0, 11.0, 17.0, 46.0, 39.0, 75.0, 84.0, 100.0, 115.0, 102.0, 88.0, 93.0, 56.0, 47.0, 43.0, 25.0, 20.0, 12.0, 6.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7109375, -11.279052734375, -10.84716796875, -10.415283203125, -9.9833984375, -9.551513671875, -9.11962890625, -8.687744140625, -8.255859375, -7.823974609375, -7.39208984375, -6.960205078125, -6.5283203125, -6.096435546875, -5.66455078125, -5.232666015625, -4.80078125, -4.368896484375, -3.93701171875, -3.505126953125, -3.0732421875, -2.641357421875, -2.20947265625, -1.777587890625, -1.345703125, -0.913818359375, -0.48193359375, -0.050048828125, 0.3818359375, 0.813720703125, 1.24560546875, 1.677490234375, 2.109375, 2.541259765625, 2.97314453125, 3.405029296875, 3.8369140625, 4.268798828125, 4.70068359375, 5.132568359375, 5.564453125, 5.996337890625, 6.42822265625, 6.860107421875, 7.2919921875, 7.723876953125, 8.15576171875, 8.587646484375, 9.01953125, 9.451416015625, 9.88330078125, 10.315185546875, 10.7470703125, 11.178955078125, 11.61083984375, 12.042724609375, 12.474609375, 12.906494140625, 13.33837890625, 13.770263671875, 14.2021484375, 14.634033203125, 15.06591796875, 15.497802734375, 15.9296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 11.0, 8.0, 15.0, 18.0, 25.0, 30.0, 41.0, 47.0, 69.0, 94.0, 109.0, 185.0, 345.0, 619.0, 1258.0, 2795.0, 7422.0, 23142.0, 102035.0, 2566635.0, 1368054.0, 88858.0, 20545.0, 6732.0, 2560.0, 1136.0, 554.0, 327.0, 153.0, 119.0, 85.0, 57.0, 36.0, 34.0, 30.0, 25.0, 24.0, 11.0, 9.0, 11.0, 3.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-29.90625, -29.025634765625, -28.14501953125, -27.264404296875, -26.3837890625, -25.503173828125, -24.62255859375, -23.741943359375, -22.861328125, -21.980712890625, -21.10009765625, -20.219482421875, -19.3388671875, -18.458251953125, -17.57763671875, -16.697021484375, -15.81640625, -14.935791015625, -14.05517578125, -13.174560546875, -12.2939453125, -11.413330078125, -10.53271484375, -9.652099609375, -8.771484375, -7.890869140625, -7.01025390625, -6.129638671875, -5.2490234375, -4.368408203125, -3.48779296875, -2.607177734375, -1.7265625, -0.845947265625, 0.03466796875, 0.915283203125, 1.7958984375, 2.676513671875, 3.55712890625, 4.437744140625, 5.318359375, 6.198974609375, 7.07958984375, 7.960205078125, 8.8408203125, 9.721435546875, 10.60205078125, 11.482666015625, 12.36328125, 13.243896484375, 14.12451171875, 15.005126953125, 15.8857421875, 16.766357421875, 17.64697265625, 18.527587890625, 19.408203125, 20.288818359375, 21.16943359375, 22.050048828125, 22.9306640625, 23.811279296875, 24.69189453125, 25.572509765625, 26.453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 9.0, 7.0, 13.0, 22.0, 45.0, 100.0, 237.0, 1181.0, 2043.0, 232.0, 82.0, 43.0, 29.0, 19.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.171875, -23.367919921875, -22.56396484375, -21.760009765625, -20.9560546875, -20.152099609375, -19.34814453125, -18.544189453125, -17.740234375, -16.936279296875, -16.13232421875, -15.328369140625, -14.5244140625, -13.720458984375, -12.91650390625, -12.112548828125, -11.30859375, -10.504638671875, -9.70068359375, -8.896728515625, -8.0927734375, -7.288818359375, -6.48486328125, -5.680908203125, -4.876953125, -4.072998046875, -3.26904296875, -2.465087890625, -1.6611328125, -0.857177734375, -0.05322265625, 0.750732421875, 1.5546875, 2.358642578125, 3.16259765625, 3.966552734375, 4.7705078125, 5.574462890625, 6.37841796875, 7.182373046875, 7.986328125, 8.790283203125, 9.59423828125, 10.398193359375, 11.2021484375, 12.006103515625, 12.81005859375, 13.614013671875, 14.41796875, 15.221923828125, 16.02587890625, 16.829833984375, 17.6337890625, 18.437744140625, 19.24169921875, 20.045654296875, 20.849609375, 21.653564453125, 22.45751953125, 23.261474609375, 24.0654296875, 24.869384765625, 25.67333984375, 26.477294921875, 27.28125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 14.0, 77.0, 375.0, 429.0, 90.0, 15.0, 4.0, 1.0, 2.0], "bins": [-420.2679443359375, -413.0373229980469, -405.8066711425781, -398.5760498046875, -391.34539794921875, -384.1147766113281, -376.8841552734375, -369.65350341796875, -362.4228820800781, -355.1922607421875, -347.96160888671875, -340.7309875488281, -333.5003356933594, -326.26971435546875, -319.0390625, -311.8084411621094, -304.57781982421875, -297.3471984863281, -290.1165466308594, -282.88592529296875, -275.6552734375, -268.4246520996094, -261.19403076171875, -253.96337890625, -246.73272705078125, -239.50209045410156, -232.27145385742188, -225.04083251953125, -217.81019592285156, -210.57955932617188, -203.3489227294922, -196.1182861328125, -188.88766479492188, -181.6570281982422, -174.4263916015625, -167.19577026367188, -159.9651336669922, -152.7344970703125, -145.5038604736328, -138.27322387695312, -131.0426025390625, -123.81196594238281, -116.58133697509766, -109.35070037841797, -102.12007141113281, -94.88943481445312, -87.65879821777344, -80.42816162109375, -73.1975326538086, -65.9668960571289, -58.73626708984375, -51.50563049316406, -44.27499771118164, -37.04436492919922, -29.81372833251953, -22.58309555053711, -15.352462768554688, -8.12182903289795, -0.8911952972412109, 6.339439392089844, 13.570072174072266, 20.800704956054688, 28.031341552734375, 35.2619743347168, 42.49260711669922]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 9.0, 7.0, 14.0, 12.0, 27.0, 21.0, 25.0, 45.0, 41.0, 42.0, 55.0, 53.0, 51.0, 71.0, 61.0, 47.0, 57.0, 49.0, 51.0, 55.0, 47.0, 28.0, 26.0, 22.0, 22.0, 12.0, 14.0, 13.0, 2.0, 3.0, 4.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.321712493896484, -50.57841873168945, -48.83512878417969, -47.091835021972656, -45.348541259765625, -43.60525131225586, -41.86195755004883, -40.11866760253906, -38.37537384033203, -36.632080078125, -34.888790130615234, -33.1454963684082, -31.402204513549805, -29.658912658691406, -27.915618896484375, -26.172327041625977, -24.429035186767578, -22.68574333190918, -20.94245147705078, -19.19915771484375, -17.45586585998535, -15.712574005126953, -13.969281196594238, -12.225988388061523, -10.482696533203125, -8.739404678344727, -6.996111869812012, -5.252819538116455, -3.5095272064208984, -1.7662353515625, -0.022942543029785156, 1.7203502655029297, 3.463642120361328, 5.206934452056885, 6.950226783752441, 8.693519592285156, 10.436811447143555, 12.180103302001953, 13.923396110534668, 15.666688919067383, 17.40998077392578, 19.15327262878418, 20.896564483642578, 22.63985824584961, 24.383150100708008, 26.126441955566406, 27.869735717773438, 29.613027572631836, 31.356319427490234, 33.099613189697266, 34.84290313720703, 36.58619689941406, 38.329490661621094, 40.07278060913086, 41.81607437133789, 43.559364318847656, 45.30265808105469, 47.04595184326172, 48.789241790771484, 50.532535552978516, 52.27582550048828, 54.01911926269531, 55.762413024902344, 57.505706787109375, 59.24899673461914]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 18.0, 31.0, 30.0, 53.0, 84.0, 99.0, 151.0, 259.0, 500.0, 959.0, 2170.0, 6315.0, 19926.0, 75414.0, 295536.0, 465702.0, 131576.0, 33905.0, 9669.0, 3296.0, 1353.0, 571.0, 342.0, 208.0, 122.0, 64.0, 63.0, 39.0, 23.0, 15.0, 13.0, 9.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.109375, -28.232666015625, -27.35595703125, -26.479248046875, -25.6025390625, -24.725830078125, -23.84912109375, -22.972412109375, -22.095703125, -21.218994140625, -20.34228515625, -19.465576171875, -18.5888671875, -17.712158203125, -16.83544921875, -15.958740234375, -15.08203125, -14.205322265625, -13.32861328125, -12.451904296875, -11.5751953125, -10.698486328125, -9.82177734375, -8.945068359375, -8.068359375, -7.191650390625, -6.31494140625, -5.438232421875, -4.5615234375, -3.684814453125, -2.80810546875, -1.931396484375, -1.0546875, -0.177978515625, 0.69873046875, 1.575439453125, 2.4521484375, 3.328857421875, 4.20556640625, 5.082275390625, 5.958984375, 6.835693359375, 7.71240234375, 8.589111328125, 9.4658203125, 10.342529296875, 11.21923828125, 12.095947265625, 12.97265625, 13.849365234375, 14.72607421875, 15.602783203125, 16.4794921875, 17.356201171875, 18.23291015625, 19.109619140625, 19.986328125, 20.863037109375, 21.73974609375, 22.616455078125, 23.4931640625, 24.369873046875, 25.24658203125, 26.123291015625, 27.0]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 6.0, 15.0, 26.0, 38.0, 51.0, 69.0, 92.0, 91.0, 104.0, 104.0, 101.0, 82.0, 65.0, 49.0, 38.0, 20.0, 22.0, 11.0, 8.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.3677978515625, -10.930908203125, -10.4940185546875, -10.05712890625, -9.6202392578125, -9.183349609375, -8.7464599609375, -8.3095703125, -7.8726806640625, -7.435791015625, -6.9989013671875, -6.56201171875, -6.1251220703125, -5.688232421875, -5.2513427734375, -4.814453125, -4.3775634765625, -3.940673828125, -3.5037841796875, -3.06689453125, -2.6300048828125, -2.193115234375, -1.7562255859375, -1.3193359375, -0.8824462890625, -0.445556640625, -0.0086669921875, 0.42822265625, 0.8651123046875, 1.302001953125, 1.7388916015625, 2.17578125, 2.6126708984375, 3.049560546875, 3.4864501953125, 3.92333984375, 4.3602294921875, 4.797119140625, 5.2340087890625, 5.6708984375, 6.1077880859375, 6.544677734375, 6.9815673828125, 7.41845703125, 7.8553466796875, 8.292236328125, 8.7291259765625, 9.166015625, 9.6029052734375, 10.039794921875, 10.4766845703125, 10.91357421875, 11.3504638671875, 11.787353515625, 12.2242431640625, 12.6611328125, 13.0980224609375, 13.534912109375, 13.9718017578125, 14.40869140625, 14.8455810546875, 15.282470703125, 15.7193603515625, 16.15625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 9.0, 9.0, 23.0, 19.0, 22.0, 31.0, 54.0, 91.0, 119.0, 167.0, 295.0, 436.0, 748.0, 1482.0, 5211.0, 51155.0, 782590.0, 189290.0, 11949.0, 2345.0, 947.0, 514.0, 330.0, 221.0, 154.0, 116.0, 62.0, 46.0, 38.0, 26.0, 16.0, 14.0, 6.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-65.0625, -63.33740234375, -61.6123046875, -59.88720703125, -58.162109375, -56.43701171875, -54.7119140625, -52.98681640625, -51.26171875, -49.53662109375, -47.8115234375, -46.08642578125, -44.361328125, -42.63623046875, -40.9111328125, -39.18603515625, -37.4609375, -35.73583984375, -34.0107421875, -32.28564453125, -30.560546875, -28.83544921875, -27.1103515625, -25.38525390625, -23.66015625, -21.93505859375, -20.2099609375, -18.48486328125, -16.759765625, -15.03466796875, -13.3095703125, -11.58447265625, -9.859375, -8.13427734375, -6.4091796875, -4.68408203125, -2.958984375, -1.23388671875, 0.4912109375, 2.21630859375, 3.94140625, 5.66650390625, 7.3916015625, 9.11669921875, 10.841796875, 12.56689453125, 14.2919921875, 16.01708984375, 17.7421875, 19.46728515625, 21.1923828125, 22.91748046875, 24.642578125, 26.36767578125, 28.0927734375, 29.81787109375, 31.54296875, 33.26806640625, 34.9931640625, 36.71826171875, 38.443359375, 40.16845703125, 41.8935546875, 43.61865234375, 45.34375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 7.0, 3.0, 6.0, 14.0, 16.0, 19.0, 12.0, 23.0, 25.0, 29.0, 42.0, 33.0, 40.0, 43.0, 60.0, 65.0, 72.0, 69.0, 50.0, 44.0, 58.0, 48.0, 42.0, 33.0, 32.0, 20.0, 20.0, 9.0, 15.0, 14.0, 9.0, 6.0, 8.0, 7.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-45.28125, -44.013671875, -42.74609375, -41.478515625, -40.2109375, -38.943359375, -37.67578125, -36.408203125, -35.140625, -33.873046875, -32.60546875, -31.337890625, -30.0703125, -28.802734375, -27.53515625, -26.267578125, -25.0, -23.732421875, -22.46484375, -21.197265625, -19.9296875, -18.662109375, -17.39453125, -16.126953125, -14.859375, -13.591796875, -12.32421875, -11.056640625, -9.7890625, -8.521484375, -7.25390625, -5.986328125, -4.71875, -3.451171875, -2.18359375, -0.916015625, 0.3515625, 1.619140625, 2.88671875, 4.154296875, 5.421875, 6.689453125, 7.95703125, 9.224609375, 10.4921875, 11.759765625, 13.02734375, 14.294921875, 15.5625, 16.830078125, 18.09765625, 19.365234375, 20.6328125, 21.900390625, 23.16796875, 24.435546875, 25.703125, 26.970703125, 28.23828125, 29.505859375, 30.7734375, 32.041015625, 33.30859375, 34.576171875, 35.84375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 0.0, 5.0, 8.0, 4.0, 8.0, 14.0, 18.0, 11.0, 33.0, 40.0, 59.0, 101.0, 158.0, 260.0, 481.0, 1001.0, 2284.0, 6416.0, 24962.0, 124529.0, 625029.0, 208753.0, 39373.0, 9376.0, 2957.0, 1303.0, 561.0, 306.0, 190.0, 99.0, 65.0, 41.0, 28.0, 23.0, 14.0, 7.0, 3.0, 5.0, 7.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.953125, -11.575439453125, -11.19775390625, -10.820068359375, -10.4423828125, -10.064697265625, -9.68701171875, -9.309326171875, -8.931640625, -8.553955078125, -8.17626953125, -7.798583984375, -7.4208984375, -7.043212890625, -6.66552734375, -6.287841796875, -5.91015625, -5.532470703125, -5.15478515625, -4.777099609375, -4.3994140625, -4.021728515625, -3.64404296875, -3.266357421875, -2.888671875, -2.510986328125, -2.13330078125, -1.755615234375, -1.3779296875, -1.000244140625, -0.62255859375, -0.244873046875, 0.1328125, 0.510498046875, 0.88818359375, 1.265869140625, 1.6435546875, 2.021240234375, 2.39892578125, 2.776611328125, 3.154296875, 3.531982421875, 3.90966796875, 4.287353515625, 4.6650390625, 5.042724609375, 5.42041015625, 5.798095703125, 6.17578125, 6.553466796875, 6.93115234375, 7.308837890625, 7.6865234375, 8.064208984375, 8.44189453125, 8.819580078125, 9.197265625, 9.574951171875, 9.95263671875, 10.330322265625, 10.7080078125, 11.085693359375, 11.46337890625, 11.841064453125, 12.21875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 9.0, 15.0, 20.0, 30.0, 32.0, 27.0, 62.0, 63.0, 107.0, 196.0, 135.0, 71.0, 60.0, 40.0, 31.0, 19.0, 23.0, 16.0, 13.0, 12.0, 4.0, 3.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010499954223632812, -0.000993475317955017, -0.0009369552135467529, -0.0008804351091384888, -0.0008239150047302246, -0.0007673949003219604, -0.0007108747959136963, -0.0006543546915054321, -0.000597834587097168, -0.0005413144826889038, -0.00048479437828063965, -0.0004282742738723755, -0.00037175416946411133, -0.00031523406505584717, -0.000258713960647583, -0.00020219385623931885, -0.0001456737518310547, -8.915364742279053e-05, -3.263354301452637e-05, 2.3886561393737793e-05, 8.040666580200195e-05, 0.0001369267702102661, 0.00019344687461853027, 0.00024996697902679443, 0.0003064870834350586, 0.00036300718784332275, 0.0004195272922515869, 0.0004760473966598511, 0.0005325675010681152, 0.0005890876054763794, 0.0006456077098846436, 0.0007021278142929077, 0.0007586479187011719, 0.000815168023109436, 0.0008716881275177002, 0.0009282082319259644, 0.0009847283363342285, 0.0010412484407424927, 0.0010977685451507568, 0.001154288649559021, 0.0012108087539672852, 0.0012673288583755493, 0.0013238489627838135, 0.0013803690671920776, 0.0014368891716003418, 0.001493409276008606, 0.0015499293804168701, 0.0016064494848251343, 0.0016629695892333984, 0.0017194896936416626, 0.0017760097980499268, 0.001832529902458191, 0.001889050006866455, 0.0019455701112747192, 0.0020020902156829834, 0.0020586103200912476, 0.0021151304244995117, 0.002171650528907776, 0.00222817063331604, 0.002284690737724304, 0.0023412108421325684, 0.0023977309465408325, 0.0024542510509490967, 0.002510771155357361, 0.002567291259765625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 13.0, 10.0, 18.0, 30.0, 49.0, 65.0, 100.0, 159.0, 252.0, 462.0, 944.0, 2578.0, 14024.0, 329564.0, 668263.0, 26180.0, 3321.0, 1180.0, 562.0, 267.0, 150.0, 100.0, 79.0, 50.0, 37.0, 21.0, 24.0, 11.0, 8.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.96875, -20.294921875, -19.62109375, -18.947265625, -18.2734375, -17.599609375, -16.92578125, -16.251953125, -15.578125, -14.904296875, -14.23046875, -13.556640625, -12.8828125, -12.208984375, -11.53515625, -10.861328125, -10.1875, -9.513671875, -8.83984375, -8.166015625, -7.4921875, -6.818359375, -6.14453125, -5.470703125, -4.796875, -4.123046875, -3.44921875, -2.775390625, -2.1015625, -1.427734375, -0.75390625, -0.080078125, 0.59375, 1.267578125, 1.94140625, 2.615234375, 3.2890625, 3.962890625, 4.63671875, 5.310546875, 5.984375, 6.658203125, 7.33203125, 8.005859375, 8.6796875, 9.353515625, 10.02734375, 10.701171875, 11.375, 12.048828125, 12.72265625, 13.396484375, 14.0703125, 14.744140625, 15.41796875, 16.091796875, 16.765625, 17.439453125, 18.11328125, 18.787109375, 19.4609375, 20.134765625, 20.80859375, 21.482421875, 22.15625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 19.0, 20.0, 30.0, 32.0, 41.0, 45.0, 62.0, 72.0, 86.0, 99.0, 98.0, 91.0, 67.0, 55.0, 48.0, 30.0, 17.0, 19.0, 10.0, 6.0, 7.0, 5.0, 7.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.765625, -9.369873046875, -8.97412109375, -8.578369140625, -8.1826171875, -7.786865234375, -7.39111328125, -6.995361328125, -6.599609375, -6.203857421875, -5.80810546875, -5.412353515625, -5.0166015625, -4.620849609375, -4.22509765625, -3.829345703125, -3.43359375, -3.037841796875, -2.64208984375, -2.246337890625, -1.8505859375, -1.454833984375, -1.05908203125, -0.663330078125, -0.267578125, 0.128173828125, 0.52392578125, 0.919677734375, 1.3154296875, 1.711181640625, 2.10693359375, 2.502685546875, 2.8984375, 3.294189453125, 3.68994140625, 4.085693359375, 4.4814453125, 4.877197265625, 5.27294921875, 5.668701171875, 6.064453125, 6.460205078125, 6.85595703125, 7.251708984375, 7.6474609375, 8.043212890625, 8.43896484375, 8.834716796875, 9.23046875, 9.626220703125, 10.02197265625, 10.417724609375, 10.8134765625, 11.209228515625, 11.60498046875, 12.000732421875, 12.396484375, 12.792236328125, 13.18798828125, 13.583740234375, 13.9794921875, 14.375244140625, 14.77099609375, 15.166748046875, 15.5625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 75.0, 465.0, 372.0, 71.0, 17.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1122.242431640625, -1097.734130859375, -1073.2257080078125, -1048.7174072265625, -1024.2091064453125, -999.7007446289062, -975.1923828125, -950.68408203125, -926.17578125, -901.6674194335938, -877.1591186523438, -852.6507568359375, -828.1424560546875, -803.6340942382812, -779.125732421875, -754.617431640625, -730.1090698242188, -705.6007080078125, -681.0924072265625, -656.5840454101562, -632.0757446289062, -607.5673828125, -583.05908203125, -558.5507202148438, -534.0423583984375, -509.5340270996094, -485.02569580078125, -460.517333984375, -436.009033203125, -411.50067138671875, -386.9923400878906, -362.4840087890625, -337.9757385253906, -313.4674072265625, -288.9590759277344, -264.45074462890625, -239.94239807128906, -215.43406677246094, -190.92572021484375, -166.41738891601562, -141.9090576171875, -117.40072631835938, -92.89238739013672, -68.38404846191406, -43.87571716308594, -19.367385864257812, 5.140960693359375, 29.6492919921875, 54.157623291015625, 78.66595458984375, 103.1742935180664, 127.68263244628906, 152.1909637451172, 176.6992950439453, 201.2076416015625, 225.71597290039062, 250.22430419921875, 274.7326354980469, 299.240966796875, 323.74932861328125, 348.25762939453125, 372.7659912109375, 397.2743225097656, 421.78265380859375, 446.2909851074219]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 4.0, 8.0, 10.0, 7.0, 9.0, 18.0, 13.0, 16.0, 22.0, 23.0, 26.0, 32.0, 28.0, 37.0, 37.0, 32.0, 37.0, 36.0, 43.0, 41.0, 33.0, 42.0, 44.0, 33.0, 32.0, 32.0, 40.0, 39.0, 23.0, 30.0, 22.0, 22.0, 20.0, 17.0, 15.0, 16.0, 13.0, 10.0, 5.0, 6.0, 6.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-148.94924926757812, -144.28082275390625, -139.6123809814453, -134.94395446777344, -130.2755126953125, -125.60708618164062, -120.93865203857422, -116.27021789550781, -111.60179138183594, -106.93335723876953, -102.26492309570312, -97.59649658203125, -92.92806243896484, -88.25962829589844, -83.59119415283203, -78.92276000976562, -74.25432586669922, -69.58589172363281, -64.9174575805664, -60.249027252197266, -55.580596923828125, -50.91216278076172, -46.24372863769531, -41.57529830932617, -36.906864166259766, -32.23843002319336, -27.56999969482422, -22.901565551757812, -18.23313331604004, -13.564701080322266, -8.89626693725586, -4.227836608886719, 0.4405975341796875, 5.109030246734619, 9.77746295928955, 14.44589614868164, 19.114328384399414, 23.782760620117188, 28.451194763183594, 33.119625091552734, 37.78805923461914, 42.45649337768555, 47.12492370605469, 51.793357849121094, 56.4617919921875, 61.13022232055664, 65.79866027832031, 70.46708679199219, 75.1355209350586, 79.803955078125, 84.4723892211914, 89.14082336425781, 93.80924987792969, 98.4776840209961, 103.1461181640625, 107.81454467773438, 112.48298645019531, 117.15142059326172, 121.81985473632812, 126.48828125, 131.15672302246094, 135.8251495361328, 140.49359130859375, 145.16201782226562, 149.8304443359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 9.0, 6.0, 17.0, 17.0, 19.0, 24.0, 46.0, 57.0, 103.0, 215.0, 410.0, 878.0, 2346.0, 6731.0, 23716.0, 143595.0, 3612607.0, 347987.0, 39576.0, 9897.0, 3330.0, 1308.0, 600.0, 295.0, 164.0, 102.0, 67.0, 33.0, 24.0, 15.0, 12.0, 19.0, 9.0, 5.0, 9.0, 6.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.5625, -32.3916015625, -31.220703125, -30.0498046875, -28.87890625, -27.7080078125, -26.537109375, -25.3662109375, -24.1953125, -23.0244140625, -21.853515625, -20.6826171875, -19.51171875, -18.3408203125, -17.169921875, -15.9990234375, -14.828125, -13.6572265625, -12.486328125, -11.3154296875, -10.14453125, -8.9736328125, -7.802734375, -6.6318359375, -5.4609375, -4.2900390625, -3.119140625, -1.9482421875, -0.77734375, 0.3935546875, 1.564453125, 2.7353515625, 3.90625, 5.0771484375, 6.248046875, 7.4189453125, 8.58984375, 9.7607421875, 10.931640625, 12.1025390625, 13.2734375, 14.4443359375, 15.615234375, 16.7861328125, 17.95703125, 19.1279296875, 20.298828125, 21.4697265625, 22.640625, 23.8115234375, 24.982421875, 26.1533203125, 27.32421875, 28.4951171875, 29.666015625, 30.8369140625, 32.0078125, 33.1787109375, 34.349609375, 35.5205078125, 36.69140625, 37.8623046875, 39.033203125, 40.2041015625, 41.375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 5.0, 16.0, 20.0, 24.0, 41.0, 72.0, 73.0, 75.0, 92.0, 94.0, 91.0, 100.0, 79.0, 68.0, 61.0, 30.0, 16.0, 15.0, 10.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.796875, -13.316650390625, -12.83642578125, -12.356201171875, -11.8759765625, -11.395751953125, -10.91552734375, -10.435302734375, -9.955078125, -9.474853515625, -8.99462890625, -8.514404296875, -8.0341796875, -7.553955078125, -7.07373046875, -6.593505859375, -6.11328125, -5.633056640625, -5.15283203125, -4.672607421875, -4.1923828125, -3.712158203125, -3.23193359375, -2.751708984375, -2.271484375, -1.791259765625, -1.31103515625, -0.830810546875, -0.3505859375, 0.129638671875, 0.60986328125, 1.090087890625, 1.5703125, 2.050537109375, 2.53076171875, 3.010986328125, 3.4912109375, 3.971435546875, 4.45166015625, 4.931884765625, 5.412109375, 5.892333984375, 6.37255859375, 6.852783203125, 7.3330078125, 7.813232421875, 8.29345703125, 8.773681640625, 9.25390625, 9.734130859375, 10.21435546875, 10.694580078125, 11.1748046875, 11.655029296875, 12.13525390625, 12.615478515625, 13.095703125, 13.575927734375, 14.05615234375, 14.536376953125, 15.0166015625, 15.496826171875, 15.97705078125, 16.457275390625, 16.9375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 10.0, 13.0, 6.0, 16.0, 29.0, 42.0, 62.0, 97.0, 135.0, 251.0, 386.0, 668.0, 1195.0, 2390.0, 5300.0, 12421.0, 33450.0, 117578.0, 876068.0, 2851359.0, 211127.0, 50490.0, 17474.0, 6967.0, 3130.0, 1512.0, 816.0, 527.0, 289.0, 173.0, 100.0, 73.0, 43.0, 28.0, 22.0, 14.0, 11.0, 6.0, 6.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.09375, -16.46484375, -15.8359375, -15.20703125, -14.578125, -13.94921875, -13.3203125, -12.69140625, -12.0625, -11.43359375, -10.8046875, -10.17578125, -9.546875, -8.91796875, -8.2890625, -7.66015625, -7.03125, -6.40234375, -5.7734375, -5.14453125, -4.515625, -3.88671875, -3.2578125, -2.62890625, -2.0, -1.37109375, -0.7421875, -0.11328125, 0.515625, 1.14453125, 1.7734375, 2.40234375, 3.03125, 3.66015625, 4.2890625, 4.91796875, 5.546875, 6.17578125, 6.8046875, 7.43359375, 8.0625, 8.69140625, 9.3203125, 9.94921875, 10.578125, 11.20703125, 11.8359375, 12.46484375, 13.09375, 13.72265625, 14.3515625, 14.98046875, 15.609375, 16.23828125, 16.8671875, 17.49609375, 18.125, 18.75390625, 19.3828125, 20.01171875, 20.640625, 21.26953125, 21.8984375, 22.52734375, 23.15625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 6.0, 14.0, 18.0, 5.0, 21.0, 33.0, 43.0, 43.0, 100.0, 140.0, 266.0, 533.0, 1637.0, 602.0, 225.0, 138.0, 87.0, 47.0, 31.0, 16.0, 19.0, 11.0, 9.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6484375, -14.184326171875, -13.72021484375, -13.256103515625, -12.7919921875, -12.327880859375, -11.86376953125, -11.399658203125, -10.935546875, -10.471435546875, -10.00732421875, -9.543212890625, -9.0791015625, -8.614990234375, -8.15087890625, -7.686767578125, -7.22265625, -6.758544921875, -6.29443359375, -5.830322265625, -5.3662109375, -4.902099609375, -4.43798828125, -3.973876953125, -3.509765625, -3.045654296875, -2.58154296875, -2.117431640625, -1.6533203125, -1.189208984375, -0.72509765625, -0.260986328125, 0.203125, 0.667236328125, 1.13134765625, 1.595458984375, 2.0595703125, 2.523681640625, 2.98779296875, 3.451904296875, 3.916015625, 4.380126953125, 4.84423828125, 5.308349609375, 5.7724609375, 6.236572265625, 6.70068359375, 7.164794921875, 7.62890625, 8.093017578125, 8.55712890625, 9.021240234375, 9.4853515625, 9.949462890625, 10.41357421875, 10.877685546875, 11.341796875, 11.805908203125, 12.27001953125, 12.734130859375, 13.1982421875, 13.662353515625, 14.12646484375, 14.590576171875, 15.0546875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 34.0, 101.0, 391.0, 355.0, 100.0, 16.0, 0.0, 2.0], "bins": [-510.11517333984375, -501.5164794921875, -492.91778564453125, -484.3191223144531, -475.7204284667969, -467.1217346191406, -458.5230407714844, -449.9243469238281, -441.32568359375, -432.72698974609375, -424.1282958984375, -415.5296325683594, -406.9309387207031, -398.3322448730469, -389.7335510253906, -381.1348571777344, -372.5361633300781, -363.9374694824219, -355.3387756347656, -346.7401123046875, -338.14141845703125, -329.542724609375, -320.94403076171875, -312.3453369140625, -303.74664306640625, -295.14794921875, -286.54925537109375, -277.9505920410156, -269.3518981933594, -260.7532043457031, -252.15451049804688, -243.55581665039062, -234.95713806152344, -226.3584442138672, -217.759765625, -209.16107177734375, -200.5623779296875, -191.9636993408203, -183.36500549316406, -174.76632690429688, -166.16763305664062, -157.56893920898438, -148.9702606201172, -140.37156677246094, -131.77288818359375, -123.1741943359375, -114.57550048828125, -105.97681427001953, -97.37812805175781, -88.7794418334961, -80.18075561523438, -71.58206176757812, -62.983375549316406, -54.38468933105469, -45.7859992980957, -37.18730926513672, -28.588623046875, -19.98993492126465, -11.391246795654297, -2.7925586700439453, 5.806129455566406, 14.404815673828125, 23.00350570678711, 31.602195739746094, 40.20088195800781]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 4.0, 6.0, 3.0, 10.0, 7.0, 11.0, 20.0, 13.0, 15.0, 16.0, 24.0, 21.0, 22.0, 26.0, 27.0, 46.0, 33.0, 46.0, 37.0, 58.0, 40.0, 47.0, 46.0, 38.0, 37.0, 43.0, 36.0, 30.0, 38.0, 26.0, 30.0, 26.0, 24.0, 14.0, 14.0, 9.0, 13.0, 8.0, 11.0, 5.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-55.14617919921875, -53.54331588745117, -51.940452575683594, -50.33759307861328, -48.7347297668457, -47.131866455078125, -45.52900314331055, -43.92613983154297, -42.323280334472656, -40.72041702270508, -39.1175537109375, -37.51469421386719, -35.91183090209961, -34.30896759033203, -32.70610427856445, -31.103242874145508, -29.50037956237793, -27.89751625061035, -26.294654846191406, -24.691791534423828, -23.088930130004883, -21.486066818237305, -19.88320541381836, -18.28034210205078, -16.677478790283203, -15.074616432189941, -13.47175407409668, -11.868890762329102, -10.266029357910156, -8.663166046142578, -7.060303688049316, -5.457441329956055, -3.8545799255371094, -2.2517175674438477, -0.6488549709320068, 0.954007625579834, 2.5568699836730957, 4.159732818603516, 5.762595176696777, 7.365457534790039, 8.9683198928833, 10.571182250976562, 12.174044609069824, 13.776906967163086, 15.379770278930664, 16.98263168334961, 18.585494995117188, 20.188358306884766, 21.79121971130371, 23.39408302307129, 24.996944427490234, 26.599807739257812, 28.202669143676758, 29.805532455444336, 31.40839385986328, 33.01125717163086, 34.61412048339844, 36.216983795166016, 37.819847106933594, 39.422706604003906, 41.025569915771484, 42.62843322753906, 44.23129653930664, 45.83415985107422, 47.43701934814453]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 10.0, 10.0, 15.0, 22.0, 38.0, 69.0, 108.0, 183.0, 275.0, 537.0, 1196.0, 3162.0, 11580.0, 58666.0, 341090.0, 500347.0, 104545.0, 18947.0, 4524.0, 1555.0, 768.0, 357.0, 215.0, 127.0, 64.0, 44.0, 31.0, 20.0, 14.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.3125, -34.1015625, -32.890625, -31.6796875, -30.46875, -29.2578125, -28.046875, -26.8359375, -25.625, -24.4140625, -23.203125, -21.9921875, -20.78125, -19.5703125, -18.359375, -17.1484375, -15.9375, -14.7265625, -13.515625, -12.3046875, -11.09375, -9.8828125, -8.671875, -7.4609375, -6.25, -5.0390625, -3.828125, -2.6171875, -1.40625, -0.1953125, 1.015625, 2.2265625, 3.4375, 4.6484375, 5.859375, 7.0703125, 8.28125, 9.4921875, 10.703125, 11.9140625, 13.125, 14.3359375, 15.546875, 16.7578125, 17.96875, 19.1796875, 20.390625, 21.6015625, 22.8125, 24.0234375, 25.234375, 26.4453125, 27.65625, 28.8671875, 30.078125, 31.2890625, 32.5, 33.7109375, 34.921875, 36.1328125, 37.34375, 38.5546875, 39.765625, 40.9765625, 42.1875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 1.0, 8.0, 9.0, 9.0, 27.0, 30.0, 42.0, 53.0, 75.0, 89.0, 90.0, 92.0, 101.0, 82.0, 77.0, 74.0, 56.0, 27.0, 30.0, 13.0, 7.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0546875, -13.5643310546875, -13.073974609375, -12.5836181640625, -12.09326171875, -11.6029052734375, -11.112548828125, -10.6221923828125, -10.1318359375, -9.6414794921875, -9.151123046875, -8.6607666015625, -8.17041015625, -7.6800537109375, -7.189697265625, -6.6993408203125, -6.208984375, -5.7186279296875, -5.228271484375, -4.7379150390625, -4.24755859375, -3.7572021484375, -3.266845703125, -2.7764892578125, -2.2861328125, -1.7957763671875, -1.305419921875, -0.8150634765625, -0.32470703125, 0.1656494140625, 0.656005859375, 1.1463623046875, 1.63671875, 2.1270751953125, 2.617431640625, 3.1077880859375, 3.59814453125, 4.0885009765625, 4.578857421875, 5.0692138671875, 5.5595703125, 6.0499267578125, 6.540283203125, 7.0306396484375, 7.52099609375, 8.0113525390625, 8.501708984375, 8.9920654296875, 9.482421875, 9.9727783203125, 10.463134765625, 10.9534912109375, 11.44384765625, 11.9342041015625, 12.424560546875, 12.9149169921875, 13.4052734375, 13.8956298828125, 14.385986328125, 14.8763427734375, 15.36669921875, 15.8570556640625, 16.347412109375, 16.8377685546875, 17.328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 3.0, 6.0, 7.0, 9.0, 10.0, 20.0, 29.0, 31.0, 49.0, 84.0, 129.0, 174.0, 378.0, 681.0, 1607.0, 6628.0, 123612.0, 875016.0, 33876.0, 3735.0, 1130.0, 565.0, 315.0, 171.0, 108.0, 57.0, 42.0, 34.0, 18.0, 10.0, 6.0, 4.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-116.875, -114.046875, -111.21875, -108.390625, -105.5625, -102.734375, -99.90625, -97.078125, -94.25, -91.421875, -88.59375, -85.765625, -82.9375, -80.109375, -77.28125, -74.453125, -71.625, -68.796875, -65.96875, -63.140625, -60.3125, -57.484375, -54.65625, -51.828125, -49.0, -46.171875, -43.34375, -40.515625, -37.6875, -34.859375, -32.03125, -29.203125, -26.375, -23.546875, -20.71875, -17.890625, -15.0625, -12.234375, -9.40625, -6.578125, -3.75, -0.921875, 1.90625, 4.734375, 7.5625, 10.390625, 13.21875, 16.046875, 18.875, 21.703125, 24.53125, 27.359375, 30.1875, 33.015625, 35.84375, 38.671875, 41.5, 44.328125, 47.15625, 49.984375, 52.8125, 55.640625, 58.46875, 61.296875, 64.125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 8.0, 8.0, 11.0, 13.0, 15.0, 22.0, 20.0, 24.0, 33.0, 39.0, 56.0, 55.0, 66.0, 70.0, 61.0, 70.0, 63.0, 79.0, 52.0, 47.0, 37.0, 27.0, 14.0, 14.0, 18.0, 17.0, 14.0, 10.0, 7.0, 3.0, 3.0, 5.0, 6.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.28125, -54.24560546875, -52.2099609375, -50.17431640625, -48.138671875, -46.10302734375, -44.0673828125, -42.03173828125, -39.99609375, -37.96044921875, -35.9248046875, -33.88916015625, -31.853515625, -29.81787109375, -27.7822265625, -25.74658203125, -23.7109375, -21.67529296875, -19.6396484375, -17.60400390625, -15.568359375, -13.53271484375, -11.4970703125, -9.46142578125, -7.42578125, -5.39013671875, -3.3544921875, -1.31884765625, 0.716796875, 2.75244140625, 4.7880859375, 6.82373046875, 8.859375, 10.89501953125, 12.9306640625, 14.96630859375, 17.001953125, 19.03759765625, 21.0732421875, 23.10888671875, 25.14453125, 27.18017578125, 29.2158203125, 31.25146484375, 33.287109375, 35.32275390625, 37.3583984375, 39.39404296875, 41.4296875, 43.46533203125, 45.5009765625, 47.53662109375, 49.572265625, 51.60791015625, 53.6435546875, 55.67919921875, 57.71484375, 59.75048828125, 61.7861328125, 63.82177734375, 65.857421875, 67.89306640625, 69.9287109375, 71.96435546875, 74.0]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 14.0, 14.0, 16.0, 20.0, 30.0, 52.0, 90.0, 163.0, 448.0, 1979.0, 41283.0, 940085.0, 60913.0, 2515.0, 477.0, 190.0, 93.0, 51.0, 43.0, 17.0, 16.0, 4.0, 12.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.6875, -38.50439453125, -37.3212890625, -36.13818359375, -34.955078125, -33.77197265625, -32.5888671875, -31.40576171875, -30.22265625, -29.03955078125, -27.8564453125, -26.67333984375, -25.490234375, -24.30712890625, -23.1240234375, -21.94091796875, -20.7578125, -19.57470703125, -18.3916015625, -17.20849609375, -16.025390625, -14.84228515625, -13.6591796875, -12.47607421875, -11.29296875, -10.10986328125, -8.9267578125, -7.74365234375, -6.560546875, -5.37744140625, -4.1943359375, -3.01123046875, -1.828125, -0.64501953125, 0.5380859375, 1.72119140625, 2.904296875, 4.08740234375, 5.2705078125, 6.45361328125, 7.63671875, 8.81982421875, 10.0029296875, 11.18603515625, 12.369140625, 13.55224609375, 14.7353515625, 15.91845703125, 17.1015625, 18.28466796875, 19.4677734375, 20.65087890625, 21.833984375, 23.01708984375, 24.2001953125, 25.38330078125, 26.56640625, 27.74951171875, 28.9326171875, 30.11572265625, 31.298828125, 32.48193359375, 33.6650390625, 34.84814453125, 36.03125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 9.0, 6.0, 15.0, 23.0, 14.0, 18.0, 27.0, 49.0, 53.0, 37.0, 76.0, 64.0, 83.0, 81.0, 68.0, 81.0, 58.0, 45.0, 42.0, 30.0, 25.0, 19.0, 7.0, 13.0, 12.0, 8.0, 11.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.001323699951171875, -0.0012825578451156616, -0.0012414157390594482, -0.0012002736330032349, -0.0011591315269470215, -0.001117989420890808, -0.0010768473148345947, -0.0010357052087783813, -0.000994563102722168, -0.0009534209966659546, -0.0009122788906097412, -0.0008711367845535278, -0.0008299946784973145, -0.0007888525724411011, -0.0007477104663848877, -0.0007065683603286743, -0.0006654262542724609, -0.0006242841482162476, -0.0005831420421600342, -0.0005419999361038208, -0.0005008578300476074, -0.00045971572399139404, -0.00041857361793518066, -0.0003774315118789673, -0.0003362894058227539, -0.00029514729976654053, -0.00025400519371032715, -0.00021286308765411377, -0.0001717209815979004, -0.000130578875541687, -8.943676948547363e-05, -4.8294663429260254e-05, -7.152557373046875e-06, 3.3989548683166504e-05, 7.513165473937988e-05, 0.00011627376079559326, 0.00015741586685180664, 0.00019855797290802002, 0.0002397000789642334, 0.0002808421850204468, 0.00032198429107666016, 0.00036312639713287354, 0.0004042685031890869, 0.0004454106092453003, 0.00048655271530151367, 0.000527694821357727, 0.0005688369274139404, 0.0006099790334701538, 0.0006511211395263672, 0.0006922632455825806, 0.0007334053516387939, 0.0007745474576950073, 0.0008156895637512207, 0.0008568316698074341, 0.0008979737758636475, 0.0009391158819198608, 0.0009802579879760742, 0.0010214000940322876, 0.001062542200088501, 0.0011036843061447144, 0.0011448264122009277, 0.0011859685182571411, 0.0012271106243133545, 0.0012682527303695679, 0.0013093948364257812]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 8.0, 7.0, 23.0, 16.0, 21.0, 36.0, 47.0, 74.0, 111.0, 191.0, 309.0, 664.0, 1847.0, 10933.0, 340677.0, 672200.0, 17399.0, 2347.0, 743.0, 325.0, 196.0, 144.0, 67.0, 47.0, 34.0, 24.0, 19.0, 9.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.71875, -31.66650390625, -30.6142578125, -29.56201171875, -28.509765625, -27.45751953125, -26.4052734375, -25.35302734375, -24.30078125, -23.24853515625, -22.1962890625, -21.14404296875, -20.091796875, -19.03955078125, -17.9873046875, -16.93505859375, -15.8828125, -14.83056640625, -13.7783203125, -12.72607421875, -11.673828125, -10.62158203125, -9.5693359375, -8.51708984375, -7.46484375, -6.41259765625, -5.3603515625, -4.30810546875, -3.255859375, -2.20361328125, -1.1513671875, -0.09912109375, 0.953125, 2.00537109375, 3.0576171875, 4.10986328125, 5.162109375, 6.21435546875, 7.2666015625, 8.31884765625, 9.37109375, 10.42333984375, 11.4755859375, 12.52783203125, 13.580078125, 14.63232421875, 15.6845703125, 16.73681640625, 17.7890625, 18.84130859375, 19.8935546875, 20.94580078125, 21.998046875, 23.05029296875, 24.1025390625, 25.15478515625, 26.20703125, 27.25927734375, 28.3115234375, 29.36376953125, 30.416015625, 31.46826171875, 32.5205078125, 33.57275390625, 34.625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 13.0, 12.0, 10.0, 23.0, 43.0, 49.0, 79.0, 124.0, 147.0, 137.0, 97.0, 66.0, 52.0, 30.0, 10.0, 13.0, 11.0, 8.0, 10.0, 5.0, 6.0, 4.0, 3.0, 7.0, 2.0, 1.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.015625, -20.354248046875, -19.69287109375, -19.031494140625, -18.3701171875, -17.708740234375, -17.04736328125, -16.385986328125, -15.724609375, -15.063232421875, -14.40185546875, -13.740478515625, -13.0791015625, -12.417724609375, -11.75634765625, -11.094970703125, -10.43359375, -9.772216796875, -9.11083984375, -8.449462890625, -7.7880859375, -7.126708984375, -6.46533203125, -5.803955078125, -5.142578125, -4.481201171875, -3.81982421875, -3.158447265625, -2.4970703125, -1.835693359375, -1.17431640625, -0.512939453125, 0.1484375, 0.809814453125, 1.47119140625, 2.132568359375, 2.7939453125, 3.455322265625, 4.11669921875, 4.778076171875, 5.439453125, 6.100830078125, 6.76220703125, 7.423583984375, 8.0849609375, 8.746337890625, 9.40771484375, 10.069091796875, 10.73046875, 11.391845703125, 12.05322265625, 12.714599609375, 13.3759765625, 14.037353515625, 14.69873046875, 15.360107421875, 16.021484375, 16.682861328125, 17.34423828125, 18.005615234375, 18.6669921875, 19.328369140625, 19.98974609375, 20.651123046875, 21.3125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 20.0, 101.0, 393.0, 377.0, 90.0, 16.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1009.714599609375, -986.197265625, -962.679931640625, -939.16259765625, -915.645263671875, -892.1278686523438, -868.6105346679688, -845.0932006835938, -821.5758666992188, -798.0585327148438, -774.5411987304688, -751.0238647460938, -727.5064697265625, -703.9891357421875, -680.4718017578125, -656.9544677734375, -633.4371337890625, -609.9197998046875, -586.4024658203125, -562.8851318359375, -539.3677978515625, -515.8504028320312, -492.33306884765625, -468.81573486328125, -445.29840087890625, -421.78106689453125, -398.26373291015625, -374.7463684082031, -351.2290344238281, -327.7117004394531, -304.1943359375, -280.677001953125, -257.15966796875, -233.642333984375, -210.12498474121094, -186.60763549804688, -163.09030151367188, -139.57296752929688, -116.05561828613281, -92.53826904296875, -69.02093505859375, -45.50359344482422, -21.986251831054688, 1.5310897827148438, 25.048431396484375, 48.565773010253906, 72.08311462402344, 95.6004638671875, 119.1177978515625, 142.6351318359375, 166.15248107910156, 189.66983032226562, 213.18716430664062, 236.70449829101562, 260.22186279296875, 283.73919677734375, 307.25653076171875, 330.77386474609375, 354.29119873046875, 377.8085632324219, 401.3258972167969, 424.8432312011719, 448.360595703125, 471.8779296875, 495.395263671875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 10.0, 13.0, 14.0, 27.0, 36.0, 37.0, 39.0, 52.0, 54.0, 56.0, 55.0, 59.0, 72.0, 64.0, 78.0, 65.0, 46.0, 48.0, 42.0, 28.0, 24.0, 22.0, 19.0, 7.0, 8.0, 5.0, 5.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.25509643554688, -241.0137481689453, -230.7724151611328, -220.53106689453125, -210.28973388671875, -200.0483856201172, -189.80703735351562, -179.56570434570312, -169.32437133789062, -159.08302307128906, -148.84169006347656, -138.600341796875, -128.3590087890625, -118.11766052246094, -107.8763198852539, -97.63497924804688, -87.39363098144531, -77.15229034423828, -66.91094970703125, -56.66960525512695, -46.42826461791992, -36.18692398071289, -25.945579528808594, -15.704238891601562, -5.462898254394531, 4.778443336486816, 15.019784927368164, 25.261127471923828, 35.50246810913086, 45.74380874633789, 55.98515319824219, 66.22649383544922, 76.46783447265625, 86.70917510986328, 96.95051574707031, 107.19186401367188, 117.43319702148438, 127.67454528808594, 137.9158935546875, 148.1572265625, 158.3985595703125, 168.63990783691406, 178.88124084472656, 189.12258911132812, 199.36392211914062, 209.6052703857422, 219.84661865234375, 230.08795166015625, 240.3292999267578, 250.57064819335938, 260.8119812011719, 271.0533142089844, 281.294677734375, 291.5360107421875, 301.77734375, 312.0186767578125, 322.2600402832031, 332.5013732910156, 342.74273681640625, 352.98406982421875, 363.22540283203125, 373.46673583984375, 383.7080993652344, 393.9494323730469, 404.1907653808594]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 14.0, 40.0, 60.0, 108.0, 254.0, 476.0, 1121.0, 3450.0, 17744.0, 3951801.0, 204647.0, 10220.0, 2542.0, 936.0, 433.0, 187.0, 117.0, 59.0, 36.0, 22.0, 8.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.5, -49.4287109375, -47.357421875, -45.2861328125, -43.21484375, -41.1435546875, -39.072265625, -37.0009765625, -34.9296875, -32.8583984375, -30.787109375, -28.7158203125, -26.64453125, -24.5732421875, -22.501953125, -20.4306640625, -18.359375, -16.2880859375, -14.216796875, -12.1455078125, -10.07421875, -8.0029296875, -5.931640625, -3.8603515625, -1.7890625, 0.2822265625, 2.353515625, 4.4248046875, 6.49609375, 8.5673828125, 10.638671875, 12.7099609375, 14.78125, 16.8525390625, 18.923828125, 20.9951171875, 23.06640625, 25.1376953125, 27.208984375, 29.2802734375, 31.3515625, 33.4228515625, 35.494140625, 37.5654296875, 39.63671875, 41.7080078125, 43.779296875, 45.8505859375, 47.921875, 49.9931640625, 52.064453125, 54.1357421875, 56.20703125, 58.2783203125, 60.349609375, 62.4208984375, 64.4921875, 66.5634765625, 68.634765625, 70.7060546875, 72.77734375, 74.8486328125, 76.919921875, 78.9912109375, 81.0625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 7.0, 13.0, 17.0, 33.0, 61.0, 72.0, 75.0, 107.0, 115.0, 106.0, 107.0, 71.0, 65.0, 63.0, 35.0, 22.0, 17.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.875, -19.139892578125, -18.40478515625, -17.669677734375, -16.9345703125, -16.199462890625, -15.46435546875, -14.729248046875, -13.994140625, -13.259033203125, -12.52392578125, -11.788818359375, -11.0537109375, -10.318603515625, -9.58349609375, -8.848388671875, -8.11328125, -7.378173828125, -6.64306640625, -5.907958984375, -5.1728515625, -4.437744140625, -3.70263671875, -2.967529296875, -2.232421875, -1.497314453125, -0.76220703125, -0.027099609375, 0.7080078125, 1.443115234375, 2.17822265625, 2.913330078125, 3.6484375, 4.383544921875, 5.11865234375, 5.853759765625, 6.5888671875, 7.323974609375, 8.05908203125, 8.794189453125, 9.529296875, 10.264404296875, 10.99951171875, 11.734619140625, 12.4697265625, 13.204833984375, 13.93994140625, 14.675048828125, 15.41015625, 16.145263671875, 16.88037109375, 17.615478515625, 18.3505859375, 19.085693359375, 19.82080078125, 20.555908203125, 21.291015625, 22.026123046875, 22.76123046875, 23.496337890625, 24.2314453125, 24.966552734375, 25.70166015625, 26.436767578125, 27.171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 7.0, 4.0, 13.0, 17.0, 29.0, 37.0, 58.0, 85.0, 141.0, 197.0, 289.0, 491.0, 794.0, 1266.0, 2683.0, 6503.0, 21998.0, 195297.0, 3883290.0, 59791.0, 12149.0, 4437.0, 1917.0, 987.0, 585.0, 386.0, 274.0, 182.0, 116.0, 69.0, 56.0, 42.0, 25.0, 23.0, 7.0, 13.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.984375, -25.126220703125, -24.26806640625, -23.409912109375, -22.5517578125, -21.693603515625, -20.83544921875, -19.977294921875, -19.119140625, -18.260986328125, -17.40283203125, -16.544677734375, -15.6865234375, -14.828369140625, -13.97021484375, -13.112060546875, -12.25390625, -11.395751953125, -10.53759765625, -9.679443359375, -8.8212890625, -7.963134765625, -7.10498046875, -6.246826171875, -5.388671875, -4.530517578125, -3.67236328125, -2.814208984375, -1.9560546875, -1.097900390625, -0.23974609375, 0.618408203125, 1.4765625, 2.334716796875, 3.19287109375, 4.051025390625, 4.9091796875, 5.767333984375, 6.62548828125, 7.483642578125, 8.341796875, 9.199951171875, 10.05810546875, 10.916259765625, 11.7744140625, 12.632568359375, 13.49072265625, 14.348876953125, 15.20703125, 16.065185546875, 16.92333984375, 17.781494140625, 18.6396484375, 19.497802734375, 20.35595703125, 21.214111328125, 22.072265625, 22.930419921875, 23.78857421875, 24.646728515625, 25.5048828125, 26.363037109375, 27.22119140625, 28.079345703125, 28.9375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 13.0, 12.0, 39.0, 74.0, 169.0, 3178.0, 368.0, 101.0, 48.0, 18.0, 13.0, 8.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.8359375, -7.59661865234375, -7.3572998046875, -7.11798095703125, -6.878662109375, -6.63934326171875, -6.4000244140625, -6.16070556640625, -5.92138671875, -5.68206787109375, -5.4427490234375, -5.20343017578125, -4.964111328125, -4.72479248046875, -4.4854736328125, -4.24615478515625, -4.0068359375, -3.76751708984375, -3.5281982421875, -3.28887939453125, -3.049560546875, -2.81024169921875, -2.5709228515625, -2.33160400390625, -2.09228515625, -1.85296630859375, -1.6136474609375, -1.37432861328125, -1.135009765625, -0.89569091796875, -0.6563720703125, -0.41705322265625, -0.177734375, 0.06158447265625, 0.3009033203125, 0.54022216796875, 0.779541015625, 1.01885986328125, 1.2581787109375, 1.49749755859375, 1.73681640625, 1.97613525390625, 2.2154541015625, 2.45477294921875, 2.694091796875, 2.93341064453125, 3.1727294921875, 3.41204833984375, 3.6513671875, 3.89068603515625, 4.1300048828125, 4.36932373046875, 4.608642578125, 4.84796142578125, 5.0872802734375, 5.32659912109375, 5.56591796875, 5.80523681640625, 6.0445556640625, 6.28387451171875, 6.523193359375, 6.76251220703125, 7.0018310546875, 7.24114990234375, 7.48046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 22.0, 48.0, 99.0, 176.0, 222.0, 205.0, 103.0, 74.0, 18.0, 9.0, 10.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.972572326660156, -42.65672302246094, -41.34087371826172, -40.0250244140625, -38.70917510986328, -37.39332580566406, -36.077476501464844, -34.76162338256836, -33.44577407836914, -32.12992477416992, -30.814075469970703, -29.498226165771484, -28.182374954223633, -26.866525650024414, -25.550676345825195, -24.234825134277344, -22.918977737426758, -21.60312843322754, -20.28727912902832, -18.97142791748047, -17.65557861328125, -16.33972930908203, -15.023880004882812, -13.708029747009277, -12.392180442810059, -11.07633113861084, -9.760480880737305, -8.444631576538086, -7.128781795501709, -5.812932014465332, -4.497082710266113, -3.181232452392578, -1.8653831481933594, -0.549533486366272, 0.7663161754608154, 2.0821657180786133, 3.3980154991149902, 4.713865280151367, 6.029714584350586, 7.345564842224121, 8.66141414642334, 9.977263450622559, 11.293113708496094, 12.608963012695312, 13.924812316894531, 15.240662574768066, 16.55651092529297, 17.87236213684082, 19.18821144104004, 20.504060745239258, 21.819910049438477, 23.135761260986328, 24.451610565185547, 25.767459869384766, 27.083309173583984, 28.399158477783203, 29.715007781982422, 31.03085708618164, 32.34670639038086, 33.66255569458008, 34.9784049987793, 36.29425811767578, 37.610107421875, 38.92595672607422, 40.24180603027344]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 12.0, 12.0, 12.0, 9.0, 10.0, 8.0, 16.0, 17.0, 21.0, 24.0, 33.0, 36.0, 34.0, 39.0, 38.0, 54.0, 48.0, 49.0, 57.0, 56.0, 39.0, 37.0, 33.0, 47.0, 34.0, 21.0, 32.0, 23.0, 28.0, 17.0, 13.0, 15.0, 13.0, 15.0, 6.0, 6.0, 7.0, 6.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.272005081176758, -13.820244789123535, -13.368485450744629, -12.916725158691406, -12.4649658203125, -12.013205528259277, -11.561445236206055, -11.109685897827148, -10.657925605773926, -10.206165313720703, -9.754405975341797, -9.302645683288574, -8.850885391235352, -8.399126052856445, -7.947365760803223, -7.495605945587158, -7.043846130371094, -6.592086315155029, -6.140326499938965, -5.688566207885742, -5.236806392669678, -4.785046577453613, -4.333286285400391, -3.881526470184326, -3.4297666549682617, -2.9780068397521973, -2.5262467861175537, -2.07448673248291, -1.6227269172668457, -1.1709671020507812, -0.7192070484161377, -0.26744699478149414, 0.1843128204345703, 0.6360727548599243, 1.0878326892852783, 1.5395926237106323, 1.9913525581359863, 2.443112373352051, 2.8948724269866943, 3.346632480621338, 3.7983922958374023, 4.250152111053467, 4.701911926269531, 5.153672218322754, 5.605432033538818, 6.057191848754883, 6.5089521408081055, 6.96071195602417, 7.412471771240234, 7.864231586456299, 8.315991401672363, 8.767751693725586, 9.219511032104492, 9.671271324157715, 10.123031616210938, 10.574790954589844, 11.026551246643066, 11.478311538696289, 11.930070877075195, 12.381831169128418, 12.83359146118164, 13.285350799560547, 13.73711109161377, 14.188871383666992, 14.640630722045898]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 6.0, 17.0, 26.0, 51.0, 79.0, 140.0, 323.0, 569.0, 1442.0, 4525.0, 22490.0, 196716.0, 653133.0, 145401.0, 17499.0, 3791.0, 1216.0, 537.0, 259.0, 129.0, 96.0, 40.0, 24.0, 15.0, 11.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5, -37.04345703125, -35.5869140625, -34.13037109375, -32.673828125, -31.21728515625, -29.7607421875, -28.30419921875, -26.84765625, -25.39111328125, -23.9345703125, -22.47802734375, -21.021484375, -19.56494140625, -18.1083984375, -16.65185546875, -15.1953125, -13.73876953125, -12.2822265625, -10.82568359375, -9.369140625, -7.91259765625, -6.4560546875, -4.99951171875, -3.54296875, -2.08642578125, -0.6298828125, 0.82666015625, 2.283203125, 3.73974609375, 5.1962890625, 6.65283203125, 8.109375, 9.56591796875, 11.0224609375, 12.47900390625, 13.935546875, 15.39208984375, 16.8486328125, 18.30517578125, 19.76171875, 21.21826171875, 22.6748046875, 24.13134765625, 25.587890625, 27.04443359375, 28.5009765625, 29.95751953125, 31.4140625, 32.87060546875, 34.3271484375, 35.78369140625, 37.240234375, 38.69677734375, 40.1533203125, 41.60986328125, 43.06640625, 44.52294921875, 45.9794921875, 47.43603515625, 48.892578125, 50.34912109375, 51.8056640625, 53.26220703125, 54.71875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 7.0, 18.0, 20.0, 41.0, 66.0, 71.0, 84.0, 93.0, 116.0, 112.0, 93.0, 66.0, 80.0, 45.0, 37.0, 23.0, 6.0, 12.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.46875, -18.7431640625, -18.017578125, -17.2919921875, -16.56640625, -15.8408203125, -15.115234375, -14.3896484375, -13.6640625, -12.9384765625, -12.212890625, -11.4873046875, -10.76171875, -10.0361328125, -9.310546875, -8.5849609375, -7.859375, -7.1337890625, -6.408203125, -5.6826171875, -4.95703125, -4.2314453125, -3.505859375, -2.7802734375, -2.0546875, -1.3291015625, -0.603515625, 0.1220703125, 0.84765625, 1.5732421875, 2.298828125, 3.0244140625, 3.75, 4.4755859375, 5.201171875, 5.9267578125, 6.65234375, 7.3779296875, 8.103515625, 8.8291015625, 9.5546875, 10.2802734375, 11.005859375, 11.7314453125, 12.45703125, 13.1826171875, 13.908203125, 14.6337890625, 15.359375, 16.0849609375, 16.810546875, 17.5361328125, 18.26171875, 18.9873046875, 19.712890625, 20.4384765625, 21.1640625, 21.8896484375, 22.615234375, 23.3408203125, 24.06640625, 24.7919921875, 25.517578125, 26.2431640625, 26.96875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 1.0, 11.0, 4.0, 5.0, 12.0, 7.0, 13.0, 18.0, 21.0, 40.0, 49.0, 61.0, 111.0, 174.0, 274.0, 484.0, 894.0, 2208.0, 9952.0, 340629.0, 673868.0, 14638.0, 2653.0, 985.0, 573.0, 295.0, 170.0, 105.0, 101.0, 50.0, 37.0, 29.0, 19.0, 20.0, 10.0, 7.0, 4.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-95.3125, -92.431640625, -89.55078125, -86.669921875, -83.7890625, -80.908203125, -78.02734375, -75.146484375, -72.265625, -69.384765625, -66.50390625, -63.623046875, -60.7421875, -57.861328125, -54.98046875, -52.099609375, -49.21875, -46.337890625, -43.45703125, -40.576171875, -37.6953125, -34.814453125, -31.93359375, -29.052734375, -26.171875, -23.291015625, -20.41015625, -17.529296875, -14.6484375, -11.767578125, -8.88671875, -6.005859375, -3.125, -0.244140625, 2.63671875, 5.517578125, 8.3984375, 11.279296875, 14.16015625, 17.041015625, 19.921875, 22.802734375, 25.68359375, 28.564453125, 31.4453125, 34.326171875, 37.20703125, 40.087890625, 42.96875, 45.849609375, 48.73046875, 51.611328125, 54.4921875, 57.373046875, 60.25390625, 63.134765625, 66.015625, 68.896484375, 71.77734375, 74.658203125, 77.5390625, 80.419921875, 83.30078125, 86.181640625, 89.0625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 11.0, 1.0, 4.0, 4.0, 6.0, 9.0, 19.0, 24.0, 29.0, 39.0, 39.0, 53.0, 62.0, 75.0, 81.0, 91.0, 95.0, 67.0, 56.0, 56.0, 41.0, 30.0, 18.0, 19.0, 9.0, 10.0, 10.0, 7.0, 2.0, 11.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.6875, -90.7900390625, -87.892578125, -84.9951171875, -82.09765625, -79.2001953125, -76.302734375, -73.4052734375, -70.5078125, -67.6103515625, -64.712890625, -61.8154296875, -58.91796875, -56.0205078125, -53.123046875, -50.2255859375, -47.328125, -44.4306640625, -41.533203125, -38.6357421875, -35.73828125, -32.8408203125, -29.943359375, -27.0458984375, -24.1484375, -21.2509765625, -18.353515625, -15.4560546875, -12.55859375, -9.6611328125, -6.763671875, -3.8662109375, -0.96875, 1.9287109375, 4.826171875, 7.7236328125, 10.62109375, 13.5185546875, 16.416015625, 19.3134765625, 22.2109375, 25.1083984375, 28.005859375, 30.9033203125, 33.80078125, 36.6982421875, 39.595703125, 42.4931640625, 45.390625, 48.2880859375, 51.185546875, 54.0830078125, 56.98046875, 59.8779296875, 62.775390625, 65.6728515625, 68.5703125, 71.4677734375, 74.365234375, 77.2626953125, 80.16015625, 83.0576171875, 85.955078125, 88.8525390625, 91.75]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 5.0, 6.0, 8.0, 4.0, 7.0, 11.0, 11.0, 14.0, 22.0, 27.0, 27.0, 38.0, 59.0, 73.0, 115.0, 244.0, 804.0, 9096.0, 923213.0, 111093.0, 2673.0, 460.0, 153.0, 89.0, 60.0, 53.0, 42.0, 20.0, 16.0, 17.0, 17.0, 16.0, 20.0, 15.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.34375, -54.45166015625, -52.5595703125, -50.66748046875, -48.775390625, -46.88330078125, -44.9912109375, -43.09912109375, -41.20703125, -39.31494140625, -37.4228515625, -35.53076171875, -33.638671875, -31.74658203125, -29.8544921875, -27.96240234375, -26.0703125, -24.17822265625, -22.2861328125, -20.39404296875, -18.501953125, -16.60986328125, -14.7177734375, -12.82568359375, -10.93359375, -9.04150390625, -7.1494140625, -5.25732421875, -3.365234375, -1.47314453125, 0.4189453125, 2.31103515625, 4.203125, 6.09521484375, 7.9873046875, 9.87939453125, 11.771484375, 13.66357421875, 15.5556640625, 17.44775390625, 19.33984375, 21.23193359375, 23.1240234375, 25.01611328125, 26.908203125, 28.80029296875, 30.6923828125, 32.58447265625, 34.4765625, 36.36865234375, 38.2607421875, 40.15283203125, 42.044921875, 43.93701171875, 45.8291015625, 47.72119140625, 49.61328125, 51.50537109375, 53.3974609375, 55.28955078125, 57.181640625, 59.07373046875, 60.9658203125, 62.85791015625, 64.75]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 12.0, 26.0, 37.0, 58.0, 91.0, 148.0, 161.0, 137.0, 97.0, 87.0, 41.0, 31.0, 18.0, 17.0, 8.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002292633056640625, -0.002206563949584961, -0.002120494842529297, -0.002034425735473633, -0.0019483566284179688, -0.0018622875213623047, -0.0017762184143066406, -0.0016901493072509766, -0.0016040802001953125, -0.0015180110931396484, -0.0014319419860839844, -0.0013458728790283203, -0.0012598037719726562, -0.0011737346649169922, -0.0010876655578613281, -0.001001596450805664, -0.00091552734375, -0.0008294582366943359, -0.0007433891296386719, -0.0006573200225830078, -0.0005712509155273438, -0.0004851818084716797, -0.0003991127014160156, -0.00031304359436035156, -0.0002269744873046875, -0.00014090538024902344, -5.4836273193359375e-05, 3.123283386230469e-05, 0.00011730194091796875, 0.0002033710479736328, 0.0002894401550292969, 0.00037550926208496094, 0.000461578369140625, 0.0005476474761962891, 0.0006337165832519531, 0.0007197856903076172, 0.0008058547973632812, 0.0008919239044189453, 0.0009779930114746094, 0.0010640621185302734, 0.0011501312255859375, 0.0012362003326416016, 0.0013222694396972656, 0.0014083385467529297, 0.0014944076538085938, 0.0015804767608642578, 0.0016665458679199219, 0.001752614974975586, 0.00183868408203125, 0.001924753189086914, 0.002010822296142578, 0.002096891403198242, 0.0021829605102539062, 0.0022690296173095703, 0.0023550987243652344, 0.0024411678314208984, 0.0025272369384765625, 0.0026133060455322266, 0.0026993751525878906, 0.0027854442596435547, 0.0028715133666992188, 0.002957582473754883, 0.003043651580810547, 0.003129720687866211, 0.003215789794921875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 13.0, 15.0, 36.0, 66.0, 167.0, 933.0, 67933.0, 977591.0, 1413.0, 218.0, 76.0, 31.0, 16.0, 13.0, 7.0, 5.0, 6.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-182.0, -176.662109375, -171.32421875, -165.986328125, -160.6484375, -155.310546875, -149.97265625, -144.634765625, -139.296875, -133.958984375, -128.62109375, -123.283203125, -117.9453125, -112.607421875, -107.26953125, -101.931640625, -96.59375, -91.255859375, -85.91796875, -80.580078125, -75.2421875, -69.904296875, -64.56640625, -59.228515625, -53.890625, -48.552734375, -43.21484375, -37.876953125, -32.5390625, -27.201171875, -21.86328125, -16.525390625, -11.1875, -5.849609375, -0.51171875, 4.826171875, 10.1640625, 15.501953125, 20.83984375, 26.177734375, 31.515625, 36.853515625, 42.19140625, 47.529296875, 52.8671875, 58.205078125, 63.54296875, 68.880859375, 74.21875, 79.556640625, 84.89453125, 90.232421875, 95.5703125, 100.908203125, 106.24609375, 111.583984375, 116.921875, 122.259765625, 127.59765625, 132.935546875, 138.2734375, 143.611328125, 148.94921875, 154.287109375, 159.625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 13.0, 19.0, 48.0, 267.0, 471.0, 119.0, 29.0, 12.0, 4.0, 4.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.6875, -103.15625, -99.625, -96.09375, -92.5625, -89.03125, -85.5, -81.96875, -78.4375, -74.90625, -71.375, -67.84375, -64.3125, -60.78125, -57.25, -53.71875, -50.1875, -46.65625, -43.125, -39.59375, -36.0625, -32.53125, -29.0, -25.46875, -21.9375, -18.40625, -14.875, -11.34375, -7.8125, -4.28125, -0.75, 2.78125, 6.3125, 9.84375, 13.375, 16.90625, 20.4375, 23.96875, 27.5, 31.03125, 34.5625, 38.09375, 41.625, 45.15625, 48.6875, 52.21875, 55.75, 59.28125, 62.8125, 66.34375, 69.875, 73.40625, 76.9375, 80.46875, 84.0, 87.53125, 91.0625, 94.59375, 98.125, 101.65625, 105.1875, 108.71875, 112.25, 115.78125, 119.3125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 13.0, 73.0, 488.0, 375.0, 45.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1467.86962890625, -1433.62548828125, -1399.3812255859375, -1365.1370849609375, -1330.8929443359375, -1296.648681640625, -1262.404541015625, -1228.160400390625, -1193.916259765625, -1159.672119140625, -1125.4278564453125, -1091.1837158203125, -1056.9395751953125, -1022.6953735351562, -988.451171875, -954.20703125, -919.9627685546875, -885.7185668945312, -851.4744262695312, -817.230224609375, -782.986083984375, -748.7418823242188, -714.4976806640625, -680.2535400390625, -646.0093383789062, -611.76513671875, -577.52099609375, -543.2767944335938, -509.0326232910156, -474.7884521484375, -440.54425048828125, -406.3000793457031, -372.055908203125, -337.8117370605469, -303.56756591796875, -269.3233642578125, -235.07919311523438, -200.83502197265625, -166.59083557128906, -132.34664916992188, -98.10247802734375, -63.858299255371094, -29.614120483398438, 4.630058288574219, 38.874237060546875, 73.118408203125, 107.36259460449219, 141.60678100585938, 175.8509521484375, 210.09512329101562, 244.3393096923828, 278.58349609375, 312.8276672363281, 347.07183837890625, 381.3160400390625, 415.5602111816406, 449.80438232421875, 484.0485534667969, 518.292724609375, 552.5369262695312, 586.7811279296875, 621.0252685546875, 655.2694702148438, 689.513671875, 723.7578125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 15.0, 8.0, 11.0, 13.0, 21.0, 18.0, 18.0, 16.0, 21.0, 33.0, 47.0, 48.0, 57.0, 50.0, 48.0, 51.0, 44.0, 47.0, 38.0, 56.0, 41.0, 48.0, 33.0, 32.0, 29.0, 24.0, 24.0, 19.0, 13.0, 13.0, 13.0, 11.0, 12.0, 2.0, 8.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-232.92453002929688, -223.71653747558594, -214.50856018066406, -205.30056762695312, -196.09259033203125, -186.8845977783203, -177.67660522460938, -168.4686279296875, -159.26063537597656, -150.05264282226562, -140.84466552734375, -131.6366729736328, -122.4286880493164, -113.220703125, -104.01271057128906, -94.80472564697266, -85.59674072265625, -76.38875579833984, -67.18077087402344, -57.9727783203125, -48.764793395996094, -39.55680847167969, -30.348819732666016, -21.140830993652344, -11.932846069335938, -2.7248592376708984, 6.483127593994141, 15.69111442565918, 24.89910125732422, 34.107086181640625, 43.3150749206543, 52.52306365966797, 61.7310791015625, 70.9390640258789, 80.14704895019531, 89.35504150390625, 98.56302642822266, 107.77101135253906, 116.97900390625, 126.1869888305664, 135.3949737548828, 144.60296630859375, 153.81094360351562, 163.01893615722656, 172.2269287109375, 181.43490600585938, 190.6428985595703, 199.85089111328125, 209.05886840820312, 218.26686096191406, 227.47483825683594, 236.68283081054688, 245.89080810546875, 255.0988006591797, 264.3067932128906, 273.5147705078125, 282.7227783203125, 291.9307556152344, 301.1387634277344, 310.34674072265625, 319.5547180175781, 328.7626953125, 337.970703125, 347.1786804199219, 356.38665771484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 10.0, 20.0, 20.0, 38.0, 38.0, 75.0, 105.0, 165.0, 278.0, 436.0, 776.0, 1504.0, 3345.0, 9318.0, 40418.0, 3835853.0, 266060.0, 23578.0, 6729.0, 2558.0, 1228.0, 668.0, 406.0, 220.0, 128.0, 95.0, 73.0, 56.0, 31.0, 21.0, 9.0, 9.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.046875, -30.006591796875, -28.96630859375, -27.926025390625, -26.8857421875, -25.845458984375, -24.80517578125, -23.764892578125, -22.724609375, -21.684326171875, -20.64404296875, -19.603759765625, -18.5634765625, -17.523193359375, -16.48291015625, -15.442626953125, -14.40234375, -13.362060546875, -12.32177734375, -11.281494140625, -10.2412109375, -9.200927734375, -8.16064453125, -7.120361328125, -6.080078125, -5.039794921875, -3.99951171875, -2.959228515625, -1.9189453125, -0.878662109375, 0.16162109375, 1.201904296875, 2.2421875, 3.282470703125, 4.32275390625, 5.363037109375, 6.4033203125, 7.443603515625, 8.48388671875, 9.524169921875, 10.564453125, 11.604736328125, 12.64501953125, 13.685302734375, 14.7255859375, 15.765869140625, 16.80615234375, 17.846435546875, 18.88671875, 19.927001953125, 20.96728515625, 22.007568359375, 23.0478515625, 24.088134765625, 25.12841796875, 26.168701171875, 27.208984375, 28.249267578125, 29.28955078125, 30.329833984375, 31.3701171875, 32.410400390625, 33.45068359375, 34.490966796875, 35.53125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 6.0, 17.0, 17.0, 29.0, 59.0, 72.0, 94.0, 99.0, 125.0, 124.0, 106.0, 94.0, 53.0, 48.0, 27.0, 15.0, 6.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.5380859375, -20.669921875, -19.8017578125, -18.93359375, -18.0654296875, -17.197265625, -16.3291015625, -15.4609375, -14.5927734375, -13.724609375, -12.8564453125, -11.98828125, -11.1201171875, -10.251953125, -9.3837890625, -8.515625, -7.6474609375, -6.779296875, -5.9111328125, -5.04296875, -4.1748046875, -3.306640625, -2.4384765625, -1.5703125, -0.7021484375, 0.166015625, 1.0341796875, 1.90234375, 2.7705078125, 3.638671875, 4.5068359375, 5.375, 6.2431640625, 7.111328125, 7.9794921875, 8.84765625, 9.7158203125, 10.583984375, 11.4521484375, 12.3203125, 13.1884765625, 14.056640625, 14.9248046875, 15.79296875, 16.6611328125, 17.529296875, 18.3974609375, 19.265625, 20.1337890625, 21.001953125, 21.8701171875, 22.73828125, 23.6064453125, 24.474609375, 25.3427734375, 26.2109375, 27.0791015625, 27.947265625, 28.8154296875, 29.68359375, 30.5517578125, 31.419921875, 32.2880859375, 33.15625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 12.0, 14.0, 16.0, 21.0, 42.0, 39.0, 64.0, 86.0, 116.0, 153.0, 207.0, 312.0, 483.0, 784.0, 1276.0, 2242.0, 4297.0, 9442.0, 23857.0, 96382.0, 3735816.0, 252039.0, 39800.0, 13611.0, 5820.0, 2996.0, 1563.0, 931.0, 572.0, 339.0, 274.0, 183.0, 135.0, 90.0, 60.0, 44.0, 45.0, 33.0, 26.0, 22.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.707275390625, -17.14892578125, -16.590576171875, -16.0322265625, -15.473876953125, -14.91552734375, -14.357177734375, -13.798828125, -13.240478515625, -12.68212890625, -12.123779296875, -11.5654296875, -11.007080078125, -10.44873046875, -9.890380859375, -9.33203125, -8.773681640625, -8.21533203125, -7.656982421875, -7.0986328125, -6.540283203125, -5.98193359375, -5.423583984375, -4.865234375, -4.306884765625, -3.74853515625, -3.190185546875, -2.6318359375, -2.073486328125, -1.51513671875, -0.956787109375, -0.3984375, 0.159912109375, 0.71826171875, 1.276611328125, 1.8349609375, 2.393310546875, 2.95166015625, 3.510009765625, 4.068359375, 4.626708984375, 5.18505859375, 5.743408203125, 6.3017578125, 6.860107421875, 7.41845703125, 7.976806640625, 8.53515625, 9.093505859375, 9.65185546875, 10.210205078125, 10.7685546875, 11.326904296875, 11.88525390625, 12.443603515625, 13.001953125, 13.560302734375, 14.11865234375, 14.677001953125, 15.2353515625, 15.793701171875, 16.35205078125, 16.910400390625, 17.46875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 9.0, 11.0, 13.0, 15.0, 31.0, 51.0, 59.0, 189.0, 2909.0, 506.0, 123.0, 52.0, 28.0, 23.0, 11.0, 9.0, 4.0, 8.0, 5.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8984375, -5.6865234375, -5.474609375, -5.2626953125, -5.05078125, -4.8388671875, -4.626953125, -4.4150390625, -4.203125, -3.9912109375, -3.779296875, -3.5673828125, -3.35546875, -3.1435546875, -2.931640625, -2.7197265625, -2.5078125, -2.2958984375, -2.083984375, -1.8720703125, -1.66015625, -1.4482421875, -1.236328125, -1.0244140625, -0.8125, -0.6005859375, -0.388671875, -0.1767578125, 0.03515625, 0.2470703125, 0.458984375, 0.6708984375, 0.8828125, 1.0947265625, 1.306640625, 1.5185546875, 1.73046875, 1.9423828125, 2.154296875, 2.3662109375, 2.578125, 2.7900390625, 3.001953125, 3.2138671875, 3.42578125, 3.6376953125, 3.849609375, 4.0615234375, 4.2734375, 4.4853515625, 4.697265625, 4.9091796875, 5.12109375, 5.3330078125, 5.544921875, 5.7568359375, 5.96875, 6.1806640625, 6.392578125, 6.6044921875, 6.81640625, 7.0283203125, 7.240234375, 7.4521484375, 7.6640625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 18.0, 31.0, 76.0, 156.0, 230.0, 228.0, 164.0, 57.0, 19.0, 9.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.80000305175781, -74.1919937133789, -72.58397674560547, -70.97596740722656, -69.36795806884766, -67.75994873046875, -66.15193176269531, -64.5439224243164, -62.935909271240234, -61.32789611816406, -59.719886779785156, -58.111873626708984, -56.50386428833008, -54.895851135253906, -53.287841796875, -51.67982864379883, -50.071815490722656, -48.463802337646484, -46.85579299926758, -45.247779846191406, -43.6397705078125, -42.03175735473633, -40.423744201660156, -38.81573486328125, -37.207725524902344, -35.59971237182617, -33.991703033447266, -32.383689880371094, -30.775678634643555, -29.167667388916016, -27.559656143188477, -25.951644897460938, -24.343631744384766, -22.735620498657227, -21.127609252929688, -19.519596099853516, -17.911584854125977, -16.303573608398438, -14.695562362670898, -13.087550163269043, -11.479538917541504, -9.871527671813965, -8.26351547241211, -6.65550422668457, -5.047492504119873, -3.439480781555176, -1.8314695358276367, -0.22345733642578125, 1.3845539093017578, 2.992565631866455, 4.600577354431152, 6.208588600158691, 7.816600322723389, 9.424612045288086, 11.032623291015625, 12.64063549041748, 14.24864673614502, 15.856657981872559, 17.464670181274414, 19.072681427001953, 20.680692672729492, 22.28870391845703, 23.896717071533203, 25.504728317260742, 27.11273956298828]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 6.0, 7.0, 3.0, 9.0, 13.0, 11.0, 8.0, 19.0, 20.0, 36.0, 31.0, 29.0, 34.0, 29.0, 44.0, 40.0, 51.0, 48.0, 51.0, 45.0, 34.0, 49.0, 40.0, 31.0, 37.0, 50.0, 44.0, 27.0, 21.0, 26.0, 23.0, 8.0, 22.0, 9.0, 10.0, 6.0, 9.0, 7.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-14.383478164672852, -13.938672065734863, -13.493865966796875, -13.049059867858887, -12.604253768920898, -12.15944766998291, -11.714641571044922, -11.269835472106934, -10.825029373168945, -10.380223274230957, -9.935417175292969, -9.49061107635498, -9.045804977416992, -8.600998878479004, -8.156192779541016, -7.711386680603027, -7.266580581665039, -6.821774482727051, -6.3769683837890625, -5.932162284851074, -5.487356185913086, -5.042550086975098, -4.597743988037109, -4.152937889099121, -3.708131790161133, -3.2633256912231445, -2.8185195922851562, -2.373713493347168, -1.9289073944091797, -1.4841012954711914, -1.0392951965332031, -0.5944890975952148, -0.14968204498291016, 0.2951240539550781, 0.7399301528930664, 1.1847362518310547, 1.629542350769043, 2.0743484497070312, 2.5191545486450195, 2.963960647583008, 3.408766746520996, 3.8535728454589844, 4.298378944396973, 4.743185043334961, 5.187991142272949, 5.6327972412109375, 6.077603340148926, 6.522409439086914, 6.967215538024902, 7.412021636962891, 7.856827735900879, 8.301633834838867, 8.746439933776855, 9.191246032714844, 9.636052131652832, 10.08085823059082, 10.525664329528809, 10.970470428466797, 11.415276527404785, 11.860082626342773, 12.304888725280762, 12.74969482421875, 13.194500923156738, 13.639307022094727, 14.084113121032715]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 17.0, 25.0, 54.0, 53.0, 115.0, 227.0, 396.0, 810.0, 1946.0, 7586.0, 51852.0, 431182.0, 480652.0, 61191.0, 8443.0, 2235.0, 837.0, 425.0, 195.0, 120.0, 80.0, 41.0, 21.0, 17.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.71875, -38.47900390625, -37.2392578125, -35.99951171875, -34.759765625, -33.52001953125, -32.2802734375, -31.04052734375, -29.80078125, -28.56103515625, -27.3212890625, -26.08154296875, -24.841796875, -23.60205078125, -22.3623046875, -21.12255859375, -19.8828125, -18.64306640625, -17.4033203125, -16.16357421875, -14.923828125, -13.68408203125, -12.4443359375, -11.20458984375, -9.96484375, -8.72509765625, -7.4853515625, -6.24560546875, -5.005859375, -3.76611328125, -2.5263671875, -1.28662109375, -0.046875, 1.19287109375, 2.4326171875, 3.67236328125, 4.912109375, 6.15185546875, 7.3916015625, 8.63134765625, 9.87109375, 11.11083984375, 12.3505859375, 13.59033203125, 14.830078125, 16.06982421875, 17.3095703125, 18.54931640625, 19.7890625, 21.02880859375, 22.2685546875, 23.50830078125, 24.748046875, 25.98779296875, 27.2275390625, 28.46728515625, 29.70703125, 30.94677734375, 32.1865234375, 33.42626953125, 34.666015625, 35.90576171875, 37.1455078125, 38.38525390625, 39.625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 14.0, 22.0, 24.0, 54.0, 70.0, 86.0, 106.0, 110.0, 117.0, 118.0, 89.0, 79.0, 49.0, 25.0, 12.0, 14.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.81591796875, -20.9443359375, -20.07275390625, -19.201171875, -18.32958984375, -17.4580078125, -16.58642578125, -15.71484375, -14.84326171875, -13.9716796875, -13.10009765625, -12.228515625, -11.35693359375, -10.4853515625, -9.61376953125, -8.7421875, -7.87060546875, -6.9990234375, -6.12744140625, -5.255859375, -4.38427734375, -3.5126953125, -2.64111328125, -1.76953125, -0.89794921875, -0.0263671875, 0.84521484375, 1.716796875, 2.58837890625, 3.4599609375, 4.33154296875, 5.203125, 6.07470703125, 6.9462890625, 7.81787109375, 8.689453125, 9.56103515625, 10.4326171875, 11.30419921875, 12.17578125, 13.04736328125, 13.9189453125, 14.79052734375, 15.662109375, 16.53369140625, 17.4052734375, 18.27685546875, 19.1484375, 20.02001953125, 20.8916015625, 21.76318359375, 22.634765625, 23.50634765625, 24.3779296875, 25.24951171875, 26.12109375, 26.99267578125, 27.8642578125, 28.73583984375, 29.607421875, 30.47900390625, 31.3505859375, 32.22216796875, 33.09375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 6.0, 5.0, 2.0, 7.0, 12.0, 16.0, 24.0, 26.0, 40.0, 53.0, 71.0, 143.0, 248.0, 537.0, 1357.0, 5635.0, 395968.0, 635083.0, 6647.0, 1382.0, 610.0, 256.0, 168.0, 91.0, 46.0, 40.0, 24.0, 17.0, 10.0, 7.0, 5.0, 4.0, 6.0, 4.0, 1.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-163.625, -159.20703125, -154.7890625, -150.37109375, -145.953125, -141.53515625, -137.1171875, -132.69921875, -128.28125, -123.86328125, -119.4453125, -115.02734375, -110.609375, -106.19140625, -101.7734375, -97.35546875, -92.9375, -88.51953125, -84.1015625, -79.68359375, -75.265625, -70.84765625, -66.4296875, -62.01171875, -57.59375, -53.17578125, -48.7578125, -44.33984375, -39.921875, -35.50390625, -31.0859375, -26.66796875, -22.25, -17.83203125, -13.4140625, -8.99609375, -4.578125, -0.16015625, 4.2578125, 8.67578125, 13.09375, 17.51171875, 21.9296875, 26.34765625, 30.765625, 35.18359375, 39.6015625, 44.01953125, 48.4375, 52.85546875, 57.2734375, 61.69140625, 66.109375, 70.52734375, 74.9453125, 79.36328125, 83.78125, 88.19921875, 92.6171875, 97.03515625, 101.453125, 105.87109375, 110.2890625, 114.70703125, 119.125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 2.0, 8.0, 2.0, 8.0, 9.0, 10.0, 13.0, 26.0, 37.0, 38.0, 69.0, 72.0, 83.0, 109.0, 104.0, 98.0, 67.0, 59.0, 43.0, 37.0, 30.0, 15.0, 16.0, 7.0, 7.0, 6.0, 3.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.625, -126.275390625, -121.92578125, -117.576171875, -113.2265625, -108.876953125, -104.52734375, -100.177734375, -95.828125, -91.478515625, -87.12890625, -82.779296875, -78.4296875, -74.080078125, -69.73046875, -65.380859375, -61.03125, -56.681640625, -52.33203125, -47.982421875, -43.6328125, -39.283203125, -34.93359375, -30.583984375, -26.234375, -21.884765625, -17.53515625, -13.185546875, -8.8359375, -4.486328125, -0.13671875, 4.212890625, 8.5625, 12.912109375, 17.26171875, 21.611328125, 25.9609375, 30.310546875, 34.66015625, 39.009765625, 43.359375, 47.708984375, 52.05859375, 56.408203125, 60.7578125, 65.107421875, 69.45703125, 73.806640625, 78.15625, 82.505859375, 86.85546875, 91.205078125, 95.5546875, 99.904296875, 104.25390625, 108.603515625, 112.953125, 117.302734375, 121.65234375, 126.001953125, 130.3515625, 134.701171875, 139.05078125, 143.400390625, 147.75]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 4.0, 7.0, 6.0, 15.0, 15.0, 29.0, 27.0, 47.0, 48.0, 96.0, 175.0, 229.0, 428.0, 918.0, 3756.0, 72194.0, 944245.0, 22391.0, 2295.0, 706.0, 315.0, 205.0, 132.0, 94.0, 56.0, 29.0, 23.0, 21.0, 16.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.59375, -44.2265625, -42.859375, -41.4921875, -40.125, -38.7578125, -37.390625, -36.0234375, -34.65625, -33.2890625, -31.921875, -30.5546875, -29.1875, -27.8203125, -26.453125, -25.0859375, -23.71875, -22.3515625, -20.984375, -19.6171875, -18.25, -16.8828125, -15.515625, -14.1484375, -12.78125, -11.4140625, -10.046875, -8.6796875, -7.3125, -5.9453125, -4.578125, -3.2109375, -1.84375, -0.4765625, 0.890625, 2.2578125, 3.625, 4.9921875, 6.359375, 7.7265625, 9.09375, 10.4609375, 11.828125, 13.1953125, 14.5625, 15.9296875, 17.296875, 18.6640625, 20.03125, 21.3984375, 22.765625, 24.1328125, 25.5, 26.8671875, 28.234375, 29.6015625, 30.96875, 32.3359375, 33.703125, 35.0703125, 36.4375, 37.8046875, 39.171875, 40.5390625, 41.90625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 13.0, 12.0, 21.0, 26.0, 38.0, 85.0, 90.0, 120.0, 124.0, 130.0, 108.0, 72.0, 40.0, 38.0, 15.0, 16.0, 8.0, 11.0, 9.0, 3.0, 3.0, 4.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018720626831054688, -0.0017986148595809937, -0.0017251670360565186, -0.0016517192125320435, -0.0015782713890075684, -0.0015048235654830933, -0.0014313757419586182, -0.001357927918434143, -0.001284480094909668, -0.0012110322713851929, -0.0011375844478607178, -0.0010641366243362427, -0.0009906888008117676, -0.0009172409772872925, -0.0008437931537628174, -0.0007703453302383423, -0.0006968975067138672, -0.0006234496831893921, -0.000550001859664917, -0.0004765540361404419, -0.0004031062126159668, -0.0003296583890914917, -0.0002562105655670166, -0.0001827627420425415, -0.0001093149185180664, -3.586709499359131e-05, 3.758072853088379e-05, 0.00011102855205535889, 0.00018447637557983398, 0.0002579241991043091, 0.0003313720226287842, 0.0004048198461532593, 0.0004782676696777344, 0.0005517154932022095, 0.0006251633167266846, 0.0006986111402511597, 0.0007720589637756348, 0.0008455067873001099, 0.000918954610824585, 0.00099240243434906, 0.0010658502578735352, 0.0011392980813980103, 0.0012127459049224854, 0.0012861937284469604, 0.0013596415519714355, 0.0014330893754959106, 0.0015065371990203857, 0.0015799850225448608, 0.001653432846069336, 0.001726880669593811, 0.0018003284931182861, 0.0018737763166427612, 0.0019472241401672363, 0.0020206719636917114, 0.0020941197872161865, 0.0021675676107406616, 0.0022410154342651367, 0.002314463257789612, 0.002387911081314087, 0.002461358904838562, 0.002534806728363037, 0.002608254551887512, 0.0026817023754119873, 0.0027551501989364624, 0.0028285980224609375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 9.0, 9.0, 5.0, 9.0, 14.0, 20.0, 20.0, 46.0, 70.0, 103.0, 178.0, 289.0, 658.0, 1807.0, 10739.0, 701299.0, 322468.0, 7914.0, 1525.0, 607.0, 286.0, 160.0, 106.0, 66.0, 45.0, 26.0, 13.0, 9.0, 13.0, 3.0, 6.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.34375, -33.98095703125, -32.6181640625, -31.25537109375, -29.892578125, -28.52978515625, -27.1669921875, -25.80419921875, -24.44140625, -23.07861328125, -21.7158203125, -20.35302734375, -18.990234375, -17.62744140625, -16.2646484375, -14.90185546875, -13.5390625, -12.17626953125, -10.8134765625, -9.45068359375, -8.087890625, -6.72509765625, -5.3623046875, -3.99951171875, -2.63671875, -1.27392578125, 0.0888671875, 1.45166015625, 2.814453125, 4.17724609375, 5.5400390625, 6.90283203125, 8.265625, 9.62841796875, 10.9912109375, 12.35400390625, 13.716796875, 15.07958984375, 16.4423828125, 17.80517578125, 19.16796875, 20.53076171875, 21.8935546875, 23.25634765625, 24.619140625, 25.98193359375, 27.3447265625, 28.70751953125, 30.0703125, 31.43310546875, 32.7958984375, 34.15869140625, 35.521484375, 36.88427734375, 38.2470703125, 39.60986328125, 40.97265625, 42.33544921875, 43.6982421875, 45.06103515625, 46.423828125, 47.78662109375, 49.1494140625, 50.51220703125, 51.875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 1.0, 9.0, 5.0, 9.0, 10.0, 12.0, 19.0, 24.0, 25.0, 49.0, 104.0, 172.0, 190.0, 128.0, 79.0, 40.0, 26.0, 21.0, 12.0, 5.0, 9.0, 9.0, 4.0, 5.0, 3.0, 3.0, 7.0, 2.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.84375, -42.671875, -41.5, -40.328125, -39.15625, -37.984375, -36.8125, -35.640625, -34.46875, -33.296875, -32.125, -30.953125, -29.78125, -28.609375, -27.4375, -26.265625, -25.09375, -23.921875, -22.75, -21.578125, -20.40625, -19.234375, -18.0625, -16.890625, -15.71875, -14.546875, -13.375, -12.203125, -11.03125, -9.859375, -8.6875, -7.515625, -6.34375, -5.171875, -4.0, -2.828125, -1.65625, -0.484375, 0.6875, 1.859375, 3.03125, 4.203125, 5.375, 6.546875, 7.71875, 8.890625, 10.0625, 11.234375, 12.40625, 13.578125, 14.75, 15.921875, 17.09375, 18.265625, 19.4375, 20.609375, 21.78125, 22.953125, 24.125, 25.296875, 26.46875, 27.640625, 28.8125, 29.984375, 31.15625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 10.0, 230.0, 714.0, 49.0, 8.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2713.180908203125, -2658.0625, -2602.9443359375, -2547.825927734375, -2492.70751953125, -2437.589111328125, -2382.470703125, -2327.3525390625, -2272.234130859375, -2217.11572265625, -2161.99755859375, -2106.879150390625, -2051.7607421875, -1996.642333984375, -1941.5240478515625, -1886.40576171875, -1831.287353515625, -1776.1689453125, -1721.0506591796875, -1665.932373046875, -1610.81396484375, -1555.695556640625, -1500.5772705078125, -1445.458984375, -1390.340576171875, -1335.22216796875, -1280.1038818359375, -1224.985595703125, -1169.8671875, -1114.748779296875, -1059.6304931640625, -1004.5121459960938, -949.3936767578125, -894.2753295898438, -839.156982421875, -784.0386352539062, -728.9202880859375, -673.8019409179688, -618.68359375, -563.5652465820312, -508.4468994140625, -453.32855224609375, -398.210205078125, -343.09185791015625, -287.9735107421875, -232.85516357421875, -177.73681640625, -122.61846923828125, -67.5001220703125, -12.38177490234375, 42.736572265625, 97.85491943359375, 152.9732666015625, 208.09161376953125, 263.2099609375, 318.32830810546875, 373.4466552734375, 428.56500244140625, 483.683349609375, 538.8016967773438, 593.9200439453125, 649.0383911132812, 704.15673828125, 759.2750854492188, 814.3934326171875]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 8.0, 8.0, 7.0, 9.0, 13.0, 16.0, 17.0, 19.0, 26.0, 22.0, 33.0, 49.0, 28.0, 38.0, 38.0, 52.0, 59.0, 36.0, 53.0, 51.0, 42.0, 45.0, 41.0, 39.0, 27.0, 36.0, 35.0, 29.0, 16.0, 17.0, 18.0, 15.0, 22.0, 11.0, 6.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-259.5472717285156, -250.4111785888672, -241.2750701904297, -232.13897705078125, -223.00286865234375, -213.8667755126953, -204.73068237304688, -195.59457397460938, -186.45848083496094, -177.3223876953125, -168.186279296875, -159.05018615722656, -149.91409301757812, -140.77798461914062, -131.6418914794922, -122.50579071044922, -113.36968994140625, -104.23358917236328, -95.09748840332031, -85.96139526367188, -76.8252944946289, -67.68919372558594, -58.553096771240234, -49.41699981689453, -40.28089904785156, -31.144800186157227, -22.00870132446289, -12.872602462768555, -3.7365036010742188, 5.39959716796875, 14.535694122314453, 23.671791076660156, 32.80792236328125, 41.94402313232422, 51.08012008666992, 60.216217041015625, 69.3523178100586, 78.48841857910156, 87.62451171875, 96.76061248779297, 105.89671325683594, 115.0328140258789, 124.16891479492188, 133.3050079345703, 142.44110107421875, 151.57720947265625, 160.7133026123047, 169.84939575195312, 178.98550415039062, 188.12159729003906, 197.25770568847656, 206.393798828125, 215.5299072265625, 224.66600036621094, 233.80209350585938, 242.93820190429688, 252.0742950439453, 261.21038818359375, 270.34649658203125, 279.48260498046875, 288.6186828613281, 297.7547912597656, 306.8908996582031, 316.0269775390625, 325.1630859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 9.0, 6.0, 6.0, 18.0, 19.0, 37.0, 72.0, 96.0, 187.0, 290.0, 496.0, 864.0, 1898.0, 5821.0, 36979.0, 4100174.0, 37548.0, 5779.0, 1916.0, 852.0, 498.0, 262.0, 180.0, 117.0, 69.0, 30.0, 26.0, 10.0, 8.0, 9.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21875, -41.587890625, -39.95703125, -38.326171875, -36.6953125, -35.064453125, -33.43359375, -31.802734375, -30.171875, -28.541015625, -26.91015625, -25.279296875, -23.6484375, -22.017578125, -20.38671875, -18.755859375, -17.125, -15.494140625, -13.86328125, -12.232421875, -10.6015625, -8.970703125, -7.33984375, -5.708984375, -4.078125, -2.447265625, -0.81640625, 0.814453125, 2.4453125, 4.076171875, 5.70703125, 7.337890625, 8.96875, 10.599609375, 12.23046875, 13.861328125, 15.4921875, 17.123046875, 18.75390625, 20.384765625, 22.015625, 23.646484375, 25.27734375, 26.908203125, 28.5390625, 30.169921875, 31.80078125, 33.431640625, 35.0625, 36.693359375, 38.32421875, 39.955078125, 41.5859375, 43.216796875, 44.84765625, 46.478515625, 48.109375, 49.740234375, 51.37109375, 53.001953125, 54.6328125, 56.263671875, 57.89453125, 59.525390625, 61.15625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 9.0, 16.0, 25.0, 25.0, 50.0, 92.0, 104.0, 125.0, 132.0, 110.0, 101.0, 91.0, 50.0, 24.0, 19.0, 14.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.984375, -23.963134765625, -22.94189453125, -21.920654296875, -20.8994140625, -19.878173828125, -18.85693359375, -17.835693359375, -16.814453125, -15.793212890625, -14.77197265625, -13.750732421875, -12.7294921875, -11.708251953125, -10.68701171875, -9.665771484375, -8.64453125, -7.623291015625, -6.60205078125, -5.580810546875, -4.5595703125, -3.538330078125, -2.51708984375, -1.495849609375, -0.474609375, 0.546630859375, 1.56787109375, 2.589111328125, 3.6103515625, 4.631591796875, 5.65283203125, 6.674072265625, 7.6953125, 8.716552734375, 9.73779296875, 10.759033203125, 11.7802734375, 12.801513671875, 13.82275390625, 14.843994140625, 15.865234375, 16.886474609375, 17.90771484375, 18.928955078125, 19.9501953125, 20.971435546875, 21.99267578125, 23.013916015625, 24.03515625, 25.056396484375, 26.07763671875, 27.098876953125, 28.1201171875, 29.141357421875, 30.16259765625, 31.183837890625, 32.205078125, 33.226318359375, 34.24755859375, 35.268798828125, 36.2900390625, 37.311279296875, 38.33251953125, 39.353759765625, 40.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 16.0, 21.0, 21.0, 26.0, 44.0, 71.0, 94.0, 124.0, 185.0, 297.0, 450.0, 725.0, 1308.0, 3127.0, 9563.0, 57918.0, 4046538.0, 57813.0, 9583.0, 3007.0, 1335.0, 710.0, 451.0, 282.0, 185.0, 111.0, 78.0, 62.0, 30.0, 26.0, 16.0, 21.0, 12.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.796875, -26.821533203125, -25.84619140625, -24.870849609375, -23.8955078125, -22.920166015625, -21.94482421875, -20.969482421875, -19.994140625, -19.018798828125, -18.04345703125, -17.068115234375, -16.0927734375, -15.117431640625, -14.14208984375, -13.166748046875, -12.19140625, -11.216064453125, -10.24072265625, -9.265380859375, -8.2900390625, -7.314697265625, -6.33935546875, -5.364013671875, -4.388671875, -3.413330078125, -2.43798828125, -1.462646484375, -0.4873046875, 0.488037109375, 1.46337890625, 2.438720703125, 3.4140625, 4.389404296875, 5.36474609375, 6.340087890625, 7.3154296875, 8.290771484375, 9.26611328125, 10.241455078125, 11.216796875, 12.192138671875, 13.16748046875, 14.142822265625, 15.1181640625, 16.093505859375, 17.06884765625, 18.044189453125, 19.01953125, 19.994873046875, 20.97021484375, 21.945556640625, 22.9208984375, 23.896240234375, 24.87158203125, 25.846923828125, 26.822265625, 27.797607421875, 28.77294921875, 29.748291015625, 30.7236328125, 31.698974609375, 32.67431640625, 33.649658203125, 34.625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 8.0, 5.0, 10.0, 21.0, 13.0, 59.0, 120.0, 3367.0, 304.0, 65.0, 40.0, 20.0, 13.0, 8.0, 5.0, 8.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.24615478515625, -8.0157470703125, -7.78533935546875, -7.554931640625, -7.32452392578125, -7.0941162109375, -6.86370849609375, -6.63330078125, -6.40289306640625, -6.1724853515625, -5.94207763671875, -5.711669921875, -5.48126220703125, -5.2508544921875, -5.02044677734375, -4.7900390625, -4.55963134765625, -4.3292236328125, -4.09881591796875, -3.868408203125, -3.63800048828125, -3.4075927734375, -3.17718505859375, -2.94677734375, -2.71636962890625, -2.4859619140625, -2.25555419921875, -2.025146484375, -1.79473876953125, -1.5643310546875, -1.33392333984375, -1.103515625, -0.87310791015625, -0.6427001953125, -0.41229248046875, -0.181884765625, 0.04852294921875, 0.2789306640625, 0.50933837890625, 0.73974609375, 0.97015380859375, 1.2005615234375, 1.43096923828125, 1.661376953125, 1.89178466796875, 2.1221923828125, 2.35260009765625, 2.5830078125, 2.81341552734375, 3.0438232421875, 3.27423095703125, 3.504638671875, 3.73504638671875, 3.9654541015625, 4.19586181640625, 4.42626953125, 4.65667724609375, 4.8870849609375, 5.11749267578125, 5.347900390625, 5.57830810546875, 5.8087158203125, 6.03912353515625, 6.26953125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 5.0, 12.0, 21.0, 27.0, 42.0, 81.0, 140.0, 171.0, 159.0, 127.0, 79.0, 44.0, 33.0, 25.0, 15.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.32073974609375, -35.27613830566406, -34.23154067993164, -33.18693923950195, -32.142337799072266, -31.09773826599121, -30.053138732910156, -29.00853729248047, -27.963937759399414, -26.91933822631836, -25.874736785888672, -24.830137252807617, -23.785537719726562, -22.740936279296875, -21.69633674621582, -20.651737213134766, -19.607135772705078, -18.562536239624023, -17.517934799194336, -16.47333526611328, -15.42873477935791, -14.384134292602539, -13.339534759521484, -12.294934272766113, -11.250333786010742, -10.205733299255371, -9.1611328125, -8.116533279418945, -7.071932792663574, -6.027332305908203, -4.98273229598999, -3.9381322860717773, -2.8935279846191406, -1.8489277362823486, -0.8043274879455566, 0.24027276039123535, 1.2848730087280273, 2.3294734954833984, 3.3740735054016113, 4.418673515319824, 5.463274002075195, 6.507874488830566, 7.552474498748779, 8.597074508666992, 9.641674995422363, 10.686275482177734, 11.730875015258789, 12.77547550201416, 13.820075988769531, 14.864676475524902, 15.909276962280273, 16.953876495361328, 17.998477935791016, 19.04307746887207, 20.087677001953125, 21.132278442382812, 22.176877975463867, 23.221477508544922, 24.26607894897461, 25.310678482055664, 26.35527801513672, 27.399879455566406, 28.44447898864746, 29.489078521728516, 30.533679962158203]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 7.0, 9.0, 13.0, 10.0, 17.0, 27.0, 21.0, 31.0, 44.0, 35.0, 49.0, 66.0, 48.0, 55.0, 50.0, 64.0, 60.0, 51.0, 49.0, 58.0, 40.0, 38.0, 33.0, 27.0, 20.0, 19.0, 14.0, 13.0, 2.0, 2.0, 5.0, 9.0, 5.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.431556701660156, -22.84870147705078, -22.265844345092773, -21.6829891204834, -21.10013198852539, -20.517276763916016, -19.934419631958008, -19.351564407348633, -18.768707275390625, -18.18585205078125, -17.602994918823242, -17.020139694213867, -16.43728256225586, -15.854427337646484, -15.271571159362793, -14.688714981079102, -14.105859756469727, -13.523003578186035, -12.940147399902344, -12.357291221618652, -11.774435043334961, -11.191579818725586, -10.608723640441895, -10.025867462158203, -9.443011283874512, -8.86015510559082, -8.277298927307129, -7.694443225860596, -7.111587047576904, -6.528730869293213, -5.94587516784668, -5.363018989562988, -4.78016471862793, -4.197308540344238, -3.614452600479126, -3.0315966606140137, -2.4487404823303223, -1.8658843040466309, -1.2830283641815186, -0.7001724243164062, -0.11731624603271484, 0.465539813041687, 1.0483958721160889, 1.6312519311904907, 2.2141079902648926, 2.796964168548584, 3.3798201084136963, 3.9626760482788086, 4.5455322265625, 5.128388404846191, 5.711244583129883, 6.294100284576416, 6.876956462860107, 7.459812641143799, 8.042668342590332, 8.625524520874023, 9.208380699157715, 9.791236877441406, 10.374093055725098, 10.956949234008789, 11.539804458618164, 12.122661590576172, 12.705516815185547, 13.288372993469238, 13.87122917175293]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 6.0, 7.0, 6.0, 14.0, 13.0, 19.0, 27.0, 35.0, 55.0, 67.0, 99.0, 159.0, 225.0, 359.0, 649.0, 1057.0, 2307.0, 5784.0, 23268.0, 148861.0, 600394.0, 219179.0, 32686.0, 7427.0, 2693.0, 1236.0, 701.0, 443.0, 257.0, 179.0, 91.0, 77.0, 55.0, 35.0, 26.0, 20.0, 17.0, 8.0, 9.0, 2.0, 8.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-44.09375, -42.951416015625, -41.80908203125, -40.666748046875, -39.5244140625, -38.382080078125, -37.23974609375, -36.097412109375, -34.955078125, -33.812744140625, -32.67041015625, -31.528076171875, -30.3857421875, -29.243408203125, -28.10107421875, -26.958740234375, -25.81640625, -24.674072265625, -23.53173828125, -22.389404296875, -21.2470703125, -20.104736328125, -18.96240234375, -17.820068359375, -16.677734375, -15.535400390625, -14.39306640625, -13.250732421875, -12.1083984375, -10.966064453125, -9.82373046875, -8.681396484375, -7.5390625, -6.396728515625, -5.25439453125, -4.112060546875, -2.9697265625, -1.827392578125, -0.68505859375, 0.457275390625, 1.599609375, 2.741943359375, 3.88427734375, 5.026611328125, 6.1689453125, 7.311279296875, 8.45361328125, 9.595947265625, 10.73828125, 11.880615234375, 13.02294921875, 14.165283203125, 15.3076171875, 16.449951171875, 17.59228515625, 18.734619140625, 19.876953125, 21.019287109375, 22.16162109375, 23.303955078125, 24.4462890625, 25.588623046875, 26.73095703125, 27.873291015625, 29.015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 11.0, 14.0, 24.0, 29.0, 47.0, 67.0, 103.0, 121.0, 134.0, 103.0, 129.0, 84.0, 49.0, 37.0, 25.0, 10.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.21875, -24.197265625, -23.17578125, -22.154296875, -21.1328125, -20.111328125, -19.08984375, -18.068359375, -17.046875, -16.025390625, -15.00390625, -13.982421875, -12.9609375, -11.939453125, -10.91796875, -9.896484375, -8.875, -7.853515625, -6.83203125, -5.810546875, -4.7890625, -3.767578125, -2.74609375, -1.724609375, -0.703125, 0.318359375, 1.33984375, 2.361328125, 3.3828125, 4.404296875, 5.42578125, 6.447265625, 7.46875, 8.490234375, 9.51171875, 10.533203125, 11.5546875, 12.576171875, 13.59765625, 14.619140625, 15.640625, 16.662109375, 17.68359375, 18.705078125, 19.7265625, 20.748046875, 21.76953125, 22.791015625, 23.8125, 24.833984375, 25.85546875, 26.876953125, 27.8984375, 28.919921875, 29.94140625, 30.962890625, 31.984375, 33.005859375, 34.02734375, 35.048828125, 36.0703125, 37.091796875, 38.11328125, 39.134765625, 40.15625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 9.0, 10.0, 11.0, 25.0, 28.0, 44.0, 59.0, 95.0, 160.0, 246.0, 505.0, 1215.0, 5013.0, 280087.0, 751798.0, 6598.0, 1359.0, 526.0, 264.0, 156.0, 98.0, 65.0, 53.0, 31.0, 27.0, 22.0, 5.0, 9.0, 4.0, 3.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-192.0, -186.36328125, -180.7265625, -175.08984375, -169.453125, -163.81640625, -158.1796875, -152.54296875, -146.90625, -141.26953125, -135.6328125, -129.99609375, -124.359375, -118.72265625, -113.0859375, -107.44921875, -101.8125, -96.17578125, -90.5390625, -84.90234375, -79.265625, -73.62890625, -67.9921875, -62.35546875, -56.71875, -51.08203125, -45.4453125, -39.80859375, -34.171875, -28.53515625, -22.8984375, -17.26171875, -11.625, -5.98828125, -0.3515625, 5.28515625, 10.921875, 16.55859375, 22.1953125, 27.83203125, 33.46875, 39.10546875, 44.7421875, 50.37890625, 56.015625, 61.65234375, 67.2890625, 72.92578125, 78.5625, 84.19921875, 89.8359375, 95.47265625, 101.109375, 106.74609375, 112.3828125, 118.01953125, 123.65625, 129.29296875, 134.9296875, 140.56640625, 146.203125, 151.83984375, 157.4765625, 163.11328125, 168.75]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 12.0, 15.0, 11.0, 11.0, 36.0, 56.0, 78.0, 151.0, 160.0, 156.0, 116.0, 63.0, 34.0, 22.0, 20.0, 17.0, 11.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-269.75, -260.9375, -252.125, -243.3125, -234.5, -225.6875, -216.875, -208.0625, -199.25, -190.4375, -181.625, -172.8125, -164.0, -155.1875, -146.375, -137.5625, -128.75, -119.9375, -111.125, -102.3125, -93.5, -84.6875, -75.875, -67.0625, -58.25, -49.4375, -40.625, -31.8125, -23.0, -14.1875, -5.375, 3.4375, 12.25, 21.0625, 29.875, 38.6875, 47.5, 56.3125, 65.125, 73.9375, 82.75, 91.5625, 100.375, 109.1875, 118.0, 126.8125, 135.625, 144.4375, 153.25, 162.0625, 170.875, 179.6875, 188.5, 197.3125, 206.125, 214.9375, 223.75, 232.5625, 241.375, 250.1875, 259.0, 267.8125, 276.625, 285.4375, 294.25]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 15.0, 16.0, 29.0, 29.0, 23.0, 57.0, 87.0, 91.0, 173.0, 315.0, 830.0, 6615.0, 1007732.0, 29987.0, 1457.0, 432.0, 204.0, 122.0, 76.0, 62.0, 40.0, 34.0, 23.0, 13.0, 12.0, 10.0, 14.0, 9.0, 12.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.25, -90.1083984375, -86.966796875, -83.8251953125, -80.68359375, -77.5419921875, -74.400390625, -71.2587890625, -68.1171875, -64.9755859375, -61.833984375, -58.6923828125, -55.55078125, -52.4091796875, -49.267578125, -46.1259765625, -42.984375, -39.8427734375, -36.701171875, -33.5595703125, -30.41796875, -27.2763671875, -24.134765625, -20.9931640625, -17.8515625, -14.7099609375, -11.568359375, -8.4267578125, -5.28515625, -2.1435546875, 0.998046875, 4.1396484375, 7.28125, 10.4228515625, 13.564453125, 16.7060546875, 19.84765625, 22.9892578125, 26.130859375, 29.2724609375, 32.4140625, 35.5556640625, 38.697265625, 41.8388671875, 44.98046875, 48.1220703125, 51.263671875, 54.4052734375, 57.546875, 60.6884765625, 63.830078125, 66.9716796875, 70.11328125, 73.2548828125, 76.396484375, 79.5380859375, 82.6796875, 85.8212890625, 88.962890625, 92.1044921875, 95.24609375, 98.3876953125, 101.529296875, 104.6708984375, 107.8125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 10.0, 13.0, 17.0, 34.0, 47.0, 97.0, 158.0, 197.0, 169.0, 95.0, 51.0, 36.0, 23.0, 12.0, 11.0, 6.0, 4.0, 7.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032711029052734375, -0.0031568706035614014, -0.0030426383018493652, -0.002928406000137329, -0.002814173698425293, -0.002699941396713257, -0.0025857090950012207, -0.0024714767932891846, -0.0023572444915771484, -0.0022430121898651123, -0.002128779888153076, -0.00201454758644104, -0.001900315284729004, -0.0017860829830169678, -0.0016718506813049316, -0.0015576183795928955, -0.0014433860778808594, -0.0013291537761688232, -0.0012149214744567871, -0.001100689172744751, -0.0009864568710327148, -0.0008722245693206787, -0.0007579922676086426, -0.0006437599658966064, -0.0005295276641845703, -0.0004152953624725342, -0.00030106306076049805, -0.00018683075904846191, -7.259845733642578e-05, 4.163384437561035e-05, 0.00015586614608764648, 0.0002700984477996826, 0.00038433074951171875, 0.0004985630512237549, 0.000612795352935791, 0.0007270276546478271, 0.0008412599563598633, 0.0009554922580718994, 0.0010697245597839355, 0.0011839568614959717, 0.0012981891632080078, 0.001412421464920044, 0.00152665376663208, 0.0016408860683441162, 0.0017551183700561523, 0.0018693506717681885, 0.0019835829734802246, 0.0020978152751922607, 0.002212047576904297, 0.002326279878616333, 0.002440512180328369, 0.0025547444820404053, 0.0026689767837524414, 0.0027832090854644775, 0.0028974413871765137, 0.00301167368888855, 0.003125905990600586, 0.003240138292312622, 0.003354370594024658, 0.0034686028957366943, 0.0035828351974487305, 0.0036970674991607666, 0.0038112998008728027, 0.003925532102584839, 0.004039764404296875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 7.0, 9.0, 17.0, 23.0, 26.0, 24.0, 72.0, 63.0, 105.0, 149.0, 225.0, 467.0, 1289.0, 6307.0, 361411.0, 668188.0, 7430.0, 1462.0, 545.0, 222.0, 138.0, 100.0, 73.0, 48.0, 43.0, 20.0, 22.0, 13.0, 6.0, 8.0, 11.0, 6.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.46875, -52.52587890625, -50.5830078125, -48.64013671875, -46.697265625, -44.75439453125, -42.8115234375, -40.86865234375, -38.92578125, -36.98291015625, -35.0400390625, -33.09716796875, -31.154296875, -29.21142578125, -27.2685546875, -25.32568359375, -23.3828125, -21.43994140625, -19.4970703125, -17.55419921875, -15.611328125, -13.66845703125, -11.7255859375, -9.78271484375, -7.83984375, -5.89697265625, -3.9541015625, -2.01123046875, -0.068359375, 1.87451171875, 3.8173828125, 5.76025390625, 7.703125, 9.64599609375, 11.5888671875, 13.53173828125, 15.474609375, 17.41748046875, 19.3603515625, 21.30322265625, 23.24609375, 25.18896484375, 27.1318359375, 29.07470703125, 31.017578125, 32.96044921875, 34.9033203125, 36.84619140625, 38.7890625, 40.73193359375, 42.6748046875, 44.61767578125, 46.560546875, 48.50341796875, 50.4462890625, 52.38916015625, 54.33203125, 56.27490234375, 58.2177734375, 60.16064453125, 62.103515625, 64.04638671875, 65.9892578125, 67.93212890625, 69.875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 14.0, 13.0, 23.0, 27.0, 66.0, 156.0, 311.0, 175.0, 73.0, 32.0, 26.0, 14.0, 9.0, 7.0, 9.0, 8.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-97.0, -94.6630859375, -92.326171875, -89.9892578125, -87.65234375, -85.3154296875, -82.978515625, -80.6416015625, -78.3046875, -75.9677734375, -73.630859375, -71.2939453125, -68.95703125, -66.6201171875, -64.283203125, -61.9462890625, -59.609375, -57.2724609375, -54.935546875, -52.5986328125, -50.26171875, -47.9248046875, -45.587890625, -43.2509765625, -40.9140625, -38.5771484375, -36.240234375, -33.9033203125, -31.56640625, -29.2294921875, -26.892578125, -24.5556640625, -22.21875, -19.8818359375, -17.544921875, -15.2080078125, -12.87109375, -10.5341796875, -8.197265625, -5.8603515625, -3.5234375, -1.1865234375, 1.150390625, 3.4873046875, 5.82421875, 8.1611328125, 10.498046875, 12.8349609375, 15.171875, 17.5087890625, 19.845703125, 22.1826171875, 24.51953125, 26.8564453125, 29.193359375, 31.5302734375, 33.8671875, 36.2041015625, 38.541015625, 40.8779296875, 43.21484375, 45.5517578125, 47.888671875, 50.2255859375, 52.5625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 17.0, 141.0, 624.0, 188.0, 20.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-778.3920288085938, -733.8359985351562, -689.2799682617188, -644.7239379882812, -600.1679077148438, -555.6118774414062, -511.0558776855469, -466.4998474121094, -421.9438171386719, -377.3877868652344, -332.8317565917969, -288.2757568359375, -243.71971130371094, -199.16368103027344, -154.607666015625, -110.0516357421875, -65.49560546875, -20.939579010009766, 23.61644744873047, 68.17247009277344, 112.72850036621094, 157.28453063964844, 201.84054565429688, 246.39657592773438, 290.9526062011719, 335.5086364746094, 380.0646667480469, 424.62066650390625, 469.17669677734375, 513.7327270507812, 558.2887573242188, 602.8447875976562, 647.4007568359375, 691.956787109375, 736.5128173828125, 781.06884765625, 825.6248779296875, 870.180908203125, 914.7369384765625, 959.29296875, 1003.8489990234375, 1048.405029296875, 1092.9610595703125, 1137.51708984375, 1182.0731201171875, 1226.629150390625, 1271.1851806640625, 1315.7412109375, 1360.297119140625, 1404.8531494140625, 1449.4091796875, 1493.9652099609375, 1538.521240234375, 1583.0772705078125, 1627.63330078125, 1672.1893310546875, 1716.745361328125, 1761.3013916015625, 1805.857421875, 1850.4134521484375, 1894.969482421875, 1939.5255126953125, 1984.08154296875, 2028.6375732421875, 2073.193603515625]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 9.0, 29.0, 28.0, 28.0, 49.0, 51.0, 73.0, 92.0, 105.0, 87.0, 73.0, 88.0, 77.0, 50.0, 47.0, 41.0, 30.0, 16.0, 10.0, 10.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-796.7935180664062, -776.0010375976562, -755.20849609375, -734.416015625, -713.6234741210938, -692.8309936523438, -672.0384521484375, -651.2459716796875, -630.4534912109375, -609.6610107421875, -588.8684692382812, -568.0759887695312, -547.283447265625, -526.490966796875, -505.6984558105469, -484.90594482421875, -464.1134033203125, -443.3208923339844, -422.52838134765625, -401.7358703613281, -380.943359375, -360.15087890625, -339.3583679199219, -318.56585693359375, -297.7733459472656, -276.9808349609375, -256.1883239746094, -235.3958282470703, -214.6033172607422, -193.81080627441406, -173.018310546875, -152.22579956054688, -131.433349609375, -110.64083862304688, -89.84833526611328, -69.05583190917969, -48.26332092285156, -27.470809936523438, -6.678306579589844, 14.11419677734375, 34.906707763671875, 55.699214935302734, 76.4917221069336, 97.28422546386719, 118.07673645019531, 138.86924743652344, 159.6617431640625, 180.45425415039062, 201.24676513671875, 222.03927612304688, 242.831787109375, 263.6242980957031, 284.41680908203125, 305.20928955078125, 326.0018005371094, 346.7943115234375, 367.5868225097656, 388.37933349609375, 409.1718444824219, 429.96435546875, 450.7568359375, 471.54937744140625, 492.34185791015625, 513.1343994140625, 533.9268798828125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 19.0, 58.0, 107.0, 386.0, 1631.0, 14854.0, 4116721.0, 56416.0, 3186.0, 609.0, 194.0, 53.0, 17.0, 15.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.9375, -37.6787109375, -35.419921875, -33.1611328125, -30.90234375, -28.6435546875, -26.384765625, -24.1259765625, -21.8671875, -19.6083984375, -17.349609375, -15.0908203125, -12.83203125, -10.5732421875, -8.314453125, -6.0556640625, -3.796875, -1.5380859375, 0.720703125, 2.9794921875, 5.23828125, 7.4970703125, 9.755859375, 12.0146484375, 14.2734375, 16.5322265625, 18.791015625, 21.0498046875, 23.30859375, 25.5673828125, 27.826171875, 30.0849609375, 32.34375, 34.6025390625, 36.861328125, 39.1201171875, 41.37890625, 43.6376953125, 45.896484375, 48.1552734375, 50.4140625, 52.6728515625, 54.931640625, 57.1904296875, 59.44921875, 61.7080078125, 63.966796875, 66.2255859375, 68.484375, 70.7431640625, 73.001953125, 75.2607421875, 77.51953125, 79.7783203125, 82.037109375, 84.2958984375, 86.5546875, 88.8134765625, 91.072265625, 93.3310546875, 95.58984375, 97.8486328125, 100.107421875, 102.3662109375, 104.625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 6.0, 13.0, 15.0, 21.0, 28.0, 34.0, 35.0, 58.0, 54.0, 77.0, 78.0, 90.0, 76.0, 71.0, 57.0, 56.0, 54.0, 33.0, 37.0, 23.0, 20.0, 10.0, 4.0, 13.0, 3.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1875, -18.4990234375, -17.810546875, -17.1220703125, -16.43359375, -15.7451171875, -15.056640625, -14.3681640625, -13.6796875, -12.9912109375, -12.302734375, -11.6142578125, -10.92578125, -10.2373046875, -9.548828125, -8.8603515625, -8.171875, -7.4833984375, -6.794921875, -6.1064453125, -5.41796875, -4.7294921875, -4.041015625, -3.3525390625, -2.6640625, -1.9755859375, -1.287109375, -0.5986328125, 0.08984375, 0.7783203125, 1.466796875, 2.1552734375, 2.84375, 3.5322265625, 4.220703125, 4.9091796875, 5.59765625, 6.2861328125, 6.974609375, 7.6630859375, 8.3515625, 9.0400390625, 9.728515625, 10.4169921875, 11.10546875, 11.7939453125, 12.482421875, 13.1708984375, 13.859375, 14.5478515625, 15.236328125, 15.9248046875, 16.61328125, 17.3017578125, 17.990234375, 18.6787109375, 19.3671875, 20.0556640625, 20.744140625, 21.4326171875, 22.12109375, 22.8095703125, 23.498046875, 24.1865234375, 24.875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 12.0, 15.0, 21.0, 16.0, 32.0, 45.0, 53.0, 88.0, 109.0, 168.0, 290.0, 524.0, 1193.0, 3371.0, 14355.0, 359055.0, 3785190.0, 22397.0, 4360.0, 1430.0, 584.0, 303.0, 197.0, 140.0, 104.0, 60.0, 46.0, 40.0, 25.0, 16.0, 9.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-37.6875, -36.614013671875, -35.54052734375, -34.467041015625, -33.3935546875, -32.320068359375, -31.24658203125, -30.173095703125, -29.099609375, -28.026123046875, -26.95263671875, -25.879150390625, -24.8056640625, -23.732177734375, -22.65869140625, -21.585205078125, -20.51171875, -19.438232421875, -18.36474609375, -17.291259765625, -16.2177734375, -15.144287109375, -14.07080078125, -12.997314453125, -11.923828125, -10.850341796875, -9.77685546875, -8.703369140625, -7.6298828125, -6.556396484375, -5.48291015625, -4.409423828125, -3.3359375, -2.262451171875, -1.18896484375, -0.115478515625, 0.9580078125, 2.031494140625, 3.10498046875, 4.178466796875, 5.251953125, 6.325439453125, 7.39892578125, 8.472412109375, 9.5458984375, 10.619384765625, 11.69287109375, 12.766357421875, 13.83984375, 14.913330078125, 15.98681640625, 17.060302734375, 18.1337890625, 19.207275390625, 20.28076171875, 21.354248046875, 22.427734375, 23.501220703125, 24.57470703125, 25.648193359375, 26.7216796875, 27.795166015625, 28.86865234375, 29.942138671875, 31.015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 10.0, 13.0, 33.0, 140.0, 3172.0, 564.0, 84.0, 23.0, 22.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15625, -18.46826171875, -17.7802734375, -17.09228515625, -16.404296875, -15.71630859375, -15.0283203125, -14.34033203125, -13.65234375, -12.96435546875, -12.2763671875, -11.58837890625, -10.900390625, -10.21240234375, -9.5244140625, -8.83642578125, -8.1484375, -7.46044921875, -6.7724609375, -6.08447265625, -5.396484375, -4.70849609375, -4.0205078125, -3.33251953125, -2.64453125, -1.95654296875, -1.2685546875, -0.58056640625, 0.107421875, 0.79541015625, 1.4833984375, 2.17138671875, 2.859375, 3.54736328125, 4.2353515625, 4.92333984375, 5.611328125, 6.29931640625, 6.9873046875, 7.67529296875, 8.36328125, 9.05126953125, 9.7392578125, 10.42724609375, 11.115234375, 11.80322265625, 12.4912109375, 13.17919921875, 13.8671875, 14.55517578125, 15.2431640625, 15.93115234375, 16.619140625, 17.30712890625, 17.9951171875, 18.68310546875, 19.37109375, 20.05908203125, 20.7470703125, 21.43505859375, 22.123046875, 22.81103515625, 23.4990234375, 24.18701171875, 24.875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 8.0, 9.0, 25.0, 69.0, 168.0, 239.0, 269.0, 130.0, 51.0, 22.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.85598754882812, -81.0434341430664, -78.23088073730469, -75.41831970214844, -72.60576629638672, -69.793212890625, -66.98065948486328, -64.16810607910156, -61.35554885864258, -58.54299545288086, -55.730438232421875, -52.917884826660156, -50.10533142089844, -47.29277420043945, -44.480220794677734, -41.66766357421875, -38.85511016845703, -36.04255676269531, -33.22999954223633, -30.41744613647461, -27.604890823364258, -24.792335510253906, -21.979782104492188, -19.167226791381836, -16.354671478271484, -13.542116165161133, -10.729561805725098, -7.9170074462890625, -5.104452133178711, -2.2918968200683594, 0.5206565856933594, 3.333211898803711, 6.1457672119140625, 8.958322525024414, 11.77087688446045, 14.583431243896484, 17.395986557006836, 20.208541870117188, 23.021095275878906, 25.833650588989258, 28.64620590209961, 31.45876121520996, 34.27131652832031, 37.08386993408203, 39.89642333984375, 42.708980560302734, 45.52153396606445, 48.33409118652344, 51.146644592285156, 53.959197998046875, 56.77175521850586, 59.58430862426758, 62.39686584472656, 65.20941925048828, 68.02197265625, 70.83452606201172, 73.64707946777344, 76.45963287353516, 79.27218627929688, 82.08474731445312, 84.89730072021484, 87.70985412597656, 90.52240753173828, 93.3349609375, 96.14752197265625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 7.0, 1.0, 9.0, 12.0, 18.0, 20.0, 17.0, 25.0, 38.0, 41.0, 49.0, 45.0, 52.0, 62.0, 60.0, 65.0, 61.0, 72.0, 62.0, 40.0, 48.0, 40.0, 39.0, 26.0, 27.0, 14.0, 16.0, 11.0, 10.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.14964294433594, -32.95511245727539, -31.760578155517578, -30.5660457611084, -29.37151336669922, -28.176982879638672, -26.982450485229492, -25.787918090820312, -24.593385696411133, -23.398853302001953, -22.204320907592773, -21.009788513183594, -19.815258026123047, -18.620723724365234, -17.426193237304688, -16.231660842895508, -15.037128448486328, -13.842596054077148, -12.648063659667969, -11.453532218933105, -10.258999824523926, -9.064467430114746, -7.869935512542725, -6.675403594970703, -5.480871200561523, -4.286338806152344, -3.0918068885803223, -1.8972747325897217, -0.7027425765991211, 0.4917898178100586, 1.68632173538208, 2.8808536529541016, 4.075386047363281, 5.269918441772461, 6.464450359344482, 7.658982276916504, 8.853514671325684, 10.048047065734863, 11.242578506469727, 12.437110900878906, 13.631643295288086, 14.826175689697266, 16.020708084106445, 17.215240478515625, 18.409770965576172, 19.604305267333984, 20.79883575439453, 21.99336814880371, 23.18790054321289, 24.38243293762207, 25.57696533203125, 26.77149772644043, 27.96603012084961, 29.160560607910156, 30.355093002319336, 31.549625396728516, 32.74415588378906, 33.93868637084961, 35.13322067260742, 36.32775115966797, 37.52228546142578, 38.71681594848633, 39.91135025024414, 41.10588073730469, 42.3004150390625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 11.0, 3.0, 14.0, 20.0, 22.0, 41.0, 69.0, 94.0, 170.0, 342.0, 614.0, 1438.0, 4291.0, 21736.0, 257095.0, 685734.0, 64088.0, 8456.0, 2376.0, 904.0, 437.0, 227.0, 133.0, 86.0, 57.0, 32.0, 21.0, 17.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.84375, -51.93701171875, -50.0302734375, -48.12353515625, -46.216796875, -44.31005859375, -42.4033203125, -40.49658203125, -38.58984375, -36.68310546875, -34.7763671875, -32.86962890625, -30.962890625, -29.05615234375, -27.1494140625, -25.24267578125, -23.3359375, -21.42919921875, -19.5224609375, -17.61572265625, -15.708984375, -13.80224609375, -11.8955078125, -9.98876953125, -8.08203125, -6.17529296875, -4.2685546875, -2.36181640625, -0.455078125, 1.45166015625, 3.3583984375, 5.26513671875, 7.171875, 9.07861328125, 10.9853515625, 12.89208984375, 14.798828125, 16.70556640625, 18.6123046875, 20.51904296875, 22.42578125, 24.33251953125, 26.2392578125, 28.14599609375, 30.052734375, 31.95947265625, 33.8662109375, 35.77294921875, 37.6796875, 39.58642578125, 41.4931640625, 43.39990234375, 45.306640625, 47.21337890625, 49.1201171875, 51.02685546875, 52.93359375, 54.84033203125, 56.7470703125, 58.65380859375, 60.560546875, 62.46728515625, 64.3740234375, 66.28076171875, 68.1875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 12.0, 6.0, 14.0, 24.0, 29.0, 37.0, 42.0, 51.0, 55.0, 58.0, 88.0, 90.0, 67.0, 72.0, 53.0, 53.0, 55.0, 48.0, 32.0, 21.0, 27.0, 14.0, 5.0, 7.0, 7.0, 7.0, 4.0, 4.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.4423828125, -17.759765625, -17.0771484375, -16.39453125, -15.7119140625, -15.029296875, -14.3466796875, -13.6640625, -12.9814453125, -12.298828125, -11.6162109375, -10.93359375, -10.2509765625, -9.568359375, -8.8857421875, -8.203125, -7.5205078125, -6.837890625, -6.1552734375, -5.47265625, -4.7900390625, -4.107421875, -3.4248046875, -2.7421875, -2.0595703125, -1.376953125, -0.6943359375, -0.01171875, 0.6708984375, 1.353515625, 2.0361328125, 2.71875, 3.4013671875, 4.083984375, 4.7666015625, 5.44921875, 6.1318359375, 6.814453125, 7.4970703125, 8.1796875, 8.8623046875, 9.544921875, 10.2275390625, 10.91015625, 11.5927734375, 12.275390625, 12.9580078125, 13.640625, 14.3232421875, 15.005859375, 15.6884765625, 16.37109375, 17.0537109375, 17.736328125, 18.4189453125, 19.1015625, 19.7841796875, 20.466796875, 21.1494140625, 21.83203125, 22.5146484375, 23.197265625, 23.8798828125, 24.5625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 2.0, 5.0, 6.0, 7.0, 10.0, 19.0, 23.0, 30.0, 38.0, 62.0, 125.0, 205.0, 398.0, 1068.0, 4731.0, 231777.0, 800610.0, 6998.0, 1393.0, 465.0, 223.0, 128.0, 73.0, 34.0, 32.0, 26.0, 17.0, 15.0, 2.0, 9.0, 5.0, 2.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.25, -168.984375, -163.71875, -158.453125, -153.1875, -147.921875, -142.65625, -137.390625, -132.125, -126.859375, -121.59375, -116.328125, -111.0625, -105.796875, -100.53125, -95.265625, -90.0, -84.734375, -79.46875, -74.203125, -68.9375, -63.671875, -58.40625, -53.140625, -47.875, -42.609375, -37.34375, -32.078125, -26.8125, -21.546875, -16.28125, -11.015625, -5.75, -0.484375, 4.78125, 10.046875, 15.3125, 20.578125, 25.84375, 31.109375, 36.375, 41.640625, 46.90625, 52.171875, 57.4375, 62.703125, 67.96875, 73.234375, 78.5, 83.765625, 89.03125, 94.296875, 99.5625, 104.828125, 110.09375, 115.359375, 120.625, 125.890625, 131.15625, 136.421875, 141.6875, 146.953125, 152.21875, 157.484375, 162.75]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 5.0, 10.0, 10.0, 14.0, 33.0, 51.0, 60.0, 82.0, 111.0, 119.0, 125.0, 108.0, 83.0, 65.0, 36.0, 25.0, 20.0, 14.0, 10.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-197.0, -191.5, -186.0, -180.5, -175.0, -169.5, -164.0, -158.5, -153.0, -147.5, -142.0, -136.5, -131.0, -125.5, -120.0, -114.5, -109.0, -103.5, -98.0, -92.5, -87.0, -81.5, -76.0, -70.5, -65.0, -59.5, -54.0, -48.5, -43.0, -37.5, -32.0, -26.5, -21.0, -15.5, -10.0, -4.5, 1.0, 6.5, 12.0, 17.5, 23.0, 28.5, 34.0, 39.5, 45.0, 50.5, 56.0, 61.5, 67.0, 72.5, 78.0, 83.5, 89.0, 94.5, 100.0, 105.5, 111.0, 116.5, 122.0, 127.5, 133.0, 138.5, 144.0, 149.5, 155.0]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 9.0, 15.0, 13.0, 23.0, 52.0, 69.0, 104.0, 206.0, 413.0, 1050.0, 4684.0, 76571.0, 943641.0, 17815.0, 2412.0, 742.0, 296.0, 169.0, 101.0, 58.0, 33.0, 25.0, 10.0, 11.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.03125, -42.708984375, -41.38671875, -40.064453125, -38.7421875, -37.419921875, -36.09765625, -34.775390625, -33.453125, -32.130859375, -30.80859375, -29.486328125, -28.1640625, -26.841796875, -25.51953125, -24.197265625, -22.875, -21.552734375, -20.23046875, -18.908203125, -17.5859375, -16.263671875, -14.94140625, -13.619140625, -12.296875, -10.974609375, -9.65234375, -8.330078125, -7.0078125, -5.685546875, -4.36328125, -3.041015625, -1.71875, -0.396484375, 0.92578125, 2.248046875, 3.5703125, 4.892578125, 6.21484375, 7.537109375, 8.859375, 10.181640625, 11.50390625, 12.826171875, 14.1484375, 15.470703125, 16.79296875, 18.115234375, 19.4375, 20.759765625, 22.08203125, 23.404296875, 24.7265625, 26.048828125, 27.37109375, 28.693359375, 30.015625, 31.337890625, 32.66015625, 33.982421875, 35.3046875, 36.626953125, 37.94921875, 39.271484375, 40.59375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 12.0, 3.0, 9.0, 18.0, 24.0, 47.0, 39.0, 62.0, 100.0, 139.0, 172.0, 92.0, 68.0, 58.0, 33.0, 34.0, 16.0, 18.0, 10.0, 6.0, 6.0, 4.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.003055572509765625, -0.0029730796813964844, -0.0028905868530273438, -0.002808094024658203, -0.0027256011962890625, -0.002643108367919922, -0.0025606155395507812, -0.0024781227111816406, -0.0023956298828125, -0.0023131370544433594, -0.0022306442260742188, -0.002148151397705078, -0.0020656585693359375, -0.001983165740966797, -0.0019006729125976562, -0.0018181800842285156, -0.001735687255859375, -0.0016531944274902344, -0.0015707015991210938, -0.0014882087707519531, -0.0014057159423828125, -0.0013232231140136719, -0.0012407302856445312, -0.0011582374572753906, -0.00107574462890625, -0.0009932518005371094, -0.0009107589721679688, -0.0008282661437988281, -0.0007457733154296875, -0.0006632804870605469, -0.0005807876586914062, -0.0004982948303222656, -0.000415802001953125, -0.0003333091735839844, -0.00025081634521484375, -0.00016832351684570312, -8.58306884765625e-05, -3.337860107421875e-06, 7.915496826171875e-05, 0.00016164779663085938, 0.000244140625, 0.0003266334533691406, 0.00040912628173828125, 0.0004916191101074219, 0.0005741119384765625, 0.0006566047668457031, 0.0007390975952148438, 0.0008215904235839844, 0.000904083251953125, 0.0009865760803222656, 0.0010690689086914062, 0.0011515617370605469, 0.0012340545654296875, 0.0013165473937988281, 0.0013990402221679688, 0.0014815330505371094, 0.00156402587890625, 0.0016465187072753906, 0.0017290115356445312, 0.0018115043640136719, 0.0018939971923828125, 0.001976490020751953, 0.0020589828491210938, 0.0021414756774902344, 0.002223968505859375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 9.0, 8.0, 12.0, 14.0, 18.0, 31.0, 54.0, 85.0, 161.0, 309.0, 780.0, 3659.0, 90687.0, 941162.0, 9209.0, 1388.0, 478.0, 200.0, 92.0, 45.0, 35.0, 21.0, 14.0, 5.0, 12.0, 11.0, 6.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.53125, -43.05712890625, -41.5830078125, -40.10888671875, -38.634765625, -37.16064453125, -35.6865234375, -34.21240234375, -32.73828125, -31.26416015625, -29.7900390625, -28.31591796875, -26.841796875, -25.36767578125, -23.8935546875, -22.41943359375, -20.9453125, -19.47119140625, -17.9970703125, -16.52294921875, -15.048828125, -13.57470703125, -12.1005859375, -10.62646484375, -9.15234375, -7.67822265625, -6.2041015625, -4.72998046875, -3.255859375, -1.78173828125, -0.3076171875, 1.16650390625, 2.640625, 4.11474609375, 5.5888671875, 7.06298828125, 8.537109375, 10.01123046875, 11.4853515625, 12.95947265625, 14.43359375, 15.90771484375, 17.3818359375, 18.85595703125, 20.330078125, 21.80419921875, 23.2783203125, 24.75244140625, 26.2265625, 27.70068359375, 29.1748046875, 30.64892578125, 32.123046875, 33.59716796875, 35.0712890625, 36.54541015625, 38.01953125, 39.49365234375, 40.9677734375, 42.44189453125, 43.916015625, 45.39013671875, 46.8642578125, 48.33837890625, 49.8125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 6.0, 7.0, 8.0, 26.0, 45.0, 48.0, 98.0, 138.0, 162.0, 148.0, 117.0, 62.0, 37.0, 22.0, 18.0, 9.0, 6.0, 3.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.796875, -28.857177734375, -27.91748046875, -26.977783203125, -26.0380859375, -25.098388671875, -24.15869140625, -23.218994140625, -22.279296875, -21.339599609375, -20.39990234375, -19.460205078125, -18.5205078125, -17.580810546875, -16.64111328125, -15.701416015625, -14.76171875, -13.822021484375, -12.88232421875, -11.942626953125, -11.0029296875, -10.063232421875, -9.12353515625, -8.183837890625, -7.244140625, -6.304443359375, -5.36474609375, -4.425048828125, -3.4853515625, -2.545654296875, -1.60595703125, -0.666259765625, 0.2734375, 1.213134765625, 2.15283203125, 3.092529296875, 4.0322265625, 4.971923828125, 5.91162109375, 6.851318359375, 7.791015625, 8.730712890625, 9.67041015625, 10.610107421875, 11.5498046875, 12.489501953125, 13.42919921875, 14.368896484375, 15.30859375, 16.248291015625, 17.18798828125, 18.127685546875, 19.0673828125, 20.007080078125, 20.94677734375, 21.886474609375, 22.826171875, 23.765869140625, 24.70556640625, 25.645263671875, 26.5849609375, 27.524658203125, 28.46435546875, 29.404052734375, 30.34375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 75.0, 584.0, 297.0, 35.0, 3.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1130.808349609375, -1083.1214599609375, -1035.4345703125, -987.7477416992188, -940.0609130859375, -892.3740234375, -844.6871337890625, -797.000244140625, -749.3134155273438, -701.6265258789062, -653.939697265625, -606.2528076171875, -558.56591796875, -510.87908935546875, -463.19219970703125, -415.5053405761719, -367.8184814453125, -320.1316223144531, -272.44476318359375, -224.75787353515625, -177.07101440429688, -129.3841552734375, -81.697265625, -34.010406494140625, 13.67645263671875, 61.363319396972656, 109.05018615722656, 156.737060546875, 204.42391967773438, 252.11077880859375, 299.79766845703125, 347.4845275878906, 395.1715087890625, 442.8583679199219, 490.54522705078125, 538.2321166992188, 585.9189453125, 633.6058349609375, 681.292724609375, 728.9796142578125, 776.6664428710938, 824.3533325195312, 872.0401611328125, 919.72705078125, 967.4139404296875, 1015.1007690429688, 1062.78759765625, 1110.4744873046875, 1158.161376953125, 1205.8482666015625, 1253.53515625, 1301.221923828125, 1348.9088134765625, 1396.595703125, 1444.2825927734375, 1491.969482421875, 1539.65625, 1587.3431396484375, 1635.030029296875, 1682.716796875, 1730.4036865234375, 1778.090576171875, 1825.7774658203125, 1873.46435546875, 1921.1512451171875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 11.0, 7.0, 8.0, 18.0, 24.0, 29.0, 19.0, 29.0, 45.0, 35.0, 38.0, 35.0, 37.0, 44.0, 43.0, 45.0, 64.0, 53.0, 41.0, 48.0, 54.0, 36.0, 36.0, 28.0, 37.0, 19.0, 23.0, 16.0, 12.0, 19.0, 6.0, 10.0, 2.0, 2.0, 5.0, 3.0, 2.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-357.4586486816406, -347.0057373046875, -336.5528564453125, -326.0999450683594, -315.64703369140625, -305.19415283203125, -294.7412414550781, -284.288330078125, -273.83544921875, -263.3825378417969, -252.92965698242188, -242.47674560546875, -232.0238494873047, -221.57095336914062, -211.1180419921875, -200.66514587402344, -190.21224975585938, -179.7593536376953, -169.30645751953125, -158.85354614257812, -148.40065002441406, -137.94775390625, -127.4948501586914, -117.04194641113281, -106.58905029296875, -96.13615417480469, -85.6832504272461, -75.2303466796875, -64.77745056152344, -54.32455062866211, -43.87165069580078, -33.41874694824219, -22.965850830078125, -12.512950897216797, -2.0600509643554688, 8.39284896850586, 18.845748901367188, 29.298648834228516, 39.751548767089844, 50.20445251464844, 60.6573486328125, 71.11024475097656, 81.56314849853516, 92.01605224609375, 102.46894836425781, 112.92184448242188, 123.37474822998047, 133.82765197753906, 144.28054809570312, 154.7334442138672, 165.18634033203125, 175.63925170898438, 186.09214782714844, 196.5450439453125, 206.99795532226562, 217.4508514404297, 227.90374755859375, 238.3566436767578, 248.80953979492188, 259.262451171875, 269.71533203125, 280.1682434082031, 290.62115478515625, 301.07403564453125, 311.5269470214844]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 15.0, 12.0, 23.0, 25.0, 76.0, 121.0, 206.0, 462.0, 1016.0, 2721.0, 9488.0, 72748.0, 3666735.0, 413302.0, 20200.0, 4356.0, 1450.0, 633.0, 317.0, 145.0, 81.0, 38.0, 38.0, 23.0, 7.0, 15.0, 5.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.84375, -22.693359375, -21.54296875, -20.392578125, -19.2421875, -18.091796875, -16.94140625, -15.791015625, -14.640625, -13.490234375, -12.33984375, -11.189453125, -10.0390625, -8.888671875, -7.73828125, -6.587890625, -5.4375, -4.287109375, -3.13671875, -1.986328125, -0.8359375, 0.314453125, 1.46484375, 2.615234375, 3.765625, 4.916015625, 6.06640625, 7.216796875, 8.3671875, 9.517578125, 10.66796875, 11.818359375, 12.96875, 14.119140625, 15.26953125, 16.419921875, 17.5703125, 18.720703125, 19.87109375, 21.021484375, 22.171875, 23.322265625, 24.47265625, 25.623046875, 26.7734375, 27.923828125, 29.07421875, 30.224609375, 31.375, 32.525390625, 33.67578125, 34.826171875, 35.9765625, 37.126953125, 38.27734375, 39.427734375, 40.578125, 41.728515625, 42.87890625, 44.029296875, 45.1796875, 46.330078125, 47.48046875, 48.630859375, 49.78125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 10.0, 8.0, 10.0, 19.0, 12.0, 28.0, 30.0, 44.0, 59.0, 73.0, 73.0, 86.0, 88.0, 88.0, 60.0, 71.0, 65.0, 52.0, 43.0, 23.0, 18.0, 11.0, 6.0, 3.0, 6.0, 8.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.9375, -22.1318359375, -21.326171875, -20.5205078125, -19.71484375, -18.9091796875, -18.103515625, -17.2978515625, -16.4921875, -15.6865234375, -14.880859375, -14.0751953125, -13.26953125, -12.4638671875, -11.658203125, -10.8525390625, -10.046875, -9.2412109375, -8.435546875, -7.6298828125, -6.82421875, -6.0185546875, -5.212890625, -4.4072265625, -3.6015625, -2.7958984375, -1.990234375, -1.1845703125, -0.37890625, 0.4267578125, 1.232421875, 2.0380859375, 2.84375, 3.6494140625, 4.455078125, 5.2607421875, 6.06640625, 6.8720703125, 7.677734375, 8.4833984375, 9.2890625, 10.0947265625, 10.900390625, 11.7060546875, 12.51171875, 13.3173828125, 14.123046875, 14.9287109375, 15.734375, 16.5400390625, 17.345703125, 18.1513671875, 18.95703125, 19.7626953125, 20.568359375, 21.3740234375, 22.1796875, 22.9853515625, 23.791015625, 24.5966796875, 25.40234375, 26.2080078125, 27.013671875, 27.8193359375, 28.625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 6.0, 10.0, 7.0, 15.0, 20.0, 34.0, 56.0, 115.0, 300.0, 875.0, 2970.0, 16347.0, 332823.0, 3789565.0, 43632.0, 5438.0, 1298.0, 419.0, 132.0, 78.0, 41.0, 24.0, 17.0, 11.0, 8.0, 6.0, 5.0, 6.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-47.03125, -45.61572265625, -44.2001953125, -42.78466796875, -41.369140625, -39.95361328125, -38.5380859375, -37.12255859375, -35.70703125, -34.29150390625, -32.8759765625, -31.46044921875, -30.044921875, -28.62939453125, -27.2138671875, -25.79833984375, -24.3828125, -22.96728515625, -21.5517578125, -20.13623046875, -18.720703125, -17.30517578125, -15.8896484375, -14.47412109375, -13.05859375, -11.64306640625, -10.2275390625, -8.81201171875, -7.396484375, -5.98095703125, -4.5654296875, -3.14990234375, -1.734375, -0.31884765625, 1.0966796875, 2.51220703125, 3.927734375, 5.34326171875, 6.7587890625, 8.17431640625, 9.58984375, 11.00537109375, 12.4208984375, 13.83642578125, 15.251953125, 16.66748046875, 18.0830078125, 19.49853515625, 20.9140625, 22.32958984375, 23.7451171875, 25.16064453125, 26.576171875, 27.99169921875, 29.4072265625, 30.82275390625, 32.23828125, 33.65380859375, 35.0693359375, 36.48486328125, 37.900390625, 39.31591796875, 40.7314453125, 42.14697265625, 43.5625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 8.0, 13.0, 14.0, 29.0, 24.0, 37.0, 92.0, 179.0, 494.0, 1506.0, 1092.0, 343.0, 96.0, 46.0, 23.0, 20.0, 8.0, 8.0, 4.0, 5.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.15625, -37.84375, -36.53125, -35.21875, -33.90625, -32.59375, -31.28125, -29.96875, -28.65625, -27.34375, -26.03125, -24.71875, -23.40625, -22.09375, -20.78125, -19.46875, -18.15625, -16.84375, -15.53125, -14.21875, -12.90625, -11.59375, -10.28125, -8.96875, -7.65625, -6.34375, -5.03125, -3.71875, -2.40625, -1.09375, 0.21875, 1.53125, 2.84375, 4.15625, 5.46875, 6.78125, 8.09375, 9.40625, 10.71875, 12.03125, 13.34375, 14.65625, 15.96875, 17.28125, 18.59375, 19.90625, 21.21875, 22.53125, 23.84375, 25.15625, 26.46875, 27.78125, 29.09375, 30.40625, 31.71875, 33.03125, 34.34375, 35.65625, 36.96875, 38.28125, 39.59375, 40.90625, 42.21875, 43.53125, 44.84375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 8.0, 11.0, 27.0, 58.0, 141.0, 327.0, 310.0, 78.0, 22.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-676.4151611328125, -662.9236450195312, -649.4321899414062, -635.940673828125, -622.4491577148438, -608.9576416015625, -595.4661865234375, -581.9746704101562, -568.483154296875, -554.9916381835938, -541.5001831054688, -528.0086669921875, -514.5171508789062, -501.0256652832031, -487.5341491699219, -474.04266357421875, -460.5511474609375, -447.0596618652344, -433.5681457519531, -420.07666015625, -406.58514404296875, -393.0936584472656, -379.6021423339844, -366.11065673828125, -352.6191711425781, -339.127685546875, -325.63616943359375, -312.1446838378906, -298.6531677246094, -285.16168212890625, -271.670166015625, -258.1786804199219, -244.68716430664062, -231.19566345214844, -217.70416259765625, -204.21266174316406, -190.72116088867188, -177.22967529296875, -163.7381591796875, -150.24667358398438, -136.75515747070312, -123.26365661621094, -109.77215576171875, -96.28065490722656, -82.78915405273438, -69.29766082763672, -55.80615997314453, -42.314659118652344, -28.823165893554688, -15.331665992736816, -1.8401660919189453, 11.65133285522461, 25.142833709716797, 38.63433074951172, 52.125831604003906, 65.6173324584961, 79.10883331298828, 92.60033416748047, 106.09183502197266, 119.58332824707031, 133.0748291015625, 146.5663299560547, 160.05783081054688, 173.54933166503906, 187.04083251953125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 10.0, 12.0, 7.0, 14.0, 18.0, 32.0, 24.0, 41.0, 56.0, 63.0, 64.0, 65.0, 73.0, 61.0, 54.0, 67.0, 72.0, 45.0, 49.0, 43.0, 30.0, 19.0, 14.0, 24.0, 10.0, 11.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-232.3013153076172, -225.70785522460938, -219.1143798828125, -212.52090454101562, -205.9274444580078, -199.333984375, -192.74050903320312, -186.14703369140625, -179.55357360839844, -172.96011352539062, -166.36663818359375, -159.77316284179688, -153.17970275878906, -146.58624267578125, -139.99276733398438, -133.3992919921875, -126.80583190917969, -120.21236419677734, -113.618896484375, -107.02542877197266, -100.43196105957031, -93.83849334716797, -87.24502563476562, -80.65155792236328, -74.05809020996094, -67.4646224975586, -60.87115478515625, -54.277687072753906, -47.68421936035156, -41.09075164794922, -34.497283935546875, -27.90381622314453, -21.310333251953125, -14.716865539550781, -8.123397827148438, -1.5299301147460938, 5.06353759765625, 11.657005310058594, 18.250473022460938, 24.84394073486328, 31.437408447265625, 38.03087615966797, 44.62434387207031, 51.217811584472656, 57.811279296875, 64.40474700927734, 70.99821472167969, 77.59168243408203, 84.18515014648438, 90.77861785888672, 97.37208557128906, 103.9655532836914, 110.55902099609375, 117.1524887084961, 123.74595642089844, 130.33941650390625, 136.93289184570312, 143.5263671875, 150.1198272705078, 156.71328735351562, 163.3067626953125, 169.90023803710938, 176.4936981201172, 183.087158203125, 189.68063354492188]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 6.0, 6.0, 5.0, 9.0, 14.0, 19.0, 27.0, 37.0, 53.0, 90.0, 120.0, 239.0, 353.0, 644.0, 1197.0, 2570.0, 6756.0, 23426.0, 113815.0, 619617.0, 223538.0, 38646.0, 10258.0, 3635.0, 1560.0, 721.0, 451.0, 259.0, 153.0, 102.0, 68.0, 44.0, 36.0, 24.0, 17.0, 12.0, 5.0, 10.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.3125, -35.0888671875, -33.865234375, -32.6416015625, -31.41796875, -30.1943359375, -28.970703125, -27.7470703125, -26.5234375, -25.2998046875, -24.076171875, -22.8525390625, -21.62890625, -20.4052734375, -19.181640625, -17.9580078125, -16.734375, -15.5107421875, -14.287109375, -13.0634765625, -11.83984375, -10.6162109375, -9.392578125, -8.1689453125, -6.9453125, -5.7216796875, -4.498046875, -3.2744140625, -2.05078125, -0.8271484375, 0.396484375, 1.6201171875, 2.84375, 4.0673828125, 5.291015625, 6.5146484375, 7.73828125, 8.9619140625, 10.185546875, 11.4091796875, 12.6328125, 13.8564453125, 15.080078125, 16.3037109375, 17.52734375, 18.7509765625, 19.974609375, 21.1982421875, 22.421875, 23.6455078125, 24.869140625, 26.0927734375, 27.31640625, 28.5400390625, 29.763671875, 30.9873046875, 32.2109375, 33.4345703125, 34.658203125, 35.8818359375, 37.10546875, 38.3291015625, 39.552734375, 40.7763671875, 42.0]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 18.0, 15.0, 19.0, 20.0, 41.0, 51.0, 74.0, 69.0, 95.0, 92.0, 109.0, 68.0, 66.0, 68.0, 49.0, 46.0, 35.0, 16.0, 12.0, 8.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.28125, -22.4765625, -21.671875, -20.8671875, -20.0625, -19.2578125, -18.453125, -17.6484375, -16.84375, -16.0390625, -15.234375, -14.4296875, -13.625, -12.8203125, -12.015625, -11.2109375, -10.40625, -9.6015625, -8.796875, -7.9921875, -7.1875, -6.3828125, -5.578125, -4.7734375, -3.96875, -3.1640625, -2.359375, -1.5546875, -0.75, 0.0546875, 0.859375, 1.6640625, 2.46875, 3.2734375, 4.078125, 4.8828125, 5.6875, 6.4921875, 7.296875, 8.1015625, 8.90625, 9.7109375, 10.515625, 11.3203125, 12.125, 12.9296875, 13.734375, 14.5390625, 15.34375, 16.1484375, 16.953125, 17.7578125, 18.5625, 19.3671875, 20.171875, 20.9765625, 21.78125, 22.5859375, 23.390625, 24.1953125, 25.0, 25.8046875, 26.609375, 27.4140625, 28.21875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 12.0, 12.0, 18.0, 41.0, 34.0, 67.0, 99.0, 194.0, 389.0, 1350.0, 8918.0, 979397.0, 53767.0, 2939.0, 672.0, 269.0, 126.0, 88.0, 38.0, 34.0, 19.0, 13.0, 13.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-200.375, -194.4375, -188.5, -182.5625, -176.625, -170.6875, -164.75, -158.8125, -152.875, -146.9375, -141.0, -135.0625, -129.125, -123.1875, -117.25, -111.3125, -105.375, -99.4375, -93.5, -87.5625, -81.625, -75.6875, -69.75, -63.8125, -57.875, -51.9375, -46.0, -40.0625, -34.125, -28.1875, -22.25, -16.3125, -10.375, -4.4375, 1.5, 7.4375, 13.375, 19.3125, 25.25, 31.1875, 37.125, 43.0625, 49.0, 54.9375, 60.875, 66.8125, 72.75, 78.6875, 84.625, 90.5625, 96.5, 102.4375, 108.375, 114.3125, 120.25, 126.1875, 132.125, 138.0625, 144.0, 149.9375, 155.875, 161.8125, 167.75, 173.6875, 179.625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 8.0, 4.0, 4.0, 25.0, 21.0, 43.0, 72.0, 107.0, 130.0, 146.0, 128.0, 119.0, 83.0, 46.0, 23.0, 14.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-222.5, -216.587890625, -210.67578125, -204.763671875, -198.8515625, -192.939453125, -187.02734375, -181.115234375, -175.203125, -169.291015625, -163.37890625, -157.466796875, -151.5546875, -145.642578125, -139.73046875, -133.818359375, -127.90625, -121.994140625, -116.08203125, -110.169921875, -104.2578125, -98.345703125, -92.43359375, -86.521484375, -80.609375, -74.697265625, -68.78515625, -62.873046875, -56.9609375, -51.048828125, -45.13671875, -39.224609375, -33.3125, -27.400390625, -21.48828125, -15.576171875, -9.6640625, -3.751953125, 2.16015625, 8.072265625, 13.984375, 19.896484375, 25.80859375, 31.720703125, 37.6328125, 43.544921875, 49.45703125, 55.369140625, 61.28125, 67.193359375, 73.10546875, 79.017578125, 84.9296875, 90.841796875, 96.75390625, 102.666015625, 108.578125, 114.490234375, 120.40234375, 126.314453125, 132.2265625, 138.138671875, 144.05078125, 149.962890625, 155.875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 8.0, 11.0, 13.0, 12.0, 25.0, 30.0, 42.0, 81.0, 141.0, 228.0, 608.0, 2022.0, 14382.0, 988254.0, 38092.0, 3057.0, 793.0, 317.0, 150.0, 86.0, 54.0, 42.0, 29.0, 14.0, 17.0, 7.0, 8.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.875, -62.94677734375, -61.0185546875, -59.09033203125, -57.162109375, -55.23388671875, -53.3056640625, -51.37744140625, -49.44921875, -47.52099609375, -45.5927734375, -43.66455078125, -41.736328125, -39.80810546875, -37.8798828125, -35.95166015625, -34.0234375, -32.09521484375, -30.1669921875, -28.23876953125, -26.310546875, -24.38232421875, -22.4541015625, -20.52587890625, -18.59765625, -16.66943359375, -14.7412109375, -12.81298828125, -10.884765625, -8.95654296875, -7.0283203125, -5.10009765625, -3.171875, -1.24365234375, 0.6845703125, 2.61279296875, 4.541015625, 6.46923828125, 8.3974609375, 10.32568359375, 12.25390625, 14.18212890625, 16.1103515625, 18.03857421875, 19.966796875, 21.89501953125, 23.8232421875, 25.75146484375, 27.6796875, 29.60791015625, 31.5361328125, 33.46435546875, 35.392578125, 37.32080078125, 39.2490234375, 41.17724609375, 43.10546875, 45.03369140625, 46.9619140625, 48.89013671875, 50.818359375, 52.74658203125, 54.6748046875, 56.60302734375, 58.53125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 6.0, 15.0, 23.0, 21.0, 27.0, 35.0, 79.0, 133.0, 242.0, 172.0, 75.0, 41.0, 38.0, 22.0, 15.0, 12.0, 9.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.004375457763671875, -0.004262089729309082, -0.004148721694946289, -0.004035353660583496, -0.003921985626220703, -0.00380861759185791, -0.003695249557495117, -0.0035818815231323242, -0.0034685134887695312, -0.0033551454544067383, -0.0032417774200439453, -0.0031284093856811523, -0.0030150413513183594, -0.0029016733169555664, -0.0027883052825927734, -0.0026749372482299805, -0.0025615692138671875, -0.0024482011795043945, -0.0023348331451416016, -0.0022214651107788086, -0.0021080970764160156, -0.0019947290420532227, -0.0018813610076904297, -0.0017679929733276367, -0.0016546249389648438, -0.0015412569046020508, -0.0014278888702392578, -0.0013145208358764648, -0.0012011528015136719, -0.001087784767150879, -0.0009744167327880859, -0.000861048698425293, -0.0007476806640625, -0.000634312629699707, -0.0005209445953369141, -0.0004075765609741211, -0.0002942085266113281, -0.00018084049224853516, -6.747245788574219e-05, 4.589557647705078e-05, 0.00015926361083984375, 0.0002726316452026367, 0.0003859996795654297, 0.0004993677139282227, 0.0006127357482910156, 0.0007261037826538086, 0.0008394718170166016, 0.0009528398513793945, 0.0010662078857421875, 0.0011795759201049805, 0.0012929439544677734, 0.0014063119888305664, 0.0015196800231933594, 0.0016330480575561523, 0.0017464160919189453, 0.0018597841262817383, 0.0019731521606445312, 0.0020865201950073242, 0.002199888229370117, 0.00231325626373291, 0.002426624298095703, 0.002539992332458496, 0.002653360366821289, 0.002766728401184082, 0.002880096435546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 9.0, 5.0, 12.0, 27.0, 30.0, 39.0, 50.0, 55.0, 101.0, 154.0, 267.0, 503.0, 1326.0, 5466.0, 87583.0, 935833.0, 13127.0, 2249.0, 777.0, 356.0, 195.0, 111.0, 64.0, 58.0, 33.0, 29.0, 20.0, 16.0, 13.0, 8.0, 11.0, 3.0, 4.0, 3.0, 0.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.3125, -41.830078125, -40.34765625, -38.865234375, -37.3828125, -35.900390625, -34.41796875, -32.935546875, -31.453125, -29.970703125, -28.48828125, -27.005859375, -25.5234375, -24.041015625, -22.55859375, -21.076171875, -19.59375, -18.111328125, -16.62890625, -15.146484375, -13.6640625, -12.181640625, -10.69921875, -9.216796875, -7.734375, -6.251953125, -4.76953125, -3.287109375, -1.8046875, -0.322265625, 1.16015625, 2.642578125, 4.125, 5.607421875, 7.08984375, 8.572265625, 10.0546875, 11.537109375, 13.01953125, 14.501953125, 15.984375, 17.466796875, 18.94921875, 20.431640625, 21.9140625, 23.396484375, 24.87890625, 26.361328125, 27.84375, 29.326171875, 30.80859375, 32.291015625, 33.7734375, 35.255859375, 36.73828125, 38.220703125, 39.703125, 41.185546875, 42.66796875, 44.150390625, 45.6328125, 47.115234375, 48.59765625, 50.080078125, 51.5625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 4.0, 10.0, 14.0, 13.0, 30.0, 53.0, 96.0, 191.0, 228.0, 140.0, 74.0, 44.0, 18.0, 13.0, 10.0, 13.0, 13.0, 3.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.25, -35.09326171875, -33.9365234375, -32.77978515625, -31.623046875, -30.46630859375, -29.3095703125, -28.15283203125, -26.99609375, -25.83935546875, -24.6826171875, -23.52587890625, -22.369140625, -21.21240234375, -20.0556640625, -18.89892578125, -17.7421875, -16.58544921875, -15.4287109375, -14.27197265625, -13.115234375, -11.95849609375, -10.8017578125, -9.64501953125, -8.48828125, -7.33154296875, -6.1748046875, -5.01806640625, -3.861328125, -2.70458984375, -1.5478515625, -0.39111328125, 0.765625, 1.92236328125, 3.0791015625, 4.23583984375, 5.392578125, 6.54931640625, 7.7060546875, 8.86279296875, 10.01953125, 11.17626953125, 12.3330078125, 13.48974609375, 14.646484375, 15.80322265625, 16.9599609375, 18.11669921875, 19.2734375, 20.43017578125, 21.5869140625, 22.74365234375, 23.900390625, 25.05712890625, 26.2138671875, 27.37060546875, 28.52734375, 29.68408203125, 30.8408203125, 31.99755859375, 33.154296875, 34.31103515625, 35.4677734375, 36.62451171875, 37.78125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 28.0, 203.0, 483.0, 211.0, 36.0, 11.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-652.607666015625, -624.6851196289062, -596.7625732421875, -568.8400268554688, -540.91748046875, -512.9949340820312, -485.0724182128906, -457.1498718261719, -429.2273254394531, -401.3047790527344, -373.3822326660156, -345.459716796875, -317.53717041015625, -289.6146240234375, -261.69207763671875, -233.76953125, -205.84698486328125, -177.9244384765625, -150.00189208984375, -122.07936096191406, -94.15681457519531, -66.23426818847656, -38.311737060546875, -10.389190673828125, 17.533355712890625, 45.45589828491211, 73.3784408569336, 101.30097961425781, 129.22352600097656, 157.1460723876953, 185.068603515625, 212.99114990234375, 240.9136962890625, 268.83624267578125, 296.7587890625, 324.68133544921875, 352.6038818359375, 380.52642822265625, 408.4489440917969, 436.3714904785156, 464.2940368652344, 492.2165832519531, 520.1390991210938, 548.0616455078125, 575.9841918945312, 603.90673828125, 631.8292846679688, 659.7518310546875, 687.6743774414062, 715.596923828125, 743.5194702148438, 771.4420166015625, 799.3645629882812, 827.287109375, 855.2095947265625, 883.1322021484375, 911.0546875, 938.9772338867188, 966.8997802734375, 994.8223266601562, 1022.744873046875, 1050.6673583984375, 1078.5899658203125, 1106.512451171875, 1134.43505859375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 6.0, 15.0, 9.0, 18.0, 22.0, 26.0, 26.0, 27.0, 39.0, 30.0, 39.0, 44.0, 35.0, 33.0, 62.0, 57.0, 60.0, 57.0, 59.0, 52.0, 35.0, 45.0, 30.0, 27.0, 25.0, 28.0, 7.0, 11.0, 17.0, 11.0, 6.0, 5.0, 7.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-281.2420349121094, -271.57293701171875, -261.90380859375, -252.23471069335938, -242.56561279296875, -232.89651489257812, -223.22740173339844, -213.55828857421875, -203.88919067382812, -194.2200927734375, -184.5509796142578, -174.88186645507812, -165.2127685546875, -155.54367065429688, -145.8745574951172, -136.2054443359375, -126.53634643554688, -116.86724090576172, -107.19813537597656, -97.5290298461914, -87.85992431640625, -78.1908187866211, -68.52171325683594, -58.85260772705078, -49.183502197265625, -39.51439666748047, -29.845291137695312, -20.176185607910156, -10.507080078125, -0.8379745483398438, 8.831130981445312, 18.50023651123047, 28.16937255859375, 37.838478088378906, 47.50758361816406, 57.17668914794922, 66.84579467773438, 76.51490020751953, 86.18400573730469, 95.85311126708984, 105.522216796875, 115.19132232666016, 124.86042785644531, 134.529541015625, 144.19863891601562, 153.86773681640625, 163.53684997558594, 173.20596313476562, 182.87506103515625, 192.54415893554688, 202.21327209472656, 211.88238525390625, 221.55148315429688, 231.2205810546875, 240.8896942138672, 250.55880737304688, 260.2279052734375, 269.8970031738281, 279.56610107421875, 289.2352294921875, 298.9043273925781, 308.57342529296875, 318.2425537109375, 327.9116516113281, 337.58074951171875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 10.0, 11.0, 22.0, 41.0, 81.0, 190.0, 487.0, 1362.0, 4516.0, 26114.0, 3121207.0, 1018680.0, 16430.0, 3283.0, 1030.0, 423.0, 182.0, 99.0, 38.0, 32.0, 19.0, 11.0, 14.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-44.78125, -43.5341796875, -42.287109375, -41.0400390625, -39.79296875, -38.5458984375, -37.298828125, -36.0517578125, -34.8046875, -33.5576171875, -32.310546875, -31.0634765625, -29.81640625, -28.5693359375, -27.322265625, -26.0751953125, -24.828125, -23.5810546875, -22.333984375, -21.0869140625, -19.83984375, -18.5927734375, -17.345703125, -16.0986328125, -14.8515625, -13.6044921875, -12.357421875, -11.1103515625, -9.86328125, -8.6162109375, -7.369140625, -6.1220703125, -4.875, -3.6279296875, -2.380859375, -1.1337890625, 0.11328125, 1.3603515625, 2.607421875, 3.8544921875, 5.1015625, 6.3486328125, 7.595703125, 8.8427734375, 10.08984375, 11.3369140625, 12.583984375, 13.8310546875, 15.078125, 16.3251953125, 17.572265625, 18.8193359375, 20.06640625, 21.3134765625, 22.560546875, 23.8076171875, 25.0546875, 26.3017578125, 27.548828125, 28.7958984375, 30.04296875, 31.2900390625, 32.537109375, 33.7841796875, 35.03125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 8.0, 8.0, 12.0, 17.0, 11.0, 26.0, 38.0, 47.0, 46.0, 59.0, 67.0, 65.0, 76.0, 81.0, 70.0, 64.0, 43.0, 51.0, 53.0, 40.0, 25.0, 18.0, 21.0, 14.0, 11.0, 3.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.54150390625, -12.9580078125, -12.37451171875, -11.791015625, -11.20751953125, -10.6240234375, -10.04052734375, -9.45703125, -8.87353515625, -8.2900390625, -7.70654296875, -7.123046875, -6.53955078125, -5.9560546875, -5.37255859375, -4.7890625, -4.20556640625, -3.6220703125, -3.03857421875, -2.455078125, -1.87158203125, -1.2880859375, -0.70458984375, -0.12109375, 0.46240234375, 1.0458984375, 1.62939453125, 2.212890625, 2.79638671875, 3.3798828125, 3.96337890625, 4.546875, 5.13037109375, 5.7138671875, 6.29736328125, 6.880859375, 7.46435546875, 8.0478515625, 8.63134765625, 9.21484375, 9.79833984375, 10.3818359375, 10.96533203125, 11.548828125, 12.13232421875, 12.7158203125, 13.29931640625, 13.8828125, 14.46630859375, 15.0498046875, 15.63330078125, 16.216796875, 16.80029296875, 17.3837890625, 17.96728515625, 18.55078125, 19.13427734375, 19.7177734375, 20.30126953125, 20.884765625, 21.46826171875, 22.0517578125, 22.63525390625, 23.21875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 9.0, 12.0, 16.0, 32.0, 64.0, 134.0, 294.0, 735.0, 2084.0, 7545.0, 45121.0, 3242508.0, 862942.0, 25316.0, 4924.0, 1561.0, 570.0, 219.0, 87.0, 53.0, 18.0, 12.0, 3.0, 8.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.875, -36.847900390625, -35.82080078125, -34.793701171875, -33.7666015625, -32.739501953125, -31.71240234375, -30.685302734375, -29.658203125, -28.631103515625, -27.60400390625, -26.576904296875, -25.5498046875, -24.522705078125, -23.49560546875, -22.468505859375, -21.44140625, -20.414306640625, -19.38720703125, -18.360107421875, -17.3330078125, -16.305908203125, -15.27880859375, -14.251708984375, -13.224609375, -12.197509765625, -11.17041015625, -10.143310546875, -9.1162109375, -8.089111328125, -7.06201171875, -6.034912109375, -5.0078125, -3.980712890625, -2.95361328125, -1.926513671875, -0.8994140625, 0.127685546875, 1.15478515625, 2.181884765625, 3.208984375, 4.236083984375, 5.26318359375, 6.290283203125, 7.3173828125, 8.344482421875, 9.37158203125, 10.398681640625, 11.42578125, 12.452880859375, 13.47998046875, 14.507080078125, 15.5341796875, 16.561279296875, 17.58837890625, 18.615478515625, 19.642578125, 20.669677734375, 21.69677734375, 22.723876953125, 23.7509765625, 24.778076171875, 25.80517578125, 26.832275390625, 27.859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 9.0, 8.0, 5.0, 18.0, 19.0, 47.0, 104.0, 272.0, 795.0, 1473.0, 811.0, 251.0, 111.0, 47.0, 35.0, 22.0, 11.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.65625, -35.65478515625, -34.6533203125, -33.65185546875, -32.650390625, -31.64892578125, -30.6474609375, -29.64599609375, -28.64453125, -27.64306640625, -26.6416015625, -25.64013671875, -24.638671875, -23.63720703125, -22.6357421875, -21.63427734375, -20.6328125, -19.63134765625, -18.6298828125, -17.62841796875, -16.626953125, -15.62548828125, -14.6240234375, -13.62255859375, -12.62109375, -11.61962890625, -10.6181640625, -9.61669921875, -8.615234375, -7.61376953125, -6.6123046875, -5.61083984375, -4.609375, -3.60791015625, -2.6064453125, -1.60498046875, -0.603515625, 0.39794921875, 1.3994140625, 2.40087890625, 3.40234375, 4.40380859375, 5.4052734375, 6.40673828125, 7.408203125, 8.40966796875, 9.4111328125, 10.41259765625, 11.4140625, 12.41552734375, 13.4169921875, 14.41845703125, 15.419921875, 16.42138671875, 17.4228515625, 18.42431640625, 19.42578125, 20.42724609375, 21.4287109375, 22.43017578125, 23.431640625, 24.43310546875, 25.4345703125, 26.43603515625, 27.4375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 4.0, 9.0, 28.0, 34.0, 124.0, 235.0, 282.0, 168.0, 67.0, 21.0, 7.0, 8.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-300.57952880859375, -292.78155517578125, -284.9836120605469, -277.1856384277344, -269.3876647949219, -261.5897216796875, -253.791748046875, -245.99378967285156, -238.19583129882812, -230.3978729248047, -222.5998992919922, -214.80194091796875, -207.0039825439453, -199.20602416992188, -191.40805053710938, -183.61009216308594, -175.81211853027344, -168.01416015625, -160.2161865234375, -152.41822814941406, -144.62026977539062, -136.82229614257812, -129.0243377685547, -121.22637939453125, -113.42841339111328, -105.63044738769531, -97.83248901367188, -90.0345230102539, -82.23655700683594, -74.4385986328125, -66.64063262939453, -58.84267044067383, -51.04472351074219, -43.246761322021484, -35.44879913330078, -27.650833129882812, -19.85287094116211, -12.054908752441406, -4.2569427490234375, 3.5410194396972656, 11.338981628417969, 19.136943817138672, 26.934907913208008, 34.732872009277344, 42.53083419799805, 50.32879638671875, 58.12676239013672, 65.92472839355469, 73.72268676757812, 81.5206527709961, 89.31861114501953, 97.1165771484375, 104.91453552246094, 112.7125015258789, 120.51046752929688, 128.3084259033203, 136.10638427734375, 143.9043426513672, 151.7023162841797, 159.50027465820312, 167.29823303222656, 175.09619140625, 182.8941650390625, 190.69212341308594, 198.49009704589844]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 2.0, 2.0, 9.0, 10.0, 18.0, 12.0, 18.0, 23.0, 23.0, 31.0, 37.0, 42.0, 52.0, 46.0, 53.0, 45.0, 63.0, 54.0, 65.0, 67.0, 48.0, 50.0, 48.0, 39.0, 36.0, 19.0, 18.0, 13.0, 11.0, 12.0, 5.0, 5.0, 6.0, 5.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-140.1543426513672, -135.87466430664062, -131.59500122070312, -127.31532287597656, -123.03565216064453, -118.7559814453125, -114.47630310058594, -110.1966323852539, -105.91696166992188, -101.63729095458984, -97.35761260986328, -93.07794189453125, -88.79827117919922, -84.51860046386719, -80.23892211914062, -75.9592514038086, -71.67957305908203, -67.39990234375, -63.1202278137207, -58.840553283691406, -54.560882568359375, -50.28120803833008, -46.00153350830078, -41.72186279296875, -37.44218826293945, -33.162513732910156, -28.882843017578125, -24.603168487548828, -20.323495864868164, -16.0438232421875, -11.764148712158203, -7.484476089477539, -3.204803466796875, 1.0748696327209473, 5.3545427322387695, 9.63421630859375, 13.913888931274414, 18.193561553955078, 22.473236083984375, 26.75290870666504, 31.032581329345703, 35.312255859375, 39.59192657470703, 43.87160110473633, 48.151275634765625, 52.430946350097656, 56.71062088012695, 60.99029541015625, 65.26996612548828, 69.54963684082031, 73.82931518554688, 78.1089859008789, 82.38865661621094, 86.6683349609375, 90.94800567626953, 95.22767639160156, 99.50735473632812, 103.78702545166016, 108.06670379638672, 112.34637451171875, 116.62604522705078, 120.90571594238281, 125.18539428710938, 129.46507263183594, 133.74473571777344]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 6.0, 6.0, 8.0, 15.0, 23.0, 26.0, 37.0, 40.0, 66.0, 107.0, 173.0, 245.0, 431.0, 835.0, 1737.0, 4306.0, 12966.0, 51363.0, 291896.0, 547653.0, 102197.0, 22615.0, 6688.0, 2457.0, 1091.0, 579.0, 350.0, 194.0, 150.0, 77.0, 68.0, 42.0, 29.0, 20.0, 18.0, 14.0, 3.0, 9.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-31.171875, -30.28662109375, -29.4013671875, -28.51611328125, -27.630859375, -26.74560546875, -25.8603515625, -24.97509765625, -24.08984375, -23.20458984375, -22.3193359375, -21.43408203125, -20.548828125, -19.66357421875, -18.7783203125, -17.89306640625, -17.0078125, -16.12255859375, -15.2373046875, -14.35205078125, -13.466796875, -12.58154296875, -11.6962890625, -10.81103515625, -9.92578125, -9.04052734375, -8.1552734375, -7.27001953125, -6.384765625, -5.49951171875, -4.6142578125, -3.72900390625, -2.84375, -1.95849609375, -1.0732421875, -0.18798828125, 0.697265625, 1.58251953125, 2.4677734375, 3.35302734375, 4.23828125, 5.12353515625, 6.0087890625, 6.89404296875, 7.779296875, 8.66455078125, 9.5498046875, 10.43505859375, 11.3203125, 12.20556640625, 13.0908203125, 13.97607421875, 14.861328125, 15.74658203125, 16.6318359375, 17.51708984375, 18.40234375, 19.28759765625, 20.1728515625, 21.05810546875, 21.943359375, 22.82861328125, 23.7138671875, 24.59912109375, 25.484375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 10.0, 10.0, 5.0, 13.0, 15.0, 17.0, 31.0, 45.0, 39.0, 48.0, 51.0, 61.0, 63.0, 60.0, 73.0, 68.0, 64.0, 61.0, 60.0, 42.0, 47.0, 24.0, 16.0, 20.0, 14.0, 14.0, 4.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.4921875, -12.9346923828125, -12.377197265625, -11.8197021484375, -11.26220703125, -10.7047119140625, -10.147216796875, -9.5897216796875, -9.0322265625, -8.4747314453125, -7.917236328125, -7.3597412109375, -6.80224609375, -6.2447509765625, -5.687255859375, -5.1297607421875, -4.572265625, -4.0147705078125, -3.457275390625, -2.8997802734375, -2.34228515625, -1.7847900390625, -1.227294921875, -0.6697998046875, -0.1123046875, 0.4451904296875, 1.002685546875, 1.5601806640625, 2.11767578125, 2.6751708984375, 3.232666015625, 3.7901611328125, 4.34765625, 4.9051513671875, 5.462646484375, 6.0201416015625, 6.57763671875, 7.1351318359375, 7.692626953125, 8.2501220703125, 8.8076171875, 9.3651123046875, 9.922607421875, 10.4801025390625, 11.03759765625, 11.5950927734375, 12.152587890625, 12.7100830078125, 13.267578125, 13.8250732421875, 14.382568359375, 14.9400634765625, 15.49755859375, 16.0550537109375, 16.612548828125, 17.1700439453125, 17.7275390625, 18.2850341796875, 18.842529296875, 19.4000244140625, 19.95751953125, 20.5150146484375, 21.072509765625, 21.6300048828125, 22.1875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 6.0, 5.0, 7.0, 6.0, 17.0, 16.0, 26.0, 31.0, 55.0, 79.0, 160.0, 226.0, 466.0, 1040.0, 3498.0, 19828.0, 726895.0, 279090.0, 12607.0, 2649.0, 872.0, 415.0, 182.0, 127.0, 76.0, 55.0, 36.0, 32.0, 15.0, 12.0, 7.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.375, -69.205078125, -67.03515625, -64.865234375, -62.6953125, -60.525390625, -58.35546875, -56.185546875, -54.015625, -51.845703125, -49.67578125, -47.505859375, -45.3359375, -43.166015625, -40.99609375, -38.826171875, -36.65625, -34.486328125, -32.31640625, -30.146484375, -27.9765625, -25.806640625, -23.63671875, -21.466796875, -19.296875, -17.126953125, -14.95703125, -12.787109375, -10.6171875, -8.447265625, -6.27734375, -4.107421875, -1.9375, 0.232421875, 2.40234375, 4.572265625, 6.7421875, 8.912109375, 11.08203125, 13.251953125, 15.421875, 17.591796875, 19.76171875, 21.931640625, 24.1015625, 26.271484375, 28.44140625, 30.611328125, 32.78125, 34.951171875, 37.12109375, 39.291015625, 41.4609375, 43.630859375, 45.80078125, 47.970703125, 50.140625, 52.310546875, 54.48046875, 56.650390625, 58.8203125, 60.990234375, 63.16015625, 65.330078125, 67.5]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 6.0, 7.0, 15.0, 9.0, 12.0, 23.0, 16.0, 37.0, 41.0, 45.0, 61.0, 61.0, 68.0, 77.0, 66.0, 67.0, 76.0, 62.0, 50.0, 39.0, 34.0, 32.0, 24.0, 18.0, 16.0, 13.0, 10.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.0, -62.748046875, -60.49609375, -58.244140625, -55.9921875, -53.740234375, -51.48828125, -49.236328125, -46.984375, -44.732421875, -42.48046875, -40.228515625, -37.9765625, -35.724609375, -33.47265625, -31.220703125, -28.96875, -26.716796875, -24.46484375, -22.212890625, -19.9609375, -17.708984375, -15.45703125, -13.205078125, -10.953125, -8.701171875, -6.44921875, -4.197265625, -1.9453125, 0.306640625, 2.55859375, 4.810546875, 7.0625, 9.314453125, 11.56640625, 13.818359375, 16.0703125, 18.322265625, 20.57421875, 22.826171875, 25.078125, 27.330078125, 29.58203125, 31.833984375, 34.0859375, 36.337890625, 38.58984375, 40.841796875, 43.09375, 45.345703125, 47.59765625, 49.849609375, 52.1015625, 54.353515625, 56.60546875, 58.857421875, 61.109375, 63.361328125, 65.61328125, 67.865234375, 70.1171875, 72.369140625, 74.62109375, 76.873046875, 79.125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 6.0, 6.0, 8.0, 15.0, 24.0, 55.0, 71.0, 162.0, 665.0, 5262.0, 1011060.0, 29058.0, 1589.0, 333.0, 106.0, 49.0, 25.0, 21.0, 4.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.125, -70.10595703125, -68.0869140625, -66.06787109375, -64.048828125, -62.02978515625, -60.0107421875, -57.99169921875, -55.97265625, -53.95361328125, -51.9345703125, -49.91552734375, -47.896484375, -45.87744140625, -43.8583984375, -41.83935546875, -39.8203125, -37.80126953125, -35.7822265625, -33.76318359375, -31.744140625, -29.72509765625, -27.7060546875, -25.68701171875, -23.66796875, -21.64892578125, -19.6298828125, -17.61083984375, -15.591796875, -13.57275390625, -11.5537109375, -9.53466796875, -7.515625, -5.49658203125, -3.4775390625, -1.45849609375, 0.560546875, 2.57958984375, 4.5986328125, 6.61767578125, 8.63671875, 10.65576171875, 12.6748046875, 14.69384765625, 16.712890625, 18.73193359375, 20.7509765625, 22.77001953125, 24.7890625, 26.80810546875, 28.8271484375, 30.84619140625, 32.865234375, 34.88427734375, 36.9033203125, 38.92236328125, 40.94140625, 42.96044921875, 44.9794921875, 46.99853515625, 49.017578125, 51.03662109375, 53.0556640625, 55.07470703125, 57.09375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 11.0, 15.0, 14.0, 23.0, 24.0, 50.0, 94.0, 169.0, 228.0, 139.0, 72.0, 46.0, 23.0, 18.0, 14.0, 12.0, 11.0, 7.0, 9.0, 2.0, 3.0, 1.0, 1.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00281524658203125, -0.0027283430099487305, -0.002641439437866211, -0.0025545358657836914, -0.002467632293701172, -0.0023807287216186523, -0.002293825149536133, -0.0022069215774536133, -0.0021200180053710938, -0.0020331144332885742, -0.0019462108612060547, -0.0018593072891235352, -0.0017724037170410156, -0.001685500144958496, -0.0015985965728759766, -0.001511693000793457, -0.0014247894287109375, -0.001337885856628418, -0.0012509822845458984, -0.001164078712463379, -0.0010771751403808594, -0.0009902715682983398, -0.0009033679962158203, -0.0008164644241333008, -0.0007295608520507812, -0.0006426572799682617, -0.0005557537078857422, -0.00046885013580322266, -0.0003819465637207031, -0.0002950429916381836, -0.00020813941955566406, -0.00012123584747314453, -3.4332275390625e-05, 5.257129669189453e-05, 0.00013947486877441406, 0.0002263784408569336, 0.0003132820129394531, 0.00040018558502197266, 0.0004870891571044922, 0.0005739927291870117, 0.0006608963012695312, 0.0007477998733520508, 0.0008347034454345703, 0.0009216070175170898, 0.0010085105895996094, 0.001095414161682129, 0.0011823177337646484, 0.001269221305847168, 0.0013561248779296875, 0.001443028450012207, 0.0015299320220947266, 0.001616835594177246, 0.0017037391662597656, 0.0017906427383422852, 0.0018775463104248047, 0.0019644498825073242, 0.0020513534545898438, 0.0021382570266723633, 0.002225160598754883, 0.0023120641708374023, 0.002398967742919922, 0.0024858713150024414, 0.002572774887084961, 0.0026596784591674805, 0.00274658203125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 6.0, 3.0, 5.0, 17.0, 20.0, 28.0, 51.0, 87.0, 128.0, 249.0, 475.0, 1162.0, 3948.0, 24939.0, 925235.0, 82410.0, 6720.0, 1742.0, 598.0, 314.0, 161.0, 81.0, 67.0, 38.0, 18.0, 15.0, 8.0, 9.0, 6.0, 8.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.84375, -30.025146484375, -29.20654296875, -28.387939453125, -27.5693359375, -26.750732421875, -25.93212890625, -25.113525390625, -24.294921875, -23.476318359375, -22.65771484375, -21.839111328125, -21.0205078125, -20.201904296875, -19.38330078125, -18.564697265625, -17.74609375, -16.927490234375, -16.10888671875, -15.290283203125, -14.4716796875, -13.653076171875, -12.83447265625, -12.015869140625, -11.197265625, -10.378662109375, -9.56005859375, -8.741455078125, -7.9228515625, -7.104248046875, -6.28564453125, -5.467041015625, -4.6484375, -3.829833984375, -3.01123046875, -2.192626953125, -1.3740234375, -0.555419921875, 0.26318359375, 1.081787109375, 1.900390625, 2.718994140625, 3.53759765625, 4.356201171875, 5.1748046875, 5.993408203125, 6.81201171875, 7.630615234375, 8.44921875, 9.267822265625, 10.08642578125, 10.905029296875, 11.7236328125, 12.542236328125, 13.36083984375, 14.179443359375, 14.998046875, 15.816650390625, 16.63525390625, 17.453857421875, 18.2724609375, 19.091064453125, 19.90966796875, 20.728271484375, 21.546875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 7.0, 12.0, 11.0, 32.0, 64.0, 94.0, 153.0, 200.0, 164.0, 100.0, 66.0, 31.0, 19.0, 15.0, 8.0, 6.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.140625, -23.39990234375, -22.6591796875, -21.91845703125, -21.177734375, -20.43701171875, -19.6962890625, -18.95556640625, -18.21484375, -17.47412109375, -16.7333984375, -15.99267578125, -15.251953125, -14.51123046875, -13.7705078125, -13.02978515625, -12.2890625, -11.54833984375, -10.8076171875, -10.06689453125, -9.326171875, -8.58544921875, -7.8447265625, -7.10400390625, -6.36328125, -5.62255859375, -4.8818359375, -4.14111328125, -3.400390625, -2.65966796875, -1.9189453125, -1.17822265625, -0.4375, 0.30322265625, 1.0439453125, 1.78466796875, 2.525390625, 3.26611328125, 4.0068359375, 4.74755859375, 5.48828125, 6.22900390625, 6.9697265625, 7.71044921875, 8.451171875, 9.19189453125, 9.9326171875, 10.67333984375, 11.4140625, 12.15478515625, 12.8955078125, 13.63623046875, 14.376953125, 15.11767578125, 15.8583984375, 16.59912109375, 17.33984375, 18.08056640625, 18.8212890625, 19.56201171875, 20.302734375, 21.04345703125, 21.7841796875, 22.52490234375, 23.265625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 8.0, 5.0, 14.0, 67.0, 224.0, 381.0, 209.0, 48.0, 13.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-292.90435791015625, -277.8301086425781, -262.7558898925781, -247.681640625, -232.60740661621094, -217.53317260742188, -202.45892333984375, -187.3846893310547, -172.31045532226562, -157.23622131347656, -142.1619873046875, -127.08773803710938, -112.01350402832031, -96.93927001953125, -81.86502838134766, -66.79078674316406, -51.716552734375, -36.64231491088867, -21.568077087402344, -6.493839263916016, 8.580398559570312, 23.654632568359375, 38.72887420654297, 53.80311584472656, 68.87734985351562, 83.95158386230469, 99.02582550048828, 114.10006713867188, 129.17430114746094, 144.24853515625, 159.32278442382812, 174.3970184326172, 189.47125244140625, 204.5454864501953, 219.61972045898438, 234.6939697265625, 249.76820373535156, 264.8424377441406, 279.91668701171875, 294.99090576171875, 310.0651550292969, 325.139404296875, 340.213623046875, 355.2878723144531, 370.36212158203125, 385.43634033203125, 400.5105895996094, 415.5848388671875, 430.6590576171875, 445.7333068847656, 460.8075256347656, 475.88177490234375, 490.95599365234375, 506.0302429199219, 521.1044921875, 536.1787109375, 551.2529296875, 566.3271484375, 581.4014282226562, 596.4756469726562, 611.5498657226562, 626.6241455078125, 641.6983642578125, 656.7725830078125, 671.8468627929688]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 7.0, 9.0, 17.0, 8.0, 17.0, 25.0, 26.0, 30.0, 38.0, 34.0, 42.0, 51.0, 42.0, 62.0, 63.0, 67.0, 62.0, 54.0, 54.0, 40.0, 40.0, 41.0, 30.0, 26.0, 22.0, 21.0, 11.0, 11.0, 10.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.97264099121094, -185.02105712890625, -177.0694580078125, -169.11785888671875, -161.16627502441406, -153.21469116210938, -145.26309204101562, -137.31149291992188, -129.3599090576172, -121.40831756591797, -113.45672607421875, -105.50513458251953, -97.55354309082031, -89.6019515991211, -81.65036010742188, -73.69876861572266, -65.74717712402344, -57.79558563232422, -49.843994140625, -41.89240264892578, -33.94081115722656, -25.989219665527344, -18.037628173828125, -10.086036682128906, -2.1344451904296875, 5.817146301269531, 13.76873779296875, 21.72032928466797, 29.671920776367188, 37.623512268066406, 45.575103759765625, 53.526695251464844, 61.478271484375, 69.42986297607422, 77.38145446777344, 85.33304595947266, 93.28463745117188, 101.2362289428711, 109.18782043457031, 117.13941192626953, 125.09100341796875, 133.0426025390625, 140.9941864013672, 148.94577026367188, 156.89736938476562, 164.84896850585938, 172.80055236816406, 180.75213623046875, 188.7037353515625, 196.65533447265625, 204.60691833496094, 212.55850219726562, 220.51010131835938, 228.46170043945312, 236.4132843017578, 244.3648681640625, 252.31646728515625, 260.26806640625, 268.21966552734375, 276.1712341308594, 284.1228332519531, 292.0744323730469, 300.0260009765625, 307.97760009765625, 315.92919921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 8.0, 17.0, 13.0, 29.0, 47.0, 60.0, 93.0, 186.0, 282.0, 430.0, 767.0, 1412.0, 3092.0, 7475.0, 21660.0, 100062.0, 1035664.0, 2674870.0, 287741.0, 40499.0, 10985.0, 4217.0, 1993.0, 1025.0, 601.0, 329.0, 226.0, 141.0, 83.0, 77.0, 46.0, 36.0, 28.0, 25.0, 13.0, 8.0, 8.0, 7.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0], "bins": [-17.796875, -17.2919921875, -16.787109375, -16.2822265625, -15.77734375, -15.2724609375, -14.767578125, -14.2626953125, -13.7578125, -13.2529296875, -12.748046875, -12.2431640625, -11.73828125, -11.2333984375, -10.728515625, -10.2236328125, -9.71875, -9.2138671875, -8.708984375, -8.2041015625, -7.69921875, -7.1943359375, -6.689453125, -6.1845703125, -5.6796875, -5.1748046875, -4.669921875, -4.1650390625, -3.66015625, -3.1552734375, -2.650390625, -2.1455078125, -1.640625, -1.1357421875, -0.630859375, -0.1259765625, 0.37890625, 0.8837890625, 1.388671875, 1.8935546875, 2.3984375, 2.9033203125, 3.408203125, 3.9130859375, 4.41796875, 4.9228515625, 5.427734375, 5.9326171875, 6.4375, 6.9423828125, 7.447265625, 7.9521484375, 8.45703125, 8.9619140625, 9.466796875, 9.9716796875, 10.4765625, 10.9814453125, 11.486328125, 11.9912109375, 12.49609375, 13.0009765625, 13.505859375, 14.0107421875, 14.515625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 11.0, 6.0, 10.0, 15.0, 22.0, 28.0, 42.0, 51.0, 42.0, 64.0, 67.0, 76.0, 83.0, 69.0, 75.0, 52.0, 53.0, 31.0, 46.0, 30.0, 31.0, 20.0, 22.0, 13.0, 14.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.5836181640625, -11.081298828125, -10.5789794921875, -10.07666015625, -9.5743408203125, -9.072021484375, -8.5697021484375, -8.0673828125, -7.5650634765625, -7.062744140625, -6.5604248046875, -6.05810546875, -5.5557861328125, -5.053466796875, -4.5511474609375, -4.048828125, -3.5465087890625, -3.044189453125, -2.5418701171875, -2.03955078125, -1.5372314453125, -1.034912109375, -0.5325927734375, -0.0302734375, 0.4720458984375, 0.974365234375, 1.4766845703125, 1.97900390625, 2.4813232421875, 2.983642578125, 3.4859619140625, 3.98828125, 4.4906005859375, 4.992919921875, 5.4952392578125, 5.99755859375, 6.4998779296875, 7.002197265625, 7.5045166015625, 8.0068359375, 8.5091552734375, 9.011474609375, 9.5137939453125, 10.01611328125, 10.5184326171875, 11.020751953125, 11.5230712890625, 12.025390625, 12.5277099609375, 13.030029296875, 13.5323486328125, 14.03466796875, 14.5369873046875, 15.039306640625, 15.5416259765625, 16.0439453125, 16.5462646484375, 17.048583984375, 17.5509033203125, 18.05322265625, 18.5555419921875, 19.057861328125, 19.5601806640625, 20.0625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 13.0, 24.0, 58.0, 141.0, 323.0, 659.0, 3265.0, 113342.0, 4029940.0, 43593.0, 2227.0, 433.0, 140.0, 63.0, 29.0, 15.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.90625, -45.310546875, -43.71484375, -42.119140625, -40.5234375, -38.927734375, -37.33203125, -35.736328125, -34.140625, -32.544921875, -30.94921875, -29.353515625, -27.7578125, -26.162109375, -24.56640625, -22.970703125, -21.375, -19.779296875, -18.18359375, -16.587890625, -14.9921875, -13.396484375, -11.80078125, -10.205078125, -8.609375, -7.013671875, -5.41796875, -3.822265625, -2.2265625, -0.630859375, 0.96484375, 2.560546875, 4.15625, 5.751953125, 7.34765625, 8.943359375, 10.5390625, 12.134765625, 13.73046875, 15.326171875, 16.921875, 18.517578125, 20.11328125, 21.708984375, 23.3046875, 24.900390625, 26.49609375, 28.091796875, 29.6875, 31.283203125, 32.87890625, 34.474609375, 36.0703125, 37.666015625, 39.26171875, 40.857421875, 42.453125, 44.048828125, 45.64453125, 47.240234375, 48.8359375, 50.431640625, 52.02734375, 53.623046875, 55.21875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 6.0, 7.0, 12.0, 25.0, 39.0, 70.0, 152.0, 455.0, 1229.0, 1224.0, 489.0, 179.0, 97.0, 41.0, 17.0, 12.0, 8.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.8125, -54.45361328125, -53.0947265625, -51.73583984375, -50.376953125, -49.01806640625, -47.6591796875, -46.30029296875, -44.94140625, -43.58251953125, -42.2236328125, -40.86474609375, -39.505859375, -38.14697265625, -36.7880859375, -35.42919921875, -34.0703125, -32.71142578125, -31.3525390625, -29.99365234375, -28.634765625, -27.27587890625, -25.9169921875, -24.55810546875, -23.19921875, -21.84033203125, -20.4814453125, -19.12255859375, -17.763671875, -16.40478515625, -15.0458984375, -13.68701171875, -12.328125, -10.96923828125, -9.6103515625, -8.25146484375, -6.892578125, -5.53369140625, -4.1748046875, -2.81591796875, -1.45703125, -0.09814453125, 1.2607421875, 2.61962890625, 3.978515625, 5.33740234375, 6.6962890625, 8.05517578125, 9.4140625, 10.77294921875, 12.1318359375, 13.49072265625, 14.849609375, 16.20849609375, 17.5673828125, 18.92626953125, 20.28515625, 21.64404296875, 23.0029296875, 24.36181640625, 25.720703125, 27.07958984375, 28.4384765625, 29.79736328125, 31.15625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 8.0, 16.0, 41.0, 107.0, 180.0, 237.0, 203.0, 110.0, 43.0, 20.0, 7.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-294.5251159667969, -286.91607666015625, -279.3070068359375, -271.6979675292969, -264.08892822265625, -256.4798889160156, -248.87083435058594, -241.26177978515625, -233.65274047851562, -226.04368591308594, -218.4346466064453, -210.82559204101562, -203.216552734375, -195.6074981689453, -187.9984588623047, -180.389404296875, -172.78036499023438, -165.1713104248047, -157.56227111816406, -149.95321655273438, -142.34417724609375, -134.73512268066406, -127.12608337402344, -119.51702880859375, -111.90797424316406, -104.2989273071289, -96.68988037109375, -89.0808334350586, -81.47178649902344, -73.86273193359375, -66.25369262695312, -58.6446418762207, -51.03559875488281, -43.426551818847656, -35.8175048828125, -28.20845603942871, -20.599409103393555, -12.990360260009766, -5.381313323974609, 2.227733612060547, 9.836780548095703, 17.44582748413086, 25.054874420166016, 32.66392517089844, 40.272972106933594, 47.88201904296875, 55.491065979003906, 63.10011291503906, 70.70915985107422, 78.31820678710938, 85.92725372314453, 93.53630065917969, 101.14534759521484, 108.75439453125, 116.36344909667969, 123.97248840332031, 131.58154296875, 139.1905975341797, 146.7996368408203, 154.40869140625, 162.01773071289062, 169.6267852783203, 177.23582458496094, 184.84487915039062, 192.45391845703125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 6.0, 11.0, 14.0, 18.0, 14.0, 18.0, 23.0, 22.0, 38.0, 49.0, 51.0, 44.0, 44.0, 59.0, 73.0, 56.0, 49.0, 47.0, 62.0, 56.0, 44.0, 41.0, 33.0, 27.0, 16.0, 23.0, 13.0, 6.0, 10.0, 6.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-162.22637939453125, -157.39866638183594, -152.5709686279297, -147.74325561523438, -142.91555786132812, -138.0878448486328, -133.2601318359375, -128.43243408203125, -123.60472106933594, -118.77701568603516, -113.94931030273438, -109.12159729003906, -104.29389190673828, -99.4661865234375, -94.63847351074219, -89.8107681274414, -84.98306274414062, -80.15535736083984, -75.32765197753906, -70.49993896484375, -65.67223358154297, -60.84452819824219, -56.01681900024414, -51.189109802246094, -46.36140441894531, -41.53369903564453, -36.705989837646484, -31.87828254699707, -27.050575256347656, -22.222867965698242, -17.395160675048828, -12.567451477050781, -7.73974609375, -2.912038803100586, 1.9156684875488281, 6.743375778198242, 11.571083068847656, 16.39879035949707, 21.226497650146484, 26.05420684814453, 30.881912231445312, 35.709617614746094, 40.53732681274414, 45.36503601074219, 50.19274139404297, 55.02044677734375, 59.8481559753418, 64.67586517333984, 69.50357055664062, 74.3312759399414, 79.15898132324219, 83.9866943359375, 88.81439971923828, 93.64210510253906, 98.46981811523438, 103.29752349853516, 108.12522888183594, 112.95293426513672, 117.7806396484375, 122.60835266113281, 127.4360580444336, 132.26376342773438, 137.0914764404297, 141.919189453125, 146.74688720703125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 7.0, 13.0, 8.0, 15.0, 16.0, 26.0, 44.0, 87.0, 133.0, 279.0, 578.0, 1483.0, 5339.0, 38307.0, 536955.0, 427513.0, 30505.0, 4796.0, 1371.0, 517.0, 250.0, 123.0, 59.0, 44.0, 33.0, 13.0, 11.0, 8.0, 9.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.0625, -56.4912109375, -54.919921875, -53.3486328125, -51.77734375, -50.2060546875, -48.634765625, -47.0634765625, -45.4921875, -43.9208984375, -42.349609375, -40.7783203125, -39.20703125, -37.6357421875, -36.064453125, -34.4931640625, -32.921875, -31.3505859375, -29.779296875, -28.2080078125, -26.63671875, -25.0654296875, -23.494140625, -21.9228515625, -20.3515625, -18.7802734375, -17.208984375, -15.6376953125, -14.06640625, -12.4951171875, -10.923828125, -9.3525390625, -7.78125, -6.2099609375, -4.638671875, -3.0673828125, -1.49609375, 0.0751953125, 1.646484375, 3.2177734375, 4.7890625, 6.3603515625, 7.931640625, 9.5029296875, 11.07421875, 12.6455078125, 14.216796875, 15.7880859375, 17.359375, 18.9306640625, 20.501953125, 22.0732421875, 23.64453125, 25.2158203125, 26.787109375, 28.3583984375, 29.9296875, 31.5009765625, 33.072265625, 34.6435546875, 36.21484375, 37.7861328125, 39.357421875, 40.9287109375, 42.5]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 9.0, 11.0, 14.0, 10.0, 25.0, 32.0, 35.0, 51.0, 42.0, 62.0, 71.0, 69.0, 57.0, 68.0, 81.0, 63.0, 57.0, 51.0, 38.0, 37.0, 35.0, 19.0, 20.0, 11.0, 10.0, 10.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.28125, -10.79248046875, -10.3037109375, -9.81494140625, -9.326171875, -8.83740234375, -8.3486328125, -7.85986328125, -7.37109375, -6.88232421875, -6.3935546875, -5.90478515625, -5.416015625, -4.92724609375, -4.4384765625, -3.94970703125, -3.4609375, -2.97216796875, -2.4833984375, -1.99462890625, -1.505859375, -1.01708984375, -0.5283203125, -0.03955078125, 0.44921875, 0.93798828125, 1.4267578125, 1.91552734375, 2.404296875, 2.89306640625, 3.3818359375, 3.87060546875, 4.359375, 4.84814453125, 5.3369140625, 5.82568359375, 6.314453125, 6.80322265625, 7.2919921875, 7.78076171875, 8.26953125, 8.75830078125, 9.2470703125, 9.73583984375, 10.224609375, 10.71337890625, 11.2021484375, 11.69091796875, 12.1796875, 12.66845703125, 13.1572265625, 13.64599609375, 14.134765625, 14.62353515625, 15.1123046875, 15.60107421875, 16.08984375, 16.57861328125, 17.0673828125, 17.55615234375, 18.044921875, 18.53369140625, 19.0224609375, 19.51123046875, 20.0]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 7.0, 3.0, 5.0, 11.0, 20.0, 30.0, 34.0, 63.0, 114.0, 206.0, 411.0, 1122.0, 4246.0, 87517.0, 940754.0, 10728.0, 1929.0, 687.0, 276.0, 148.0, 86.0, 56.0, 40.0, 18.0, 15.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-145.5, -141.4833984375, -137.466796875, -133.4501953125, -129.43359375, -125.4169921875, -121.400390625, -117.3837890625, -113.3671875, -109.3505859375, -105.333984375, -101.3173828125, -97.30078125, -93.2841796875, -89.267578125, -85.2509765625, -81.234375, -77.2177734375, -73.201171875, -69.1845703125, -65.16796875, -61.1513671875, -57.134765625, -53.1181640625, -49.1015625, -45.0849609375, -41.068359375, -37.0517578125, -33.03515625, -29.0185546875, -25.001953125, -20.9853515625, -16.96875, -12.9521484375, -8.935546875, -4.9189453125, -0.90234375, 3.1142578125, 7.130859375, 11.1474609375, 15.1640625, 19.1806640625, 23.197265625, 27.2138671875, 31.23046875, 35.2470703125, 39.263671875, 43.2802734375, 47.296875, 51.3134765625, 55.330078125, 59.3466796875, 63.36328125, 67.3798828125, 71.396484375, 75.4130859375, 79.4296875, 83.4462890625, 87.462890625, 91.4794921875, 95.49609375, 99.5126953125, 103.529296875, 107.5458984375, 111.5625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 14.0, 10.0, 13.0, 26.0, 28.0, 33.0, 51.0, 58.0, 82.0, 58.0, 74.0, 64.0, 72.0, 70.0, 47.0, 56.0, 47.0, 43.0, 31.0, 26.0, 16.0, 16.0, 15.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-82.375, -80.24365234375, -78.1123046875, -75.98095703125, -73.849609375, -71.71826171875, -69.5869140625, -67.45556640625, -65.32421875, -63.19287109375, -61.0615234375, -58.93017578125, -56.798828125, -54.66748046875, -52.5361328125, -50.40478515625, -48.2734375, -46.14208984375, -44.0107421875, -41.87939453125, -39.748046875, -37.61669921875, -35.4853515625, -33.35400390625, -31.22265625, -29.09130859375, -26.9599609375, -24.82861328125, -22.697265625, -20.56591796875, -18.4345703125, -16.30322265625, -14.171875, -12.04052734375, -9.9091796875, -7.77783203125, -5.646484375, -3.51513671875, -1.3837890625, 0.74755859375, 2.87890625, 5.01025390625, 7.1416015625, 9.27294921875, 11.404296875, 13.53564453125, 15.6669921875, 17.79833984375, 19.9296875, 22.06103515625, 24.1923828125, 26.32373046875, 28.455078125, 30.58642578125, 32.7177734375, 34.84912109375, 36.98046875, 39.11181640625, 41.2431640625, 43.37451171875, 45.505859375, 47.63720703125, 49.7685546875, 51.89990234375, 54.03125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 16.0, 14.0, 19.0, 34.0, 36.0, 49.0, 100.0, 115.0, 220.0, 483.0, 1582.0, 8168.0, 261947.0, 760973.0, 11503.0, 1954.0, 564.0, 266.0, 157.0, 82.0, 52.0, 52.0, 35.0, 23.0, 11.0, 18.0, 10.0, 9.0, 6.0, 3.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.484375, -25.573486328125, -24.66259765625, -23.751708984375, -22.8408203125, -21.929931640625, -21.01904296875, -20.108154296875, -19.197265625, -18.286376953125, -17.37548828125, -16.464599609375, -15.5537109375, -14.642822265625, -13.73193359375, -12.821044921875, -11.91015625, -10.999267578125, -10.08837890625, -9.177490234375, -8.2666015625, -7.355712890625, -6.44482421875, -5.533935546875, -4.623046875, -3.712158203125, -2.80126953125, -1.890380859375, -0.9794921875, -0.068603515625, 0.84228515625, 1.753173828125, 2.6640625, 3.574951171875, 4.48583984375, 5.396728515625, 6.3076171875, 7.218505859375, 8.12939453125, 9.040283203125, 9.951171875, 10.862060546875, 11.77294921875, 12.683837890625, 13.5947265625, 14.505615234375, 15.41650390625, 16.327392578125, 17.23828125, 18.149169921875, 19.06005859375, 19.970947265625, 20.8818359375, 21.792724609375, 22.70361328125, 23.614501953125, 24.525390625, 25.436279296875, 26.34716796875, 27.258056640625, 28.1689453125, 29.079833984375, 29.99072265625, 30.901611328125, 31.8125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 3.0, 7.0, 7.0, 11.0, 12.0, 19.0, 19.0, 26.0, 30.0, 57.0, 69.0, 139.0, 186.0, 120.0, 83.0, 53.0, 30.0, 36.0, 26.0, 16.0, 13.0, 16.0, 8.0, 3.0, 1.0, 8.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003078460693359375, -0.002986311912536621, -0.002894163131713867, -0.0028020143508911133, -0.0027098655700683594, -0.0026177167892456055, -0.0025255680084228516, -0.0024334192276000977, -0.0023412704467773438, -0.00224912166595459, -0.002156972885131836, -0.002064824104309082, -0.001972675323486328, -0.0018805265426635742, -0.0017883777618408203, -0.0016962289810180664, -0.0016040802001953125, -0.0015119314193725586, -0.0014197826385498047, -0.0013276338577270508, -0.0012354850769042969, -0.001143336296081543, -0.001051187515258789, -0.0009590387344360352, -0.0008668899536132812, -0.0007747411727905273, -0.0006825923919677734, -0.0005904436111450195, -0.0004982948303222656, -0.0004061460494995117, -0.0003139972686767578, -0.0002218484878540039, -0.00012969970703125, -3.7550926208496094e-05, 5.459785461425781e-05, 0.00014674663543701172, 0.00023889541625976562, 0.00033104419708251953, 0.00042319297790527344, 0.0005153417587280273, 0.0006074905395507812, 0.0006996393203735352, 0.0007917881011962891, 0.000883936882019043, 0.0009760856628417969, 0.0010682344436645508, 0.0011603832244873047, 0.0012525320053100586, 0.0013446807861328125, 0.0014368295669555664, 0.0015289783477783203, 0.0016211271286010742, 0.0017132759094238281, 0.001805424690246582, 0.001897573471069336, 0.00198972225189209, 0.0020818710327148438, 0.0021740198135375977, 0.0022661685943603516, 0.0023583173751831055, 0.0024504661560058594, 0.0025426149368286133, 0.002634763717651367, 0.002726912498474121, 0.002819061279296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 0.0, 4.0, 6.0, 4.0, 6.0, 8.0, 9.0, 12.0, 19.0, 25.0, 32.0, 38.0, 50.0, 89.0, 155.0, 211.0, 378.0, 891.0, 2802.0, 14229.0, 831851.0, 185017.0, 9110.0, 1973.0, 707.0, 366.0, 186.0, 120.0, 68.0, 52.0, 38.0, 27.0, 18.0, 7.0, 5.0, 10.0, 9.0, 6.0, 4.0, 1.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -28.037841796875, -27.18505859375, -26.332275390625, -25.4794921875, -24.626708984375, -23.77392578125, -22.921142578125, -22.068359375, -21.215576171875, -20.36279296875, -19.510009765625, -18.6572265625, -17.804443359375, -16.95166015625, -16.098876953125, -15.24609375, -14.393310546875, -13.54052734375, -12.687744140625, -11.8349609375, -10.982177734375, -10.12939453125, -9.276611328125, -8.423828125, -7.571044921875, -6.71826171875, -5.865478515625, -5.0126953125, -4.159912109375, -3.30712890625, -2.454345703125, -1.6015625, -0.748779296875, 0.10400390625, 0.956787109375, 1.8095703125, 2.662353515625, 3.51513671875, 4.367919921875, 5.220703125, 6.073486328125, 6.92626953125, 7.779052734375, 8.6318359375, 9.484619140625, 10.33740234375, 11.190185546875, 12.04296875, 12.895751953125, 13.74853515625, 14.601318359375, 15.4541015625, 16.306884765625, 17.15966796875, 18.012451171875, 18.865234375, 19.718017578125, 20.57080078125, 21.423583984375, 22.2763671875, 23.129150390625, 23.98193359375, 24.834716796875, 25.6875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 14.0, 10.0, 22.0, 42.0, 44.0, 71.0, 115.0, 170.0, 184.0, 117.0, 80.0, 33.0, 30.0, 17.0, 5.0, 9.0, 6.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.609375, -14.00146484375, -13.3935546875, -12.78564453125, -12.177734375, -11.56982421875, -10.9619140625, -10.35400390625, -9.74609375, -9.13818359375, -8.5302734375, -7.92236328125, -7.314453125, -6.70654296875, -6.0986328125, -5.49072265625, -4.8828125, -4.27490234375, -3.6669921875, -3.05908203125, -2.451171875, -1.84326171875, -1.2353515625, -0.62744140625, -0.01953125, 0.58837890625, 1.1962890625, 1.80419921875, 2.412109375, 3.02001953125, 3.6279296875, 4.23583984375, 4.84375, 5.45166015625, 6.0595703125, 6.66748046875, 7.275390625, 7.88330078125, 8.4912109375, 9.09912109375, 9.70703125, 10.31494140625, 10.9228515625, 11.53076171875, 12.138671875, 12.74658203125, 13.3544921875, 13.96240234375, 14.5703125, 15.17822265625, 15.7861328125, 16.39404296875, 17.001953125, 17.60986328125, 18.2177734375, 18.82568359375, 19.43359375, 20.04150390625, 20.6494140625, 21.25732421875, 21.865234375, 22.47314453125, 23.0810546875, 23.68896484375, 24.296875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 8.0, 22.0, 73.0, 182.0, 404.0, 204.0, 59.0, 19.0, 2.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-518.3729248046875, -504.5660705566406, -490.7591857910156, -476.95233154296875, -463.14544677734375, -449.3385925292969, -435.53173828125, -421.724853515625, -407.9179992675781, -394.11114501953125, -380.30426025390625, -366.4974060058594, -352.6905517578125, -338.8836669921875, -325.0768127441406, -311.26995849609375, -297.46307373046875, -283.6562194824219, -269.8493347167969, -256.04248046875, -242.23561096191406, -228.42874145507812, -214.62188720703125, -200.8150177001953, -187.00814819335938, -173.20127868652344, -159.3944091796875, -145.58755493164062, -131.7806854248047, -117.97381591796875, -104.16695404052734, -90.36009216308594, -76.55319213867188, -62.7463264465332, -48.93946075439453, -35.13259506225586, -21.325729370117188, -7.51885986328125, 6.288002014160156, 20.094863891601562, 33.9017333984375, 47.70859909057617, 61.515464782714844, 75.32232666015625, 89.12919616699219, 102.93606567382812, 116.74292755126953, 130.54978942871094, 144.35665893554688, 158.1635284423828, 171.97039794921875, 185.77725219726562, 199.58412170410156, 213.3909912109375, 227.19784545898438, 241.0047149658203, 254.81158447265625, 268.6184387207031, 282.4253234863281, 296.232177734375, 310.0390625, 323.8459167480469, 337.65277099609375, 351.45965576171875, 365.2665100097656]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 10.0, 4.0, 11.0, 7.0, 8.0, 14.0, 21.0, 10.0, 20.0, 22.0, 20.0, 20.0, 25.0, 32.0, 26.0, 22.0, 29.0, 37.0, 56.0, 56.0, 58.0, 61.0, 50.0, 36.0, 39.0, 35.0, 35.0, 36.0, 27.0, 23.0, 24.0, 19.0, 20.0, 14.0, 15.0, 8.0, 9.0, 7.0, 9.0, 5.0, 9.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-146.6016082763672, -141.68582153320312, -136.77003479003906, -131.85426330566406, -126.9384765625, -122.02268981933594, -117.10690307617188, -112.19111633300781, -107.27533721923828, -102.35955047607422, -97.44377136230469, -92.52798461914062, -87.61219787597656, -82.69641876220703, -77.78063201904297, -72.86485290527344, -67.94906616210938, -63.03328323364258, -58.11750030517578, -53.20171356201172, -48.28593063354492, -43.370147705078125, -38.45436096191406, -33.538578033447266, -28.62279510498047, -23.707012176513672, -18.791227340698242, -13.875443458557129, -8.959659576416016, -4.043876647949219, 0.8719081878662109, 5.787693023681641, 10.7034912109375, 15.619275093078613, 20.535058975219727, 25.450843811035156, 30.366626739501953, 35.28240966796875, 40.19819641113281, 45.11397933959961, 50.029762268066406, 54.9455451965332, 59.861328125, 64.77711486816406, 69.69290161132812, 74.60868072509766, 79.52446746826172, 84.44024658203125, 89.35603332519531, 94.27182006835938, 99.1875991821289, 104.10338592529297, 109.0191650390625, 113.93495178222656, 118.85073852539062, 123.76652526855469, 128.68231201171875, 133.5980987548828, 138.51388549804688, 143.42965698242188, 148.34544372558594, 153.26123046875, 158.17701721191406, 163.09280395507812, 168.00857543945312]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 4.0, 4.0, 10.0, 18.0, 24.0, 34.0, 62.0, 98.0, 175.0, 321.0, 660.0, 1633.0, 5187.0, 23972.0, 632558.0, 3424947.0, 90542.0, 9407.0, 2566.0, 971.0, 464.0, 235.0, 142.0, 81.0, 64.0, 29.0, 17.0, 20.0, 9.0, 1.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.1875, -27.41015625, -26.6328125, -25.85546875, -25.078125, -24.30078125, -23.5234375, -22.74609375, -21.96875, -21.19140625, -20.4140625, -19.63671875, -18.859375, -18.08203125, -17.3046875, -16.52734375, -15.75, -14.97265625, -14.1953125, -13.41796875, -12.640625, -11.86328125, -11.0859375, -10.30859375, -9.53125, -8.75390625, -7.9765625, -7.19921875, -6.421875, -5.64453125, -4.8671875, -4.08984375, -3.3125, -2.53515625, -1.7578125, -0.98046875, -0.203125, 0.57421875, 1.3515625, 2.12890625, 2.90625, 3.68359375, 4.4609375, 5.23828125, 6.015625, 6.79296875, 7.5703125, 8.34765625, 9.125, 9.90234375, 10.6796875, 11.45703125, 12.234375, 13.01171875, 13.7890625, 14.56640625, 15.34375, 16.12109375, 16.8984375, 17.67578125, 18.453125, 19.23046875, 20.0078125, 20.78515625, 21.5625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 12.0, 5.0, 10.0, 15.0, 22.0, 30.0, 43.0, 56.0, 60.0, 112.0, 90.0, 82.0, 97.0, 79.0, 74.0, 68.0, 51.0, 43.0, 16.0, 25.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8203125, -14.1951904296875, -13.570068359375, -12.9449462890625, -12.31982421875, -11.6947021484375, -11.069580078125, -10.4444580078125, -9.8193359375, -9.1942138671875, -8.569091796875, -7.9439697265625, -7.31884765625, -6.6937255859375, -6.068603515625, -5.4434814453125, -4.818359375, -4.1932373046875, -3.568115234375, -2.9429931640625, -2.31787109375, -1.6927490234375, -1.067626953125, -0.4425048828125, 0.1826171875, 0.8077392578125, 1.432861328125, 2.0579833984375, 2.68310546875, 3.3082275390625, 3.933349609375, 4.5584716796875, 5.18359375, 5.8087158203125, 6.433837890625, 7.0589599609375, 7.68408203125, 8.3092041015625, 8.934326171875, 9.5594482421875, 10.1845703125, 10.8096923828125, 11.434814453125, 12.0599365234375, 12.68505859375, 13.3101806640625, 13.935302734375, 14.5604248046875, 15.185546875, 15.8106689453125, 16.435791015625, 17.0609130859375, 17.68603515625, 18.3111572265625, 18.936279296875, 19.5614013671875, 20.1865234375, 20.8116455078125, 21.436767578125, 22.0618896484375, 22.68701171875, 23.3121337890625, 23.937255859375, 24.5623779296875, 25.1875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 14.0, 18.0, 43.0, 60.0, 135.0, 284.0, 571.0, 1123.0, 2923.0, 14443.0, 276135.0, 3813310.0, 74151.0, 7504.0, 1853.0, 716.0, 356.0, 238.0, 129.0, 92.0, 63.0, 27.0, 25.0, 18.0, 8.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.484375, -20.522705078125, -19.56103515625, -18.599365234375, -17.6376953125, -16.676025390625, -15.71435546875, -14.752685546875, -13.791015625, -12.829345703125, -11.86767578125, -10.906005859375, -9.9443359375, -8.982666015625, -8.02099609375, -7.059326171875, -6.09765625, -5.135986328125, -4.17431640625, -3.212646484375, -2.2509765625, -1.289306640625, -0.32763671875, 0.634033203125, 1.595703125, 2.557373046875, 3.51904296875, 4.480712890625, 5.4423828125, 6.404052734375, 7.36572265625, 8.327392578125, 9.2890625, 10.250732421875, 11.21240234375, 12.174072265625, 13.1357421875, 14.097412109375, 15.05908203125, 16.020751953125, 16.982421875, 17.944091796875, 18.90576171875, 19.867431640625, 20.8291015625, 21.790771484375, 22.75244140625, 23.714111328125, 24.67578125, 25.637451171875, 26.59912109375, 27.560791015625, 28.5224609375, 29.484130859375, 30.44580078125, 31.407470703125, 32.369140625, 33.330810546875, 34.29248046875, 35.254150390625, 36.2158203125, 37.177490234375, 38.13916015625, 39.100830078125, 40.0625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 8.0, 7.0, 7.0, 22.0, 18.0, 42.0, 67.0, 144.0, 430.0, 997.0, 1362.0, 607.0, 198.0, 64.0, 41.0, 22.0, 15.0, 8.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.21875, -33.0869140625, -31.955078125, -30.8232421875, -29.69140625, -28.5595703125, -27.427734375, -26.2958984375, -25.1640625, -24.0322265625, -22.900390625, -21.7685546875, -20.63671875, -19.5048828125, -18.373046875, -17.2412109375, -16.109375, -14.9775390625, -13.845703125, -12.7138671875, -11.58203125, -10.4501953125, -9.318359375, -8.1865234375, -7.0546875, -5.9228515625, -4.791015625, -3.6591796875, -2.52734375, -1.3955078125, -0.263671875, 0.8681640625, 2.0, 3.1318359375, 4.263671875, 5.3955078125, 6.52734375, 7.6591796875, 8.791015625, 9.9228515625, 11.0546875, 12.1865234375, 13.318359375, 14.4501953125, 15.58203125, 16.7138671875, 17.845703125, 18.9775390625, 20.109375, 21.2412109375, 22.373046875, 23.5048828125, 24.63671875, 25.7685546875, 26.900390625, 28.0322265625, 29.1640625, 30.2958984375, 31.427734375, 32.5595703125, 33.69140625, 34.8232421875, 35.955078125, 37.0869140625, 38.21875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 18.0, 76.0, 348.0, 399.0, 106.0, 18.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-390.8502197265625, -378.28790283203125, -365.7255859375, -353.16326904296875, -340.6009216308594, -328.0386047363281, -315.4762878417969, -302.9139709472656, -290.35162353515625, -277.789306640625, -265.22698974609375, -252.66465759277344, -240.10232543945312, -227.54000854492188, -214.97769165039062, -202.41537475585938, -189.85305786132812, -177.29074096679688, -164.72840881347656, -152.1660919189453, -139.603759765625, -127.04144287109375, -114.4791259765625, -101.91680145263672, -89.35447692871094, -76.79215240478516, -64.22982788085938, -51.667510986328125, -39.105186462402344, -26.542861938476562, -13.980545043945312, -1.4182205200195312, 11.144134521484375, 23.706457138061523, 36.26877975463867, 48.83110046386719, 61.39342498779297, 73.95574951171875, 86.51806640625, 99.08039093017578, 111.64271545410156, 124.20503997802734, 136.76736450195312, 149.32968139648438, 161.89199829101562, 174.45433044433594, 187.0166473388672, 199.5789794921875, 212.14129638671875, 224.70361328125, 237.2659454345703, 249.82826232910156, 262.3905944824219, 274.9529113769531, 287.5152282714844, 300.0775451660156, 312.639892578125, 325.20220947265625, 337.7645263671875, 350.32684326171875, 362.8891906738281, 375.4515075683594, 388.0138244628906, 400.5761413574219, 413.1384582519531]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 8.0, 14.0, 13.0, 30.0, 17.0, 36.0, 36.0, 79.0, 71.0, 83.0, 77.0, 95.0, 81.0, 84.0, 80.0, 46.0, 42.0, 35.0, 20.0, 15.0, 16.0, 7.0, 10.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.0839385986328, -241.26461791992188, -235.44529724121094, -229.6259765625, -223.80667114257812, -217.9873504638672, -212.16802978515625, -206.3487091064453, -200.52938842773438, -194.71006774902344, -188.8907470703125, -183.07144165039062, -177.2521209716797, -171.43280029296875, -165.6134796142578, -159.79415893554688, -153.974853515625, -148.15553283691406, -142.33621215820312, -136.51690673828125, -130.6975860595703, -124.87826538085938, -119.05894470214844, -113.2396240234375, -107.42030334472656, -101.60098266601562, -95.78166961669922, -89.96234893798828, -84.14302825927734, -78.32371520996094, -72.50439453125, -66.68507385253906, -60.865760803222656, -55.046443939208984, -49.22712326049805, -43.407806396484375, -37.58848571777344, -31.769168853759766, -25.949851989746094, -20.130531311035156, -14.311214447021484, -8.49189567565918, -2.6725778579711914, 3.146739959716797, 8.966058731079102, 14.785377502441406, 20.604694366455078, 26.424015045166016, 32.24333190917969, 38.06264877319336, 43.8819694519043, 49.70128631591797, 55.520606994628906, 61.33992385864258, 67.15924072265625, 72.97856140136719, 78.79788208007812, 84.61720275878906, 90.43651580810547, 96.2558364868164, 102.07515716552734, 107.89447021484375, 113.71379089355469, 119.53311157226562, 125.35242462158203]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 5.0, 10.0, 9.0, 17.0, 14.0, 18.0, 22.0, 28.0, 50.0, 51.0, 75.0, 129.0, 185.0, 298.0, 513.0, 1167.0, 3099.0, 11483.0, 66380.0, 635630.0, 286480.0, 32044.0, 6679.0, 2105.0, 857.0, 439.0, 239.0, 158.0, 88.0, 68.0, 46.0, 42.0, 26.0, 17.0, 18.0, 12.0, 6.0, 12.0, 10.0, 6.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-32.125, -31.04736328125, -29.9697265625, -28.89208984375, -27.814453125, -26.73681640625, -25.6591796875, -24.58154296875, -23.50390625, -22.42626953125, -21.3486328125, -20.27099609375, -19.193359375, -18.11572265625, -17.0380859375, -15.96044921875, -14.8828125, -13.80517578125, -12.7275390625, -11.64990234375, -10.572265625, -9.49462890625, -8.4169921875, -7.33935546875, -6.26171875, -5.18408203125, -4.1064453125, -3.02880859375, -1.951171875, -0.87353515625, 0.2041015625, 1.28173828125, 2.359375, 3.43701171875, 4.5146484375, 5.59228515625, 6.669921875, 7.74755859375, 8.8251953125, 9.90283203125, 10.98046875, 12.05810546875, 13.1357421875, 14.21337890625, 15.291015625, 16.36865234375, 17.4462890625, 18.52392578125, 19.6015625, 20.67919921875, 21.7568359375, 22.83447265625, 23.912109375, 24.98974609375, 26.0673828125, 27.14501953125, 28.22265625, 29.30029296875, 30.3779296875, 31.45556640625, 32.533203125, 33.61083984375, 34.6884765625, 35.76611328125, 36.84375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 6.0, 6.0, 12.0, 14.0, 10.0, 24.0, 31.0, 45.0, 60.0, 68.0, 73.0, 74.0, 86.0, 85.0, 77.0, 67.0, 70.0, 57.0, 33.0, 41.0, 20.0, 13.0, 10.0, 6.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.4453125, -13.9268798828125, -13.408447265625, -12.8900146484375, -12.37158203125, -11.8531494140625, -11.334716796875, -10.8162841796875, -10.2978515625, -9.7794189453125, -9.260986328125, -8.7425537109375, -8.22412109375, -7.7056884765625, -7.187255859375, -6.6688232421875, -6.150390625, -5.6319580078125, -5.113525390625, -4.5950927734375, -4.07666015625, -3.5582275390625, -3.039794921875, -2.5213623046875, -2.0029296875, -1.4844970703125, -0.966064453125, -0.4476318359375, 0.07080078125, 0.5892333984375, 1.107666015625, 1.6260986328125, 2.14453125, 2.6629638671875, 3.181396484375, 3.6998291015625, 4.21826171875, 4.7366943359375, 5.255126953125, 5.7735595703125, 6.2919921875, 6.8104248046875, 7.328857421875, 7.8472900390625, 8.36572265625, 8.8841552734375, 9.402587890625, 9.9210205078125, 10.439453125, 10.9578857421875, 11.476318359375, 11.9947509765625, 12.51318359375, 13.0316162109375, 13.550048828125, 14.0684814453125, 14.5869140625, 15.1053466796875, 15.623779296875, 16.1422119140625, 16.66064453125, 17.1790771484375, 17.697509765625, 18.2159423828125, 18.734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 4.0, 2.0, 0.0, 5.0, 7.0, 7.0, 16.0, 17.0, 20.0, 27.0, 41.0, 74.0, 91.0, 204.0, 393.0, 966.0, 2995.0, 20987.0, 964083.0, 51804.0, 4435.0, 1295.0, 492.0, 236.0, 113.0, 64.0, 45.0, 39.0, 25.0, 16.0, 14.0, 11.0, 4.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-90.0625, -87.21484375, -84.3671875, -81.51953125, -78.671875, -75.82421875, -72.9765625, -70.12890625, -67.28125, -64.43359375, -61.5859375, -58.73828125, -55.890625, -53.04296875, -50.1953125, -47.34765625, -44.5, -41.65234375, -38.8046875, -35.95703125, -33.109375, -30.26171875, -27.4140625, -24.56640625, -21.71875, -18.87109375, -16.0234375, -13.17578125, -10.328125, -7.48046875, -4.6328125, -1.78515625, 1.0625, 3.91015625, 6.7578125, 9.60546875, 12.453125, 15.30078125, 18.1484375, 20.99609375, 23.84375, 26.69140625, 29.5390625, 32.38671875, 35.234375, 38.08203125, 40.9296875, 43.77734375, 46.625, 49.47265625, 52.3203125, 55.16796875, 58.015625, 60.86328125, 63.7109375, 66.55859375, 69.40625, 72.25390625, 75.1015625, 77.94921875, 80.796875, 83.64453125, 86.4921875, 89.33984375, 92.1875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 14.0, 18.0, 26.0, 34.0, 45.0, 48.0, 60.0, 84.0, 94.0, 86.0, 83.0, 77.0, 72.0, 60.0, 42.0, 32.0, 28.0, 23.0, 11.0, 15.0, 6.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.5, -69.3671875, -67.234375, -65.1015625, -62.96875, -60.8359375, -58.703125, -56.5703125, -54.4375, -52.3046875, -50.171875, -48.0390625, -45.90625, -43.7734375, -41.640625, -39.5078125, -37.375, -35.2421875, -33.109375, -30.9765625, -28.84375, -26.7109375, -24.578125, -22.4453125, -20.3125, -18.1796875, -16.046875, -13.9140625, -11.78125, -9.6484375, -7.515625, -5.3828125, -3.25, -1.1171875, 1.015625, 3.1484375, 5.28125, 7.4140625, 9.546875, 11.6796875, 13.8125, 15.9453125, 18.078125, 20.2109375, 22.34375, 24.4765625, 26.609375, 28.7421875, 30.875, 33.0078125, 35.140625, 37.2734375, 39.40625, 41.5390625, 43.671875, 45.8046875, 47.9375, 50.0703125, 52.203125, 54.3359375, 56.46875, 58.6015625, 60.734375, 62.8671875, 65.0]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 10.0, 7.0, 14.0, 19.0, 22.0, 29.0, 35.0, 59.0, 91.0, 108.0, 211.0, 385.0, 920.0, 2598.0, 11814.0, 866088.0, 154510.0, 7954.0, 2044.0, 706.0, 306.0, 220.0, 104.0, 74.0, 54.0, 38.0, 34.0, 22.0, 8.0, 13.0, 8.0, 10.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.25, -29.30126953125, -28.3525390625, -27.40380859375, -26.455078125, -25.50634765625, -24.5576171875, -23.60888671875, -22.66015625, -21.71142578125, -20.7626953125, -19.81396484375, -18.865234375, -17.91650390625, -16.9677734375, -16.01904296875, -15.0703125, -14.12158203125, -13.1728515625, -12.22412109375, -11.275390625, -10.32666015625, -9.3779296875, -8.42919921875, -7.48046875, -6.53173828125, -5.5830078125, -4.63427734375, -3.685546875, -2.73681640625, -1.7880859375, -0.83935546875, 0.109375, 1.05810546875, 2.0068359375, 2.95556640625, 3.904296875, 4.85302734375, 5.8017578125, 6.75048828125, 7.69921875, 8.64794921875, 9.5966796875, 10.54541015625, 11.494140625, 12.44287109375, 13.3916015625, 14.34033203125, 15.2890625, 16.23779296875, 17.1865234375, 18.13525390625, 19.083984375, 20.03271484375, 20.9814453125, 21.93017578125, 22.87890625, 23.82763671875, 24.7763671875, 25.72509765625, 26.673828125, 27.62255859375, 28.5712890625, 29.52001953125, 30.46875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 5.0, 10.0, 22.0, 43.0, 69.0, 157.0, 351.0, 185.0, 57.0, 25.0, 16.0, 20.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.003997802734375, -0.003852665424346924, -0.0037075281143188477, -0.0035623908042907715, -0.0034172534942626953, -0.003272116184234619, -0.003126978874206543, -0.002981841564178467, -0.0028367042541503906, -0.0026915669441223145, -0.0025464296340942383, -0.002401292324066162, -0.002256155014038086, -0.0021110177040100098, -0.0019658803939819336, -0.0018207430839538574, -0.0016756057739257812, -0.001530468463897705, -0.001385331153869629, -0.0012401938438415527, -0.0010950565338134766, -0.0009499192237854004, -0.0008047819137573242, -0.000659644603729248, -0.0005145072937011719, -0.0003693699836730957, -0.00022423267364501953, -7.909536361694336e-05, 6.604194641113281e-05, 0.00021117925643920898, 0.00035631656646728516, 0.0005014538764953613, 0.0006465911865234375, 0.0007917284965515137, 0.0009368658065795898, 0.001082003116607666, 0.0012271404266357422, 0.0013722777366638184, 0.0015174150466918945, 0.0016625523567199707, 0.0018076896667480469, 0.001952826976776123, 0.0020979642868041992, 0.0022431015968322754, 0.0023882389068603516, 0.0025333762168884277, 0.002678513526916504, 0.00282365083694458, 0.0029687881469726562, 0.0031139254570007324, 0.0032590627670288086, 0.0034042000770568848, 0.003549337387084961, 0.003694474697113037, 0.0038396120071411133, 0.0039847493171691895, 0.004129886627197266, 0.004275023937225342, 0.004420161247253418, 0.004565298557281494, 0.00471043586730957, 0.0048555731773376465, 0.005000710487365723, 0.005145847797393799, 0.005290985107421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 11.0, 22.0, 32.0, 58.0, 79.0, 132.0, 294.0, 648.0, 2993.0, 30300.0, 991404.0, 19266.0, 2120.0, 612.0, 230.0, 125.0, 77.0, 50.0, 32.0, 17.0, 13.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.375, -33.43115234375, -32.4873046875, -31.54345703125, -30.599609375, -29.65576171875, -28.7119140625, -27.76806640625, -26.82421875, -25.88037109375, -24.9365234375, -23.99267578125, -23.048828125, -22.10498046875, -21.1611328125, -20.21728515625, -19.2734375, -18.32958984375, -17.3857421875, -16.44189453125, -15.498046875, -14.55419921875, -13.6103515625, -12.66650390625, -11.72265625, -10.77880859375, -9.8349609375, -8.89111328125, -7.947265625, -7.00341796875, -6.0595703125, -5.11572265625, -4.171875, -3.22802734375, -2.2841796875, -1.34033203125, -0.396484375, 0.54736328125, 1.4912109375, 2.43505859375, 3.37890625, 4.32275390625, 5.2666015625, 6.21044921875, 7.154296875, 8.09814453125, 9.0419921875, 9.98583984375, 10.9296875, 11.87353515625, 12.8173828125, 13.76123046875, 14.705078125, 15.64892578125, 16.5927734375, 17.53662109375, 18.48046875, 19.42431640625, 20.3681640625, 21.31201171875, 22.255859375, 23.19970703125, 24.1435546875, 25.08740234375, 26.03125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 6.0, 8.0, 4.0, 9.0, 13.0, 32.0, 69.0, 189.0, 315.0, 189.0, 72.0, 31.0, 11.0, 14.0, 5.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.078125, -21.39892578125, -20.7197265625, -20.04052734375, -19.361328125, -18.68212890625, -18.0029296875, -17.32373046875, -16.64453125, -15.96533203125, -15.2861328125, -14.60693359375, -13.927734375, -13.24853515625, -12.5693359375, -11.89013671875, -11.2109375, -10.53173828125, -9.8525390625, -9.17333984375, -8.494140625, -7.81494140625, -7.1357421875, -6.45654296875, -5.77734375, -5.09814453125, -4.4189453125, -3.73974609375, -3.060546875, -2.38134765625, -1.7021484375, -1.02294921875, -0.34375, 0.33544921875, 1.0146484375, 1.69384765625, 2.373046875, 3.05224609375, 3.7314453125, 4.41064453125, 5.08984375, 5.76904296875, 6.4482421875, 7.12744140625, 7.806640625, 8.48583984375, 9.1650390625, 9.84423828125, 10.5234375, 11.20263671875, 11.8818359375, 12.56103515625, 13.240234375, 13.91943359375, 14.5986328125, 15.27783203125, 15.95703125, 16.63623046875, 17.3154296875, 17.99462890625, 18.673828125, 19.35302734375, 20.0322265625, 20.71142578125, 21.390625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 9.0, 46.0, 340.0, 504.0, 66.0, 12.0, 3.0, 5.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-575.5166015625, -552.5615234375, -529.6063842773438, -506.65130615234375, -483.69622802734375, -460.7411193847656, -437.7860107421875, -414.8309326171875, -391.8758239746094, -368.92071533203125, -345.96563720703125, -323.0105285644531, -300.055419921875, -277.100341796875, -254.14523315429688, -231.1901397705078, -208.23504638671875, -185.2799530029297, -162.32485961914062, -139.3697509765625, -116.41465759277344, -93.45956420898438, -70.50445556640625, -47.54936218261719, -24.594268798828125, -1.6391716003417969, 21.31592559814453, 44.271026611328125, 67.22611999511719, 90.18121337890625, 113.13632202148438, 136.09141540527344, 159.0465087890625, 182.00160217285156, 204.95669555664062, 227.91180419921875, 250.8668975830078, 273.8219909667969, 296.777099609375, 319.732177734375, 342.6872863769531, 365.64239501953125, 388.59747314453125, 411.5525817871094, 434.5076904296875, 457.4627685546875, 480.4178771972656, 503.37298583984375, 526.3280639648438, 549.2831420898438, 572.23828125, 595.193359375, 618.1484375, 641.103515625, 664.0586547851562, 687.0137329101562, 709.9688720703125, 732.9239501953125, 755.8790893554688, 778.8341674804688, 801.7892456054688, 824.744384765625, 847.699462890625, 870.654541015625, 893.609619140625]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 8.0, 9.0, 15.0, 11.0, 22.0, 14.0, 20.0, 22.0, 34.0, 39.0, 48.0, 35.0, 55.0, 67.0, 81.0, 58.0, 83.0, 61.0, 41.0, 41.0, 34.0, 28.0, 32.0, 25.0, 25.0, 14.0, 17.0, 7.0, 9.0, 10.0, 6.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-167.3512420654297, -161.45753479003906, -155.5638427734375, -149.67013549804688, -143.7764434814453, -137.8827362060547, -131.98904418945312, -126.0953369140625, -120.2016372680664, -114.30793762207031, -108.41423797607422, -102.52053833007812, -96.6268310546875, -90.73313903808594, -84.83943176269531, -78.94573211669922, -73.05203247070312, -67.15833282470703, -61.26463317871094, -55.37092971801758, -49.477230072021484, -43.58353042602539, -37.68982696533203, -31.796127319335938, -25.902427673339844, -20.00872802734375, -14.115026473999023, -8.221324920654297, -2.327625274658203, 3.5660743713378906, 9.45977783203125, 15.353477478027344, 21.247177124023438, 27.14087677001953, 33.034576416015625, 38.928279876708984, 44.82197952270508, 50.71567916870117, 56.60938262939453, 62.503082275390625, 68.39678192138672, 74.29048156738281, 80.1841812133789, 86.077880859375, 91.97158813476562, 97.86528015136719, 103.75898742675781, 109.6526870727539, 115.54638671875, 121.4400863647461, 127.33378601074219, 133.2274932861328, 139.12118530273438, 145.014892578125, 150.90859985351562, 156.8022918701172, 162.69598388671875, 168.58969116210938, 174.48338317871094, 180.37709045410156, 186.27078247070312, 192.16448974609375, 198.05819702148438, 203.95188903808594, 209.84559631347656]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 6.0, 9.0, 23.0, 15.0, 25.0, 56.0, 102.0, 187.0, 695.0, 2310.0, 14514.0, 3124510.0, 1038999.0, 9751.0, 1955.0, 621.0, 225.0, 95.0, 64.0, 35.0, 23.0, 18.0, 6.0, 7.0, 6.0, 0.0, 6.0, 2.0, 0.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.21875, -43.80224609375, -42.3857421875, -40.96923828125, -39.552734375, -38.13623046875, -36.7197265625, -35.30322265625, -33.88671875, -32.47021484375, -31.0537109375, -29.63720703125, -28.220703125, -26.80419921875, -25.3876953125, -23.97119140625, -22.5546875, -21.13818359375, -19.7216796875, -18.30517578125, -16.888671875, -15.47216796875, -14.0556640625, -12.63916015625, -11.22265625, -9.80615234375, -8.3896484375, -6.97314453125, -5.556640625, -4.14013671875, -2.7236328125, -1.30712890625, 0.109375, 1.52587890625, 2.9423828125, 4.35888671875, 5.775390625, 7.19189453125, 8.6083984375, 10.02490234375, 11.44140625, 12.85791015625, 14.2744140625, 15.69091796875, 17.107421875, 18.52392578125, 19.9404296875, 21.35693359375, 22.7734375, 24.18994140625, 25.6064453125, 27.02294921875, 28.439453125, 29.85595703125, 31.2724609375, 32.68896484375, 34.10546875, 35.52197265625, 36.9384765625, 38.35498046875, 39.771484375, 41.18798828125, 42.6044921875, 44.02099609375, 45.4375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 16.0, 27.0, 66.0, 104.0, 135.0, 164.0, 163.0, 125.0, 100.0, 52.0, 28.0, 11.0, 6.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.65625, -31.6650390625, -30.673828125, -29.6826171875, -28.69140625, -27.7001953125, -26.708984375, -25.7177734375, -24.7265625, -23.7353515625, -22.744140625, -21.7529296875, -20.76171875, -19.7705078125, -18.779296875, -17.7880859375, -16.796875, -15.8056640625, -14.814453125, -13.8232421875, -12.83203125, -11.8408203125, -10.849609375, -9.8583984375, -8.8671875, -7.8759765625, -6.884765625, -5.8935546875, -4.90234375, -3.9111328125, -2.919921875, -1.9287109375, -0.9375, 0.0537109375, 1.044921875, 2.0361328125, 3.02734375, 4.0185546875, 5.009765625, 6.0009765625, 6.9921875, 7.9833984375, 8.974609375, 9.9658203125, 10.95703125, 11.9482421875, 12.939453125, 13.9306640625, 14.921875, 15.9130859375, 16.904296875, 17.8955078125, 18.88671875, 19.8779296875, 20.869140625, 21.8603515625, 22.8515625, 23.8427734375, 24.833984375, 25.8251953125, 26.81640625, 27.8076171875, 28.798828125, 29.7900390625, 30.78125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 2.0, 6.0, 13.0, 15.0, 16.0, 39.0, 40.0, 98.0, 158.0, 254.0, 522.0, 992.0, 1838.0, 3879.0, 16746.0, 3936742.0, 221046.0, 7307.0, 2372.0, 1098.0, 522.0, 258.0, 108.0, 78.0, 52.0, 29.0, 21.0, 6.0, 12.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.46875, -37.87744140625, -36.2861328125, -34.69482421875, -33.103515625, -31.51220703125, -29.9208984375, -28.32958984375, -26.73828125, -25.14697265625, -23.5556640625, -21.96435546875, -20.373046875, -18.78173828125, -17.1904296875, -15.59912109375, -14.0078125, -12.41650390625, -10.8251953125, -9.23388671875, -7.642578125, -6.05126953125, -4.4599609375, -2.86865234375, -1.27734375, 0.31396484375, 1.9052734375, 3.49658203125, 5.087890625, 6.67919921875, 8.2705078125, 9.86181640625, 11.453125, 13.04443359375, 14.6357421875, 16.22705078125, 17.818359375, 19.40966796875, 21.0009765625, 22.59228515625, 24.18359375, 25.77490234375, 27.3662109375, 28.95751953125, 30.548828125, 32.14013671875, 33.7314453125, 35.32275390625, 36.9140625, 38.50537109375, 40.0966796875, 41.68798828125, 43.279296875, 44.87060546875, 46.4619140625, 48.05322265625, 49.64453125, 51.23583984375, 52.8271484375, 54.41845703125, 56.009765625, 57.60107421875, 59.1923828125, 60.78369140625, 62.375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 6.0, 8.0, 23.0, 32.0, 208.0, 1489.0, 1908.0, 271.0, 74.0, 19.0, 13.0, 7.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.0, -74.05810546875, -72.1162109375, -70.17431640625, -68.232421875, -66.29052734375, -64.3486328125, -62.40673828125, -60.46484375, -58.52294921875, -56.5810546875, -54.63916015625, -52.697265625, -50.75537109375, -48.8134765625, -46.87158203125, -44.9296875, -42.98779296875, -41.0458984375, -39.10400390625, -37.162109375, -35.22021484375, -33.2783203125, -31.33642578125, -29.39453125, -27.45263671875, -25.5107421875, -23.56884765625, -21.626953125, -19.68505859375, -17.7431640625, -15.80126953125, -13.859375, -11.91748046875, -9.9755859375, -8.03369140625, -6.091796875, -4.14990234375, -2.2080078125, -0.26611328125, 1.67578125, 3.61767578125, 5.5595703125, 7.50146484375, 9.443359375, 11.38525390625, 13.3271484375, 15.26904296875, 17.2109375, 19.15283203125, 21.0947265625, 23.03662109375, 24.978515625, 26.92041015625, 28.8623046875, 30.80419921875, 32.74609375, 34.68798828125, 36.6298828125, 38.57177734375, 40.513671875, 42.45556640625, 44.3974609375, 46.33935546875, 48.28125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 11.0, 30.0, 267.0, 590.0, 60.0, 15.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-927.4464111328125, -908.6227416992188, -889.7991333007812, -870.9754638671875, -852.15185546875, -833.3281860351562, -814.5045166015625, -795.680908203125, -776.8572387695312, -758.0335693359375, -739.2099609375, -720.3862915039062, -701.5626220703125, -682.739013671875, -663.9153442382812, -645.0916748046875, -626.26806640625, -607.4443969726562, -588.6207885742188, -569.797119140625, -550.9735107421875, -532.1498413085938, -513.326171875, -494.5025329589844, -475.67889404296875, -456.8552551269531, -438.0316162109375, -419.20794677734375, -400.3843078613281, -381.5606689453125, -362.73699951171875, -343.9133605957031, -325.08966064453125, -306.2660217285156, -287.4423828125, -268.61871337890625, -249.79507446289062, -230.971435546875, -212.1477813720703, -193.32412719726562, -174.50048828125, -155.67684936523438, -136.8531951904297, -118.02954864501953, -99.20590209960938, -80.38225555419922, -61.55860900878906, -42.734954833984375, -23.91131591796875, -5.087669372558594, 13.735977172851562, 32.55962371826172, 51.383270263671875, 70.20691680908203, 89.03056335449219, 107.85421752929688, 126.6778564453125, 145.50149536132812, 164.3251495361328, 183.1488037109375, 201.97244262695312, 220.79608154296875, 239.61973571777344, 258.4433898925781, 277.26702880859375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 11.0, 26.0, 30.0, 78.0, 75.0, 130.0, 137.0, 133.0, 132.0, 101.0, 63.0, 40.0, 21.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-261.275390625, -252.9762725830078, -244.6771697998047, -236.3780517578125, -228.0789337158203, -219.77981567382812, -211.480712890625, -203.1815948486328, -194.88247680664062, -186.58335876464844, -178.2842559814453, -169.98513793945312, -161.68601989746094, -153.38690185546875, -145.08779907226562, -136.78868103027344, -128.4895782470703, -120.19046783447266, -111.89134979248047, -103.59223937988281, -95.29312133789062, -86.99401092529297, -78.69490051269531, -70.39578247070312, -62.09667205810547, -53.79755783081055, -45.498443603515625, -37.19933319091797, -28.900218963623047, -20.601104736328125, -12.301994323730469, -4.002880096435547, 4.296234130859375, 12.59534740447998, 20.894460678100586, 29.193572998046875, 37.4926872253418, 45.79180145263672, 54.090911865234375, 62.3900260925293, 70.68914031982422, 78.98825073242188, 87.28736877441406, 95.58647918701172, 103.88558959960938, 112.18470764160156, 120.48381805419922, 128.78292846679688, 137.08204650878906, 145.38116455078125, 153.68026733398438, 161.97938537597656, 170.27850341796875, 178.57760620117188, 186.87672424316406, 195.17584228515625, 203.47494506835938, 211.77406311035156, 220.0731658935547, 228.37228393554688, 236.67140197753906, 244.97052001953125, 253.26962280273438, 261.5687255859375, 269.86785888671875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 4.0, 4.0, 11.0, 13.0, 11.0, 16.0, 27.0, 53.0, 84.0, 168.0, 298.0, 552.0, 1579.0, 10603.0, 358202.0, 655853.0, 17634.0, 2075.0, 663.0, 277.0, 154.0, 90.0, 76.0, 24.0, 21.0, 15.0, 13.0, 16.0, 6.0, 2.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.0625, -44.75, -43.4375, -42.125, -40.8125, -39.5, -38.1875, -36.875, -35.5625, -34.25, -32.9375, -31.625, -30.3125, -29.0, -27.6875, -26.375, -25.0625, -23.75, -22.4375, -21.125, -19.8125, -18.5, -17.1875, -15.875, -14.5625, -13.25, -11.9375, -10.625, -9.3125, -8.0, -6.6875, -5.375, -4.0625, -2.75, -1.4375, -0.125, 1.1875, 2.5, 3.8125, 5.125, 6.4375, 7.75, 9.0625, 10.375, 11.6875, 13.0, 14.3125, 15.625, 16.9375, 18.25, 19.5625, 20.875, 22.1875, 23.5, 24.8125, 26.125, 27.4375, 28.75, 30.0625, 31.375, 32.6875, 34.0, 35.3125, 36.625, 37.9375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 7.0, 27.0, 35.0, 70.0, 106.0, 156.0, 142.0, 155.0, 124.0, 85.0, 49.0, 26.0, 13.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.046875, -26.104736328125, -25.16259765625, -24.220458984375, -23.2783203125, -22.336181640625, -21.39404296875, -20.451904296875, -19.509765625, -18.567626953125, -17.62548828125, -16.683349609375, -15.7412109375, -14.799072265625, -13.85693359375, -12.914794921875, -11.97265625, -11.030517578125, -10.08837890625, -9.146240234375, -8.2041015625, -7.261962890625, -6.31982421875, -5.377685546875, -4.435546875, -3.493408203125, -2.55126953125, -1.609130859375, -0.6669921875, 0.275146484375, 1.21728515625, 2.159423828125, 3.1015625, 4.043701171875, 4.98583984375, 5.927978515625, 6.8701171875, 7.812255859375, 8.75439453125, 9.696533203125, 10.638671875, 11.580810546875, 12.52294921875, 13.465087890625, 14.4072265625, 15.349365234375, 16.29150390625, 17.233642578125, 18.17578125, 19.117919921875, 20.06005859375, 21.002197265625, 21.9443359375, 22.886474609375, 23.82861328125, 24.770751953125, 25.712890625, 26.655029296875, 27.59716796875, 28.539306640625, 29.4814453125, 30.423583984375, 31.36572265625, 32.307861328125, 33.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 10.0, 7.0, 16.0, 26.0, 25.0, 50.0, 91.0, 169.0, 382.0, 1055.0, 4184.0, 32903.0, 704183.0, 283897.0, 17211.0, 2882.0, 785.0, 298.0, 160.0, 75.0, 51.0, 24.0, 23.0, 13.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.79736328125, -29.8603515625, -28.92333984375, -27.986328125, -27.04931640625, -26.1123046875, -25.17529296875, -24.23828125, -23.30126953125, -22.3642578125, -21.42724609375, -20.490234375, -19.55322265625, -18.6162109375, -17.67919921875, -16.7421875, -15.80517578125, -14.8681640625, -13.93115234375, -12.994140625, -12.05712890625, -11.1201171875, -10.18310546875, -9.24609375, -8.30908203125, -7.3720703125, -6.43505859375, -5.498046875, -4.56103515625, -3.6240234375, -2.68701171875, -1.75, -0.81298828125, 0.1240234375, 1.06103515625, 1.998046875, 2.93505859375, 3.8720703125, 4.80908203125, 5.74609375, 6.68310546875, 7.6201171875, 8.55712890625, 9.494140625, 10.43115234375, 11.3681640625, 12.30517578125, 13.2421875, 14.17919921875, 15.1162109375, 16.05322265625, 16.990234375, 17.92724609375, 18.8642578125, 19.80126953125, 20.73828125, 21.67529296875, 22.6123046875, 23.54931640625, 24.486328125, 25.42333984375, 26.3603515625, 27.29736328125, 28.234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 11.0, 10.0, 19.0, 18.0, 17.0, 22.0, 31.0, 36.0, 34.0, 35.0, 55.0, 52.0, 52.0, 46.0, 58.0, 50.0, 54.0, 52.0, 48.0, 53.0, 38.0, 37.0, 31.0, 26.0, 17.0, 24.0, 11.0, 13.0, 9.0, 7.0, 8.0, 5.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.71875, -39.598876953125, -38.47900390625, -37.359130859375, -36.2392578125, -35.119384765625, -33.99951171875, -32.879638671875, -31.759765625, -30.639892578125, -29.52001953125, -28.400146484375, -27.2802734375, -26.160400390625, -25.04052734375, -23.920654296875, -22.80078125, -21.680908203125, -20.56103515625, -19.441162109375, -18.3212890625, -17.201416015625, -16.08154296875, -14.961669921875, -13.841796875, -12.721923828125, -11.60205078125, -10.482177734375, -9.3623046875, -8.242431640625, -7.12255859375, -6.002685546875, -4.8828125, -3.762939453125, -2.64306640625, -1.523193359375, -0.4033203125, 0.716552734375, 1.83642578125, 2.956298828125, 4.076171875, 5.196044921875, 6.31591796875, 7.435791015625, 8.5556640625, 9.675537109375, 10.79541015625, 11.915283203125, 13.03515625, 14.155029296875, 15.27490234375, 16.394775390625, 17.5146484375, 18.634521484375, 19.75439453125, 20.874267578125, 21.994140625, 23.114013671875, 24.23388671875, 25.353759765625, 26.4736328125, 27.593505859375, 28.71337890625, 29.833251953125, 30.953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 8.0, 7.0, 12.0, 19.0, 17.0, 38.0, 56.0, 81.0, 185.0, 443.0, 1053.0, 3716.0, 18730.0, 227191.0, 744782.0, 42864.0, 6448.0, 1676.0, 560.0, 272.0, 132.0, 75.0, 46.0, 28.0, 14.0, 21.0, 12.0, 8.0, 9.0, 5.0, 9.0, 7.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.6640625, -6.443359375, -6.22265625, -6.001953125, -5.78125, -5.560546875, -5.33984375, -5.119140625, -4.8984375, -4.677734375, -4.45703125, -4.236328125, -4.015625, -3.794921875, -3.57421875, -3.353515625, -3.1328125, -2.912109375, -2.69140625, -2.470703125, -2.25, -2.029296875, -1.80859375, -1.587890625, -1.3671875, -1.146484375, -0.92578125, -0.705078125, -0.484375, -0.263671875, -0.04296875, 0.177734375, 0.3984375, 0.619140625, 0.83984375, 1.060546875, 1.28125, 1.501953125, 1.72265625, 1.943359375, 2.1640625, 2.384765625, 2.60546875, 2.826171875, 3.046875, 3.267578125, 3.48828125, 3.708984375, 3.9296875, 4.150390625, 4.37109375, 4.591796875, 4.8125, 5.033203125, 5.25390625, 5.474609375, 5.6953125, 5.916015625, 6.13671875, 6.357421875, 6.578125, 6.798828125, 7.01953125, 7.240234375, 7.4609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 11.0, 15.0, 22.0, 30.0, 30.0, 50.0, 65.0, 126.0, 146.0, 154.0, 115.0, 77.0, 44.0, 35.0, 18.0, 11.0, 8.0, 5.0, 9.0, 3.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012359619140625, -0.0011984705924987793, -0.0011609792709350586, -0.0011234879493713379, -0.0010859966278076172, -0.0010485053062438965, -0.0010110139846801758, -0.0009735226631164551, -0.0009360313415527344, -0.0008985400199890137, -0.000861048698425293, -0.0008235573768615723, -0.0007860660552978516, -0.0007485747337341309, -0.0007110834121704102, -0.0006735920906066895, -0.0006361007690429688, -0.000598609447479248, -0.0005611181259155273, -0.0005236268043518066, -0.00048613548278808594, -0.00044864416122436523, -0.00041115283966064453, -0.00037366151809692383, -0.0003361701965332031, -0.0002986788749694824, -0.0002611875534057617, -0.00022369623184204102, -0.0001862049102783203, -0.0001487135887145996, -0.0001112222671508789, -7.37309455871582e-05, -3.62396240234375e-05, 1.2516975402832031e-06, 3.8743019104003906e-05, 7.623434066772461e-05, 0.00011372566223144531, 0.00015121698379516602, 0.00018870830535888672, 0.00022619962692260742, 0.0002636909484863281, 0.00030118227005004883, 0.00033867359161376953, 0.00037616491317749023, 0.00041365623474121094, 0.00045114755630493164, 0.0004886388778686523, 0.000526130199432373, 0.0005636215209960938, 0.0006011128425598145, 0.0006386041641235352, 0.0006760954856872559, 0.0007135868072509766, 0.0007510781288146973, 0.000788569450378418, 0.0008260607719421387, 0.0008635520935058594, 0.0009010434150695801, 0.0009385347366333008, 0.0009760260581970215, 0.0010135173797607422, 0.0010510087013244629, 0.0010885000228881836, 0.0011259913444519043, 0.001163482666015625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 8.0, 9.0, 11.0, 13.0, 32.0, 48.0, 87.0, 121.0, 273.0, 564.0, 1496.0, 4340.0, 18328.0, 201375.0, 760562.0, 48945.0, 8116.0, 2477.0, 908.0, 408.0, 166.0, 92.0, 49.0, 28.0, 24.0, 21.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.37890625, -7.1500244140625, -6.921142578125, -6.6922607421875, -6.46337890625, -6.2344970703125, -6.005615234375, -5.7767333984375, -5.5478515625, -5.3189697265625, -5.090087890625, -4.8612060546875, -4.63232421875, -4.4034423828125, -4.174560546875, -3.9456787109375, -3.716796875, -3.4879150390625, -3.259033203125, -3.0301513671875, -2.80126953125, -2.5723876953125, -2.343505859375, -2.1146240234375, -1.8857421875, -1.6568603515625, -1.427978515625, -1.1990966796875, -0.97021484375, -0.7413330078125, -0.512451171875, -0.2835693359375, -0.0546875, 0.1741943359375, 0.403076171875, 0.6319580078125, 0.86083984375, 1.0897216796875, 1.318603515625, 1.5474853515625, 1.7763671875, 2.0052490234375, 2.234130859375, 2.4630126953125, 2.69189453125, 2.9207763671875, 3.149658203125, 3.3785400390625, 3.607421875, 3.8363037109375, 4.065185546875, 4.2940673828125, 4.52294921875, 4.7518310546875, 4.980712890625, 5.2095947265625, 5.4384765625, 5.6673583984375, 5.896240234375, 6.1251220703125, 6.35400390625, 6.5828857421875, 6.811767578125, 7.0406494140625, 7.26953125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 6.0, 7.0, 10.0, 18.0, 20.0, 33.0, 46.0, 71.0, 73.0, 107.0, 107.0, 116.0, 105.0, 70.0, 55.0, 39.0, 32.0, 28.0, 17.0, 8.0, 5.0, 5.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.75408935546875, -4.5706787109375, -4.38726806640625, -4.203857421875, -4.02044677734375, -3.8370361328125, -3.65362548828125, -3.47021484375, -3.28680419921875, -3.1033935546875, -2.91998291015625, -2.736572265625, -2.55316162109375, -2.3697509765625, -2.18634033203125, -2.0029296875, -1.81951904296875, -1.6361083984375, -1.45269775390625, -1.269287109375, -1.08587646484375, -0.9024658203125, -0.71905517578125, -0.53564453125, -0.35223388671875, -0.1688232421875, 0.01458740234375, 0.197998046875, 0.38140869140625, 0.5648193359375, 0.74822998046875, 0.931640625, 1.11505126953125, 1.2984619140625, 1.48187255859375, 1.665283203125, 1.84869384765625, 2.0321044921875, 2.21551513671875, 2.39892578125, 2.58233642578125, 2.7657470703125, 2.94915771484375, 3.132568359375, 3.31597900390625, 3.4993896484375, 3.68280029296875, 3.8662109375, 4.04962158203125, 4.2330322265625, 4.41644287109375, 4.599853515625, 4.78326416015625, 4.9666748046875, 5.15008544921875, 5.33349609375, 5.51690673828125, 5.7003173828125, 5.88372802734375, 6.067138671875, 6.25054931640625, 6.4339599609375, 6.61737060546875, 6.80078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 12.0, 16.0, 149.0, 570.0, 197.0, 35.0, 10.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-261.16143798828125, -249.56187438964844, -237.96231079101562, -226.36276245117188, -214.76318359375, -203.16363525390625, -191.56407165527344, -179.96450805664062, -168.3649444580078, -156.765380859375, -145.1658172607422, -133.56625366210938, -121.9666976928711, -110.36713409423828, -98.767578125, -87.16801452636719, -75.56845092773438, -63.96888732910156, -52.369327545166016, -40.76976776123047, -29.170204162597656, -17.570640563964844, -5.9710845947265625, 5.62847900390625, 17.228042602539062, 28.827604293823242, 40.42716598510742, 52.02672576904297, 63.62628936767578, 75.2258529663086, 86.82540893554688, 98.42497253417969, 110.0245361328125, 121.62409973144531, 133.22366333007812, 144.82321166992188, 156.42279052734375, 168.0223388671875, 179.6219024658203, 191.22146606445312, 202.82102966308594, 214.42059326171875, 226.02015686035156, 237.61972045898438, 249.21926879882812, 260.81884765625, 272.41839599609375, 284.0179443359375, 295.6175231933594, 307.2170715332031, 318.816650390625, 330.41619873046875, 342.0157775878906, 353.6153259277344, 365.21490478515625, 376.814453125, 388.41400146484375, 400.0135498046875, 411.6131286621094, 423.2126770019531, 434.812255859375, 446.41180419921875, 458.0113525390625, 469.6109313964844, 481.21051025390625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 14.0, 19.0, 15.0, 37.0, 38.0, 53.0, 51.0, 60.0, 92.0, 147.0, 113.0, 71.0, 45.0, 60.0, 37.0, 35.0, 24.0, 27.0, 14.0, 7.0, 15.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.95297241210938, -178.7249298095703, -172.4968719482422, -166.26882934570312, -160.04078674316406, -153.81272888183594, -147.58468627929688, -141.35662841796875, -135.1285858154297, -128.90054321289062, -122.67249298095703, -116.44444274902344, -110.21639251708984, -103.98834228515625, -97.76029968261719, -91.5322494506836, -85.30420684814453, -79.07615661621094, -72.84811401367188, -66.62006378173828, -60.39201354980469, -54.16396713256836, -47.93592071533203, -41.70787048339844, -35.47982406616211, -29.25177574157715, -23.023727416992188, -16.79568099975586, -10.567632675170898, -4.3395843505859375, 1.8884620666503906, 8.116512298583984, 14.344558715820312, 20.572607040405273, 26.800655364990234, 33.02870178222656, 39.256752014160156, 45.484798431396484, 51.71284484863281, 57.940895080566406, 64.1689453125, 70.3969955444336, 76.62503814697266, 82.85308837890625, 89.08113861083984, 95.30918884277344, 101.5372314453125, 107.7652816772461, 113.99332427978516, 120.22137451171875, 126.44941711425781, 132.67745971679688, 138.905517578125, 145.13356018066406, 151.36160278320312, 157.58966064453125, 163.8177032470703, 170.04574584960938, 176.2738037109375, 182.50184631347656, 188.72988891601562, 194.95794677734375, 201.1859893798828, 207.41403198242188, 213.64208984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 16.0, 20.0, 29.0, 48.0, 97.0, 151.0, 327.0, 620.0, 1386.0, 3357.0, 11404.0, 166375.0, 3812491.0, 184554.0, 9539.0, 2240.0, 846.0, 364.0, 184.0, 89.0, 38.0, 29.0, 21.0, 14.0, 7.0, 4.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.84375, -13.168701171875, -12.49365234375, -11.818603515625, -11.1435546875, -10.468505859375, -9.79345703125, -9.118408203125, -8.443359375, -7.768310546875, -7.09326171875, -6.418212890625, -5.7431640625, -5.068115234375, -4.39306640625, -3.718017578125, -3.04296875, -2.367919921875, -1.69287109375, -1.017822265625, -0.3427734375, 0.332275390625, 1.00732421875, 1.682373046875, 2.357421875, 3.032470703125, 3.70751953125, 4.382568359375, 5.0576171875, 5.732666015625, 6.40771484375, 7.082763671875, 7.7578125, 8.432861328125, 9.10791015625, 9.782958984375, 10.4580078125, 11.133056640625, 11.80810546875, 12.483154296875, 13.158203125, 13.833251953125, 14.50830078125, 15.183349609375, 15.8583984375, 16.533447265625, 17.20849609375, 17.883544921875, 18.55859375, 19.233642578125, 19.90869140625, 20.583740234375, 21.2587890625, 21.933837890625, 22.60888671875, 23.283935546875, 23.958984375, 24.634033203125, 25.30908203125, 25.984130859375, 26.6591796875, 27.334228515625, 28.00927734375, 28.684326171875, 29.359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 10.0, 18.0, 48.0, 56.0, 90.0, 119.0, 125.0, 135.0, 120.0, 125.0, 75.0, 38.0, 18.0, 16.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5390625, -13.7840576171875, -13.029052734375, -12.2740478515625, -11.51904296875, -10.7640380859375, -10.009033203125, -9.2540283203125, -8.4990234375, -7.7440185546875, -6.989013671875, -6.2340087890625, -5.47900390625, -4.7239990234375, -3.968994140625, -3.2139892578125, -2.458984375, -1.7039794921875, -0.948974609375, -0.1939697265625, 0.56103515625, 1.3160400390625, 2.071044921875, 2.8260498046875, 3.5810546875, 4.3360595703125, 5.091064453125, 5.8460693359375, 6.60107421875, 7.3560791015625, 8.111083984375, 8.8660888671875, 9.62109375, 10.3760986328125, 11.131103515625, 11.8861083984375, 12.64111328125, 13.3961181640625, 14.151123046875, 14.9061279296875, 15.6611328125, 16.4161376953125, 17.171142578125, 17.9261474609375, 18.68115234375, 19.4361572265625, 20.191162109375, 20.9461669921875, 21.701171875, 22.4561767578125, 23.211181640625, 23.9661865234375, 24.72119140625, 25.4761962890625, 26.231201171875, 26.9862060546875, 27.7412109375, 28.4962158203125, 29.251220703125, 30.0062255859375, 30.76123046875, 31.5162353515625, 32.271240234375, 33.0262451171875, 33.78125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 3.0, 7.0, 10.0, 10.0, 19.0, 26.0, 31.0, 51.0, 103.0, 198.0, 564.0, 1861.0, 8956.0, 92127.0, 3744105.0, 325019.0, 16807.0, 2915.0, 849.0, 289.0, 114.0, 70.0, 42.0, 31.0, 24.0, 8.0, 8.0, 7.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-22.671875, -22.08544921875, -21.4990234375, -20.91259765625, -20.326171875, -19.73974609375, -19.1533203125, -18.56689453125, -17.98046875, -17.39404296875, -16.8076171875, -16.22119140625, -15.634765625, -15.04833984375, -14.4619140625, -13.87548828125, -13.2890625, -12.70263671875, -12.1162109375, -11.52978515625, -10.943359375, -10.35693359375, -9.7705078125, -9.18408203125, -8.59765625, -8.01123046875, -7.4248046875, -6.83837890625, -6.251953125, -5.66552734375, -5.0791015625, -4.49267578125, -3.90625, -3.31982421875, -2.7333984375, -2.14697265625, -1.560546875, -0.97412109375, -0.3876953125, 0.19873046875, 0.78515625, 1.37158203125, 1.9580078125, 2.54443359375, 3.130859375, 3.71728515625, 4.3037109375, 4.89013671875, 5.4765625, 6.06298828125, 6.6494140625, 7.23583984375, 7.822265625, 8.40869140625, 8.9951171875, 9.58154296875, 10.16796875, 10.75439453125, 11.3408203125, 11.92724609375, 12.513671875, 13.10009765625, 13.6865234375, 14.27294921875, 14.859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 11.0, 9.0, 13.0, 15.0, 27.0, 40.0, 75.0, 174.0, 268.0, 494.0, 692.0, 792.0, 576.0, 363.0, 184.0, 102.0, 64.0, 41.0, 31.0, 20.0, 20.0, 15.0, 8.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2265625, -12.7896728515625, -12.352783203125, -11.9158935546875, -11.47900390625, -11.0421142578125, -10.605224609375, -10.1683349609375, -9.7314453125, -9.2945556640625, -8.857666015625, -8.4207763671875, -7.98388671875, -7.5469970703125, -7.110107421875, -6.6732177734375, -6.236328125, -5.7994384765625, -5.362548828125, -4.9256591796875, -4.48876953125, -4.0518798828125, -3.614990234375, -3.1781005859375, -2.7412109375, -2.3043212890625, -1.867431640625, -1.4305419921875, -0.99365234375, -0.5567626953125, -0.119873046875, 0.3170166015625, 0.75390625, 1.1907958984375, 1.627685546875, 2.0645751953125, 2.50146484375, 2.9383544921875, 3.375244140625, 3.8121337890625, 4.2490234375, 4.6859130859375, 5.122802734375, 5.5596923828125, 5.99658203125, 6.4334716796875, 6.870361328125, 7.3072509765625, 7.744140625, 8.1810302734375, 8.617919921875, 9.0548095703125, 9.49169921875, 9.9285888671875, 10.365478515625, 10.8023681640625, 11.2392578125, 11.6761474609375, 12.113037109375, 12.5499267578125, 12.98681640625, 13.4237060546875, 13.860595703125, 14.2974853515625, 14.734375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 11.0, 45.0, 310.0, 503.0, 114.0, 15.0, 11.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.47637939453125, -191.0307159423828, -181.58506774902344, -172.139404296875, -162.69375610351562, -153.2480926513672, -143.80242919921875, -134.35678100585938, -124.91112518310547, -115.46546936035156, -106.01981353759766, -96.57415771484375, -87.12849426269531, -77.68284606933594, -68.2371826171875, -58.791526794433594, -49.34587097167969, -39.90021514892578, -30.454557418823242, -21.008899688720703, -11.563243865966797, -2.1175880432128906, 7.328071594238281, 16.773727416992188, 26.219383239746094, 35.6650390625, 45.110694885253906, 54.55635452270508, 64.00201416015625, 73.44766235351562, 82.89332580566406, 92.33898162841797, 101.78463745117188, 111.23029327392578, 120.67594909667969, 130.12161254882812, 139.5672607421875, 149.01292419433594, 158.45858764648438, 167.90423583984375, 177.34988403320312, 186.79554748535156, 196.24119567871094, 205.68685913085938, 215.13250732421875, 224.5781707763672, 234.02383422851562, 243.469482421875, 252.91514587402344, 262.3608093261719, 271.80645751953125, 281.2521057128906, 290.6977844238281, 300.1434326171875, 309.5890808105469, 319.03472900390625, 328.48040771484375, 337.9260559082031, 347.3717346191406, 356.8173828125, 366.2630310058594, 375.70867919921875, 385.15435791015625, 394.6000061035156, 404.045654296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 7.0, 4.0, 8.0, 9.0, 15.0, 22.0, 18.0, 26.0, 31.0, 31.0, 42.0, 41.0, 44.0, 55.0, 47.0, 46.0, 50.0, 58.0, 48.0, 47.0, 54.0, 37.0, 37.0, 38.0, 40.0, 23.0, 16.0, 23.0, 27.0, 9.0, 14.0, 10.0, 3.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.53143310546875, -57.66530227661133, -55.79916763305664, -53.93303680419922, -52.06690216064453, -50.20077133178711, -48.33464050292969, -46.468505859375, -44.60237503051758, -42.736244201660156, -40.87010955810547, -39.00397872924805, -37.13784408569336, -35.27171325683594, -33.40557861328125, -31.539447784423828, -29.673315048217773, -27.80718231201172, -25.941049575805664, -24.07491683959961, -22.208786010742188, -20.342653274536133, -18.476520538330078, -16.610389709472656, -14.744256019592285, -12.87812328338623, -11.011991500854492, -9.145858764648438, -7.279726505279541, -5.4135942459106445, -3.54746150970459, -1.6813297271728516, 0.18480300903320312, 2.0509352684020996, 3.917067766189575, 5.783200263977051, 7.649332523345947, 9.515464782714844, 11.381597518920898, 13.247729301452637, 15.113862037658691, 16.97999382019043, 18.846126556396484, 20.71225929260254, 22.578392028808594, 24.444522857666016, 26.310657501220703, 28.176788330078125, 30.04292106628418, 31.909053802490234, 33.775184631347656, 35.641319274902344, 37.507450103759766, 39.37358093261719, 41.239715576171875, 43.1058464050293, 44.971981048583984, 46.838111877441406, 48.704246520996094, 50.570377349853516, 52.4365119934082, 54.302642822265625, 56.16877746582031, 58.034908294677734, 59.901039123535156]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 11.0, 8.0, 19.0, 18.0, 24.0, 42.0, 48.0, 84.0, 140.0, 254.0, 499.0, 1398.0, 6419.0, 87060.0, 872321.0, 72132.0, 5708.0, 1315.0, 450.0, 227.0, 128.0, 84.0, 55.0, 29.0, 13.0, 18.0, 13.0, 10.0, 8.0, 6.0, 3.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.765625, -27.718505859375, -26.67138671875, -25.624267578125, -24.5771484375, -23.530029296875, -22.48291015625, -21.435791015625, -20.388671875, -19.341552734375, -18.29443359375, -17.247314453125, -16.2001953125, -15.153076171875, -14.10595703125, -13.058837890625, -12.01171875, -10.964599609375, -9.91748046875, -8.870361328125, -7.8232421875, -6.776123046875, -5.72900390625, -4.681884765625, -3.634765625, -2.587646484375, -1.54052734375, -0.493408203125, 0.5537109375, 1.600830078125, 2.64794921875, 3.695068359375, 4.7421875, 5.789306640625, 6.83642578125, 7.883544921875, 8.9306640625, 9.977783203125, 11.02490234375, 12.072021484375, 13.119140625, 14.166259765625, 15.21337890625, 16.260498046875, 17.3076171875, 18.354736328125, 19.40185546875, 20.448974609375, 21.49609375, 22.543212890625, 23.59033203125, 24.637451171875, 25.6845703125, 26.731689453125, 27.77880859375, 28.825927734375, 29.873046875, 30.920166015625, 31.96728515625, 33.014404296875, 34.0615234375, 35.108642578125, 36.15576171875, 37.202880859375, 38.25]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 13.0, 25.0, 43.0, 48.0, 91.0, 119.0, 134.0, 143.0, 115.0, 101.0, 72.0, 52.0, 21.0, 13.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5625, -13.80615234375, -13.0498046875, -12.29345703125, -11.537109375, -10.78076171875, -10.0244140625, -9.26806640625, -8.51171875, -7.75537109375, -6.9990234375, -6.24267578125, -5.486328125, -4.72998046875, -3.9736328125, -3.21728515625, -2.4609375, -1.70458984375, -0.9482421875, -0.19189453125, 0.564453125, 1.32080078125, 2.0771484375, 2.83349609375, 3.58984375, 4.34619140625, 5.1025390625, 5.85888671875, 6.615234375, 7.37158203125, 8.1279296875, 8.88427734375, 9.640625, 10.39697265625, 11.1533203125, 11.90966796875, 12.666015625, 13.42236328125, 14.1787109375, 14.93505859375, 15.69140625, 16.44775390625, 17.2041015625, 17.96044921875, 18.716796875, 19.47314453125, 20.2294921875, 20.98583984375, 21.7421875, 22.49853515625, 23.2548828125, 24.01123046875, 24.767578125, 25.52392578125, 26.2802734375, 27.03662109375, 27.79296875, 28.54931640625, 29.3056640625, 30.06201171875, 30.818359375, 31.57470703125, 32.3310546875, 33.08740234375, 33.84375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 8.0, 8.0, 8.0, 1.0, 7.0, 8.0, 7.0, 17.0, 18.0, 29.0, 31.0, 47.0, 80.0, 118.0, 211.0, 501.0, 1365.0, 5417.0, 71528.0, 931744.0, 31546.0, 3783.0, 1083.0, 426.0, 206.0, 118.0, 75.0, 32.0, 30.0, 30.0, 17.0, 12.0, 11.0, 10.0, 6.0, 4.0, 5.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.125, -37.83740234375, -36.5498046875, -35.26220703125, -33.974609375, -32.68701171875, -31.3994140625, -30.11181640625, -28.82421875, -27.53662109375, -26.2490234375, -24.96142578125, -23.673828125, -22.38623046875, -21.0986328125, -19.81103515625, -18.5234375, -17.23583984375, -15.9482421875, -14.66064453125, -13.373046875, -12.08544921875, -10.7978515625, -9.51025390625, -8.22265625, -6.93505859375, -5.6474609375, -4.35986328125, -3.072265625, -1.78466796875, -0.4970703125, 0.79052734375, 2.078125, 3.36572265625, 4.6533203125, 5.94091796875, 7.228515625, 8.51611328125, 9.8037109375, 11.09130859375, 12.37890625, 13.66650390625, 14.9541015625, 16.24169921875, 17.529296875, 18.81689453125, 20.1044921875, 21.39208984375, 22.6796875, 23.96728515625, 25.2548828125, 26.54248046875, 27.830078125, 29.11767578125, 30.4052734375, 31.69287109375, 32.98046875, 34.26806640625, 35.5556640625, 36.84326171875, 38.130859375, 39.41845703125, 40.7060546875, 41.99365234375, 43.28125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 1.0, 6.0, 4.0, 10.0, 11.0, 11.0, 11.0, 16.0, 23.0, 29.0, 32.0, 42.0, 45.0, 41.0, 45.0, 70.0, 57.0, 52.0, 56.0, 49.0, 44.0, 50.0, 44.0, 37.0, 36.0, 28.0, 25.0, 22.0, 17.0, 15.0, 15.0, 14.0, 9.0, 8.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.0625, -33.9638671875, -32.865234375, -31.7666015625, -30.66796875, -29.5693359375, -28.470703125, -27.3720703125, -26.2734375, -25.1748046875, -24.076171875, -22.9775390625, -21.87890625, -20.7802734375, -19.681640625, -18.5830078125, -17.484375, -16.3857421875, -15.287109375, -14.1884765625, -13.08984375, -11.9912109375, -10.892578125, -9.7939453125, -8.6953125, -7.5966796875, -6.498046875, -5.3994140625, -4.30078125, -3.2021484375, -2.103515625, -1.0048828125, 0.09375, 1.1923828125, 2.291015625, 3.3896484375, 4.48828125, 5.5869140625, 6.685546875, 7.7841796875, 8.8828125, 9.9814453125, 11.080078125, 12.1787109375, 13.27734375, 14.3759765625, 15.474609375, 16.5732421875, 17.671875, 18.7705078125, 19.869140625, 20.9677734375, 22.06640625, 23.1650390625, 24.263671875, 25.3623046875, 26.4609375, 27.5595703125, 28.658203125, 29.7568359375, 30.85546875, 31.9541015625, 33.052734375, 34.1513671875, 35.25]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 4.0, 13.0, 9.0, 6.0, 15.0, 26.0, 25.0, 26.0, 57.0, 96.0, 163.0, 385.0, 926.0, 2693.0, 12179.0, 907826.0, 114416.0, 6597.0, 1755.0, 651.0, 268.0, 138.0, 84.0, 48.0, 39.0, 22.0, 22.0, 13.0, 14.0, 4.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-15.484375, -15.0638427734375, -14.643310546875, -14.2227783203125, -13.80224609375, -13.3817138671875, -12.961181640625, -12.5406494140625, -12.1201171875, -11.6995849609375, -11.279052734375, -10.8585205078125, -10.43798828125, -10.0174560546875, -9.596923828125, -9.1763916015625, -8.755859375, -8.3353271484375, -7.914794921875, -7.4942626953125, -7.07373046875, -6.6531982421875, -6.232666015625, -5.8121337890625, -5.3916015625, -4.9710693359375, -4.550537109375, -4.1300048828125, -3.70947265625, -3.2889404296875, -2.868408203125, -2.4478759765625, -2.02734375, -1.6068115234375, -1.186279296875, -0.7657470703125, -0.34521484375, 0.0753173828125, 0.495849609375, 0.9163818359375, 1.3369140625, 1.7574462890625, 2.177978515625, 2.5985107421875, 3.01904296875, 3.4395751953125, 3.860107421875, 4.2806396484375, 4.701171875, 5.1217041015625, 5.542236328125, 5.9627685546875, 6.38330078125, 6.8038330078125, 7.224365234375, 7.6448974609375, 8.0654296875, 8.4859619140625, 8.906494140625, 9.3270263671875, 9.74755859375, 10.1680908203125, 10.588623046875, 11.0091552734375, 11.4296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 8.0, 10.0, 21.0, 30.0, 78.0, 230.0, 338.0, 142.0, 61.0, 22.0, 19.0, 13.0, 6.0, 4.0, 5.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00201416015625, -0.0019429028034210205, -0.001871645450592041, -0.0018003880977630615, -0.001729130744934082, -0.0016578733921051025, -0.001586616039276123, -0.0015153586864471436, -0.001444101333618164, -0.0013728439807891846, -0.001301586627960205, -0.0012303292751312256, -0.001159071922302246, -0.0010878145694732666, -0.0010165572166442871, -0.0009452998638153076, -0.0008740425109863281, -0.0008027851581573486, -0.0007315278053283691, -0.0006602704524993896, -0.0005890130996704102, -0.0005177557468414307, -0.00044649839401245117, -0.0003752410411834717, -0.0003039836883544922, -0.0002327263355255127, -0.0001614689826965332, -9.021162986755371e-05, -1.895427703857422e-05, 5.2303075790405273e-05, 0.00012356042861938477, 0.00019481778144836426, 0.00026607513427734375, 0.00033733248710632324, 0.00040858983993530273, 0.0004798471927642822, 0.0005511045455932617, 0.0006223618984222412, 0.0006936192512512207, 0.0007648766040802002, 0.0008361339569091797, 0.0009073913097381592, 0.0009786486625671387, 0.0010499060153961182, 0.0011211633682250977, 0.0011924207210540771, 0.0012636780738830566, 0.0013349354267120361, 0.0014061927795410156, 0.0014774501323699951, 0.0015487074851989746, 0.001619964838027954, 0.0016912221908569336, 0.001762479543685913, 0.0018337368965148926, 0.001904994249343872, 0.0019762516021728516, 0.002047508955001831, 0.0021187663078308105, 0.00219002366065979, 0.0022612810134887695, 0.002332538366317749, 0.0024037957191467285, 0.002475053071975708, 0.0025463104248046875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 7.0, 6.0, 8.0, 8.0, 12.0, 15.0, 24.0, 16.0, 23.0, 38.0, 49.0, 99.0, 125.0, 224.0, 404.0, 768.0, 1477.0, 3584.0, 11454.0, 112349.0, 870315.0, 35550.0, 6906.0, 2552.0, 1133.0, 553.0, 286.0, 190.0, 113.0, 60.0, 48.0, 46.0, 27.0, 14.0, 19.0, 11.0, 10.0, 9.0, 7.0, 8.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.6015625, -7.3507080078125, -7.099853515625, -6.8489990234375, -6.59814453125, -6.3472900390625, -6.096435546875, -5.8455810546875, -5.5947265625, -5.3438720703125, -5.093017578125, -4.8421630859375, -4.59130859375, -4.3404541015625, -4.089599609375, -3.8387451171875, -3.587890625, -3.3370361328125, -3.086181640625, -2.8353271484375, -2.58447265625, -2.3336181640625, -2.082763671875, -1.8319091796875, -1.5810546875, -1.3302001953125, -1.079345703125, -0.8284912109375, -0.57763671875, -0.3267822265625, -0.075927734375, 0.1749267578125, 0.42578125, 0.6766357421875, 0.927490234375, 1.1783447265625, 1.42919921875, 1.6800537109375, 1.930908203125, 2.1817626953125, 2.4326171875, 2.6834716796875, 2.934326171875, 3.1851806640625, 3.43603515625, 3.6868896484375, 3.937744140625, 4.1885986328125, 4.439453125, 4.6903076171875, 4.941162109375, 5.1920166015625, 5.44287109375, 5.6937255859375, 5.944580078125, 6.1954345703125, 6.4462890625, 6.6971435546875, 6.947998046875, 7.1988525390625, 7.44970703125, 7.7005615234375, 7.951416015625, 8.2022705078125, 8.453125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 5.0, 2.0, 10.0, 36.0, 82.0, 358.0, 359.0, 92.0, 27.0, 13.0, 7.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.65625, -24.9619140625, -24.267578125, -23.5732421875, -22.87890625, -22.1845703125, -21.490234375, -20.7958984375, -20.1015625, -19.4072265625, -18.712890625, -18.0185546875, -17.32421875, -16.6298828125, -15.935546875, -15.2412109375, -14.546875, -13.8525390625, -13.158203125, -12.4638671875, -11.76953125, -11.0751953125, -10.380859375, -9.6865234375, -8.9921875, -8.2978515625, -7.603515625, -6.9091796875, -6.21484375, -5.5205078125, -4.826171875, -4.1318359375, -3.4375, -2.7431640625, -2.048828125, -1.3544921875, -0.66015625, 0.0341796875, 0.728515625, 1.4228515625, 2.1171875, 2.8115234375, 3.505859375, 4.2001953125, 4.89453125, 5.5888671875, 6.283203125, 6.9775390625, 7.671875, 8.3662109375, 9.060546875, 9.7548828125, 10.44921875, 11.1435546875, 11.837890625, 12.5322265625, 13.2265625, 13.9208984375, 14.615234375, 15.3095703125, 16.00390625, 16.6982421875, 17.392578125, 18.0869140625, 18.78125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 1.0, 10.0, 31.0, 78.0, 412.0, 355.0, 78.0, 12.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-403.9385070800781, -393.5765686035156, -383.2146301269531, -372.85272216796875, -362.49078369140625, -352.12884521484375, -341.76690673828125, -331.40496826171875, -321.0430603027344, -310.6811218261719, -300.3191833496094, -289.957275390625, -279.5953369140625, -269.2333984375, -258.8714599609375, -248.50953674316406, -238.14759826660156, -227.78565979003906, -217.42373657226562, -207.06179809570312, -196.6998748779297, -186.3379364013672, -175.97601318359375, -165.61407470703125, -155.25213623046875, -144.89019775390625, -134.5282745361328, -124.16633605957031, -113.80441284179688, -103.44247436523438, -93.0805435180664, -82.71861267089844, -72.356689453125, -61.99475860595703, -51.63282775878906, -41.27089309692383, -30.90896224975586, -20.54703140258789, -10.185096740722656, 0.1768341064453125, 10.538764953613281, 20.90069580078125, 31.26262855529785, 41.62456130981445, 51.98649215698242, 62.34842300415039, 72.71035766601562, 83.0722885131836, 93.43421936035156, 103.79615020751953, 114.1580810546875, 124.52001953125, 134.88194274902344, 145.24388122558594, 155.60580444335938, 165.96774291992188, 176.32968139648438, 186.69161987304688, 197.0535430908203, 207.4154815673828, 217.77740478515625, 228.13934326171875, 238.50128173828125, 248.8632049560547, 259.2251281738281]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 11.0, 11.0, 24.0, 26.0, 22.0, 25.0, 36.0, 37.0, 41.0, 52.0, 54.0, 141.0, 113.0, 84.0, 67.0, 39.0, 44.0, 34.0, 38.0, 26.0, 17.0, 10.0, 19.0, 10.0, 4.0, 8.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.90231323242188, -174.29664611816406, -168.69097900390625, -163.08531188964844, -157.47964477539062, -151.8739776611328, -146.268310546875, -140.66265869140625, -135.05697631835938, -129.45130920410156, -123.84564208984375, -118.23997497558594, -112.63430786132812, -107.02864074707031, -101.42298126220703, -95.81731414794922, -90.21165466308594, -84.60598754882812, -79.00032043457031, -73.3946533203125, -67.78898620605469, -62.18332290649414, -56.577659606933594, -50.97199249267578, -45.36632537841797, -39.760658264160156, -34.154991149902344, -28.549327850341797, -22.943660736083984, -17.337993621826172, -11.732330322265625, -6.1266632080078125, -0.52099609375, 5.084670066833496, 10.690336227416992, 16.296001434326172, 21.901668548583984, 27.507335662841797, 33.112998962402344, 38.718666076660156, 44.32433319091797, 49.93000030517578, 55.535667419433594, 61.14133071899414, 66.74699401855469, 72.3526611328125, 77.95832824707031, 83.56399536132812, 89.16966247558594, 94.77532958984375, 100.38099670410156, 105.98666381835938, 111.59233093261719, 117.197998046875, 122.80365753173828, 128.40933227539062, 134.01498413085938, 139.6206512451172, 145.226318359375, 150.8319854736328, 156.43765258789062, 162.04331970214844, 167.64898681640625, 173.254638671875, 178.86032104492188]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 12.0, 10.0, 13.0, 3.0, 21.0, 25.0, 50.0, 76.0, 130.0, 158.0, 308.0, 464.0, 800.0, 1334.0, 2605.0, 6486.0, 24880.0, 290221.0, 3248684.0, 576112.0, 31850.0, 6115.0, 2075.0, 789.0, 428.0, 233.0, 116.0, 81.0, 58.0, 46.0, 21.0, 22.0, 6.0, 13.0, 5.0, 6.0, 9.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.390625, -13.9351806640625, -13.479736328125, -13.0242919921875, -12.56884765625, -12.1134033203125, -11.657958984375, -11.2025146484375, -10.7470703125, -10.2916259765625, -9.836181640625, -9.3807373046875, -8.92529296875, -8.4698486328125, -8.014404296875, -7.5589599609375, -7.103515625, -6.6480712890625, -6.192626953125, -5.7371826171875, -5.28173828125, -4.8262939453125, -4.370849609375, -3.9154052734375, -3.4599609375, -3.0045166015625, -2.549072265625, -2.0936279296875, -1.63818359375, -1.1827392578125, -0.727294921875, -0.2718505859375, 0.18359375, 0.6390380859375, 1.094482421875, 1.5499267578125, 2.00537109375, 2.4608154296875, 2.916259765625, 3.3717041015625, 3.8271484375, 4.2825927734375, 4.738037109375, 5.1934814453125, 5.64892578125, 6.1043701171875, 6.559814453125, 7.0152587890625, 7.470703125, 7.9261474609375, 8.381591796875, 8.8370361328125, 9.29248046875, 9.7479248046875, 10.203369140625, 10.6588134765625, 11.1142578125, 11.5697021484375, 12.025146484375, 12.4805908203125, 12.93603515625, 13.3914794921875, 13.846923828125, 14.3023681640625, 14.7578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 11.0, 23.0, 34.0, 44.0, 54.0, 95.0, 104.0, 96.0, 105.0, 119.0, 105.0, 61.0, 49.0, 47.0, 23.0, 12.0, 11.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.5546875, -11.9388427734375, -11.322998046875, -10.7071533203125, -10.09130859375, -9.4754638671875, -8.859619140625, -8.2437744140625, -7.6279296875, -7.0120849609375, -6.396240234375, -5.7803955078125, -5.16455078125, -4.5487060546875, -3.932861328125, -3.3170166015625, -2.701171875, -2.0853271484375, -1.469482421875, -0.8536376953125, -0.23779296875, 0.3780517578125, 0.993896484375, 1.6097412109375, 2.2255859375, 2.8414306640625, 3.457275390625, 4.0731201171875, 4.68896484375, 5.3048095703125, 5.920654296875, 6.5364990234375, 7.15234375, 7.7681884765625, 8.384033203125, 8.9998779296875, 9.61572265625, 10.2315673828125, 10.847412109375, 11.4632568359375, 12.0791015625, 12.6949462890625, 13.310791015625, 13.9266357421875, 14.54248046875, 15.1583251953125, 15.774169921875, 16.3900146484375, 17.005859375, 17.6217041015625, 18.237548828125, 18.8533935546875, 19.46923828125, 20.0850830078125, 20.700927734375, 21.3167724609375, 21.9326171875, 22.5484619140625, 23.164306640625, 23.7801513671875, 24.39599609375, 25.0118408203125, 25.627685546875, 26.2435302734375, 26.859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 6.0, 13.0, 6.0, 17.0, 24.0, 22.0, 59.0, 78.0, 164.0, 328.0, 892.0, 3734.0, 20887.0, 610998.0, 3483403.0, 63503.0, 7290.0, 1787.0, 482.0, 235.0, 116.0, 74.0, 37.0, 31.0, 26.0, 18.0, 7.0, 11.0, 5.0, 8.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.4375, -19.857177734375, -19.27685546875, -18.696533203125, -18.1162109375, -17.535888671875, -16.95556640625, -16.375244140625, -15.794921875, -15.214599609375, -14.63427734375, -14.053955078125, -13.4736328125, -12.893310546875, -12.31298828125, -11.732666015625, -11.15234375, -10.572021484375, -9.99169921875, -9.411376953125, -8.8310546875, -8.250732421875, -7.67041015625, -7.090087890625, -6.509765625, -5.929443359375, -5.34912109375, -4.768798828125, -4.1884765625, -3.608154296875, -3.02783203125, -2.447509765625, -1.8671875, -1.286865234375, -0.70654296875, -0.126220703125, 0.4541015625, 1.034423828125, 1.61474609375, 2.195068359375, 2.775390625, 3.355712890625, 3.93603515625, 4.516357421875, 5.0966796875, 5.677001953125, 6.25732421875, 6.837646484375, 7.41796875, 7.998291015625, 8.57861328125, 9.158935546875, 9.7392578125, 10.319580078125, 10.89990234375, 11.480224609375, 12.060546875, 12.640869140625, 13.22119140625, 13.801513671875, 14.3818359375, 14.962158203125, 15.54248046875, 16.122802734375, 16.703125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 7.0, 5.0, 19.0, 17.0, 31.0, 40.0, 72.0, 105.0, 213.0, 387.0, 662.0, 827.0, 645.0, 456.0, 240.0, 117.0, 72.0, 39.0, 29.0, 23.0, 16.0, 12.0, 5.0, 9.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-19.25, -18.7645263671875, -18.279052734375, -17.7935791015625, -17.30810546875, -16.8226318359375, -16.337158203125, -15.8516845703125, -15.3662109375, -14.8807373046875, -14.395263671875, -13.9097900390625, -13.42431640625, -12.9388427734375, -12.453369140625, -11.9678955078125, -11.482421875, -10.9969482421875, -10.511474609375, -10.0260009765625, -9.54052734375, -9.0550537109375, -8.569580078125, -8.0841064453125, -7.5986328125, -7.1131591796875, -6.627685546875, -6.1422119140625, -5.65673828125, -5.1712646484375, -4.685791015625, -4.2003173828125, -3.71484375, -3.2293701171875, -2.743896484375, -2.2584228515625, -1.77294921875, -1.2874755859375, -0.802001953125, -0.3165283203125, 0.1689453125, 0.6544189453125, 1.139892578125, 1.6253662109375, 2.11083984375, 2.5963134765625, 3.081787109375, 3.5672607421875, 4.052734375, 4.5382080078125, 5.023681640625, 5.5091552734375, 5.99462890625, 6.4801025390625, 6.965576171875, 7.4510498046875, 7.9365234375, 8.4219970703125, 8.907470703125, 9.3929443359375, 9.87841796875, 10.3638916015625, 10.849365234375, 11.3348388671875, 11.8203125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 7.0, 15.0, 34.0, 70.0, 129.0, 180.0, 209.0, 162.0, 86.0, 35.0, 23.0, 15.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-134.03045654296875, -130.5371856689453, -127.04390716552734, -123.5506362915039, -120.05736541748047, -116.5640869140625, -113.07081604003906, -109.57754516601562, -106.08427429199219, -102.59100341796875, -99.09772491455078, -95.60445404052734, -92.1111831665039, -88.61790466308594, -85.1246337890625, -81.63136291503906, -78.13809204101562, -74.64482116699219, -71.15154266357422, -67.65827178955078, -64.16500091552734, -60.67172622680664, -57.17845153808594, -53.6851806640625, -50.19190216064453, -46.69862747192383, -43.20535659790039, -39.71208190917969, -36.21881103515625, -32.72553634643555, -29.232263565063477, -25.738990783691406, -22.24571990966797, -18.7524471282959, -15.259174346923828, -11.765900611877441, -8.272627830505371, -4.779354095458984, -1.286081314086914, 2.2071914672851562, 5.700464248657227, 9.193737030029297, 12.687009811401367, 16.180282592773438, 19.67355728149414, 23.16683006286621, 26.66010284423828, 30.15337562561035, 33.64664840698242, 37.139923095703125, 40.63319396972656, 44.126468658447266, 47.6197395324707, 51.113014221191406, 54.606285095214844, 58.09955978393555, 61.59283447265625, 65.08610534667969, 68.57938385009766, 72.0726547241211, 75.56592559814453, 79.0592041015625, 82.55247497558594, 86.04574584960938, 89.53901672363281]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 9.0, 13.0, 9.0, 10.0, 12.0, 13.0, 21.0, 22.0, 22.0, 33.0, 32.0, 37.0, 36.0, 28.0, 29.0, 53.0, 41.0, 41.0, 35.0, 57.0, 37.0, 46.0, 41.0, 36.0, 39.0, 32.0, 36.0, 26.0, 25.0, 23.0, 16.0, 18.0, 7.0, 9.0, 14.0, 6.0, 8.0, 6.0, 5.0, 2.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0], "bins": [-53.862239837646484, -52.25047302246094, -50.63870620727539, -49.026939392089844, -47.41516876220703, -45.80340576171875, -44.19163513183594, -42.57986831665039, -40.968101501464844, -39.3563346862793, -37.74456787109375, -36.1328010559082, -34.521034240722656, -32.909263610839844, -31.297496795654297, -29.68572998046875, -28.073963165283203, -26.462196350097656, -24.85042953491211, -23.23866081237793, -21.626893997192383, -20.015127182006836, -18.403358459472656, -16.79159164428711, -15.179824829101562, -13.568058013916016, -11.956290245056152, -10.344522476196289, -8.732755661010742, -7.120988845825195, -5.509221076965332, -3.8974533081054688, -2.2856826782226562, -0.6739153861999512, 0.9378519058227539, 2.549619197845459, 4.161386489868164, 5.773153305053711, 7.384921073913574, 8.996688842773438, 10.608455657958984, 12.220222473144531, 13.831990242004395, 15.443758010864258, 17.055524826049805, 18.66729164123535, 20.27906036376953, 21.890827178955078, 23.502593994140625, 25.114360809326172, 26.72612762451172, 28.3378963470459, 29.949663162231445, 31.561429977416992, 33.17319869995117, 34.78496551513672, 36.396732330322266, 38.00849914550781, 39.62026596069336, 41.232032775878906, 42.84380340576172, 44.45556640625, 46.06733703613281, 47.67910385131836, 49.290870666503906]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 10.0, 16.0, 19.0, 29.0, 51.0, 106.0, 175.0, 310.0, 798.0, 2921.0, 23544.0, 610054.0, 390748.0, 16206.0, 2256.0, 652.0, 264.0, 156.0, 69.0, 56.0, 41.0, 25.0, 11.0, 12.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.75, -37.60791015625, -36.4658203125, -35.32373046875, -34.181640625, -33.03955078125, -31.8974609375, -30.75537109375, -29.61328125, -28.47119140625, -27.3291015625, -26.18701171875, -25.044921875, -23.90283203125, -22.7607421875, -21.61865234375, -20.4765625, -19.33447265625, -18.1923828125, -17.05029296875, -15.908203125, -14.76611328125, -13.6240234375, -12.48193359375, -11.33984375, -10.19775390625, -9.0556640625, -7.91357421875, -6.771484375, -5.62939453125, -4.4873046875, -3.34521484375, -2.203125, -1.06103515625, 0.0810546875, 1.22314453125, 2.365234375, 3.50732421875, 4.6494140625, 5.79150390625, 6.93359375, 8.07568359375, 9.2177734375, 10.35986328125, 11.501953125, 12.64404296875, 13.7861328125, 14.92822265625, 16.0703125, 17.21240234375, 18.3544921875, 19.49658203125, 20.638671875, 21.78076171875, 22.9228515625, 24.06494140625, 25.20703125, 26.34912109375, 27.4912109375, 28.63330078125, 29.775390625, 30.91748046875, 32.0595703125, 33.20166015625, 34.34375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 15.0, 23.0, 35.0, 37.0, 68.0, 72.0, 104.0, 113.0, 106.0, 114.0, 95.0, 69.0, 43.0, 51.0, 29.0, 14.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.5546875, -11.9388427734375, -11.322998046875, -10.7071533203125, -10.09130859375, -9.4754638671875, -8.859619140625, -8.2437744140625, -7.6279296875, -7.0120849609375, -6.396240234375, -5.7803955078125, -5.16455078125, -4.5487060546875, -3.932861328125, -3.3170166015625, -2.701171875, -2.0853271484375, -1.469482421875, -0.8536376953125, -0.23779296875, 0.3780517578125, 0.993896484375, 1.6097412109375, 2.2255859375, 2.8414306640625, 3.457275390625, 4.0731201171875, 4.68896484375, 5.3048095703125, 5.920654296875, 6.5364990234375, 7.15234375, 7.7681884765625, 8.384033203125, 8.9998779296875, 9.61572265625, 10.2315673828125, 10.847412109375, 11.4632568359375, 12.0791015625, 12.6949462890625, 13.310791015625, 13.9266357421875, 14.54248046875, 15.1583251953125, 15.774169921875, 16.3900146484375, 17.005859375, 17.6217041015625, 18.237548828125, 18.8533935546875, 19.46923828125, 20.0850830078125, 20.700927734375, 21.3167724609375, 21.9326171875, 22.5484619140625, 23.164306640625, 23.7801513671875, 24.39599609375, 25.0118408203125, 25.627685546875, 26.2435302734375, 26.859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 15.0, 4.0, 6.0, 15.0, 21.0, 27.0, 32.0, 24.0, 32.0, 46.0, 79.0, 132.0, 162.0, 325.0, 504.0, 885.0, 1914.0, 4653.0, 19236.0, 256342.0, 724006.0, 29251.0, 5977.0, 2158.0, 1079.0, 579.0, 360.0, 231.0, 143.0, 77.0, 75.0, 44.0, 23.0, 24.0, 15.0, 9.0, 6.0, 9.0, 6.0, 8.0, 1.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-26.9375, -26.071533203125, -25.20556640625, -24.339599609375, -23.4736328125, -22.607666015625, -21.74169921875, -20.875732421875, -20.009765625, -19.143798828125, -18.27783203125, -17.411865234375, -16.5458984375, -15.679931640625, -14.81396484375, -13.947998046875, -13.08203125, -12.216064453125, -11.35009765625, -10.484130859375, -9.6181640625, -8.752197265625, -7.88623046875, -7.020263671875, -6.154296875, -5.288330078125, -4.42236328125, -3.556396484375, -2.6904296875, -1.824462890625, -0.95849609375, -0.092529296875, 0.7734375, 1.639404296875, 2.50537109375, 3.371337890625, 4.2373046875, 5.103271484375, 5.96923828125, 6.835205078125, 7.701171875, 8.567138671875, 9.43310546875, 10.299072265625, 11.1650390625, 12.031005859375, 12.89697265625, 13.762939453125, 14.62890625, 15.494873046875, 16.36083984375, 17.226806640625, 18.0927734375, 18.958740234375, 19.82470703125, 20.690673828125, 21.556640625, 22.422607421875, 23.28857421875, 24.154541015625, 25.0205078125, 25.886474609375, 26.75244140625, 27.618408203125, 28.484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 19.0, 11.0, 31.0, 29.0, 52.0, 73.0, 95.0, 94.0, 128.0, 94.0, 87.0, 77.0, 70.0, 44.0, 22.0, 19.0, 19.0, 7.0, 9.0, 8.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.375, -63.3125, -61.25, -59.1875, -57.125, -55.0625, -53.0, -50.9375, -48.875, -46.8125, -44.75, -42.6875, -40.625, -38.5625, -36.5, -34.4375, -32.375, -30.3125, -28.25, -26.1875, -24.125, -22.0625, -20.0, -17.9375, -15.875, -13.8125, -11.75, -9.6875, -7.625, -5.5625, -3.5, -1.4375, 0.625, 2.6875, 4.75, 6.8125, 8.875, 10.9375, 13.0, 15.0625, 17.125, 19.1875, 21.25, 23.3125, 25.375, 27.4375, 29.5, 31.5625, 33.625, 35.6875, 37.75, 39.8125, 41.875, 43.9375, 46.0, 48.0625, 50.125, 52.1875, 54.25, 56.3125, 58.375, 60.4375, 62.5, 64.5625, 66.625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 4.0, 15.0, 16.0, 13.0, 28.0, 44.0, 59.0, 65.0, 123.0, 199.0, 411.0, 945.0, 2899.0, 10773.0, 909701.0, 113041.0, 6558.0, 2097.0, 754.0, 301.0, 178.0, 112.0, 65.0, 35.0, 34.0, 20.0, 11.0, 11.0, 8.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6875, -12.276123046875, -11.86474609375, -11.453369140625, -11.0419921875, -10.630615234375, -10.21923828125, -9.807861328125, -9.396484375, -8.985107421875, -8.57373046875, -8.162353515625, -7.7509765625, -7.339599609375, -6.92822265625, -6.516845703125, -6.10546875, -5.694091796875, -5.28271484375, -4.871337890625, -4.4599609375, -4.048583984375, -3.63720703125, -3.225830078125, -2.814453125, -2.403076171875, -1.99169921875, -1.580322265625, -1.1689453125, -0.757568359375, -0.34619140625, 0.065185546875, 0.4765625, 0.887939453125, 1.29931640625, 1.710693359375, 2.1220703125, 2.533447265625, 2.94482421875, 3.356201171875, 3.767578125, 4.178955078125, 4.59033203125, 5.001708984375, 5.4130859375, 5.824462890625, 6.23583984375, 6.647216796875, 7.05859375, 7.469970703125, 7.88134765625, 8.292724609375, 8.7041015625, 9.115478515625, 9.52685546875, 9.938232421875, 10.349609375, 10.760986328125, 11.17236328125, 11.583740234375, 11.9951171875, 12.406494140625, 12.81787109375, 13.229248046875, 13.640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 6.0, 14.0, 19.0, 33.0, 78.0, 206.0, 323.0, 140.0, 62.0, 32.0, 15.0, 12.0, 14.0, 3.0, 7.0, 4.0, 3.0, 0.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026149749755859375, -0.0025449544191360474, -0.0024749338626861572, -0.002404913306236267, -0.002334892749786377, -0.002264872193336487, -0.0021948516368865967, -0.0021248310804367065, -0.0020548105239868164, -0.0019847899675369263, -0.0019147694110870361, -0.001844748854637146, -0.0017747282981872559, -0.0017047077417373657, -0.0016346871852874756, -0.0015646666288375854, -0.0014946460723876953, -0.0014246255159378052, -0.001354604959487915, -0.001284584403038025, -0.0012145638465881348, -0.0011445432901382446, -0.0010745227336883545, -0.0010045021772384644, -0.0009344816207885742, -0.0008644610643386841, -0.0007944405078887939, -0.0007244199514389038, -0.0006543993949890137, -0.0005843788385391235, -0.0005143582820892334, -0.00044433772563934326, -0.0003743171691894531, -0.000304296612739563, -0.00023427605628967285, -0.00016425549983978271, -9.423494338989258e-05, -2.421438694000244e-05, 4.5806169509887695e-05, 0.00011582672595977783, 0.00018584728240966797, 0.0002558678388595581, 0.00032588839530944824, 0.0003959089517593384, 0.0004659295082092285, 0.0005359500646591187, 0.0006059706211090088, 0.0006759911775588989, 0.0007460117340087891, 0.0008160322904586792, 0.0008860528469085693, 0.0009560734033584595, 0.0010260939598083496, 0.0010961145162582397, 0.0011661350727081299, 0.00123615562915802, 0.0013061761856079102, 0.0013761967420578003, 0.0014462172985076904, 0.0015162378549575806, 0.0015862584114074707, 0.0016562789678573608, 0.001726299524307251, 0.0017963200807571411, 0.0018663406372070312]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 9.0, 3.0, 9.0, 10.0, 11.0, 14.0, 16.0, 23.0, 39.0, 45.0, 63.0, 107.0, 158.0, 252.0, 439.0, 896.0, 1983.0, 5036.0, 18330.0, 798459.0, 203342.0, 12015.0, 3786.0, 1644.0, 736.0, 378.0, 234.0, 141.0, 84.0, 57.0, 47.0, 41.0, 36.0, 27.0, 24.0, 13.0, 12.0, 10.0, 3.0, 3.0, 2.0, 3.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.359375, -8.1051025390625, -7.850830078125, -7.5965576171875, -7.34228515625, -7.0880126953125, -6.833740234375, -6.5794677734375, -6.3251953125, -6.0709228515625, -5.816650390625, -5.5623779296875, -5.30810546875, -5.0538330078125, -4.799560546875, -4.5452880859375, -4.291015625, -4.0367431640625, -3.782470703125, -3.5281982421875, -3.27392578125, -3.0196533203125, -2.765380859375, -2.5111083984375, -2.2568359375, -2.0025634765625, -1.748291015625, -1.4940185546875, -1.23974609375, -0.9854736328125, -0.731201171875, -0.4769287109375, -0.22265625, 0.0316162109375, 0.285888671875, 0.5401611328125, 0.79443359375, 1.0487060546875, 1.302978515625, 1.5572509765625, 1.8115234375, 2.0657958984375, 2.320068359375, 2.5743408203125, 2.82861328125, 3.0828857421875, 3.337158203125, 3.5914306640625, 3.845703125, 4.0999755859375, 4.354248046875, 4.6085205078125, 4.86279296875, 5.1170654296875, 5.371337890625, 5.6256103515625, 5.8798828125, 6.1341552734375, 6.388427734375, 6.6427001953125, 6.89697265625, 7.1512451171875, 7.405517578125, 7.6597900390625, 7.9140625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 9.0, 7.0, 10.0, 14.0, 19.0, 41.0, 54.0, 86.0, 160.0, 169.0, 131.0, 93.0, 59.0, 36.0, 33.0, 18.0, 14.0, 14.0, 10.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.109375, -4.892822265625, -4.67626953125, -4.459716796875, -4.2431640625, -4.026611328125, -3.81005859375, -3.593505859375, -3.376953125, -3.160400390625, -2.94384765625, -2.727294921875, -2.5107421875, -2.294189453125, -2.07763671875, -1.861083984375, -1.64453125, -1.427978515625, -1.21142578125, -0.994873046875, -0.7783203125, -0.561767578125, -0.34521484375, -0.128662109375, 0.087890625, 0.304443359375, 0.52099609375, 0.737548828125, 0.9541015625, 1.170654296875, 1.38720703125, 1.603759765625, 1.8203125, 2.036865234375, 2.25341796875, 2.469970703125, 2.6865234375, 2.903076171875, 3.11962890625, 3.336181640625, 3.552734375, 3.769287109375, 3.98583984375, 4.202392578125, 4.4189453125, 4.635498046875, 4.85205078125, 5.068603515625, 5.28515625, 5.501708984375, 5.71826171875, 5.934814453125, 6.1513671875, 6.367919921875, 6.58447265625, 6.801025390625, 7.017578125, 7.234130859375, 7.45068359375, 7.667236328125, 7.8837890625, 8.100341796875, 8.31689453125, 8.533447265625, 8.75]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 23.0, 136.0, 760.0, 62.0, 10.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-793.3284912109375, -770.2240600585938, -747.11962890625, -724.0151977539062, -700.9107666015625, -677.8062744140625, -654.7018432617188, -631.597412109375, -608.4929809570312, -585.3885498046875, -562.2841186523438, -539.1796875, -516.0751953125, -492.9707946777344, -469.8663330078125, -446.76190185546875, -423.657470703125, -400.55303955078125, -377.4486083984375, -354.3441467285156, -331.2397155761719, -308.1352844238281, -285.03082275390625, -261.9263916015625, -238.82196044921875, -215.717529296875, -192.6130828857422, -169.50863647460938, -146.40420532226562, -123.29976654052734, -100.19532775878906, -77.09088134765625, -53.98651123046875, -30.88207244873047, -7.7776336669921875, 15.326805114746094, 38.431243896484375, 61.535682678222656, 84.64012145996094, 107.74456787109375, 130.8489990234375, 153.95343017578125, 177.05787658691406, 200.16232299804688, 223.26675415039062, 246.37118530273438, 269.47564697265625, 292.580078125, 315.68450927734375, 338.7889404296875, 361.89337158203125, 384.9978332519531, 408.1022644042969, 431.2066955566406, 454.3111572265625, 477.41558837890625, 500.52001953125, 523.6244506835938, 546.7288818359375, 569.8333129882812, 592.937744140625, 616.042236328125, 639.1466674804688, 662.2510986328125, 685.3555297851562]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 10.0, 20.0, 13.0, 31.0, 20.0, 44.0, 50.0, 43.0, 64.0, 112.0, 162.0, 103.0, 61.0, 49.0, 29.0, 32.0, 30.0, 37.0, 18.0, 25.0, 13.0, 8.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0], "bins": [-259.38421630859375, -253.55169677734375, -247.71917724609375, -241.88665771484375, -236.05413818359375, -230.2216339111328, -224.3891143798828, -218.5565948486328, -212.7240753173828, -206.8915557861328, -201.0590362548828, -195.2265167236328, -189.39401245117188, -183.56149291992188, -177.72897338867188, -171.89645385742188, -166.06393432617188, -160.23141479492188, -154.39889526367188, -148.56637573242188, -142.73385620117188, -136.90135192871094, -131.06883239746094, -125.23631286621094, -119.40379333496094, -113.57127380371094, -107.73875427246094, -101.90624237060547, -96.07372283935547, -90.24120330810547, -84.40869140625, -78.576171875, -72.74366760253906, -66.91114807128906, -61.07863235473633, -55.246116638183594, -49.413597106933594, -43.581077575683594, -37.74856185913086, -31.916046142578125, -26.083526611328125, -20.251008987426758, -14.41849136352539, -8.585973739624023, -2.7534561157226562, 3.079061508178711, 8.911579132080078, 14.744094848632812, 20.576614379882812, 26.40913200378418, 32.24164962768555, 38.07416534423828, 43.90668487548828, 49.73920440673828, 55.571720123291016, 61.40423583984375, 67.23675537109375, 73.06927490234375, 78.90179443359375, 84.73430633544922, 90.56682586669922, 96.39934539794922, 102.23185729980469, 108.06437683105469, 113.89689636230469]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 6.0, 10.0, 18.0, 17.0, 34.0, 75.0, 140.0, 380.0, 1221.0, 4177.0, 23946.0, 2748309.0, 1398306.0, 14035.0, 2351.0, 708.0, 252.0, 114.0, 64.0, 33.0, 28.0, 13.0, 10.0, 11.0, 9.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.8125, -26.41650390625, -25.0205078125, -23.62451171875, -22.228515625, -20.83251953125, -19.4365234375, -18.04052734375, -16.64453125, -15.24853515625, -13.8525390625, -12.45654296875, -11.060546875, -9.66455078125, -8.2685546875, -6.87255859375, -5.4765625, -4.08056640625, -2.6845703125, -1.28857421875, 0.107421875, 1.50341796875, 2.8994140625, 4.29541015625, 5.69140625, 7.08740234375, 8.4833984375, 9.87939453125, 11.275390625, 12.67138671875, 14.0673828125, 15.46337890625, 16.859375, 18.25537109375, 19.6513671875, 21.04736328125, 22.443359375, 23.83935546875, 25.2353515625, 26.63134765625, 28.02734375, 29.42333984375, 30.8193359375, 32.21533203125, 33.611328125, 35.00732421875, 36.4033203125, 37.79931640625, 39.1953125, 40.59130859375, 41.9873046875, 43.38330078125, 44.779296875, 46.17529296875, 47.5712890625, 48.96728515625, 50.36328125, 51.75927734375, 53.1552734375, 54.55126953125, 55.947265625, 57.34326171875, 58.7392578125, 60.13525390625, 61.53125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 9.0, 15.0, 26.0, 33.0, 69.0, 65.0, 109.0, 101.0, 113.0, 115.0, 107.0, 77.0, 58.0, 41.0, 35.0, 19.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.287109375, -10.68359375, -10.080078125, -9.4765625, -8.873046875, -8.26953125, -7.666015625, -7.0625, -6.458984375, -5.85546875, -5.251953125, -4.6484375, -4.044921875, -3.44140625, -2.837890625, -2.234375, -1.630859375, -1.02734375, -0.423828125, 0.1796875, 0.783203125, 1.38671875, 1.990234375, 2.59375, 3.197265625, 3.80078125, 4.404296875, 5.0078125, 5.611328125, 6.21484375, 6.818359375, 7.421875, 8.025390625, 8.62890625, 9.232421875, 9.8359375, 10.439453125, 11.04296875, 11.646484375, 12.25, 12.853515625, 13.45703125, 14.060546875, 14.6640625, 15.267578125, 15.87109375, 16.474609375, 17.078125, 17.681640625, 18.28515625, 18.888671875, 19.4921875, 20.095703125, 20.69921875, 21.302734375, 21.90625, 22.509765625, 23.11328125, 23.716796875, 24.3203125, 24.923828125, 25.52734375, 26.130859375, 26.734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 2.0, 5.0, 6.0, 7.0, 9.0, 17.0, 32.0, 69.0, 112.0, 271.0, 892.0, 3909.0, 112026.0, 4065676.0, 8894.0, 1551.0, 430.0, 166.0, 75.0, 49.0, 31.0, 19.0, 14.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.4375, -70.833984375, -68.23046875, -65.626953125, -63.0234375, -60.419921875, -57.81640625, -55.212890625, -52.609375, -50.005859375, -47.40234375, -44.798828125, -42.1953125, -39.591796875, -36.98828125, -34.384765625, -31.78125, -29.177734375, -26.57421875, -23.970703125, -21.3671875, -18.763671875, -16.16015625, -13.556640625, -10.953125, -8.349609375, -5.74609375, -3.142578125, -0.5390625, 2.064453125, 4.66796875, 7.271484375, 9.875, 12.478515625, 15.08203125, 17.685546875, 20.2890625, 22.892578125, 25.49609375, 28.099609375, 30.703125, 33.306640625, 35.91015625, 38.513671875, 41.1171875, 43.720703125, 46.32421875, 48.927734375, 51.53125, 54.134765625, 56.73828125, 59.341796875, 61.9453125, 64.548828125, 67.15234375, 69.755859375, 72.359375, 74.962890625, 77.56640625, 80.169921875, 82.7734375, 85.376953125, 87.98046875, 90.583984375, 93.1875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 8.0, 8.0, 15.0, 20.0, 47.0, 70.0, 160.0, 351.0, 780.0, 1296.0, 757.0, 291.0, 142.0, 61.0, 20.0, 22.0, 9.0, 8.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-63.5625, -62.068359375, -60.57421875, -59.080078125, -57.5859375, -56.091796875, -54.59765625, -53.103515625, -51.609375, -50.115234375, -48.62109375, -47.126953125, -45.6328125, -44.138671875, -42.64453125, -41.150390625, -39.65625, -38.162109375, -36.66796875, -35.173828125, -33.6796875, -32.185546875, -30.69140625, -29.197265625, -27.703125, -26.208984375, -24.71484375, -23.220703125, -21.7265625, -20.232421875, -18.73828125, -17.244140625, -15.75, -14.255859375, -12.76171875, -11.267578125, -9.7734375, -8.279296875, -6.78515625, -5.291015625, -3.796875, -2.302734375, -0.80859375, 0.685546875, 2.1796875, 3.673828125, 5.16796875, 6.662109375, 8.15625, 9.650390625, 11.14453125, 12.638671875, 14.1328125, 15.626953125, 17.12109375, 18.615234375, 20.109375, 21.603515625, 23.09765625, 24.591796875, 26.0859375, 27.580078125, 29.07421875, 30.568359375, 32.0625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 11.0, 21.0, 29.0, 73.0, 168.0, 309.0, 201.0, 80.0, 44.0, 15.0, 10.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-437.33099365234375, -425.4548034667969, -413.5786437988281, -401.70245361328125, -389.8262939453125, -377.9501037597656, -366.07391357421875, -354.19775390625, -342.3215637207031, -330.44537353515625, -318.5692138671875, -306.6930236816406, -294.8168640136719, -282.940673828125, -271.06451416015625, -259.1883239746094, -247.31214904785156, -235.43597412109375, -223.55979919433594, -211.68362426757812, -199.80743408203125, -187.93125915527344, -176.05508422851562, -164.17889404296875, -152.302734375, -140.4265594482422, -128.55038452148438, -116.67420196533203, -104.79801940917969, -92.92184448242188, -81.04566955566406, -69.16948699951172, -57.293304443359375, -45.4171257019043, -33.54094696044922, -21.664772033691406, -9.788593292236328, 2.08758544921875, 13.963760375976562, 25.839942932128906, 37.71611785888672, 49.5922966003418, 61.468475341796875, 73.34465026855469, 85.2208251953125, 97.09700775146484, 108.97318267822266, 120.849365234375, 132.7255401611328, 144.60171508789062, 156.47789001464844, 168.35406494140625, 180.23025512695312, 192.10643005371094, 203.98260498046875, 215.85879516601562, 227.73495483398438, 239.6111297607422, 251.4873046875, 263.3634948730469, 275.2396545410156, 287.1158447265625, 298.99200439453125, 310.8681945800781, 322.744384765625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 6.0, 10.0, 23.0, 38.0, 34.0, 56.0, 63.0, 80.0, 94.0, 104.0, 114.0, 73.0, 72.0, 69.0, 42.0, 25.0, 34.0, 20.0, 21.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-253.4017333984375, -245.37399291992188, -237.34625244140625, -229.3185272216797, -221.29078674316406, -213.26304626464844, -205.23532104492188, -197.20758056640625, -189.17984008789062, -181.152099609375, -173.12435913085938, -165.0966339111328, -157.0688934326172, -149.04115295410156, -141.013427734375, -132.98568725585938, -124.95794677734375, -116.93020629882812, -108.90247344970703, -100.87474060058594, -92.84700012207031, -84.81925964355469, -76.7915267944336, -68.7637939453125, -60.736053466796875, -52.708316802978516, -44.680580139160156, -36.6528434753418, -28.625106811523438, -20.597370147705078, -12.569633483886719, -4.541896820068359, 3.48583984375, 11.51357650756836, 19.54131317138672, 27.569049835205078, 35.59678649902344, 43.6245231628418, 51.652259826660156, 59.679996490478516, 67.70773315429688, 75.7354736328125, 83.7632064819336, 91.79093933105469, 99.81867980957031, 107.84642028808594, 115.87415313720703, 123.90188598632812, 131.92962646484375, 139.95736694335938, 147.985107421875, 156.01283264160156, 164.0405731201172, 172.0683135986328, 180.09603881835938, 188.123779296875, 196.15151977539062, 204.17926025390625, 212.20700073242188, 220.23472595214844, 228.26246643066406, 236.2902069091797, 244.31793212890625, 252.34567260742188, 260.3734130859375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 17.0, 15.0, 28.0, 28.0, 45.0, 69.0, 111.0, 192.0, 353.0, 762.0, 1713.0, 5656.0, 27772.0, 407978.0, 560774.0, 33072.0, 6440.0, 1958.0, 732.0, 341.0, 174.0, 127.0, 63.0, 31.0, 21.0, 13.0, 22.0, 13.0, 3.0, 8.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.46875, -25.691162109375, -24.91357421875, -24.135986328125, -23.3583984375, -22.580810546875, -21.80322265625, -21.025634765625, -20.248046875, -19.470458984375, -18.69287109375, -17.915283203125, -17.1376953125, -16.360107421875, -15.58251953125, -14.804931640625, -14.02734375, -13.249755859375, -12.47216796875, -11.694580078125, -10.9169921875, -10.139404296875, -9.36181640625, -8.584228515625, -7.806640625, -7.029052734375, -6.25146484375, -5.473876953125, -4.6962890625, -3.918701171875, -3.14111328125, -2.363525390625, -1.5859375, -0.808349609375, -0.03076171875, 0.746826171875, 1.5244140625, 2.302001953125, 3.07958984375, 3.857177734375, 4.634765625, 5.412353515625, 6.18994140625, 6.967529296875, 7.7451171875, 8.522705078125, 9.30029296875, 10.077880859375, 10.85546875, 11.633056640625, 12.41064453125, 13.188232421875, 13.9658203125, 14.743408203125, 15.52099609375, 16.298583984375, 17.076171875, 17.853759765625, 18.63134765625, 19.408935546875, 20.1865234375, 20.964111328125, 21.74169921875, 22.519287109375, 23.296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 10.0, 10.0, 22.0, 22.0, 31.0, 50.0, 79.0, 74.0, 108.0, 82.0, 92.0, 120.0, 71.0, 68.0, 51.0, 40.0, 29.0, 17.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.2724609375, -10.685546875, -10.0986328125, -9.51171875, -8.9248046875, -8.337890625, -7.7509765625, -7.1640625, -6.5771484375, -5.990234375, -5.4033203125, -4.81640625, -4.2294921875, -3.642578125, -3.0556640625, -2.46875, -1.8818359375, -1.294921875, -0.7080078125, -0.12109375, 0.4658203125, 1.052734375, 1.6396484375, 2.2265625, 2.8134765625, 3.400390625, 3.9873046875, 4.57421875, 5.1611328125, 5.748046875, 6.3349609375, 6.921875, 7.5087890625, 8.095703125, 8.6826171875, 9.26953125, 9.8564453125, 10.443359375, 11.0302734375, 11.6171875, 12.2041015625, 12.791015625, 13.3779296875, 13.96484375, 14.5517578125, 15.138671875, 15.7255859375, 16.3125, 16.8994140625, 17.486328125, 18.0732421875, 18.66015625, 19.2470703125, 19.833984375, 20.4208984375, 21.0078125, 21.5947265625, 22.181640625, 22.7685546875, 23.35546875, 23.9423828125, 24.529296875, 25.1162109375, 25.703125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 14.0, 11.0, 13.0, 16.0, 23.0, 42.0, 48.0, 66.0, 113.0, 148.0, 248.0, 352.0, 673.0, 1499.0, 5408.0, 41395.0, 912727.0, 74064.0, 7833.0, 1972.0, 712.0, 348.0, 264.0, 145.0, 109.0, 71.0, 54.0, 54.0, 29.0, 20.0, 24.0, 14.0, 10.0, 6.0, 7.0, 2.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.71875, -22.042724609375, -21.36669921875, -20.690673828125, -20.0146484375, -19.338623046875, -18.66259765625, -17.986572265625, -17.310546875, -16.634521484375, -15.95849609375, -15.282470703125, -14.6064453125, -13.930419921875, -13.25439453125, -12.578369140625, -11.90234375, -11.226318359375, -10.55029296875, -9.874267578125, -9.1982421875, -8.522216796875, -7.84619140625, -7.170166015625, -6.494140625, -5.818115234375, -5.14208984375, -4.466064453125, -3.7900390625, -3.114013671875, -2.43798828125, -1.761962890625, -1.0859375, -0.409912109375, 0.26611328125, 0.942138671875, 1.6181640625, 2.294189453125, 2.97021484375, 3.646240234375, 4.322265625, 4.998291015625, 5.67431640625, 6.350341796875, 7.0263671875, 7.702392578125, 8.37841796875, 9.054443359375, 9.73046875, 10.406494140625, 11.08251953125, 11.758544921875, 12.4345703125, 13.110595703125, 13.78662109375, 14.462646484375, 15.138671875, 15.814697265625, 16.49072265625, 17.166748046875, 17.8427734375, 18.518798828125, 19.19482421875, 19.870849609375, 20.546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 8.0, 2.0, 14.0, 8.0, 18.0, 14.0, 16.0, 18.0, 22.0, 29.0, 31.0, 44.0, 43.0, 53.0, 66.0, 63.0, 94.0, 67.0, 59.0, 64.0, 42.0, 33.0, 43.0, 29.0, 17.0, 18.0, 21.0, 15.0, 6.0, 9.0, 7.0, 8.0, 10.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-43.28125, -41.95458984375, -40.6279296875, -39.30126953125, -37.974609375, -36.64794921875, -35.3212890625, -33.99462890625, -32.66796875, -31.34130859375, -30.0146484375, -28.68798828125, -27.361328125, -26.03466796875, -24.7080078125, -23.38134765625, -22.0546875, -20.72802734375, -19.4013671875, -18.07470703125, -16.748046875, -15.42138671875, -14.0947265625, -12.76806640625, -11.44140625, -10.11474609375, -8.7880859375, -7.46142578125, -6.134765625, -4.80810546875, -3.4814453125, -2.15478515625, -0.828125, 0.49853515625, 1.8251953125, 3.15185546875, 4.478515625, 5.80517578125, 7.1318359375, 8.45849609375, 9.78515625, 11.11181640625, 12.4384765625, 13.76513671875, 15.091796875, 16.41845703125, 17.7451171875, 19.07177734375, 20.3984375, 21.72509765625, 23.0517578125, 24.37841796875, 25.705078125, 27.03173828125, 28.3583984375, 29.68505859375, 31.01171875, 32.33837890625, 33.6650390625, 34.99169921875, 36.318359375, 37.64501953125, 38.9716796875, 40.29833984375, 41.625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 10.0, 15.0, 13.0, 9.0, 16.0, 37.0, 55.0, 86.0, 162.0, 337.0, 1040.0, 3808.0, 29048.0, 953670.0, 52785.0, 5240.0, 1286.0, 455.0, 203.0, 105.0, 47.0, 45.0, 20.0, 20.0, 11.0, 12.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.0535888671875, -3.911865234375, -3.7701416015625, -3.62841796875, -3.4866943359375, -3.344970703125, -3.2032470703125, -3.0615234375, -2.9197998046875, -2.778076171875, -2.6363525390625, -2.49462890625, -2.3529052734375, -2.211181640625, -2.0694580078125, -1.927734375, -1.7860107421875, -1.644287109375, -1.5025634765625, -1.36083984375, -1.2191162109375, -1.077392578125, -0.9356689453125, -0.7939453125, -0.6522216796875, -0.510498046875, -0.3687744140625, -0.22705078125, -0.0853271484375, 0.056396484375, 0.1981201171875, 0.33984375, 0.4815673828125, 0.623291015625, 0.7650146484375, 0.90673828125, 1.0484619140625, 1.190185546875, 1.3319091796875, 1.4736328125, 1.6153564453125, 1.757080078125, 1.8988037109375, 2.04052734375, 2.1822509765625, 2.323974609375, 2.4656982421875, 2.607421875, 2.7491455078125, 2.890869140625, 3.0325927734375, 3.17431640625, 3.3160400390625, 3.457763671875, 3.5994873046875, 3.7412109375, 3.8829345703125, 4.024658203125, 4.1663818359375, 4.30810546875, 4.4498291015625, 4.591552734375, 4.7332763671875, 4.875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 6.0, 9.0, 4.0, 10.0, 9.0, 14.0, 17.0, 18.0, 17.0, 17.0, 30.0, 50.0, 76.0, 87.0, 94.0, 107.0, 92.0, 72.0, 54.0, 50.0, 32.0, 23.0, 22.0, 14.0, 13.0, 7.0, 5.0, 9.0, 7.0, 8.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.0005636215209960938, -0.0005484633147716522, -0.0005333051085472107, -0.0005181469023227692, -0.0005029886960983276, -0.0004878304898738861, -0.0004726722836494446, -0.00045751407742500305, -0.0004423558712005615, -0.00042719766497612, -0.00041203945875167847, -0.00039688125252723694, -0.0003817230463027954, -0.0003665648400783539, -0.00035140663385391235, -0.0003362484276294708, -0.0003210902214050293, -0.00030593201518058777, -0.00029077380895614624, -0.0002756156027317047, -0.0002604573965072632, -0.00024529919028282166, -0.00023014098405838013, -0.0002149827778339386, -0.00019982457160949707, -0.00018466636538505554, -0.00016950815916061401, -0.00015434995293617249, -0.00013919174671173096, -0.00012403354048728943, -0.0001088753342628479, -9.371712803840637e-05, -7.855892181396484e-05, -6.340071558952332e-05, -4.824250936508179e-05, -3.308430314064026e-05, -1.792609691619873e-05, -2.767890691757202e-06, 1.2390315532684326e-05, 2.7548521757125854e-05, 4.270672798156738e-05, 5.786493420600891e-05, 7.302314043045044e-05, 8.818134665489197e-05, 0.0001033395528793335, 0.00011849775910377502, 0.00013365596532821655, 0.00014881417155265808, 0.0001639723777770996, 0.00017913058400154114, 0.00019428879022598267, 0.0002094469964504242, 0.00022460520267486572, 0.00023976340889930725, 0.0002549216151237488, 0.0002700798213481903, 0.00028523802757263184, 0.00030039623379707336, 0.0003155544400215149, 0.0003307126462459564, 0.00034587085247039795, 0.0003610290586948395, 0.000376187264919281, 0.00039134547114372253, 0.00040650367736816406]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 12.0, 11.0, 36.0, 28.0, 66.0, 150.0, 286.0, 659.0, 1964.0, 8422.0, 69181.0, 915431.0, 43523.0, 6081.0, 1606.0, 534.0, 232.0, 132.0, 66.0, 51.0, 26.0, 20.0, 9.0, 12.0, 1.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -1.99700927734375, -1.8885498046875, -1.78009033203125, -1.671630859375, -1.56317138671875, -1.4547119140625, -1.34625244140625, -1.23779296875, -1.12933349609375, -1.0208740234375, -0.91241455078125, -0.803955078125, -0.69549560546875, -0.5870361328125, -0.47857666015625, -0.3701171875, -0.26165771484375, -0.1531982421875, -0.04473876953125, 0.063720703125, 0.17218017578125, 0.2806396484375, 0.38909912109375, 0.49755859375, 0.60601806640625, 0.7144775390625, 0.82293701171875, 0.931396484375, 1.03985595703125, 1.1483154296875, 1.25677490234375, 1.365234375, 1.47369384765625, 1.5821533203125, 1.69061279296875, 1.799072265625, 1.90753173828125, 2.0159912109375, 2.12445068359375, 2.23291015625, 2.34136962890625, 2.4498291015625, 2.55828857421875, 2.666748046875, 2.77520751953125, 2.8836669921875, 2.99212646484375, 3.1005859375, 3.20904541015625, 3.3175048828125, 3.42596435546875, 3.534423828125, 3.64288330078125, 3.7513427734375, 3.85980224609375, 3.96826171875, 4.07672119140625, 4.1851806640625, 4.29364013671875, 4.402099609375, 4.51055908203125, 4.6190185546875, 4.72747802734375, 4.8359375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 5.0, 4.0, 6.0, 2.0, 8.0, 6.0, 6.0, 15.0, 20.0, 16.0, 22.0, 20.0, 34.0, 52.0, 72.0, 87.0, 119.0, 104.0, 103.0, 68.0, 53.0, 19.0, 30.0, 28.0, 15.0, 13.0, 16.0, 11.0, 5.0, 9.0, 8.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.73046875, -3.62127685546875, -3.5120849609375, -3.40289306640625, -3.293701171875, -3.18450927734375, -3.0753173828125, -2.96612548828125, -2.85693359375, -2.74774169921875, -2.6385498046875, -2.52935791015625, -2.420166015625, -2.31097412109375, -2.2017822265625, -2.09259033203125, -1.9833984375, -1.87420654296875, -1.7650146484375, -1.65582275390625, -1.546630859375, -1.43743896484375, -1.3282470703125, -1.21905517578125, -1.10986328125, -1.00067138671875, -0.8914794921875, -0.78228759765625, -0.673095703125, -0.56390380859375, -0.4547119140625, -0.34552001953125, -0.236328125, -0.12713623046875, -0.0179443359375, 0.09124755859375, 0.200439453125, 0.30963134765625, 0.4188232421875, 0.52801513671875, 0.63720703125, 0.74639892578125, 0.8555908203125, 0.96478271484375, 1.073974609375, 1.18316650390625, 1.2923583984375, 1.40155029296875, 1.5107421875, 1.61993408203125, 1.7291259765625, 1.83831787109375, 1.947509765625, 2.05670166015625, 2.1658935546875, 2.27508544921875, 2.38427734375, 2.49346923828125, 2.6026611328125, 2.71185302734375, 2.821044921875, 2.93023681640625, 3.0394287109375, 3.14862060546875, 3.2578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 15.0, 37.0, 117.0, 602.0, 131.0, 54.0, 27.0, 10.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.75347900390625, -281.3962097167969, -273.0389404296875, -264.681640625, -256.3243713378906, -247.96710205078125, -239.60983276367188, -231.2525634765625, -222.89527893066406, -214.5380096435547, -206.18072509765625, -197.82345581054688, -189.4661865234375, -181.10890197753906, -172.7516326904297, -164.39434814453125, -156.03707885742188, -147.6798095703125, -139.32252502441406, -130.9652557373047, -122.60797882080078, -114.25070190429688, -105.8934326171875, -97.5361557006836, -89.17887878417969, -80.82160186767578, -72.46432495117188, -64.1070556640625, -55.749778747558594, -47.39250183105469, -39.03522872924805, -30.677955627441406, -22.3206787109375, -13.963403701782227, -5.606128692626953, 2.7511463165283203, 11.108421325683594, 19.4656982421875, 27.82297134399414, 36.18024444580078, 44.53752136230469, 52.894798278808594, 61.252071380615234, 69.60934448242188, 77.96662139892578, 86.32389831542969, 94.68116760253906, 103.03844451904297, 111.39572143554688, 119.75299835205078, 128.1102752685547, 136.46754455566406, 144.8248291015625, 153.18209838867188, 161.53936767578125, 169.89663696289062, 178.25392150878906, 186.61119079589844, 194.96847534179688, 203.32574462890625, 211.68301391601562, 220.04029846191406, 228.39756774902344, 236.75485229492188, 245.11212158203125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 14.0, 19.0, 29.0, 38.0, 55.0, 49.0, 66.0, 369.0, 151.0, 63.0, 50.0, 35.0, 16.0, 14.0, 17.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-133.61251831054688, -125.6063461303711, -117.60017395019531, -109.593994140625, -101.58782196044922, -93.58164978027344, -85.57546997070312, -77.56929779052734, -69.56312561035156, -61.55695343017578, -53.550777435302734, -45.54460144042969, -37.538429260253906, -29.532257080078125, -21.526081085205078, -13.519905090332031, -5.51373291015625, 2.492441177368164, 10.498615264892578, 18.504789352416992, 26.510963439941406, 34.51713562011719, 42.523311614990234, 50.52948760986328, 58.53565979003906, 66.54183197021484, 74.54800415039062, 82.55418395996094, 90.56035614013672, 98.5665283203125, 106.57270812988281, 114.5788803100586, 122.5850830078125, 130.5912628173828, 138.59742736816406, 146.60360717773438, 154.60977172851562, 162.61595153808594, 170.62213134765625, 178.6282958984375, 186.6344757080078, 194.64065551757812, 202.64682006835938, 210.6529998779297, 218.6591796875, 226.66534423828125, 234.67152404785156, 242.67770385742188, 250.68386840820312, 258.6900329589844, 266.69622802734375, 274.702392578125, 282.70855712890625, 290.7147216796875, 298.7209167480469, 306.7270812988281, 314.7332763671875, 322.73944091796875, 330.7456359863281, 338.7518005371094, 346.7579650878906, 354.76416015625, 362.77032470703125, 370.7764892578125, 378.78265380859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 6.0, 4.0, 10.0, 15.0, 24.0, 19.0, 40.0, 50.0, 47.0, 77.0, 177.0, 312.0, 52.0, 54.0, 35.0, 36.0, 19.0, 9.0, 4.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.177734375, -10.62109375, -10.064453125, -9.5078125, -8.951171875, -8.39453125, -7.837890625, -7.28125, -6.724609375, -6.16796875, -5.611328125, -5.0546875, -4.498046875, -3.94140625, -3.384765625, -2.828125, -2.271484375, -1.71484375, -1.158203125, -0.6015625, -0.044921875, 0.51171875, 1.068359375, 1.625, 2.181640625, 2.73828125, 3.294921875, 3.8515625, 4.408203125, 4.96484375, 5.521484375, 6.078125, 6.634765625, 7.19140625, 7.748046875, 8.3046875, 8.861328125, 9.41796875, 9.974609375, 10.53125, 11.087890625, 11.64453125, 12.201171875, 12.7578125, 13.314453125, 13.87109375, 14.427734375, 14.984375, 15.541015625, 16.09765625, 16.654296875, 17.2109375, 17.767578125, 18.32421875, 18.880859375, 19.4375, 19.994140625, 20.55078125, 21.107421875, 21.6640625, 22.220703125, 22.77734375, 23.333984375, 23.890625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 2.0, 5.0, 3.0, 7.0, 17.0, 15.0, 10.0, 15.0, 20.0, 45.0, 53.0, 145.0, 283.0, 1177.0, 25972.0, 8357535.0, 2387.0, 472.0, 169.0, 66.0, 54.0, 28.0, 12.0, 26.0, 13.0, 1.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-240.01898193359375, -232.9963836669922, -225.97378540039062, -218.951171875, -211.92857360839844, -204.90597534179688, -197.8833770751953, -190.86077880859375, -183.8381805419922, -176.81558227539062, -169.79298400878906, -162.7703857421875, -155.74777221679688, -148.7251739501953, -141.70257568359375, -134.6799774169922, -127.6573715209961, -120.63477325439453, -113.61216735839844, -106.58956909179688, -99.56697082519531, -92.54437255859375, -85.52176666259766, -78.4991683959961, -71.4765625, -64.45396423339844, -57.43136215209961, -50.40876007080078, -43.38616180419922, -36.36355972290039, -29.340957641601562, -22.318359375, -15.295761108398438, -8.273160934448242, -1.2505598068237305, 5.772041320800781, 12.794641494750977, 19.817241668701172, 26.83984375, 33.86244201660156, 40.88504409790039, 47.90764617919922, 54.93024444580078, 61.95284652709961, 68.97544860839844, 75.998046875, 83.02064514160156, 90.04324340820312, 97.06584930419922, 104.08844757080078, 111.11105346679688, 118.13365173339844, 125.15625, 132.17884826660156, 139.20144653320312, 146.22406005859375, 153.2466583251953, 160.26925659179688, 167.29185485839844, 174.314453125, 181.33706665039062, 188.3596649169922, 195.38226318359375, 202.4048614501953, 209.42745971679688]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 5.0, 12.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-395.9598083496094, -386.100830078125, -376.2418518066406, -366.38287353515625, -356.52386474609375, -346.6648864746094, -336.805908203125, -326.9469299316406, -317.08795166015625, -307.2289733886719, -297.3699951171875, -287.5110168457031, -277.65203857421875, -267.79302978515625, -257.9340515136719, -248.0750732421875, -238.21609497070312, -228.35711669921875, -218.49813842773438, -208.63914489746094, -198.78016662597656, -188.9211883544922, -179.06219482421875, -169.20321655273438, -159.34423828125, -149.48526000976562, -139.62628173828125, -129.7672882080078, -119.90830993652344, -110.04933166503906, -100.19034576416016, -90.33135986328125, -80.472412109375, -70.61343383789062, -60.75444793701172, -50.89546585083008, -41.03648376464844, -31.177501678466797, -21.318519592285156, -11.45953369140625, -1.600555419921875, 8.258426666259766, 18.117408752441406, 27.976390838623047, 37.83537292480469, 47.69435501098633, 57.55333709716797, 67.41232299804688, 77.27130126953125, 87.13027954101562, 96.98926544189453, 106.84825134277344, 116.70722961425781, 126.56620788574219, 136.42520141601562, 146.2841796875, 156.14315795898438, 166.00213623046875, 175.86111450195312, 185.72010803222656, 195.57908630371094, 205.4380645751953, 215.29705810546875, 225.15603637695312, 235.0150146484375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 2.0, 3.0, 4.0, 11.0, 12.0, 19.0, 25.0, 28.0, 41.0, 88.0, 125.0, 239.0, 454.0, 1087.0, 3568.0, 14954.0, 80272.0, 286764.0, 107935.0, 20454.0, 4985.0, 1615.0, 695.0, 311.0, 185.0, 130.0, 59.0, 56.0, 34.0, 23.0, 19.0, 18.0, 10.0, 11.0, 8.0, 12.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.375, -73.5009765625, -70.626953125, -67.7529296875, -64.87890625, -62.0048828125, -59.130859375, -56.2568359375, -53.3828125, -50.5087890625, -47.634765625, -44.7607421875, -41.88671875, -39.0126953125, -36.138671875, -33.2646484375, -30.390625, -27.5166015625, -24.642578125, -21.7685546875, -18.89453125, -16.0205078125, -13.146484375, -10.2724609375, -7.3984375, -4.5244140625, -1.650390625, 1.2236328125, 4.09765625, 6.9716796875, 9.845703125, 12.7197265625, 15.59375, 18.4677734375, 21.341796875, 24.2158203125, 27.08984375, 29.9638671875, 32.837890625, 35.7119140625, 38.5859375, 41.4599609375, 44.333984375, 47.2080078125, 50.08203125, 52.9560546875, 55.830078125, 58.7041015625, 61.578125, 64.4521484375, 67.326171875, 70.2001953125, 73.07421875, 75.9482421875, 78.822265625, 81.6962890625, 84.5703125, 87.4443359375, 90.318359375, 93.1923828125, 96.06640625, 98.9404296875, 101.814453125, 104.6884765625, 107.5625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 9.0, 17.0, 38.0, 36.0, 60.0, 86.0, 112.0, 125.0, 129.0, 103.0, 80.0, 57.0, 35.0, 32.0, 24.0, 16.0, 13.0, 13.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3046875, -10.5943603515625, -9.884033203125, -9.1737060546875, -8.46337890625, -7.7530517578125, -7.042724609375, -6.3323974609375, -5.6220703125, -4.9117431640625, -4.201416015625, -3.4910888671875, -2.78076171875, -2.0704345703125, -1.360107421875, -0.6497802734375, 0.060546875, 0.7708740234375, 1.481201171875, 2.1915283203125, 2.90185546875, 3.6121826171875, 4.322509765625, 5.0328369140625, 5.7431640625, 6.4534912109375, 7.163818359375, 7.8741455078125, 8.58447265625, 9.2947998046875, 10.005126953125, 10.7154541015625, 11.42578125, 12.1361083984375, 12.846435546875, 13.5567626953125, 14.26708984375, 14.9774169921875, 15.687744140625, 16.3980712890625, 17.1083984375, 17.8187255859375, 18.529052734375, 19.2393798828125, 19.94970703125, 20.6600341796875, 21.370361328125, 22.0806884765625, 22.791015625, 23.5013427734375, 24.211669921875, 24.9219970703125, 25.63232421875, 26.3426513671875, 27.052978515625, 27.7633056640625, 28.4736328125, 29.1839599609375, 29.894287109375, 30.6046142578125, 31.31494140625, 32.0252685546875, 32.735595703125, 33.4459228515625, 34.15625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 25.0, 30.0, 64.0, 78.0, 93.0, 77.0, 50.0, 23.0, 10.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.19784545898438, -118.62834930419922, -115.05884552001953, -111.48934936523438, -107.91985321044922, -104.35035705566406, -100.78085327148438, -97.21135711669922, -93.64186096191406, -90.0723648071289, -86.50286102294922, -82.93336486816406, -79.3638687133789, -75.79437255859375, -72.22486877441406, -68.6553726196289, -65.08587646484375, -61.51637649536133, -57.94688034057617, -54.37738037109375, -50.807884216308594, -47.23838424682617, -43.66888427734375, -40.099388122558594, -36.529884338378906, -32.960384368896484, -29.390888214111328, -25.821388244628906, -22.25189208984375, -18.682392120361328, -15.112894058227539, -11.54339599609375, -7.973899841308594, -4.404401779174805, -0.8349032402038574, 2.73459529876709, 6.304093360900879, 9.873592376708984, 13.443090438842773, 17.012588500976562, 20.58208656311035, 24.15158462524414, 27.72108268737793, 31.29058074951172, 34.86008071899414, 38.42958068847656, 41.99907684326172, 45.568572998046875, 49.1380729675293, 52.70757293701172, 56.277069091796875, 59.8465690612793, 63.41606521606445, 66.98556518554688, 70.55506134033203, 74.12455749511719, 77.69406127929688, 81.26355743408203, 84.83306121826172, 88.40255737304688, 91.97205352783203, 95.54154968261719, 99.11105346679688, 102.68054962158203, 106.25004577636719]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 13.0, 16.0, 28.0, 48.0, 74.0, 85.0, 67.0, 49.0, 21.0, 13.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.279029846191406, -60.375274658203125, -58.471519470214844, -56.56776428222656, -54.66400909423828, -52.76025390625, -50.85649871826172, -48.95274353027344, -47.048988342285156, -45.145233154296875, -43.241477966308594, -41.33772277832031, -39.43396759033203, -37.53021240234375, -35.62645721435547, -33.72270202636719, -31.818946838378906, -29.915191650390625, -28.011436462402344, -26.107681274414062, -24.20392608642578, -22.3001708984375, -20.39641571044922, -18.492660522460938, -16.588905334472656, -14.685150146484375, -12.781394958496094, -10.877639770507812, -8.973884582519531, -7.07012939453125, -5.166374206542969, -3.2626190185546875, -1.3588676452636719, 0.5448875427246094, 2.4486427307128906, 4.352397918701172, 6.256153106689453, 8.159908294677734, 10.063663482666016, 11.967418670654297, 13.871173858642578, 15.77492904663086, 17.67868423461914, 19.582439422607422, 21.486194610595703, 23.389949798583984, 25.293704986572266, 27.197460174560547, 29.101215362548828, 31.00497055053711, 32.90872573852539, 34.81248092651367, 36.71623611450195, 38.619991302490234, 40.523746490478516, 42.4275016784668, 44.33125686645508, 46.23501205444336, 48.13876724243164, 50.04252243041992, 51.9462776184082, 53.850032806396484, 55.753787994384766, 57.65754318237305, 59.56129837036133]}, "eval/loss": 5.7725830078125, "eval/wer": 0.7927852848383833, "eval/runtime": 1037.3103, "eval/samples_per_second": 2.547, "eval/steps_per_second": 0.319, "train/train_runtime": 29013.0161, "train/train_samples_per_second": 4.918, "train/train_steps_per_second": 0.154, "train/total_flos": 0.0, "train/train_loss": 6.2593836770463955, "_wandb": {"runtime": 30422}} \ No newline at end of file