diff --git "a/wandb/run-20220308_102248-3h7e1p8o/files/wandb-summary.json" "b/wandb/run-20220308_102248-3h7e1p8o/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220308_102248-3h7e1p8o/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 5.7093, "train/learning_rate": 2.5664739884393065e-05, "train/epoch": 6.73, "train/global_step": 1500, "_runtime": 28375, "_timestamp": 1646763343, "_step": 1500, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 13.0, 15.0, 9.0, 244.0, 40.0, 27136.0, 2951.0, 47.0, 25.0, 12.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.5625, -64.2626953125, -59.962890625, -55.6630859375, -51.36328125, -47.0634765625, -42.763671875, -38.4638671875, -34.1640625, -29.8642578125, -25.564453125, -21.2646484375, -16.96484375, -12.6650390625, -8.365234375, -4.0654296875, 0.234375, 4.5341796875, 8.833984375, 13.1337890625, 17.43359375, 21.7333984375, 26.033203125, 30.3330078125, 34.6328125, 38.9326171875, 43.232421875, 47.5322265625, 51.83203125, 56.1318359375, 60.431640625, 64.7314453125, 69.03125, 73.3310546875, 77.630859375, 81.9306640625, 86.23046875, 90.5302734375, 94.830078125, 99.1298828125, 103.4296875, 107.7294921875, 112.029296875, 116.3291015625, 120.62890625, 124.9287109375, 129.228515625, 133.5283203125, 137.828125, 142.1279296875, 146.427734375, 150.7275390625, 155.02734375, 159.3271484375, 163.626953125, 167.9267578125, 172.2265625, 176.5263671875, 180.826171875, 185.1259765625, 189.42578125, 193.7255859375, 198.025390625, 202.3251953125, 206.625]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 3.0, 6.0, 4.0, 9.0, 16.0, 17.0, 17.0, 18.0, 27.0, 20.0, 37.0, 31.0, 41.0, 49.0, 77.0, 59.0, 52.0, 58.0, 68.0, 55.0, 55.0, 62.0, 44.0, 42.0, 42.0, 23.0, 19.0, 12.0, 17.0, 3.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.291805267333984, -29.244800567626953, -28.197795867919922, -27.15079116821289, -26.10378646850586, -25.056781768798828, -24.009775161743164, -22.962770462036133, -21.9157657623291, -20.86876106262207, -19.82175636291504, -18.774751663208008, -17.727745056152344, -16.680740356445312, -15.633735656738281, -14.58673095703125, -13.539726257324219, -12.492721557617188, -11.445716857910156, -10.398711204528809, -9.351706504821777, -8.304701805114746, -7.257696628570557, -6.210691452026367, -5.163686752319336, -4.116682052612305, -3.0696768760681152, -2.022671937942505, -0.9756669998168945, 0.07133769989013672, 1.1183428764343262, 2.1653480529785156, 3.2123565673828125, 4.259361267089844, 5.306366443634033, 6.353371620178223, 7.400376319885254, 8.447381019592285, 9.494386672973633, 10.541391372680664, 11.588396072387695, 12.635400772094727, 13.682405471801758, 14.729411125183105, 15.776415824890137, 16.823421478271484, 17.870426177978516, 18.917430877685547, 19.964435577392578, 21.01144027709961, 22.05844497680664, 23.105449676513672, 24.152454376220703, 25.199459075927734, 26.2464656829834, 27.29347038269043, 28.34047508239746, 29.387479782104492, 30.434484481811523, 31.481489181518555, 32.52849578857422, 33.57550048828125, 34.62250518798828, 35.66950988769531, 36.716514587402344]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 5.0, 4.0, 5.0, 7.0, 14.0, 7.0, 18.0, 24.0, 18.0, 20.0, 32.0, 22.0, 29.0, 33.0, 44.0, 31.0, 32.0, 47.0, 36.0, 36.0, 44.0, 49.0, 37.0, 45.0, 22.0, 38.0, 31.0, 33.0, 32.0, 32.0, 26.0, 19.0, 14.0, 18.0, 10.0, 9.0, 10.0, 16.0, 9.0, 2.0, 6.0, 9.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-22.69486427307129, -21.952890396118164, -21.21091651916504, -20.468942642211914, -19.726970672607422, -18.984996795654297, -18.243022918701172, -17.501049041748047, -16.759075164794922, -16.017101287841797, -15.275127410888672, -14.533154487609863, -13.791180610656738, -13.049206733703613, -12.307233810424805, -11.56525993347168, -10.823286056518555, -10.08131217956543, -9.339338302612305, -8.597365379333496, -7.855391502380371, -7.113417625427246, -6.371444225311279, -5.6294708251953125, -4.8874969482421875, -4.1455230712890625, -3.4035496711730957, -2.66157603263855, -1.919602394104004, -1.177628755569458, -0.4356551170349121, 0.3063182830810547, 1.0482940673828125, 1.7902677059173584, 2.5322413444519043, 3.27421498298645, 4.016188621520996, 4.758162498474121, 5.500135898590088, 6.242109298706055, 6.98408317565918, 7.726057052612305, 8.46803092956543, 9.210003852844238, 9.951977729797363, 10.693951606750488, 11.435924530029297, 12.177898406982422, 12.919872283935547, 13.661846160888672, 14.403820037841797, 15.145792961120605, 15.88776683807373, 16.62973976135254, 17.371713638305664, 18.11368751525879, 18.855661392211914, 19.59763526916504, 20.339609146118164, 21.08158302307129, 21.82355499267578, 22.565528869628906, 23.30750274658203, 24.049476623535156, 24.79145050048828]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 5.0, 5.0, 13.0, 11.0, 12.0, 18.0, 30.0, 45.0, 95.0, 128.0, 214.0, 307.0, 472.0, 817.0, 1241.0, 1966.0, 2978.0, 4589.0, 7071.0, 10674.0, 16132.0, 23439.0, 34011.0, 48862.0, 69436.0, 97987.0, 137587.0, 164800.0, 129012.0, 91466.0, 64009.0, 45135.0, 31320.0, 21784.0, 14853.0, 9870.0, 6491.0, 4257.0, 2617.0, 1762.0, 1086.0, 688.0, 455.0, 300.0, 197.0, 127.0, 62.0, 42.0, 30.0, 22.0, 20.0, 10.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.4375, -62.3173828125, -60.197265625, -58.0771484375, -55.95703125, -53.8369140625, -51.716796875, -49.5966796875, -47.4765625, -45.3564453125, -43.236328125, -41.1162109375, -38.99609375, -36.8759765625, -34.755859375, -32.6357421875, -30.515625, -28.3955078125, -26.275390625, -24.1552734375, -22.03515625, -19.9150390625, -17.794921875, -15.6748046875, -13.5546875, -11.4345703125, -9.314453125, -7.1943359375, -5.07421875, -2.9541015625, -0.833984375, 1.2861328125, 3.40625, 5.5263671875, 7.646484375, 9.7666015625, 11.88671875, 14.0068359375, 16.126953125, 18.2470703125, 20.3671875, 22.4873046875, 24.607421875, 26.7275390625, 28.84765625, 30.9677734375, 33.087890625, 35.2080078125, 37.328125, 39.4482421875, 41.568359375, 43.6884765625, 45.80859375, 47.9287109375, 50.048828125, 52.1689453125, 54.2890625, 56.4091796875, 58.529296875, 60.6494140625, 62.76953125, 64.8896484375, 67.009765625, 69.1298828125, 71.25]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 0.0, 4.0, 4.0, 5.0, 4.0, 5.0, 8.0, 9.0, 13.0, 17.0, 18.0, 16.0, 33.0, 27.0, 37.0, 45.0, 52.0, 48.0, 67.0, 68.0, 80.0, 68.0, 47.0, 42.0, 37.0, 41.0, 28.0, 39.0, 21.0, 25.0, 7.0, 16.0, 14.0, 15.0, 8.0, 5.0, 4.0, 9.0, 2.0, 3.0, 2.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.0625, -34.95361328125, -33.8447265625, -32.73583984375, -31.626953125, -30.51806640625, -29.4091796875, -28.30029296875, -27.19140625, -26.08251953125, -24.9736328125, -23.86474609375, -22.755859375, -21.64697265625, -20.5380859375, -19.42919921875, -18.3203125, -17.21142578125, -16.1025390625, -14.99365234375, -13.884765625, -12.77587890625, -11.6669921875, -10.55810546875, -9.44921875, -8.34033203125, -7.2314453125, -6.12255859375, -5.013671875, -3.90478515625, -2.7958984375, -1.68701171875, -0.578125, 0.53076171875, 1.6396484375, 2.74853515625, 3.857421875, 4.96630859375, 6.0751953125, 7.18408203125, 8.29296875, 9.40185546875, 10.5107421875, 11.61962890625, 12.728515625, 13.83740234375, 14.9462890625, 16.05517578125, 17.1640625, 18.27294921875, 19.3818359375, 20.49072265625, 21.599609375, 22.70849609375, 23.8173828125, 24.92626953125, 26.03515625, 27.14404296875, 28.2529296875, 29.36181640625, 30.470703125, 31.57958984375, 32.6884765625, 33.79736328125, 34.90625]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 9.0, 5.0, 9.0, 12.0, 19.0, 17.0, 28.0, 20.0, 27.0, 31.0, 32.0, 60.0, 48.0, 54.0, 58.0, 55.0, 46.0, 53.0, 38.0, 52.0, 47.0, 35.0, 36.0, 30.0, 29.0, 26.0, 23.0, 21.0, 16.0, 17.0, 5.0, 6.0, 8.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.149961471557617, -17.51326560974121, -16.876569747924805, -16.2398738861084, -15.603178024291992, -14.966482162475586, -14.32978630065918, -13.693090438842773, -13.056394577026367, -12.419698715209961, -11.783002853393555, -11.146306991577148, -10.509611129760742, -9.872915267944336, -9.23621940612793, -8.599523544311523, -7.962827682495117, -7.326131820678711, -6.689435958862305, -6.052740097045898, -5.416044235229492, -4.779348373413086, -4.14265251159668, -3.5059566497802734, -2.869260787963867, -2.232564926147461, -1.5958690643310547, -0.9591732025146484, -0.3224773406982422, 0.31421852111816406, 0.9509143829345703, 1.5876102447509766, 2.224306106567383, 2.861001968383789, 3.4976978302001953, 4.134393692016602, 4.771089553833008, 5.407785415649414, 6.04448127746582, 6.681177139282227, 7.317873001098633, 7.954568862915039, 8.591264724731445, 9.227960586547852, 9.864656448364258, 10.501352310180664, 11.13804817199707, 11.774744033813477, 12.411439895629883, 13.048135757446289, 13.684831619262695, 14.321527481079102, 14.958223342895508, 15.594919204711914, 16.23161506652832, 16.868310928344727, 17.505006790161133, 18.14170265197754, 18.778398513793945, 19.41509437561035, 20.051790237426758, 20.688486099243164, 21.32518196105957, 21.961877822875977, 22.598573684692383]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 7.0, 4.0, 6.0, 8.0, 7.0, 6.0, 15.0, 11.0, 14.0, 10.0, 20.0, 24.0, 26.0, 27.0, 30.0, 23.0, 43.0, 28.0, 40.0, 44.0, 42.0, 45.0, 37.0, 47.0, 40.0, 31.0, 40.0, 36.0, 28.0, 34.0, 36.0, 27.0, 31.0, 25.0, 17.0, 16.0, 14.0, 9.0, 8.0, 10.0, 2.0, 11.0, 3.0, 5.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.773460388183594, -16.20166015625, -15.629859924316406, -15.058059692382812, -14.486259460449219, -13.914459228515625, -13.342658042907715, -12.770857810974121, -12.199057579040527, -11.627257347106934, -11.05545711517334, -10.483656883239746, -9.911855697631836, -9.340055465698242, -8.768255233764648, -8.196455001831055, -7.624654769897461, -7.052854537963867, -6.481054306030273, -5.9092535972595215, -5.337453365325928, -4.765653133392334, -4.193852424621582, -3.6220521926879883, -3.0502519607543945, -2.478451728820801, -1.906651258468628, -1.3348509073257446, -0.7630505561828613, -0.19125032424926758, 0.3805501461029053, 0.9523506164550781, 1.5241508483886719, 2.0959510803222656, 2.6677515506744385, 3.2395520210266113, 3.811352252960205, 4.383152484893799, 4.954953193664551, 5.5267534255981445, 6.098553657531738, 6.670353889465332, 7.242154121398926, 7.813954830169678, 8.38575553894043, 8.957555770874023, 9.529356002807617, 10.101156234741211, 10.672956466674805, 11.244756698608398, 11.816556930541992, 12.388357162475586, 12.96015739440918, 13.531957626342773, 14.103758811950684, 14.675559043884277, 15.247359275817871, 15.819159507751465, 16.390960693359375, 16.96276092529297, 17.534561157226562, 18.106361389160156, 18.67816162109375, 19.249961853027344, 19.821762084960938]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 15.0, 18.0, 25.0, 44.0, 64.0, 93.0, 166.0, 259.0, 387.0, 673.0, 1025.0, 1689.0, 2615.0, 4149.0, 6668.0, 10444.0, 16358.0, 25725.0, 39449.0, 60532.0, 92171.0, 136125.0, 197779.0, 276681.0, 366166.0, 448933.0, 496552.0, 486740.0, 423620.0, 333668.0, 245964.0, 175212.0, 119320.0, 80335.0, 52387.0, 33632.0, 21645.0, 13825.0, 8544.0, 5479.0, 3455.0, 2147.0, 1345.0, 819.0, 528.0, 324.0, 193.0, 121.0, 76.0, 38.0, 20.0, 20.0, 11.0, 5.0, 3.0, 0.0, 3.0, 3.0], "bins": [-14.140625, -13.7095947265625, -13.278564453125, -12.8475341796875, -12.41650390625, -11.9854736328125, -11.554443359375, -11.1234130859375, -10.6923828125, -10.2613525390625, -9.830322265625, -9.3992919921875, -8.96826171875, -8.5372314453125, -8.106201171875, -7.6751708984375, -7.244140625, -6.8131103515625, -6.382080078125, -5.9510498046875, -5.52001953125, -5.0889892578125, -4.657958984375, -4.2269287109375, -3.7958984375, -3.3648681640625, -2.933837890625, -2.5028076171875, -2.07177734375, -1.6407470703125, -1.209716796875, -0.7786865234375, -0.34765625, 0.0833740234375, 0.514404296875, 0.9454345703125, 1.37646484375, 1.8074951171875, 2.238525390625, 2.6695556640625, 3.1005859375, 3.5316162109375, 3.962646484375, 4.3936767578125, 4.82470703125, 5.2557373046875, 5.686767578125, 6.1177978515625, 6.548828125, 6.9798583984375, 7.410888671875, 7.8419189453125, 8.27294921875, 8.7039794921875, 9.135009765625, 9.5660400390625, 9.9970703125, 10.4281005859375, 10.859130859375, 11.2901611328125, 11.72119140625, 12.1522216796875, 12.583251953125, 13.0142822265625, 13.4453125]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 13.0, 7.0, 3.0, 9.0, 10.0, 8.0, 15.0, 16.0, 16.0, 17.0, 19.0, 22.0, 24.0, 23.0, 31.0, 46.0, 38.0, 38.0, 39.0, 42.0, 42.0, 45.0, 38.0, 44.0, 41.0, 36.0, 27.0, 36.0, 26.0, 39.0, 16.0, 29.0, 21.0, 13.0, 21.0, 12.0, 11.0, 9.0, 4.0, 12.0, 6.0, 12.0, 6.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9609375, -12.526123046875, -12.09130859375, -11.656494140625, -11.2216796875, -10.786865234375, -10.35205078125, -9.917236328125, -9.482421875, -9.047607421875, -8.61279296875, -8.177978515625, -7.7431640625, -7.308349609375, -6.87353515625, -6.438720703125, -6.00390625, -5.569091796875, -5.13427734375, -4.699462890625, -4.2646484375, -3.829833984375, -3.39501953125, -2.960205078125, -2.525390625, -2.090576171875, -1.65576171875, -1.220947265625, -0.7861328125, -0.351318359375, 0.08349609375, 0.518310546875, 0.953125, 1.387939453125, 1.82275390625, 2.257568359375, 2.6923828125, 3.127197265625, 3.56201171875, 3.996826171875, 4.431640625, 4.866455078125, 5.30126953125, 5.736083984375, 6.1708984375, 6.605712890625, 7.04052734375, 7.475341796875, 7.91015625, 8.344970703125, 8.77978515625, 9.214599609375, 9.6494140625, 10.084228515625, 10.51904296875, 10.953857421875, 11.388671875, 11.823486328125, 12.25830078125, 12.693115234375, 13.1279296875, 13.562744140625, 13.99755859375, 14.432373046875, 14.8671875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 14.0, 13.0, 18.0, 31.0, 56.0, 97.0, 139.0, 226.0, 378.0, 562.0, 972.0, 1509.0, 2462.0, 4103.0, 6685.0, 11068.0, 17368.0, 27170.0, 42260.0, 63734.0, 93910.0, 133610.0, 183842.0, 244301.0, 308607.0, 368848.0, 414735.0, 428020.0, 406584.0, 358289.0, 295129.0, 231374.0, 173626.0, 123943.0, 87170.0, 58512.0, 38970.0, 24737.0, 15667.0, 9800.0, 6041.0, 3880.0, 2276.0, 1321.0, 810.0, 567.0, 329.0, 183.0, 123.0, 89.0, 63.0, 39.0, 15.0, 9.0, 3.0, 0.0, 0.0, 2.0], "bins": [-13.0703125, -12.678955078125, -12.28759765625, -11.896240234375, -11.5048828125, -11.113525390625, -10.72216796875, -10.330810546875, -9.939453125, -9.548095703125, -9.15673828125, -8.765380859375, -8.3740234375, -7.982666015625, -7.59130859375, -7.199951171875, -6.80859375, -6.417236328125, -6.02587890625, -5.634521484375, -5.2431640625, -4.851806640625, -4.46044921875, -4.069091796875, -3.677734375, -3.286376953125, -2.89501953125, -2.503662109375, -2.1123046875, -1.720947265625, -1.32958984375, -0.938232421875, -0.546875, -0.155517578125, 0.23583984375, 0.627197265625, 1.0185546875, 1.409912109375, 1.80126953125, 2.192626953125, 2.583984375, 2.975341796875, 3.36669921875, 3.758056640625, 4.1494140625, 4.540771484375, 4.93212890625, 5.323486328125, 5.71484375, 6.106201171875, 6.49755859375, 6.888916015625, 7.2802734375, 7.671630859375, 8.06298828125, 8.454345703125, 8.845703125, 9.237060546875, 9.62841796875, 10.019775390625, 10.4111328125, 10.802490234375, 11.19384765625, 11.585205078125, 11.9765625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 3.0, 4.0, 8.0, 9.0, 4.0, 11.0, 16.0, 13.0, 14.0, 22.0, 30.0, 43.0, 55.0, 52.0, 61.0, 68.0, 83.0, 94.0, 125.0, 112.0, 158.0, 162.0, 180.0, 188.0, 216.0, 207.0, 198.0, 213.0, 200.0, 202.0, 184.0, 181.0, 149.0, 123.0, 103.0, 83.0, 92.0, 87.0, 60.0, 42.0, 50.0, 40.0, 26.0, 16.0, 13.0, 21.0, 18.0, 10.0, 5.0, 5.0, 7.0, 4.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3203125, -6.1033935546875, -5.886474609375, -5.6695556640625, -5.45263671875, -5.2357177734375, -5.018798828125, -4.8018798828125, -4.5849609375, -4.3680419921875, -4.151123046875, -3.9342041015625, -3.71728515625, -3.5003662109375, -3.283447265625, -3.0665283203125, -2.849609375, -2.6326904296875, -2.415771484375, -2.1988525390625, -1.98193359375, -1.7650146484375, -1.548095703125, -1.3311767578125, -1.1142578125, -0.8973388671875, -0.680419921875, -0.4635009765625, -0.24658203125, -0.0296630859375, 0.187255859375, 0.4041748046875, 0.62109375, 0.8380126953125, 1.054931640625, 1.2718505859375, 1.48876953125, 1.7056884765625, 1.922607421875, 2.1395263671875, 2.3564453125, 2.5733642578125, 2.790283203125, 3.0072021484375, 3.22412109375, 3.4410400390625, 3.657958984375, 3.8748779296875, 4.091796875, 4.3087158203125, 4.525634765625, 4.7425537109375, 4.95947265625, 5.1763916015625, 5.393310546875, 5.6102294921875, 5.8271484375, 6.0440673828125, 6.260986328125, 6.4779052734375, 6.69482421875, 6.9117431640625, 7.128662109375, 7.3455810546875, 7.5625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 2.0, 7.0, 2.0, 9.0, 8.0, 13.0, 11.0, 7.0, 19.0, 24.0, 28.0, 22.0, 22.0, 36.0, 33.0, 31.0, 41.0, 38.0, 35.0, 40.0, 37.0, 55.0, 40.0, 31.0, 43.0, 38.0, 26.0, 33.0, 31.0, 33.0, 30.0, 28.0, 13.0, 22.0, 11.0, 18.0, 18.0, 11.0, 11.0, 6.0, 5.0, 4.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-14.633525848388672, -14.15636920928955, -13.679213523864746, -13.202056884765625, -12.72490119934082, -12.2477445602417, -11.770587921142578, -11.293432235717773, -10.816275596618652, -10.339118957519531, -9.861963272094727, -9.384806632995605, -8.9076509475708, -8.43049430847168, -7.953338146209717, -7.476181983947754, -6.999025821685791, -6.521869659423828, -6.044713497161865, -5.567557334899902, -5.090400695800781, -4.613244533538818, -4.1360883712768555, -3.6589319705963135, -3.1817758083343506, -2.7046196460723877, -2.2274632453918457, -1.7503070831298828, -1.2731508016586304, -0.7959945201873779, -0.31883835792541504, 0.15831804275512695, 0.6354742050170898, 1.1126304864883423, 1.5897867679595947, 2.0669429302215576, 2.5440993309020996, 3.0212554931640625, 3.4984116554260254, 3.9755680561065674, 4.452724456787109, 4.929880619049072, 5.407036781311035, 5.884193420410156, 6.361349582672119, 6.838505744934082, 7.315661907196045, 7.792818069458008, 8.269973754882812, 8.747130393981934, 9.224286079406738, 9.70144271850586, 10.178598403930664, 10.655755043029785, 11.132911682128906, 11.610067367553711, 12.087224006652832, 12.564380645751953, 13.041536331176758, 13.518692970275879, 13.995848655700684, 14.473005294799805, 14.95016098022461, 15.42731761932373, 15.904474258422852]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 12.0, 15.0, 14.0, 11.0, 19.0, 21.0, 22.0, 27.0, 26.0, 21.0, 33.0, 34.0, 30.0, 30.0, 36.0, 37.0, 43.0, 47.0, 52.0, 37.0, 39.0, 20.0, 36.0, 28.0, 28.0, 44.0, 28.0, 18.0, 19.0, 18.0, 24.0, 23.0, 8.0, 19.0, 8.0, 8.0, 8.0, 11.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-17.379621505737305, -16.850271224975586, -16.3209228515625, -15.791572570800781, -15.262222290039062, -14.732872009277344, -14.203522682189941, -13.674173355102539, -13.14482307434082, -12.615472793579102, -12.0861234664917, -11.556774139404297, -11.027423858642578, -10.49807357788086, -9.968724250793457, -9.439374923706055, -8.910024642944336, -8.380674362182617, -7.851325035095215, -7.321975231170654, -6.792625427246094, -6.263275623321533, -5.733925819396973, -5.204576015472412, -4.675226211547852, -4.145876407623291, -3.6165266036987305, -3.08717679977417, -2.5578269958496094, -2.028477191925049, -1.4991273880004883, -0.9697775840759277, -0.4404258728027344, 0.08892393112182617, 0.6182737350463867, 1.1476235389709473, 1.6769733428955078, 2.2063231468200684, 2.735672950744629, 3.2650227546691895, 3.79437255859375, 4.3237223625183105, 4.853072166442871, 5.382421970367432, 5.911771774291992, 6.441121578216553, 6.970471382141113, 7.499821186065674, 8.029170989990234, 8.558521270751953, 9.087870597839355, 9.617219924926758, 10.146570205688477, 10.675920486450195, 11.205269813537598, 11.734619140625, 12.263969421386719, 12.793319702148438, 13.32266902923584, 13.852018356323242, 14.381368637084961, 14.91071891784668, 15.440068244934082, 15.969417572021484, 16.498767852783203]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 9.0, 12.0, 15.0, 22.0, 28.0, 57.0, 63.0, 110.0, 140.0, 239.0, 388.0, 568.0, 939.0, 1490.0, 2484.0, 4137.0, 7024.0, 11984.0, 21221.0, 37564.0, 66760.0, 117512.0, 189360.0, 217222.0, 156735.0, 91576.0, 52084.0, 28673.0, 16713.0, 9371.0, 5452.0, 3265.0, 2005.0, 1215.0, 752.0, 469.0, 318.0, 181.0, 146.0, 70.0, 51.0, 29.0, 31.0, 19.0, 11.0, 13.0, 7.0, 2.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-11.84375, -11.465087890625, -11.08642578125, -10.707763671875, -10.3291015625, -9.950439453125, -9.57177734375, -9.193115234375, -8.814453125, -8.435791015625, -8.05712890625, -7.678466796875, -7.2998046875, -6.921142578125, -6.54248046875, -6.163818359375, -5.78515625, -5.406494140625, -5.02783203125, -4.649169921875, -4.2705078125, -3.891845703125, -3.51318359375, -3.134521484375, -2.755859375, -2.377197265625, -1.99853515625, -1.619873046875, -1.2412109375, -0.862548828125, -0.48388671875, -0.105224609375, 0.2734375, 0.652099609375, 1.03076171875, 1.409423828125, 1.7880859375, 2.166748046875, 2.54541015625, 2.924072265625, 3.302734375, 3.681396484375, 4.06005859375, 4.438720703125, 4.8173828125, 5.196044921875, 5.57470703125, 5.953369140625, 6.33203125, 6.710693359375, 7.08935546875, 7.468017578125, 7.8466796875, 8.225341796875, 8.60400390625, 8.982666015625, 9.361328125, 9.739990234375, 10.11865234375, 10.497314453125, 10.8759765625, 11.254638671875, 11.63330078125, 12.011962890625, 12.390625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 2.0, 3.0, 4.0, 8.0, 13.0, 11.0, 15.0, 23.0, 17.0, 20.0, 21.0, 21.0, 20.0, 29.0, 29.0, 34.0, 34.0, 30.0, 41.0, 37.0, 36.0, 39.0, 48.0, 32.0, 47.0, 39.0, 26.0, 32.0, 25.0, 38.0, 28.0, 33.0, 20.0, 17.0, 15.0, 12.0, 20.0, 19.0, 11.0, 6.0, 11.0, 6.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.9140625, -15.3829345703125, -14.851806640625, -14.3206787109375, -13.78955078125, -13.2584228515625, -12.727294921875, -12.1961669921875, -11.6650390625, -11.1339111328125, -10.602783203125, -10.0716552734375, -9.54052734375, -9.0093994140625, -8.478271484375, -7.9471435546875, -7.416015625, -6.8848876953125, -6.353759765625, -5.8226318359375, -5.29150390625, -4.7603759765625, -4.229248046875, -3.6981201171875, -3.1669921875, -2.6358642578125, -2.104736328125, -1.5736083984375, -1.04248046875, -0.5113525390625, 0.019775390625, 0.5509033203125, 1.08203125, 1.6131591796875, 2.144287109375, 2.6754150390625, 3.20654296875, 3.7376708984375, 4.268798828125, 4.7999267578125, 5.3310546875, 5.8621826171875, 6.393310546875, 6.9244384765625, 7.45556640625, 7.9866943359375, 8.517822265625, 9.0489501953125, 9.580078125, 10.1112060546875, 10.642333984375, 11.1734619140625, 11.70458984375, 12.2357177734375, 12.766845703125, 13.2979736328125, 13.8291015625, 14.3602294921875, 14.891357421875, 15.4224853515625, 15.95361328125, 16.4847412109375, 17.015869140625, 17.5469970703125, 18.078125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 6.0, 2.0, 6.0, 10.0, 13.0, 9.0, 10.0, 26.0, 34.0, 46.0, 68.0, 111.0, 200.0, 319.0, 593.0, 1160.0, 2352.0, 5131.0, 11936.0, 29128.0, 76099.0, 210708.0, 387292.0, 200859.0, 73256.0, 27843.0, 11510.0, 5016.0, 2326.0, 1064.0, 563.0, 344.0, 167.0, 102.0, 84.0, 50.0, 29.0, 24.0, 17.0, 14.0, 17.0, 3.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-17.25, -16.7896728515625, -16.329345703125, -15.8690185546875, -15.40869140625, -14.9483642578125, -14.488037109375, -14.0277099609375, -13.5673828125, -13.1070556640625, -12.646728515625, -12.1864013671875, -11.72607421875, -11.2657470703125, -10.805419921875, -10.3450927734375, -9.884765625, -9.4244384765625, -8.964111328125, -8.5037841796875, -8.04345703125, -7.5831298828125, -7.122802734375, -6.6624755859375, -6.2021484375, -5.7418212890625, -5.281494140625, -4.8211669921875, -4.36083984375, -3.9005126953125, -3.440185546875, -2.9798583984375, -2.51953125, -2.0592041015625, -1.598876953125, -1.1385498046875, -0.67822265625, -0.2178955078125, 0.242431640625, 0.7027587890625, 1.1630859375, 1.6234130859375, 2.083740234375, 2.5440673828125, 3.00439453125, 3.4647216796875, 3.925048828125, 4.3853759765625, 4.845703125, 5.3060302734375, 5.766357421875, 6.2266845703125, 6.68701171875, 7.1473388671875, 7.607666015625, 8.0679931640625, 8.5283203125, 8.9886474609375, 9.448974609375, 9.9093017578125, 10.36962890625, 10.8299560546875, 11.290283203125, 11.7506103515625, 12.2109375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 6.0, 5.0, 8.0, 12.0, 14.0, 10.0, 13.0, 12.0, 23.0, 25.0, 30.0, 29.0, 34.0, 29.0, 42.0, 45.0, 47.0, 55.0, 44.0, 46.0, 41.0, 33.0, 48.0, 38.0, 32.0, 26.0, 36.0, 20.0, 36.0, 26.0, 21.0, 22.0, 12.0, 12.0, 16.0, 8.0, 10.0, 15.0, 7.0, 5.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.328125, -11.9072265625, -11.486328125, -11.0654296875, -10.64453125, -10.2236328125, -9.802734375, -9.3818359375, -8.9609375, -8.5400390625, -8.119140625, -7.6982421875, -7.27734375, -6.8564453125, -6.435546875, -6.0146484375, -5.59375, -5.1728515625, -4.751953125, -4.3310546875, -3.91015625, -3.4892578125, -3.068359375, -2.6474609375, -2.2265625, -1.8056640625, -1.384765625, -0.9638671875, -0.54296875, -0.1220703125, 0.298828125, 0.7197265625, 1.140625, 1.5615234375, 1.982421875, 2.4033203125, 2.82421875, 3.2451171875, 3.666015625, 4.0869140625, 4.5078125, 4.9287109375, 5.349609375, 5.7705078125, 6.19140625, 6.6123046875, 7.033203125, 7.4541015625, 7.875, 8.2958984375, 8.716796875, 9.1376953125, 9.55859375, 9.9794921875, 10.400390625, 10.8212890625, 11.2421875, 11.6630859375, 12.083984375, 12.5048828125, 12.92578125, 13.3466796875, 13.767578125, 14.1884765625, 14.609375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 14.0, 13.0, 21.0, 22.0, 35.0, 59.0, 90.0, 116.0, 148.0, 210.0, 309.0, 496.0, 1137.0, 3343.0, 12524.0, 79186.0, 647749.0, 262064.0, 30704.0, 6296.0, 1991.0, 737.0, 396.0, 236.0, 169.0, 117.0, 118.0, 58.0, 58.0, 39.0, 25.0, 19.0, 12.0, 9.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.921875, -14.436767578125, -13.95166015625, -13.466552734375, -12.9814453125, -12.496337890625, -12.01123046875, -11.526123046875, -11.041015625, -10.555908203125, -10.07080078125, -9.585693359375, -9.1005859375, -8.615478515625, -8.13037109375, -7.645263671875, -7.16015625, -6.675048828125, -6.18994140625, -5.704833984375, -5.2197265625, -4.734619140625, -4.24951171875, -3.764404296875, -3.279296875, -2.794189453125, -2.30908203125, -1.823974609375, -1.3388671875, -0.853759765625, -0.36865234375, 0.116455078125, 0.6015625, 1.086669921875, 1.57177734375, 2.056884765625, 2.5419921875, 3.027099609375, 3.51220703125, 3.997314453125, 4.482421875, 4.967529296875, 5.45263671875, 5.937744140625, 6.4228515625, 6.907958984375, 7.39306640625, 7.878173828125, 8.36328125, 8.848388671875, 9.33349609375, 9.818603515625, 10.3037109375, 10.788818359375, 11.27392578125, 11.759033203125, 12.244140625, 12.729248046875, 13.21435546875, 13.699462890625, 14.1845703125, 14.669677734375, 15.15478515625, 15.639892578125, 16.125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 6.0, 12.0, 6.0, 21.0, 25.0, 42.0, 58.0, 77.0, 115.0, 140.0, 141.0, 89.0, 77.0, 63.0, 27.0, 30.0, 17.0, 13.0, 13.0, 6.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007505416870117188, -0.0007296130061149597, -0.0007086843252182007, -0.0006877556443214417, -0.0006668269634246826, -0.0006458982825279236, -0.0006249696016311646, -0.0006040409207344055, -0.0005831122398376465, -0.0005621835589408875, -0.0005412548780441284, -0.0005203261971473694, -0.0004993975162506104, -0.0004784688353538513, -0.0004575401544570923, -0.00043661147356033325, -0.0004156827926635742, -0.0003947541117668152, -0.00037382543087005615, -0.0003528967499732971, -0.0003319680690765381, -0.00031103938817977905, -0.00029011070728302, -0.000269182026386261, -0.00024825334548950195, -0.00022732466459274292, -0.0002063959836959839, -0.00018546730279922485, -0.00016453862190246582, -0.0001436099410057068, -0.00012268126010894775, -0.00010175257921218872, -8.082389831542969e-05, -5.9895217418670654e-05, -3.896653652191162e-05, -1.8037855625152588e-05, 2.8908252716064453e-06, 2.381950616836548e-05, 4.474818706512451e-05, 6.567686796188354e-05, 8.660554885864258e-05, 0.00010753422975540161, 0.00012846291065216064, 0.00014939159154891968, 0.0001703202724456787, 0.00019124895334243774, 0.00021217763423919678, 0.0002331063151359558, 0.00025403499603271484, 0.0002749636769294739, 0.0002958923578262329, 0.00031682103872299194, 0.000337749719619751, 0.00035867840051651, 0.00037960708141326904, 0.0004005357623100281, 0.0004214644432067871, 0.00044239312410354614, 0.0004633218050003052, 0.0004842504858970642, 0.0005051791667938232, 0.0005261078476905823, 0.0005470365285873413, 0.0005679652094841003, 0.0005888938903808594]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 11.0, 5.0, 10.0, 12.0, 10.0, 35.0, 40.0, 46.0, 61.0, 91.0, 113.0, 165.0, 198.0, 362.0, 507.0, 820.0, 1360.0, 2303.0, 4333.0, 8510.0, 17698.0, 37128.0, 80280.0, 177611.0, 319243.0, 213451.0, 96586.0, 44644.0, 20731.0, 10048.0, 5235.0, 2687.0, 1449.0, 931.0, 558.0, 371.0, 256.0, 183.0, 131.0, 102.0, 61.0, 56.0, 37.0, 21.0, 24.0, 16.0, 4.0, 8.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.4453125, -11.1048583984375, -10.764404296875, -10.4239501953125, -10.08349609375, -9.7430419921875, -9.402587890625, -9.0621337890625, -8.7216796875, -8.3812255859375, -8.040771484375, -7.7003173828125, -7.35986328125, -7.0194091796875, -6.678955078125, -6.3385009765625, -5.998046875, -5.6575927734375, -5.317138671875, -4.9766845703125, -4.63623046875, -4.2957763671875, -3.955322265625, -3.6148681640625, -3.2744140625, -2.9339599609375, -2.593505859375, -2.2530517578125, -1.91259765625, -1.5721435546875, -1.231689453125, -0.8912353515625, -0.55078125, -0.2103271484375, 0.130126953125, 0.4705810546875, 0.81103515625, 1.1514892578125, 1.491943359375, 1.8323974609375, 2.1728515625, 2.5133056640625, 2.853759765625, 3.1942138671875, 3.53466796875, 3.8751220703125, 4.215576171875, 4.5560302734375, 4.896484375, 5.2369384765625, 5.577392578125, 5.9178466796875, 6.25830078125, 6.5987548828125, 6.939208984375, 7.2796630859375, 7.6201171875, 7.9605712890625, 8.301025390625, 8.6414794921875, 8.98193359375, 9.3223876953125, 9.662841796875, 10.0032958984375, 10.34375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 6.0, 18.0, 15.0, 17.0, 17.0, 26.0, 27.0, 42.0, 39.0, 51.0, 54.0, 80.0, 44.0, 51.0, 70.0, 65.0, 59.0, 51.0, 49.0, 38.0, 32.0, 29.0, 26.0, 23.0, 18.0, 9.0, 7.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.39453125, -3.27288818359375, -3.1512451171875, -3.02960205078125, -2.907958984375, -2.78631591796875, -2.6646728515625, -2.54302978515625, -2.42138671875, -2.29974365234375, -2.1781005859375, -2.05645751953125, -1.934814453125, -1.81317138671875, -1.6915283203125, -1.56988525390625, -1.4482421875, -1.32659912109375, -1.2049560546875, -1.08331298828125, -0.961669921875, -0.84002685546875, -0.7183837890625, -0.59674072265625, -0.47509765625, -0.35345458984375, -0.2318115234375, -0.11016845703125, 0.011474609375, 0.13311767578125, 0.2547607421875, 0.37640380859375, 0.498046875, 0.61968994140625, 0.7413330078125, 0.86297607421875, 0.984619140625, 1.10626220703125, 1.2279052734375, 1.34954833984375, 1.47119140625, 1.59283447265625, 1.7144775390625, 1.83612060546875, 1.957763671875, 2.07940673828125, 2.2010498046875, 2.32269287109375, 2.4443359375, 2.56597900390625, 2.6876220703125, 2.80926513671875, 2.930908203125, 3.05255126953125, 3.1741943359375, 3.29583740234375, 3.41748046875, 3.53912353515625, 3.6607666015625, 3.78240966796875, 3.904052734375, 4.02569580078125, 4.1473388671875, 4.26898193359375, 4.390625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 4.0, 1.0, 8.0, 7.0, 8.0, 8.0, 8.0, 14.0, 24.0, 18.0, 27.0, 28.0, 21.0, 35.0, 27.0, 39.0, 31.0, 44.0, 54.0, 49.0, 46.0, 35.0, 41.0, 39.0, 46.0, 39.0, 31.0, 30.0, 26.0, 36.0, 32.0, 26.0, 17.0, 16.0, 19.0, 18.0, 7.0, 11.0, 5.0, 4.0, 6.0, 6.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-15.191408157348633, -14.68614673614502, -14.180885314941406, -13.675623893737793, -13.17036247253418, -12.665101051330566, -12.159839630126953, -11.65457820892334, -11.149316787719727, -10.644055366516113, -10.1387939453125, -9.633532524108887, -9.128271102905273, -8.62300968170166, -8.117748260498047, -7.612486839294434, -7.10722541809082, -6.601963996887207, -6.096702575683594, -5.5914411544799805, -5.086179733276367, -4.580918312072754, -4.075656890869141, -3.5703954696655273, -3.065134048461914, -2.559872627258301, -2.0546112060546875, -1.5493497848510742, -1.044088363647461, -0.5388269424438477, -0.033565521240234375, 0.4716958999633789, 0.9769554138183594, 1.4822168350219727, 1.987478256225586, 2.492739677429199, 2.9980010986328125, 3.503262519836426, 4.008523941040039, 4.513785362243652, 5.019046783447266, 5.524308204650879, 6.029569625854492, 6.5348310470581055, 7.040092468261719, 7.545353889465332, 8.050615310668945, 8.555876731872559, 9.061138153076172, 9.566399574279785, 10.071660995483398, 10.576922416687012, 11.082183837890625, 11.587445259094238, 12.092706680297852, 12.597968101501465, 13.103229522705078, 13.608490943908691, 14.113752365112305, 14.619013786315918, 15.124275207519531, 15.629536628723145, 16.134798049926758, 16.640060424804688, 17.145320892333984]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 8.0, 11.0, 9.0, 13.0, 12.0, 5.0, 23.0, 17.0, 17.0, 25.0, 19.0, 31.0, 25.0, 26.0, 26.0, 36.0, 29.0, 40.0, 43.0, 39.0, 45.0, 36.0, 47.0, 41.0, 29.0, 44.0, 24.0, 29.0, 25.0, 27.0, 26.0, 28.0, 11.0, 25.0, 19.0, 19.0, 12.0, 7.0, 9.0, 15.0, 7.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-18.01759910583496, -17.4824275970459, -16.94725799560547, -16.412086486816406, -15.876914978027344, -15.341743469238281, -14.806572914123535, -14.271402359008789, -13.736230850219727, -13.201059341430664, -12.665888786315918, -12.130718231201172, -11.59554672241211, -11.060375213623047, -10.5252046585083, -9.990034103393555, -9.454862594604492, -8.91969108581543, -8.384520530700684, -7.849349498748779, -7.314178466796875, -6.779007434844971, -6.243836402893066, -5.708665370941162, -5.173494338989258, -4.6383233070373535, -4.103152275085449, -3.567981243133545, -3.0328102111816406, -2.4976391792297363, -1.962468147277832, -1.4272971153259277, -0.8921241760253906, -0.35695314407348633, 0.17821788787841797, 0.7133889198303223, 1.2485599517822266, 1.7837309837341309, 2.318902015686035, 2.8540730476379395, 3.3892440795898438, 3.924415111541748, 4.459586143493652, 4.994757175445557, 5.529928207397461, 6.065099239349365, 6.6002702713012695, 7.135441303253174, 7.670612335205078, 8.20578384399414, 8.740954399108887, 9.276124954223633, 9.811296463012695, 10.346467971801758, 10.881638526916504, 11.41680908203125, 11.951980590820312, 12.487152099609375, 13.022322654724121, 13.557493209838867, 14.09266471862793, 14.627836227416992, 15.163006782531738, 15.698177337646484, 16.233348846435547]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 8.0, 17.0, 25.0, 42.0, 75.0, 134.0, 208.0, 302.0, 520.0, 850.0, 1348.0, 2232.0, 3681.0, 5773.0, 9318.0, 14244.0, 22334.0, 32840.0, 47672.0, 65535.0, 85746.0, 103319.0, 115348.0, 115367.0, 106494.0, 89810.0, 70233.0, 51480.0, 36157.0, 24276.0, 16065.0, 10145.0, 6491.0, 4068.0, 2467.0, 1583.0, 953.0, 556.0, 327.0, 205.0, 127.0, 80.0, 41.0, 20.0, 18.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.5546875, -15.0703125, -14.5859375, -14.1015625, -13.6171875, -13.1328125, -12.6484375, -12.1640625, -11.6796875, -11.1953125, -10.7109375, -10.2265625, -9.7421875, -9.2578125, -8.7734375, -8.2890625, -7.8046875, -7.3203125, -6.8359375, -6.3515625, -5.8671875, -5.3828125, -4.8984375, -4.4140625, -3.9296875, -3.4453125, -2.9609375, -2.4765625, -1.9921875, -1.5078125, -1.0234375, -0.5390625, -0.0546875, 0.4296875, 0.9140625, 1.3984375, 1.8828125, 2.3671875, 2.8515625, 3.3359375, 3.8203125, 4.3046875, 4.7890625, 5.2734375, 5.7578125, 6.2421875, 6.7265625, 7.2109375, 7.6953125, 8.1796875, 8.6640625, 9.1484375, 9.6328125, 10.1171875, 10.6015625, 11.0859375, 11.5703125, 12.0546875, 12.5390625, 13.0234375, 13.5078125, 13.9921875, 14.4765625, 14.9609375, 15.4453125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 7.0, 5.0, 9.0, 8.0, 9.0, 15.0, 16.0, 15.0, 24.0, 18.0, 25.0, 24.0, 26.0, 22.0, 25.0, 26.0, 28.0, 31.0, 46.0, 39.0, 38.0, 36.0, 43.0, 31.0, 48.0, 40.0, 29.0, 34.0, 26.0, 23.0, 19.0, 29.0, 24.0, 20.0, 17.0, 20.0, 16.0, 17.0, 22.0, 15.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.859375, -15.359375, -14.859375, -14.359375, -13.859375, -13.359375, -12.859375, -12.359375, -11.859375, -11.359375, -10.859375, -10.359375, -9.859375, -9.359375, -8.859375, -8.359375, -7.859375, -7.359375, -6.859375, -6.359375, -5.859375, -5.359375, -4.859375, -4.359375, -3.859375, -3.359375, -2.859375, -2.359375, -1.859375, -1.359375, -0.859375, -0.359375, 0.140625, 0.640625, 1.140625, 1.640625, 2.140625, 2.640625, 3.140625, 3.640625, 4.140625, 4.640625, 5.140625, 5.640625, 6.140625, 6.640625, 7.140625, 7.640625, 8.140625, 8.640625, 9.140625, 9.640625, 10.140625, 10.640625, 11.140625, 11.640625, 12.140625, 12.640625, 13.140625, 13.640625, 14.140625, 14.640625, 15.140625, 15.640625, 16.140625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 18.0, 28.0, 41.0, 63.0, 92.0, 149.0, 220.0, 324.0, 506.0, 769.0, 1162.0, 1838.0, 2857.0, 4306.0, 6860.0, 10459.0, 15960.0, 24485.0, 35644.0, 51018.0, 69939.0, 90208.0, 107619.0, 117135.0, 114920.0, 102712.0, 84996.0, 64003.0, 46405.0, 32207.0, 21478.0, 14071.0, 9044.0, 6065.0, 3904.0, 2519.0, 1589.0, 1018.0, 646.0, 432.0, 281.0, 172.0, 136.0, 88.0, 64.0, 36.0, 28.0, 17.0, 6.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.0, -16.46630859375, -15.9326171875, -15.39892578125, -14.865234375, -14.33154296875, -13.7978515625, -13.26416015625, -12.73046875, -12.19677734375, -11.6630859375, -11.12939453125, -10.595703125, -10.06201171875, -9.5283203125, -8.99462890625, -8.4609375, -7.92724609375, -7.3935546875, -6.85986328125, -6.326171875, -5.79248046875, -5.2587890625, -4.72509765625, -4.19140625, -3.65771484375, -3.1240234375, -2.59033203125, -2.056640625, -1.52294921875, -0.9892578125, -0.45556640625, 0.078125, 0.61181640625, 1.1455078125, 1.67919921875, 2.212890625, 2.74658203125, 3.2802734375, 3.81396484375, 4.34765625, 4.88134765625, 5.4150390625, 5.94873046875, 6.482421875, 7.01611328125, 7.5498046875, 8.08349609375, 8.6171875, 9.15087890625, 9.6845703125, 10.21826171875, 10.751953125, 11.28564453125, 11.8193359375, 12.35302734375, 12.88671875, 13.42041015625, 13.9541015625, 14.48779296875, 15.021484375, 15.55517578125, 16.0888671875, 16.62255859375, 17.15625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 2.0, 6.0, 7.0, 10.0, 9.0, 7.0, 21.0, 16.0, 22.0, 23.0, 18.0, 30.0, 34.0, 29.0, 24.0, 38.0, 40.0, 19.0, 40.0, 39.0, 43.0, 37.0, 41.0, 35.0, 44.0, 36.0, 32.0, 26.0, 32.0, 35.0, 21.0, 21.0, 19.0, 17.0, 31.0, 15.0, 14.0, 11.0, 8.0, 8.0, 5.0, 10.0, 4.0, 5.0, 1.0, 3.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4765625, -11.086669921875, -10.69677734375, -10.306884765625, -9.9169921875, -9.527099609375, -9.13720703125, -8.747314453125, -8.357421875, -7.967529296875, -7.57763671875, -7.187744140625, -6.7978515625, -6.407958984375, -6.01806640625, -5.628173828125, -5.23828125, -4.848388671875, -4.45849609375, -4.068603515625, -3.6787109375, -3.288818359375, -2.89892578125, -2.509033203125, -2.119140625, -1.729248046875, -1.33935546875, -0.949462890625, -0.5595703125, -0.169677734375, 0.22021484375, 0.610107421875, 1.0, 1.389892578125, 1.77978515625, 2.169677734375, 2.5595703125, 2.949462890625, 3.33935546875, 3.729248046875, 4.119140625, 4.509033203125, 4.89892578125, 5.288818359375, 5.6787109375, 6.068603515625, 6.45849609375, 6.848388671875, 7.23828125, 7.628173828125, 8.01806640625, 8.407958984375, 8.7978515625, 9.187744140625, 9.57763671875, 9.967529296875, 10.357421875, 10.747314453125, 11.13720703125, 11.527099609375, 11.9169921875, 12.306884765625, 12.69677734375, 13.086669921875, 13.4765625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 5.0, 5.0, 13.0, 13.0, 18.0, 24.0, 27.0, 31.0, 50.0, 65.0, 121.0, 177.0, 268.0, 329.0, 555.0, 862.0, 1515.0, 2622.0, 5241.0, 10409.0, 24149.0, 61650.0, 171397.0, 329506.0, 263102.0, 105373.0, 38638.0, 16120.0, 7422.0, 3641.0, 1993.0, 1124.0, 733.0, 417.0, 283.0, 195.0, 137.0, 80.0, 58.0, 57.0, 41.0, 17.0, 27.0, 14.0, 9.0, 11.0, 3.0, 3.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.625, -24.8427734375, -24.060546875, -23.2783203125, -22.49609375, -21.7138671875, -20.931640625, -20.1494140625, -19.3671875, -18.5849609375, -17.802734375, -17.0205078125, -16.23828125, -15.4560546875, -14.673828125, -13.8916015625, -13.109375, -12.3271484375, -11.544921875, -10.7626953125, -9.98046875, -9.1982421875, -8.416015625, -7.6337890625, -6.8515625, -6.0693359375, -5.287109375, -4.5048828125, -3.72265625, -2.9404296875, -2.158203125, -1.3759765625, -0.59375, 0.1884765625, 0.970703125, 1.7529296875, 2.53515625, 3.3173828125, 4.099609375, 4.8818359375, 5.6640625, 6.4462890625, 7.228515625, 8.0107421875, 8.79296875, 9.5751953125, 10.357421875, 11.1396484375, 11.921875, 12.7041015625, 13.486328125, 14.2685546875, 15.05078125, 15.8330078125, 16.615234375, 17.3974609375, 18.1796875, 18.9619140625, 19.744140625, 20.5263671875, 21.30859375, 22.0908203125, 22.873046875, 23.6552734375, 24.4375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 15.0, 17.0, 23.0, 38.0, 69.0, 77.0, 133.0, 104.0, 103.0, 113.0, 80.0, 67.0, 37.0, 31.0, 19.0, 13.0, 12.0, 3.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00255584716796875, -0.002475738525390625, -0.0023956298828125, -0.002315521240234375, -0.00223541259765625, -0.002155303955078125, -0.0020751953125, -0.001995086669921875, -0.00191497802734375, -0.001834869384765625, -0.0017547607421875, -0.001674652099609375, -0.00159454345703125, -0.001514434814453125, -0.001434326171875, -0.001354217529296875, -0.00127410888671875, -0.001194000244140625, -0.0011138916015625, -0.001033782958984375, -0.00095367431640625, -0.000873565673828125, -0.00079345703125, -0.000713348388671875, -0.00063323974609375, -0.000553131103515625, -0.0004730224609375, -0.000392913818359375, -0.00031280517578125, -0.000232696533203125, -0.000152587890625, -7.2479248046875e-05, 7.62939453125e-06, 8.7738037109375e-05, 0.0001678466796875, 0.000247955322265625, 0.00032806396484375, 0.000408172607421875, 0.00048828125, 0.000568389892578125, 0.00064849853515625, 0.000728607177734375, 0.0008087158203125, 0.000888824462890625, 0.00096893310546875, 0.001049041748046875, 0.001129150390625, 0.001209259033203125, 0.00128936767578125, 0.001369476318359375, 0.0014495849609375, 0.001529693603515625, 0.00160980224609375, 0.001689910888671875, 0.00177001953125, 0.001850128173828125, 0.00193023681640625, 0.002010345458984375, 0.0020904541015625, 0.002170562744140625, 0.00225067138671875, 0.002330780029296875, 0.002410888671875, 0.002490997314453125, 0.00257110595703125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 9.0, 17.0, 13.0, 23.0, 41.0, 63.0, 89.0, 127.0, 149.0, 263.0, 400.0, 593.0, 876.0, 1447.0, 2127.0, 3512.0, 5854.0, 10181.0, 18229.0, 33745.0, 61770.0, 104284.0, 155482.0, 184208.0, 170090.0, 122938.0, 75888.0, 42212.0, 22685.0, 12529.0, 7075.0, 4365.0, 2517.0, 1613.0, 1045.0, 685.0, 463.0, 309.0, 205.0, 136.0, 87.0, 71.0, 49.0, 30.0, 23.0, 13.0, 10.0, 10.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2578125, -10.8785400390625, -10.499267578125, -10.1199951171875, -9.74072265625, -9.3614501953125, -8.982177734375, -8.6029052734375, -8.2236328125, -7.8443603515625, -7.465087890625, -7.0858154296875, -6.70654296875, -6.3272705078125, -5.947998046875, -5.5687255859375, -5.189453125, -4.8101806640625, -4.430908203125, -4.0516357421875, -3.67236328125, -3.2930908203125, -2.913818359375, -2.5345458984375, -2.1552734375, -1.7760009765625, -1.396728515625, -1.0174560546875, -0.63818359375, -0.2589111328125, 0.120361328125, 0.4996337890625, 0.87890625, 1.2581787109375, 1.637451171875, 2.0167236328125, 2.39599609375, 2.7752685546875, 3.154541015625, 3.5338134765625, 3.9130859375, 4.2923583984375, 4.671630859375, 5.0509033203125, 5.43017578125, 5.8094482421875, 6.188720703125, 6.5679931640625, 6.947265625, 7.3265380859375, 7.705810546875, 8.0850830078125, 8.46435546875, 8.8436279296875, 9.222900390625, 9.6021728515625, 9.9814453125, 10.3607177734375, 10.739990234375, 11.1192626953125, 11.49853515625, 11.8778076171875, 12.257080078125, 12.6363525390625, 13.015625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 4.0, 7.0, 5.0, 9.0, 12.0, 22.0, 22.0, 25.0, 36.0, 36.0, 51.0, 55.0, 60.0, 64.0, 73.0, 68.0, 61.0, 53.0, 68.0, 53.0, 55.0, 30.0, 29.0, 21.0, 17.0, 16.0, 7.0, 7.0, 7.0, 8.0, 5.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.81365966796875, -5.6429443359375, -5.47222900390625, -5.301513671875, -5.13079833984375, -4.9600830078125, -4.78936767578125, -4.61865234375, -4.44793701171875, -4.2772216796875, -4.10650634765625, -3.935791015625, -3.76507568359375, -3.5943603515625, -3.42364501953125, -3.2529296875, -3.08221435546875, -2.9114990234375, -2.74078369140625, -2.570068359375, -2.39935302734375, -2.2286376953125, -2.05792236328125, -1.88720703125, -1.71649169921875, -1.5457763671875, -1.37506103515625, -1.204345703125, -1.03363037109375, -0.8629150390625, -0.69219970703125, -0.521484375, -0.35076904296875, -0.1800537109375, -0.00933837890625, 0.161376953125, 0.33209228515625, 0.5028076171875, 0.67352294921875, 0.84423828125, 1.01495361328125, 1.1856689453125, 1.35638427734375, 1.527099609375, 1.69781494140625, 1.8685302734375, 2.03924560546875, 2.2099609375, 2.38067626953125, 2.5513916015625, 2.72210693359375, 2.892822265625, 3.06353759765625, 3.2342529296875, 3.40496826171875, 3.57568359375, 3.74639892578125, 3.9171142578125, 4.08782958984375, 4.258544921875, 4.42926025390625, 4.5999755859375, 4.77069091796875, 4.94140625]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 6.0, 13.0, 5.0, 8.0, 11.0, 4.0, 5.0, 16.0, 20.0, 22.0, 20.0, 17.0, 20.0, 32.0, 28.0, 34.0, 35.0, 34.0, 38.0, 29.0, 52.0, 35.0, 35.0, 42.0, 40.0, 50.0, 45.0, 27.0, 28.0, 29.0, 38.0, 29.0, 17.0, 13.0, 13.0, 13.0, 18.0, 10.0, 14.0, 11.0, 11.0, 12.0, 2.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.307159423828125, -14.824515342712402, -14.34187126159668, -13.859227180480957, -13.376583099365234, -12.893939018249512, -12.411294937133789, -11.928650856018066, -11.446006774902344, -10.963362693786621, -10.480718612670898, -9.998074531555176, -9.515430450439453, -9.03278636932373, -8.550142288208008, -8.067498207092285, -7.584853649139404, -7.102209568023682, -6.619565486907959, -6.136921405792236, -5.654277324676514, -5.171632766723633, -4.68898868560791, -4.2063446044921875, -3.723700761795044, -3.2410566806793213, -2.7584125995635986, -2.275768280029297, -1.7931243181228638, -1.3104801177978516, -0.8278360366821289, -0.34519195556640625, 0.1374521255493164, 0.6200962066650391, 1.1027402877807617, 1.585384488105774, 2.068028450012207, 2.550672769546509, 3.0333168506622314, 3.515960931777954, 3.9986050128936768, 4.4812493324279785, 4.963893413543701, 5.446537494659424, 5.9291815757751465, 6.411825656890869, 6.894469738006592, 7.3771138191223145, 7.859757900238037, 8.342402458190918, 8.82504653930664, 9.307690620422363, 9.790334701538086, 10.272978782653809, 10.755622863769531, 11.238266944885254, 11.720911026000977, 12.2035551071167, 12.686199188232422, 13.168843269348145, 13.651487350463867, 14.13413143157959, 14.616775512695312, 15.099419593811035, 15.582063674926758]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 9.0, 1.0, 13.0, 10.0, 9.0, 14.0, 12.0, 23.0, 14.0, 27.0, 26.0, 33.0, 25.0, 31.0, 44.0, 40.0, 49.0, 39.0, 47.0, 45.0, 48.0, 42.0, 37.0, 31.0, 44.0, 42.0, 39.0, 38.0, 31.0, 20.0, 20.0, 22.0, 19.0, 15.0, 14.0, 8.0, 7.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.076461791992188, -18.39020538330078, -17.703948974609375, -17.01769256591797, -16.331436157226562, -15.645180702209473, -14.958925247192383, -14.272668838500977, -13.58641242980957, -12.900156021118164, -12.213899612426758, -11.527644157409668, -10.841387748718262, -10.155131340026855, -9.468875885009766, -8.78261947631836, -8.096363067626953, -7.410106658935547, -6.723850727081299, -6.037594795227051, -5.3513383865356445, -4.665081977844238, -3.9788260459899902, -3.292570114135742, -2.606313705444336, -1.9200575351715088, -1.2338013648986816, -0.5475451946258545, 0.13871097564697266, 0.8249671459197998, 1.511223316192627, 2.197479248046875, 2.8837356567382812, 3.5699918270111084, 4.2562479972839355, 4.942503929138184, 5.62876033782959, 6.315016746520996, 7.001272678375244, 7.687528610229492, 8.373785018920898, 9.060041427612305, 9.746297836303711, 10.4325532913208, 11.118809700012207, 11.805066108703613, 12.491321563720703, 13.17757797241211, 13.863834381103516, 14.550090789794922, 15.236347198486328, 15.922602653503418, 16.60886001586914, 17.295114517211914, 17.98137092590332, 18.667627334594727, 19.353883743286133, 20.04014015197754, 20.726396560668945, 21.41265296936035, 22.098907470703125, 22.78516387939453, 23.471420288085938, 24.157676696777344, 24.84393310546875]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 3.0, 9.0, 13.0, 21.0, 33.0, 55.0, 105.0, 150.0, 255.0, 362.0, 582.0, 914.0, 1415.0, 2164.0, 3632.0, 5642.0, 8974.0, 13668.0, 21232.0, 32938.0, 50126.0, 74998.0, 110886.0, 158930.0, 223181.0, 300388.0, 381633.0, 451580.0, 482308.0, 455739.0, 390037.0, 306778.0, 228894.0, 164119.0, 112403.0, 76349.0, 49517.0, 31853.0, 20132.0, 12485.0, 7719.0, 4752.0, 2876.0, 1748.0, 1048.0, 665.0, 417.0, 193.0, 155.0, 89.0, 46.0, 29.0, 20.0, 16.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-16.09375, -15.582763671875, -15.07177734375, -14.560791015625, -14.0498046875, -13.538818359375, -13.02783203125, -12.516845703125, -12.005859375, -11.494873046875, -10.98388671875, -10.472900390625, -9.9619140625, -9.450927734375, -8.93994140625, -8.428955078125, -7.91796875, -7.406982421875, -6.89599609375, -6.385009765625, -5.8740234375, -5.363037109375, -4.85205078125, -4.341064453125, -3.830078125, -3.319091796875, -2.80810546875, -2.297119140625, -1.7861328125, -1.275146484375, -0.76416015625, -0.253173828125, 0.2578125, 0.768798828125, 1.27978515625, 1.790771484375, 2.3017578125, 2.812744140625, 3.32373046875, 3.834716796875, 4.345703125, 4.856689453125, 5.36767578125, 5.878662109375, 6.3896484375, 6.900634765625, 7.41162109375, 7.922607421875, 8.43359375, 8.944580078125, 9.45556640625, 9.966552734375, 10.4775390625, 10.988525390625, 11.49951171875, 12.010498046875, 12.521484375, 13.032470703125, 13.54345703125, 14.054443359375, 14.5654296875, 15.076416015625, 15.58740234375, 16.098388671875, 16.609375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 8.0, 8.0, 7.0, 9.0, 10.0, 14.0, 14.0, 19.0, 28.0, 24.0, 26.0, 32.0, 30.0, 37.0, 47.0, 36.0, 41.0, 46.0, 47.0, 38.0, 49.0, 56.0, 38.0, 39.0, 46.0, 29.0, 33.0, 31.0, 32.0, 23.0, 26.0, 10.0, 14.0, 14.0, 13.0, 3.0, 7.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.765869140625, -17.17236328125, -16.578857421875, -15.9853515625, -15.391845703125, -14.79833984375, -14.204833984375, -13.611328125, -13.017822265625, -12.42431640625, -11.830810546875, -11.2373046875, -10.643798828125, -10.05029296875, -9.456787109375, -8.86328125, -8.269775390625, -7.67626953125, -7.082763671875, -6.4892578125, -5.895751953125, -5.30224609375, -4.708740234375, -4.115234375, -3.521728515625, -2.92822265625, -2.334716796875, -1.7412109375, -1.147705078125, -0.55419921875, 0.039306640625, 0.6328125, 1.226318359375, 1.81982421875, 2.413330078125, 3.0068359375, 3.600341796875, 4.19384765625, 4.787353515625, 5.380859375, 5.974365234375, 6.56787109375, 7.161376953125, 7.7548828125, 8.348388671875, 8.94189453125, 9.535400390625, 10.12890625, 10.722412109375, 11.31591796875, 11.909423828125, 12.5029296875, 13.096435546875, 13.68994140625, 14.283447265625, 14.876953125, 15.470458984375, 16.06396484375, 16.657470703125, 17.2509765625, 17.844482421875, 18.43798828125, 19.031494140625, 19.625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 4.0, 12.0, 13.0, 29.0, 54.0, 69.0, 111.0, 167.0, 307.0, 451.0, 731.0, 1215.0, 1954.0, 3183.0, 5256.0, 8240.0, 13806.0, 21694.0, 35273.0, 55550.0, 85371.0, 128439.0, 183807.0, 251364.0, 327328.0, 399074.0, 453339.0, 465420.0, 430268.0, 365590.0, 290187.0, 217664.0, 154479.0, 105709.0, 70043.0, 44498.0, 28240.0, 17433.0, 10649.0, 6708.0, 4020.0, 2479.0, 1535.0, 1022.0, 577.0, 362.0, 214.0, 135.0, 85.0, 52.0, 25.0, 26.0, 8.0, 10.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.140625, -15.607177734375, -15.07373046875, -14.540283203125, -14.0068359375, -13.473388671875, -12.93994140625, -12.406494140625, -11.873046875, -11.339599609375, -10.80615234375, -10.272705078125, -9.7392578125, -9.205810546875, -8.67236328125, -8.138916015625, -7.60546875, -7.072021484375, -6.53857421875, -6.005126953125, -5.4716796875, -4.938232421875, -4.40478515625, -3.871337890625, -3.337890625, -2.804443359375, -2.27099609375, -1.737548828125, -1.2041015625, -0.670654296875, -0.13720703125, 0.396240234375, 0.9296875, 1.463134765625, 1.99658203125, 2.530029296875, 3.0634765625, 3.596923828125, 4.13037109375, 4.663818359375, 5.197265625, 5.730712890625, 6.26416015625, 6.797607421875, 7.3310546875, 7.864501953125, 8.39794921875, 8.931396484375, 9.46484375, 9.998291015625, 10.53173828125, 11.065185546875, 11.5986328125, 12.132080078125, 12.66552734375, 13.198974609375, 13.732421875, 14.265869140625, 14.79931640625, 15.332763671875, 15.8662109375, 16.399658203125, 16.93310546875, 17.466552734375, 18.0]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 9.0, 17.0, 9.0, 21.0, 17.0, 34.0, 35.0, 31.0, 47.0, 61.0, 60.0, 78.0, 84.0, 101.0, 107.0, 147.0, 154.0, 181.0, 163.0, 172.0, 183.0, 199.0, 209.0, 176.0, 208.0, 177.0, 176.0, 176.0, 135.0, 121.0, 124.0, 105.0, 92.0, 67.0, 68.0, 53.0, 49.0, 40.0, 36.0, 24.0, 32.0, 19.0, 21.0, 20.0, 7.0, 8.0, 6.0, 4.0, 4.0, 4.0, 1.0], "bins": [-10.3671875, -10.075439453125, -9.78369140625, -9.491943359375, -9.2001953125, -8.908447265625, -8.61669921875, -8.324951171875, -8.033203125, -7.741455078125, -7.44970703125, -7.157958984375, -6.8662109375, -6.574462890625, -6.28271484375, -5.990966796875, -5.69921875, -5.407470703125, -5.11572265625, -4.823974609375, -4.5322265625, -4.240478515625, -3.94873046875, -3.656982421875, -3.365234375, -3.073486328125, -2.78173828125, -2.489990234375, -2.1982421875, -1.906494140625, -1.61474609375, -1.322998046875, -1.03125, -0.739501953125, -0.44775390625, -0.156005859375, 0.1357421875, 0.427490234375, 0.71923828125, 1.010986328125, 1.302734375, 1.594482421875, 1.88623046875, 2.177978515625, 2.4697265625, 2.761474609375, 3.05322265625, 3.344970703125, 3.63671875, 3.928466796875, 4.22021484375, 4.511962890625, 4.8037109375, 5.095458984375, 5.38720703125, 5.678955078125, 5.970703125, 6.262451171875, 6.55419921875, 6.845947265625, 7.1376953125, 7.429443359375, 7.72119140625, 8.012939453125, 8.3046875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 7.0, 8.0, 10.0, 10.0, 16.0, 12.0, 19.0, 29.0, 27.0, 26.0, 26.0, 42.0, 36.0, 43.0, 44.0, 46.0, 45.0, 46.0, 50.0, 28.0, 40.0, 38.0, 39.0, 45.0, 39.0, 33.0, 26.0, 31.0, 26.0, 20.0, 19.0, 10.0, 11.0, 7.0, 6.0, 14.0, 2.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.349048614501953, -19.656740188598633, -18.96442985534668, -18.27212142944336, -17.57981300354004, -16.88750457763672, -16.195194244384766, -15.502885818481445, -14.810576438903809, -14.118267059326172, -13.425958633422852, -12.733649253845215, -12.041339874267578, -11.349031448364258, -10.656722068786621, -9.964412689208984, -9.272104263305664, -8.579794883728027, -7.887486457824707, -7.19517707824707, -6.502868175506592, -5.810559272766113, -5.118249893188477, -4.425940990447998, -3.7336320877075195, -3.041323184967041, -2.3490140438079834, -1.6567049026489258, -0.9643959999084473, -0.27208709716796875, 0.42022228240966797, 1.1125311851501465, 1.804840087890625, 2.4971489906311035, 3.189458131790161, 3.8817672729492188, 4.574076175689697, 5.266385078430176, 5.9586944580078125, 6.651003360748291, 7.3433122634887695, 8.035621643066406, 8.727930068969727, 9.420239448547363, 10.112548828125, 10.80485725402832, 11.497166633605957, 12.189476013183594, 12.881784439086914, 13.57409381866455, 14.266402244567871, 14.958711624145508, 15.651020050048828, 16.34333038330078, 17.0356388092041, 17.727947235107422, 18.420257568359375, 19.112565994262695, 19.80487632751465, 20.49718475341797, 21.18949317932129, 21.88180160522461, 22.574111938476562, 23.266420364379883, 23.958728790283203]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 3.0, 5.0, 7.0, 13.0, 6.0, 12.0, 8.0, 14.0, 20.0, 20.0, 28.0, 32.0, 39.0, 45.0, 29.0, 51.0, 45.0, 48.0, 43.0, 54.0, 39.0, 46.0, 39.0, 42.0, 49.0, 39.0, 42.0, 35.0, 26.0, 20.0, 25.0, 25.0, 16.0, 8.0, 14.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.64008712768555, -34.61390686035156, -33.58772659301758, -32.561546325683594, -31.535367965698242, -30.509187698364258, -29.483007431030273, -28.45682716369629, -27.430648803710938, -26.404468536376953, -25.37828826904297, -24.352108001708984, -23.325929641723633, -22.29974937438965, -21.273569107055664, -20.24738883972168, -19.221208572387695, -18.19502830505371, -17.168848037719727, -16.142669677734375, -15.11648941040039, -14.090309143066406, -13.064128875732422, -12.037948608398438, -11.01176929473877, -9.985589027404785, -8.959409713745117, -7.933229446411133, -6.907049655914307, -5.8808698654174805, -4.854689598083496, -3.82850980758667, -2.8023319244384766, -1.7761520147323608, -0.7499721050262451, 0.27620792388916016, 1.3023877143859863, 2.3285675048828125, 3.354747772216797, 4.380927562713623, 5.407107353210449, 6.433287143707275, 7.459466934204102, 8.485647201538086, 9.51182746887207, 10.538006782531738, 11.564187049865723, 12.59036636352539, 13.616546630859375, 14.64272689819336, 15.668906211853027, 16.695087432861328, 17.72126579284668, 18.747446060180664, 19.77362632751465, 20.799806594848633, 21.825984954833984, 22.85216522216797, 23.878345489501953, 24.904525756835938, 25.93070411682129, 26.956884384155273, 27.983064651489258, 29.009244918823242, 30.035425186157227]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 3.0, 11.0, 13.0, 24.0, 37.0, 60.0, 79.0, 117.0, 184.0, 303.0, 414.0, 635.0, 991.0, 1568.0, 2398.0, 3939.0, 6359.0, 10383.0, 17874.0, 30677.0, 53537.0, 95294.0, 169925.0, 232654.0, 179130.0, 103383.0, 57551.0, 32520.0, 18910.0, 11354.0, 6827.0, 4181.0, 2541.0, 1672.0, 1028.0, 681.0, 478.0, 253.0, 198.0, 129.0, 78.0, 49.0, 37.0, 31.0, 19.0, 11.0, 3.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-18.109375, -17.55322265625, -16.9970703125, -16.44091796875, -15.884765625, -15.32861328125, -14.7724609375, -14.21630859375, -13.66015625, -13.10400390625, -12.5478515625, -11.99169921875, -11.435546875, -10.87939453125, -10.3232421875, -9.76708984375, -9.2109375, -8.65478515625, -8.0986328125, -7.54248046875, -6.986328125, -6.43017578125, -5.8740234375, -5.31787109375, -4.76171875, -4.20556640625, -3.6494140625, -3.09326171875, -2.537109375, -1.98095703125, -1.4248046875, -0.86865234375, -0.3125, 0.24365234375, 0.7998046875, 1.35595703125, 1.912109375, 2.46826171875, 3.0244140625, 3.58056640625, 4.13671875, 4.69287109375, 5.2490234375, 5.80517578125, 6.361328125, 6.91748046875, 7.4736328125, 8.02978515625, 8.5859375, 9.14208984375, 9.6982421875, 10.25439453125, 10.810546875, 11.36669921875, 11.9228515625, 12.47900390625, 13.03515625, 13.59130859375, 14.1474609375, 14.70361328125, 15.259765625, 15.81591796875, 16.3720703125, 16.92822265625, 17.484375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 1.0, 7.0, 11.0, 3.0, 11.0, 10.0, 17.0, 14.0, 26.0, 25.0, 31.0, 36.0, 24.0, 39.0, 50.0, 45.0, 52.0, 58.0, 42.0, 52.0, 44.0, 45.0, 48.0, 40.0, 36.0, 38.0, 32.0, 33.0, 28.0, 28.0, 16.0, 13.0, 19.0, 10.0, 4.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.40625, -34.32958984375, -33.2529296875, -32.17626953125, -31.099609375, -30.02294921875, -28.9462890625, -27.86962890625, -26.79296875, -25.71630859375, -24.6396484375, -23.56298828125, -22.486328125, -21.40966796875, -20.3330078125, -19.25634765625, -18.1796875, -17.10302734375, -16.0263671875, -14.94970703125, -13.873046875, -12.79638671875, -11.7197265625, -10.64306640625, -9.56640625, -8.48974609375, -7.4130859375, -6.33642578125, -5.259765625, -4.18310546875, -3.1064453125, -2.02978515625, -0.953125, 0.12353515625, 1.2001953125, 2.27685546875, 3.353515625, 4.43017578125, 5.5068359375, 6.58349609375, 7.66015625, 8.73681640625, 9.8134765625, 10.89013671875, 11.966796875, 13.04345703125, 14.1201171875, 15.19677734375, 16.2734375, 17.35009765625, 18.4267578125, 19.50341796875, 20.580078125, 21.65673828125, 22.7333984375, 23.81005859375, 24.88671875, 25.96337890625, 27.0400390625, 28.11669921875, 29.193359375, 30.27001953125, 31.3466796875, 32.42333984375, 33.5]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 4.0, 6.0, 12.0, 9.0, 14.0, 20.0, 30.0, 40.0, 89.0, 97.0, 120.0, 195.0, 297.0, 418.0, 739.0, 1179.0, 2026.0, 3648.0, 6755.0, 12763.0, 27388.0, 64928.0, 167935.0, 365349.0, 233305.0, 88984.0, 36230.0, 16743.0, 8341.0, 4497.0, 2444.0, 1483.0, 859.0, 562.0, 346.0, 221.0, 151.0, 92.0, 66.0, 58.0, 36.0, 19.0, 15.0, 12.0, 8.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-19.625, -18.963623046875, -18.30224609375, -17.640869140625, -16.9794921875, -16.318115234375, -15.65673828125, -14.995361328125, -14.333984375, -13.672607421875, -13.01123046875, -12.349853515625, -11.6884765625, -11.027099609375, -10.36572265625, -9.704345703125, -9.04296875, -8.381591796875, -7.72021484375, -7.058837890625, -6.3974609375, -5.736083984375, -5.07470703125, -4.413330078125, -3.751953125, -3.090576171875, -2.42919921875, -1.767822265625, -1.1064453125, -0.445068359375, 0.21630859375, 0.877685546875, 1.5390625, 2.200439453125, 2.86181640625, 3.523193359375, 4.1845703125, 4.845947265625, 5.50732421875, 6.168701171875, 6.830078125, 7.491455078125, 8.15283203125, 8.814208984375, 9.4755859375, 10.136962890625, 10.79833984375, 11.459716796875, 12.12109375, 12.782470703125, 13.44384765625, 14.105224609375, 14.7666015625, 15.427978515625, 16.08935546875, 16.750732421875, 17.412109375, 18.073486328125, 18.73486328125, 19.396240234375, 20.0576171875, 20.718994140625, 21.38037109375, 22.041748046875, 22.703125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 3.0, 8.0, 9.0, 7.0, 12.0, 20.0, 12.0, 18.0, 10.0, 15.0, 19.0, 26.0, 27.0, 29.0, 43.0, 26.0, 50.0, 36.0, 37.0, 45.0, 41.0, 45.0, 38.0, 43.0, 53.0, 41.0, 37.0, 27.0, 30.0, 39.0, 27.0, 19.0, 27.0, 9.0, 14.0, 9.0, 4.0, 9.0, 9.0, 3.0, 4.0, 8.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -17.954345703125, -17.33056640625, -16.706787109375, -16.0830078125, -15.459228515625, -14.83544921875, -14.211669921875, -13.587890625, -12.964111328125, -12.34033203125, -11.716552734375, -11.0927734375, -10.468994140625, -9.84521484375, -9.221435546875, -8.59765625, -7.973876953125, -7.35009765625, -6.726318359375, -6.1025390625, -5.478759765625, -4.85498046875, -4.231201171875, -3.607421875, -2.983642578125, -2.35986328125, -1.736083984375, -1.1123046875, -0.488525390625, 0.13525390625, 0.759033203125, 1.3828125, 2.006591796875, 2.63037109375, 3.254150390625, 3.8779296875, 4.501708984375, 5.12548828125, 5.749267578125, 6.373046875, 6.996826171875, 7.62060546875, 8.244384765625, 8.8681640625, 9.491943359375, 10.11572265625, 10.739501953125, 11.36328125, 11.987060546875, 12.61083984375, 13.234619140625, 13.8583984375, 14.482177734375, 15.10595703125, 15.729736328125, 16.353515625, 16.977294921875, 17.60107421875, 18.224853515625, 18.8486328125, 19.472412109375, 20.09619140625, 20.719970703125, 21.34375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 8.0, 3.0, 7.0, 12.0, 10.0, 12.0, 30.0, 38.0, 66.0, 107.0, 155.0, 254.0, 416.0, 740.0, 1622.0, 3947.0, 12323.0, 55687.0, 531729.0, 381372.0, 43142.0, 10158.0, 3372.0, 1510.0, 686.0, 432.0, 255.0, 158.0, 93.0, 72.0, 45.0, 37.0, 14.0, 15.0, 10.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-31.609375, -30.79736328125, -29.9853515625, -29.17333984375, -28.361328125, -27.54931640625, -26.7373046875, -25.92529296875, -25.11328125, -24.30126953125, -23.4892578125, -22.67724609375, -21.865234375, -21.05322265625, -20.2412109375, -19.42919921875, -18.6171875, -17.80517578125, -16.9931640625, -16.18115234375, -15.369140625, -14.55712890625, -13.7451171875, -12.93310546875, -12.12109375, -11.30908203125, -10.4970703125, -9.68505859375, -8.873046875, -8.06103515625, -7.2490234375, -6.43701171875, -5.625, -4.81298828125, -4.0009765625, -3.18896484375, -2.376953125, -1.56494140625, -0.7529296875, 0.05908203125, 0.87109375, 1.68310546875, 2.4951171875, 3.30712890625, 4.119140625, 4.93115234375, 5.7431640625, 6.55517578125, 7.3671875, 8.17919921875, 8.9912109375, 9.80322265625, 10.615234375, 11.42724609375, 12.2392578125, 13.05126953125, 13.86328125, 14.67529296875, 15.4873046875, 16.29931640625, 17.111328125, 17.92333984375, 18.7353515625, 19.54736328125, 20.359375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 9.0, 9.0, 20.0, 14.0, 27.0, 25.0, 43.0, 51.0, 73.0, 80.0, 110.0, 99.0, 99.0, 87.0, 57.0, 52.0, 44.0, 27.0, 25.0, 9.0, 9.0, 5.0, 1.0, 3.0, 6.0, 1.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0008516311645507812, -0.0008299797773361206, -0.00080832839012146, -0.0007866770029067993, -0.0007650256156921387, -0.000743374228477478, -0.0007217228412628174, -0.0007000714540481567, -0.0006784200668334961, -0.0006567686796188354, -0.0006351172924041748, -0.0006134659051895142, -0.0005918145179748535, -0.0005701631307601929, -0.0005485117435455322, -0.0005268603563308716, -0.0005052089691162109, -0.0004835575819015503, -0.00046190619468688965, -0.000440254807472229, -0.00041860342025756836, -0.0003969520330429077, -0.00037530064582824707, -0.0003536492586135864, -0.0003319978713989258, -0.00031034648418426514, -0.0002886950969696045, -0.00026704370975494385, -0.0002453923225402832, -0.00022374093532562256, -0.00020208954811096191, -0.00018043816089630127, -0.00015878677368164062, -0.00013713538646697998, -0.00011548399925231934, -9.383261203765869e-05, -7.218122482299805e-05, -5.05298376083374e-05, -2.8878450393676758e-05, -7.227063179016113e-06, 1.4424324035644531e-05, 3.6075711250305176e-05, 5.772709846496582e-05, 7.937848567962646e-05, 0.00010102987289428711, 0.00012268126010894775, 0.0001443326473236084, 0.00016598403453826904, 0.0001876354217529297, 0.00020928680896759033, 0.00023093819618225098, 0.0002525895833969116, 0.00027424097061157227, 0.0002958923578262329, 0.00031754374504089355, 0.0003391951322555542, 0.00036084651947021484, 0.0003824979066848755, 0.00040414929389953613, 0.0004258006811141968, 0.0004474520683288574, 0.00046910345554351807, 0.0004907548427581787, 0.0005124062299728394, 0.0005340576171875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 17.0, 15.0, 41.0, 49.0, 60.0, 118.0, 183.0, 260.0, 422.0, 642.0, 1109.0, 1792.0, 2863.0, 4844.0, 8157.0, 15065.0, 28404.0, 56785.0, 121650.0, 258212.0, 279562.0, 135664.0, 63087.0, 30994.0, 16365.0, 8930.0, 5111.0, 3013.0, 1946.0, 1179.0, 729.0, 459.0, 289.0, 182.0, 123.0, 67.0, 58.0, 28.0, 27.0, 10.0, 11.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.296875, -15.7548828125, -15.212890625, -14.6708984375, -14.12890625, -13.5869140625, -13.044921875, -12.5029296875, -11.9609375, -11.4189453125, -10.876953125, -10.3349609375, -9.79296875, -9.2509765625, -8.708984375, -8.1669921875, -7.625, -7.0830078125, -6.541015625, -5.9990234375, -5.45703125, -4.9150390625, -4.373046875, -3.8310546875, -3.2890625, -2.7470703125, -2.205078125, -1.6630859375, -1.12109375, -0.5791015625, -0.037109375, 0.5048828125, 1.046875, 1.5888671875, 2.130859375, 2.6728515625, 3.21484375, 3.7568359375, 4.298828125, 4.8408203125, 5.3828125, 5.9248046875, 6.466796875, 7.0087890625, 7.55078125, 8.0927734375, 8.634765625, 9.1767578125, 9.71875, 10.2607421875, 10.802734375, 11.3447265625, 11.88671875, 12.4287109375, 12.970703125, 13.5126953125, 14.0546875, 14.5966796875, 15.138671875, 15.6806640625, 16.22265625, 16.7646484375, 17.306640625, 17.8486328125, 18.390625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 7.0, 7.0, 8.0, 13.0, 10.0, 24.0, 16.0, 18.0, 31.0, 26.0, 47.0, 42.0, 45.0, 50.0, 52.0, 59.0, 55.0, 53.0, 47.0, 51.0, 61.0, 48.0, 32.0, 30.0, 25.0, 20.0, 30.0, 13.0, 21.0, 5.0, 10.0, 5.0, 5.0, 7.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.14453125, -6.93157958984375, -6.7186279296875, -6.50567626953125, -6.292724609375, -6.07977294921875, -5.8668212890625, -5.65386962890625, -5.44091796875, -5.22796630859375, -5.0150146484375, -4.80206298828125, -4.589111328125, -4.37615966796875, -4.1632080078125, -3.95025634765625, -3.7373046875, -3.52435302734375, -3.3114013671875, -3.09844970703125, -2.885498046875, -2.67254638671875, -2.4595947265625, -2.24664306640625, -2.03369140625, -1.82073974609375, -1.6077880859375, -1.39483642578125, -1.181884765625, -0.96893310546875, -0.7559814453125, -0.54302978515625, -0.330078125, -0.11712646484375, 0.0958251953125, 0.30877685546875, 0.521728515625, 0.73468017578125, 0.9476318359375, 1.16058349609375, 1.37353515625, 1.58648681640625, 1.7994384765625, 2.01239013671875, 2.225341796875, 2.43829345703125, 2.6512451171875, 2.86419677734375, 3.0771484375, 3.29010009765625, 3.5030517578125, 3.71600341796875, 3.928955078125, 4.14190673828125, 4.3548583984375, 4.56781005859375, 4.78076171875, 4.99371337890625, 5.2066650390625, 5.41961669921875, 5.632568359375, 5.84552001953125, 6.0584716796875, 6.27142333984375, 6.484375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 3.0, 8.0, 15.0, 15.0, 21.0, 23.0, 20.0, 23.0, 36.0, 26.0, 44.0, 47.0, 40.0, 35.0, 43.0, 40.0, 38.0, 46.0, 54.0, 47.0, 38.0, 34.0, 36.0, 39.0, 34.0, 28.0, 35.0, 16.0, 16.0, 13.0, 9.0, 15.0, 16.0, 5.0, 6.0, 3.0, 5.0, 7.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.151737213134766, -18.430511474609375, -17.709285736083984, -16.988059997558594, -16.266834259033203, -15.545609474182129, -14.824384689331055, -14.103158950805664, -13.381933212280273, -12.660707473754883, -11.939481735229492, -11.218256950378418, -10.497031211853027, -9.775805473327637, -9.054580688476562, -8.333354949951172, -7.612129211425781, -6.890903472900391, -6.169678211212158, -5.448452949523926, -4.727227210998535, -4.0060014724731445, -3.284776210784912, -2.5635509490966797, -1.842325210571289, -1.1210997104644775, -0.399874210357666, 0.3213512897491455, 1.042576789855957, 1.7638022899627686, 2.48502779006958, 3.2062530517578125, 3.927480697631836, 4.648706436157227, 5.369931697845459, 6.091156959533691, 6.812382698059082, 7.533608436584473, 8.254833221435547, 8.976058959960938, 9.697284698486328, 10.418510437011719, 11.13973617553711, 11.860960960388184, 12.582186698913574, 13.303412437438965, 14.024637222290039, 14.74586296081543, 15.46708869934082, 16.18831443786621, 16.9095401763916, 17.630765914916992, 18.35198974609375, 19.07321548461914, 19.79444122314453, 20.515666961669922, 21.236892700195312, 21.958118438720703, 22.679344177246094, 23.400569915771484, 24.121795654296875, 24.843019485473633, 25.564245223999023, 26.285470962524414, 27.006696701049805]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 10.0, 9.0, 19.0, 18.0, 23.0, 32.0, 22.0, 25.0, 29.0, 31.0, 38.0, 55.0, 45.0, 44.0, 31.0, 45.0, 52.0, 45.0, 50.0, 51.0, 50.0, 33.0, 34.0, 24.0, 22.0, 32.0, 20.0, 20.0, 15.0, 13.0, 14.0, 12.0, 9.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.02465057373047, -32.98223876953125, -31.939828872680664, -30.897417068481445, -29.85500717163086, -28.81259536743164, -27.770183563232422, -26.727773666381836, -25.68536376953125, -24.64295196533203, -23.600542068481445, -22.558130264282227, -21.51572036743164, -20.473308563232422, -19.430896759033203, -18.388486862182617, -17.3460750579834, -16.30366325378418, -15.261253356933594, -14.218841552734375, -13.176431655883789, -12.13401985168457, -11.091609001159668, -10.049198150634766, -9.006787300109863, -7.964376449584961, -6.921965599060059, -5.879554271697998, -4.837143421173096, -3.7947325706481934, -2.752321243286133, -1.7099103927612305, -0.6674995422363281, 0.37491142749786377, 1.4173223972320557, 2.459733486175537, 3.5021443367004395, 4.544555187225342, 5.586966514587402, 6.629377365112305, 7.671788215637207, 8.71419906616211, 9.756609916687012, 10.799020767211914, 11.841432571411133, 12.883842468261719, 13.926254272460938, 14.96866512298584, 16.011075973510742, 17.05348777770996, 18.095897674560547, 19.138309478759766, 20.18071937561035, 21.22313117980957, 22.265541076660156, 23.307952880859375, 24.350364685058594, 25.392776489257812, 26.4351863861084, 27.477598190307617, 28.520008087158203, 29.562419891357422, 30.60483169555664, 31.647241592407227, 32.68965148925781]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 5.0, 8.0, 15.0, 15.0, 35.0, 54.0, 92.0, 134.0, 223.0, 333.0, 528.0, 951.0, 1529.0, 2570.0, 4473.0, 7887.0, 14099.0, 25907.0, 48051.0, 88175.0, 150150.0, 203934.0, 195050.0, 134964.0, 76667.0, 41572.0, 22199.0, 12384.0, 6723.0, 4013.0, 2296.0, 1355.0, 801.0, 488.0, 345.0, 201.0, 114.0, 76.0, 56.0, 31.0, 21.0, 11.0, 11.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.21875, -35.180419921875, -34.14208984375, -33.103759765625, -32.0654296875, -31.027099609375, -29.98876953125, -28.950439453125, -27.912109375, -26.873779296875, -25.83544921875, -24.797119140625, -23.7587890625, -22.720458984375, -21.68212890625, -20.643798828125, -19.60546875, -18.567138671875, -17.52880859375, -16.490478515625, -15.4521484375, -14.413818359375, -13.37548828125, -12.337158203125, -11.298828125, -10.260498046875, -9.22216796875, -8.183837890625, -7.1455078125, -6.107177734375, -5.06884765625, -4.030517578125, -2.9921875, -1.953857421875, -0.91552734375, 0.122802734375, 1.1611328125, 2.199462890625, 3.23779296875, 4.276123046875, 5.314453125, 6.352783203125, 7.39111328125, 8.429443359375, 9.4677734375, 10.506103515625, 11.54443359375, 12.582763671875, 13.62109375, 14.659423828125, 15.69775390625, 16.736083984375, 17.7744140625, 18.812744140625, 19.85107421875, 20.889404296875, 21.927734375, 22.966064453125, 24.00439453125, 25.042724609375, 26.0810546875, 27.119384765625, 28.15771484375, 29.196044921875, 30.234375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 6.0, 12.0, 9.0, 14.0, 15.0, 27.0, 22.0, 33.0, 23.0, 29.0, 25.0, 42.0, 49.0, 41.0, 40.0, 41.0, 54.0, 31.0, 45.0, 48.0, 52.0, 43.0, 45.0, 31.0, 33.0, 25.0, 27.0, 21.0, 25.0, 20.0, 8.0, 8.0, 10.0, 15.0, 7.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.375, -30.400390625, -29.42578125, -28.451171875, -27.4765625, -26.501953125, -25.52734375, -24.552734375, -23.578125, -22.603515625, -21.62890625, -20.654296875, -19.6796875, -18.705078125, -17.73046875, -16.755859375, -15.78125, -14.806640625, -13.83203125, -12.857421875, -11.8828125, -10.908203125, -9.93359375, -8.958984375, -7.984375, -7.009765625, -6.03515625, -5.060546875, -4.0859375, -3.111328125, -2.13671875, -1.162109375, -0.1875, 0.787109375, 1.76171875, 2.736328125, 3.7109375, 4.685546875, 5.66015625, 6.634765625, 7.609375, 8.583984375, 9.55859375, 10.533203125, 11.5078125, 12.482421875, 13.45703125, 14.431640625, 15.40625, 16.380859375, 17.35546875, 18.330078125, 19.3046875, 20.279296875, 21.25390625, 22.228515625, 23.203125, 24.177734375, 25.15234375, 26.126953125, 27.1015625, 28.076171875, 29.05078125, 30.025390625, 31.0]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 8.0, 11.0, 21.0, 28.0, 45.0, 68.0, 107.0, 150.0, 216.0, 323.0, 486.0, 755.0, 1178.0, 1887.0, 2922.0, 4522.0, 7038.0, 11329.0, 17952.0, 29253.0, 50134.0, 88193.0, 153919.0, 217588.0, 187596.0, 112872.0, 63796.0, 36623.0, 21969.0, 13663.0, 8611.0, 5437.0, 3542.0, 2260.0, 1395.0, 874.0, 629.0, 385.0, 280.0, 149.0, 126.0, 71.0, 53.0, 45.0, 17.0, 10.0, 6.0, 6.0, 1.0, 8.0, 2.0, 1.0, 1.0, 1.0], "bins": [-44.28125, -42.9677734375, -41.654296875, -40.3408203125, -39.02734375, -37.7138671875, -36.400390625, -35.0869140625, -33.7734375, -32.4599609375, -31.146484375, -29.8330078125, -28.51953125, -27.2060546875, -25.892578125, -24.5791015625, -23.265625, -21.9521484375, -20.638671875, -19.3251953125, -18.01171875, -16.6982421875, -15.384765625, -14.0712890625, -12.7578125, -11.4443359375, -10.130859375, -8.8173828125, -7.50390625, -6.1904296875, -4.876953125, -3.5634765625, -2.25, -0.9365234375, 0.376953125, 1.6904296875, 3.00390625, 4.3173828125, 5.630859375, 6.9443359375, 8.2578125, 9.5712890625, 10.884765625, 12.1982421875, 13.51171875, 14.8251953125, 16.138671875, 17.4521484375, 18.765625, 20.0791015625, 21.392578125, 22.7060546875, 24.01953125, 25.3330078125, 26.646484375, 27.9599609375, 29.2734375, 30.5869140625, 31.900390625, 33.2138671875, 34.52734375, 35.8408203125, 37.154296875, 38.4677734375, 39.78125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 14.0, 11.0, 13.0, 15.0, 15.0, 15.0, 22.0, 32.0, 28.0, 32.0, 29.0, 38.0, 38.0, 40.0, 40.0, 45.0, 43.0, 34.0, 42.0, 40.0, 54.0, 39.0, 37.0, 37.0, 33.0, 26.0, 20.0, 14.0, 24.0, 23.0, 15.0, 12.0, 13.0, 18.0, 13.0, 9.0, 5.0, 6.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.577392578125, -16.95166015625, -16.325927734375, -15.7001953125, -15.074462890625, -14.44873046875, -13.822998046875, -13.197265625, -12.571533203125, -11.94580078125, -11.320068359375, -10.6943359375, -10.068603515625, -9.44287109375, -8.817138671875, -8.19140625, -7.565673828125, -6.93994140625, -6.314208984375, -5.6884765625, -5.062744140625, -4.43701171875, -3.811279296875, -3.185546875, -2.559814453125, -1.93408203125, -1.308349609375, -0.6826171875, -0.056884765625, 0.56884765625, 1.194580078125, 1.8203125, 2.446044921875, 3.07177734375, 3.697509765625, 4.3232421875, 4.948974609375, 5.57470703125, 6.200439453125, 6.826171875, 7.451904296875, 8.07763671875, 8.703369140625, 9.3291015625, 9.954833984375, 10.58056640625, 11.206298828125, 11.83203125, 12.457763671875, 13.08349609375, 13.709228515625, 14.3349609375, 14.960693359375, 15.58642578125, 16.212158203125, 16.837890625, 17.463623046875, 18.08935546875, 18.715087890625, 19.3408203125, 19.966552734375, 20.59228515625, 21.218017578125, 21.84375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 8.0, 8.0, 14.0, 10.0, 21.0, 27.0, 54.0, 63.0, 87.0, 121.0, 201.0, 255.0, 370.0, 530.0, 764.0, 1099.0, 1683.0, 2540.0, 3788.0, 6347.0, 11139.0, 21320.0, 45954.0, 105259.0, 223538.0, 287738.0, 179001.0, 79714.0, 35002.0, 17162.0, 9170.0, 5458.0, 3325.0, 2136.0, 1357.0, 1029.0, 690.0, 469.0, 361.0, 238.0, 157.0, 112.0, 81.0, 59.0, 33.0, 20.0, 15.0, 15.0, 13.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.84375, -16.26953125, -15.6953125, -15.12109375, -14.546875, -13.97265625, -13.3984375, -12.82421875, -12.25, -11.67578125, -11.1015625, -10.52734375, -9.953125, -9.37890625, -8.8046875, -8.23046875, -7.65625, -7.08203125, -6.5078125, -5.93359375, -5.359375, -4.78515625, -4.2109375, -3.63671875, -3.0625, -2.48828125, -1.9140625, -1.33984375, -0.765625, -0.19140625, 0.3828125, 0.95703125, 1.53125, 2.10546875, 2.6796875, 3.25390625, 3.828125, 4.40234375, 4.9765625, 5.55078125, 6.125, 6.69921875, 7.2734375, 7.84765625, 8.421875, 8.99609375, 9.5703125, 10.14453125, 10.71875, 11.29296875, 11.8671875, 12.44140625, 13.015625, 13.58984375, 14.1640625, 14.73828125, 15.3125, 15.88671875, 16.4609375, 17.03515625, 17.609375, 18.18359375, 18.7578125, 19.33203125, 19.90625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 1.0, 3.0, 6.0, 4.0, 2.0, 14.0, 10.0, 10.0, 10.0, 6.0, 20.0, 24.0, 29.0, 36.0, 36.0, 41.0, 53.0, 58.0, 64.0, 70.0, 72.0, 38.0, 56.0, 50.0, 43.0, 47.0, 30.0, 38.0, 26.0, 14.0, 16.0, 18.0, 7.0, 14.0, 9.0, 11.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0013675689697265625, -0.0013276934623718262, -0.0012878179550170898, -0.0012479424476623535, -0.0012080669403076172, -0.0011681914329528809, -0.0011283159255981445, -0.0010884404182434082, -0.0010485649108886719, -0.0010086894035339355, -0.0009688138961791992, -0.0009289383888244629, -0.0008890628814697266, -0.0008491873741149902, -0.0008093118667602539, -0.0007694363594055176, -0.0007295608520507812, -0.0006896853446960449, -0.0006498098373413086, -0.0006099343299865723, -0.0005700588226318359, -0.0005301833152770996, -0.0004903078079223633, -0.00045043230056762695, -0.0004105567932128906, -0.0003706812858581543, -0.00033080577850341797, -0.00029093027114868164, -0.0002510547637939453, -0.00021117925643920898, -0.00017130374908447266, -0.00013142824172973633, -9.1552734375e-05, -5.167722702026367e-05, -1.1801719665527344e-05, 2.8073787689208984e-05, 6.794929504394531e-05, 0.00010782480239868164, 0.00014770030975341797, 0.0001875758171081543, 0.00022745132446289062, 0.00026732683181762695, 0.0003072023391723633, 0.0003470778465270996, 0.00038695335388183594, 0.00042682886123657227, 0.0004667043685913086, 0.0005065798759460449, 0.0005464553833007812, 0.0005863308906555176, 0.0006262063980102539, 0.0006660819053649902, 0.0007059574127197266, 0.0007458329200744629, 0.0007857084274291992, 0.0008255839347839355, 0.0008654594421386719, 0.0009053349494934082, 0.0009452104568481445, 0.0009850859642028809, 0.0010249614715576172, 0.0010648369789123535, 0.0011047124862670898, 0.0011445879936218262, 0.0011844635009765625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 12.0, 15.0, 36.0, 41.0, 41.0, 97.0, 152.0, 219.0, 276.0, 412.0, 549.0, 858.0, 1178.0, 1721.0, 2476.0, 3582.0, 5353.0, 8088.0, 13661.0, 24310.0, 52440.0, 161629.0, 395555.0, 232041.0, 69883.0, 29629.0, 15876.0, 9456.0, 6075.0, 3993.0, 2724.0, 1871.0, 1278.0, 896.0, 665.0, 455.0, 301.0, 221.0, 163.0, 131.0, 69.0, 46.0, 35.0, 18.0, 12.0, 7.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.875, -33.77294921875, -32.6708984375, -31.56884765625, -30.466796875, -29.36474609375, -28.2626953125, -27.16064453125, -26.05859375, -24.95654296875, -23.8544921875, -22.75244140625, -21.650390625, -20.54833984375, -19.4462890625, -18.34423828125, -17.2421875, -16.14013671875, -15.0380859375, -13.93603515625, -12.833984375, -11.73193359375, -10.6298828125, -9.52783203125, -8.42578125, -7.32373046875, -6.2216796875, -5.11962890625, -4.017578125, -2.91552734375, -1.8134765625, -0.71142578125, 0.390625, 1.49267578125, 2.5947265625, 3.69677734375, 4.798828125, 5.90087890625, 7.0029296875, 8.10498046875, 9.20703125, 10.30908203125, 11.4111328125, 12.51318359375, 13.615234375, 14.71728515625, 15.8193359375, 16.92138671875, 18.0234375, 19.12548828125, 20.2275390625, 21.32958984375, 22.431640625, 23.53369140625, 24.6357421875, 25.73779296875, 26.83984375, 27.94189453125, 29.0439453125, 30.14599609375, 31.248046875, 32.35009765625, 33.4521484375, 34.55419921875, 35.65625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 6.0, 4.0, 7.0, 2.0, 6.0, 9.0, 5.0, 3.0, 7.0, 15.0, 19.0, 22.0, 24.0, 50.0, 67.0, 106.0, 127.0, 124.0, 94.0, 80.0, 46.0, 33.0, 24.0, 15.0, 11.0, 7.0, 12.0, 4.0, 6.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.37451171875, -11.9521484375, -11.52978515625, -11.107421875, -10.68505859375, -10.2626953125, -9.84033203125, -9.41796875, -8.99560546875, -8.5732421875, -8.15087890625, -7.728515625, -7.30615234375, -6.8837890625, -6.46142578125, -6.0390625, -5.61669921875, -5.1943359375, -4.77197265625, -4.349609375, -3.92724609375, -3.5048828125, -3.08251953125, -2.66015625, -2.23779296875, -1.8154296875, -1.39306640625, -0.970703125, -0.54833984375, -0.1259765625, 0.29638671875, 0.71875, 1.14111328125, 1.5634765625, 1.98583984375, 2.408203125, 2.83056640625, 3.2529296875, 3.67529296875, 4.09765625, 4.52001953125, 4.9423828125, 5.36474609375, 5.787109375, 6.20947265625, 6.6318359375, 7.05419921875, 7.4765625, 7.89892578125, 8.3212890625, 8.74365234375, 9.166015625, 9.58837890625, 10.0107421875, 10.43310546875, 10.85546875, 11.27783203125, 11.7001953125, 12.12255859375, 12.544921875, 12.96728515625, 13.3896484375, 13.81201171875, 14.234375]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 4.0, 9.0, 19.0, 10.0, 18.0, 15.0, 21.0, 30.0, 28.0, 27.0, 25.0, 42.0, 62.0, 69.0, 39.0, 61.0, 61.0, 49.0, 60.0, 44.0, 39.0, 43.0, 42.0, 23.0, 31.0, 25.0, 16.0, 17.0, 19.0, 13.0, 9.0, 4.0, 5.0, 3.0, 8.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.97028350830078, -27.944339752197266, -26.91839599609375, -25.892452239990234, -24.86651039123535, -23.840566635131836, -22.81462287902832, -21.788679122924805, -20.762737274169922, -19.736793518066406, -18.71084976196289, -17.684906005859375, -16.658964157104492, -15.633020401000977, -14.607076644897461, -13.581132888793945, -12.55518913269043, -11.529245376586914, -10.503302574157715, -9.4773588180542, -8.451416015625, -7.425472259521484, -6.399528503417969, -5.373585224151611, -4.347641944885254, -3.3216986656188965, -2.29575514793396, -1.2698116302490234, -0.24386835098266602, 0.7820749282836914, 1.808018684387207, 2.8339619636535645, 3.859905242919922, 4.885848522186279, 5.911791801452637, 6.937735557556152, 7.96367883682251, 8.989622116088867, 10.015565872192383, 11.041509628295898, 12.067452430725098, 13.093396186828613, 14.119338989257812, 15.145282745361328, 16.171226501464844, 17.19717025756836, 18.223114013671875, 19.249055862426758, 20.274999618530273, 21.30094337463379, 22.326887130737305, 23.352828979492188, 24.378772735595703, 25.40471649169922, 26.430660247802734, 27.45660400390625, 28.482547760009766, 29.50849151611328, 30.534435272216797, 31.560379028320312, 32.58632278442383, 33.612266540527344, 34.638206481933594, 35.66415023803711, 36.690093994140625]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 5.0, 8.0, 7.0, 16.0, 11.0, 22.0, 19.0, 14.0, 28.0, 27.0, 35.0, 47.0, 27.0, 44.0, 67.0, 45.0, 54.0, 62.0, 62.0, 49.0, 43.0, 49.0, 45.0, 44.0, 42.0, 25.0, 24.0, 19.0, 16.0, 15.0, 5.0, 9.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.63909149169922, -52.07381820678711, -50.508548736572266, -48.943275451660156, -47.37800598144531, -45.8127326965332, -44.247459411621094, -42.68218994140625, -41.116920471191406, -39.5516471862793, -37.98637771606445, -36.421104431152344, -34.8558349609375, -33.29056167602539, -31.725290298461914, -30.160018920898438, -28.594745635986328, -27.02947425842285, -25.464202880859375, -23.898929595947266, -22.333660125732422, -20.768386840820312, -19.203115463256836, -17.63784408569336, -16.072572708129883, -14.507301330566406, -12.94202995300293, -11.376757621765137, -9.81148624420166, -8.246214866638184, -6.680942535400391, -5.115671157836914, -3.550395965576172, -1.9851243495941162, -0.41985273361206055, 1.1454191207885742, 2.710690498352051, 4.275961875915527, 5.84123420715332, 7.406505584716797, 8.971776962280273, 10.53704833984375, 12.102319717407227, 13.66759204864502, 15.232863426208496, 16.798133850097656, 18.363407135009766, 19.928678512573242, 21.49394989013672, 23.059221267700195, 24.624492645263672, 26.18976593017578, 27.755035400390625, 29.320308685302734, 30.88558006286621, 32.45085144042969, 34.01612091064453, 35.58139419555664, 37.146663665771484, 38.711936950683594, 40.27720642089844, 41.84247970581055, 43.407752990722656, 44.9730224609375, 46.53829574584961]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 9.0, 9.0, 23.0, 23.0, 45.0, 46.0, 77.0, 92.0, 128.0, 165.0, 213.0, 298.0, 464.0, 590.0, 813.0, 966.0, 1284.0, 1744.0, 2245.0, 2739.0, 3749.0, 4803.0, 6117.0, 468011.0, 6985.0, 5186.0, 3965.0, 3162.0, 2423.0, 1949.0, 1456.0, 1163.0, 832.0, 670.0, 499.0, 360.0, 289.0, 189.0, 139.0, 93.0, 81.0, 50.0, 35.0, 35.0, 16.0, 12.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0], "bins": [-190.5108642578125, -185.01910400390625, -179.52732849121094, -174.03555297851562, -168.54379272460938, -163.05203247070312, -157.5602569580078, -152.0684814453125, -146.57672119140625, -141.0849609375, -135.5931854248047, -130.10140991210938, -124.60964965820312, -119.11788177490234, -113.62611389160156, -108.13434600830078, -102.642578125, -97.15081024169922, -91.65904235839844, -86.16727447509766, -80.67550659179688, -75.1837387084961, -69.69197082519531, -64.20020294189453, -58.70843505859375, -53.21666717529297, -47.72489929199219, -42.233131408691406, -36.741363525390625, -31.249595642089844, -25.757827758789062, -20.26605987548828, -14.7742919921875, -9.282524108886719, -3.7907562255859375, 1.7010116577148438, 7.192779541015625, 12.684547424316406, 18.176315307617188, 23.66808319091797, 29.15985107421875, 34.65161895751953, 40.14338684082031, 45.635154724121094, 51.126922607421875, 56.618690490722656, 62.11045837402344, 67.60222625732422, 73.093994140625, 78.58576202392578, 84.07752990722656, 89.56929779052734, 95.06106567382812, 100.5528335571289, 106.04460144042969, 111.53636932373047, 117.02813720703125, 122.51990509033203, 128.0116729736328, 133.50344848632812, 138.99520874023438, 144.48696899414062, 149.97874450683594, 155.47052001953125, 160.9622802734375]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 8.0, 18.0, 10.0, 17.0, 20.0, 18.0, 28.0, 29.0, 31.0, 44.0, 33.0, 41.0, 65.0, 45.0, 56.0, 1085.0, 68.0, 50.0, 37.0, 51.0, 47.0, 43.0, 39.0, 31.0, 23.0, 19.0, 16.0, 14.0, 7.0, 7.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1631.448974609375, -1583.848876953125, -1536.248779296875, -1488.6488037109375, -1441.0487060546875, -1393.4486083984375, -1345.8486328125, -1298.24853515625, -1250.6484375, -1203.04833984375, -1155.4482421875, -1107.8482666015625, -1060.2481689453125, -1012.6480712890625, -965.0480346679688, -917.447998046875, -869.847900390625, -822.247802734375, -774.6477661132812, -727.0477294921875, -679.4476318359375, -631.8475341796875, -584.2474975585938, -536.6474609375, -489.04736328125, -441.4472961425781, -393.84722900390625, -346.2471618652344, -298.6470947265625, -251.04702758789062, -203.44696044921875, -155.84689331054688, -108.246826171875, -60.646759033203125, -13.04669189453125, 34.553375244140625, 82.1534423828125, 129.75350952148438, 177.35357666015625, 224.95364379882812, 272.5537109375, 320.1537780761719, 367.75384521484375, 415.3539123535156, 462.9539794921875, 510.5540466308594, 558.1541137695312, 605.754150390625, 653.354248046875, 700.954345703125, 748.5543823242188, 796.1544189453125, 843.7545166015625, 891.3546142578125, 938.9546508789062, 986.5546875, 1034.15478515625, 1081.7548828125, 1129.35498046875, 1176.9549560546875, 1224.5550537109375, 1272.1551513671875, 1319.755126953125, 1367.355224609375, 1414.955322265625]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 10.0, 36.0, 123.0, 119.0, 133.0, 95.0, 126.0, 155.0, 226.0, 331.0, 460.0, 796.0, 1513.0, 3289.0, 8274.0, 20169.0, 43075.0, 119878.0, 30919748.0, 94273.0, 27267.0, 7984.0, 3015.0, 1389.0, 721.0, 446.0, 242.0, 132.0, 98.0, 59.0, 33.0, 37.0, 29.0, 24.0, 20.0, 22.0, 17.0, 23.0, 11.0, 23.0, 11.0, 17.0, 15.0, 9.0, 4.0, 10.0, 6.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0], "bins": [-292.59295654296875, -281.84930419921875, -271.1056823730469, -260.3620300292969, -249.61839294433594, -238.874755859375, -228.13111877441406, -217.38748168945312, -206.64382934570312, -195.9001922607422, -185.15655517578125, -174.41290283203125, -163.6692657470703, -152.92562866210938, -142.18199157714844, -131.4383544921875, -120.69471740722656, -109.95108032226562, -99.20743560791016, -88.46379852294922, -77.72015380859375, -66.97651672363281, -56.232879638671875, -45.489234924316406, -34.74559783935547, -24.001956939697266, -13.258317947387695, -2.514678955078125, 8.228961944580078, 18.97260284423828, 29.71623992919922, 40.45988464355469, 51.203521728515625, 61.94716262817383, 72.69080352783203, 83.43444061279297, 94.17808532714844, 104.92172241210938, 115.66535949707031, 126.40900421142578, 137.15264892578125, 147.8962860107422, 158.63992309570312, 169.38357543945312, 180.12721252441406, 190.870849609375, 201.61448669433594, 212.35812377929688, 223.1017608642578, 233.84539794921875, 244.5890350341797, 255.33267211914062, 266.0763244628906, 276.8199462890625, 287.5635986328125, 298.3072509765625, 309.0508728027344, 319.7945251464844, 330.53814697265625, 341.28179931640625, 352.0254211425781, 362.7690734863281, 373.5126953125, 384.25634765625, 395.0]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 7.0, 12.0, 13.0, 22.0, 51.0, 49.0, 76.0, 128.0, 211.0, 304.0, 461.0, 605.0, 942.0, 1370.0, 2051.0, 2988.0, 4441.0, 7045.0, 11313.0, 18797.0, 31634.0, 54737.0, 99938.0, 192966.0, 402929.0, 1092998.0, 2849584.0, 810156.0, 332869.0, 163784.0, 86879.0, 48404.0, 27818.0, 16769.0, 10135.0, 6354.0, 4048.0, 2729.0, 1890.0, 1318.0, 891.0, 584.0, 370.0, 259.0, 164.0, 107.0, 75.0, 43.0, 46.0, 29.0, 11.0, 10.0, 11.0, 4.0, 2.0, 3.0, 2.0, 2.0], "bins": [-8.1328125, -7.88165283203125, -7.6304931640625, -7.37933349609375, -7.128173828125, -6.87701416015625, -6.6258544921875, -6.37469482421875, -6.12353515625, -5.87237548828125, -5.6212158203125, -5.37005615234375, -5.118896484375, -4.86773681640625, -4.6165771484375, -4.36541748046875, -4.1142578125, -3.86309814453125, -3.6119384765625, -3.36077880859375, -3.109619140625, -2.85845947265625, -2.6072998046875, -2.35614013671875, -2.10498046875, -1.85382080078125, -1.6026611328125, -1.35150146484375, -1.100341796875, -0.84918212890625, -0.5980224609375, -0.34686279296875, -0.095703125, 0.15545654296875, 0.4066162109375, 0.65777587890625, 0.908935546875, 1.16009521484375, 1.4112548828125, 1.66241455078125, 1.91357421875, 2.16473388671875, 2.4158935546875, 2.66705322265625, 2.918212890625, 3.16937255859375, 3.4205322265625, 3.67169189453125, 3.9228515625, 4.17401123046875, 4.4251708984375, 4.67633056640625, 4.927490234375, 5.17864990234375, 5.4298095703125, 5.68096923828125, 5.93212890625, 6.18328857421875, 6.4344482421875, 6.68560791015625, 6.936767578125, 7.18792724609375, 7.4390869140625, 7.69024658203125, 7.94140625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 10.0, 7.0, 8.0, 9.0, 9.0, 13.0, 4.0, 12.0, 18.0, 19.0, 31.0, 31.0, 44.0, 53.0, 65.0, 102.0, 147.0, 184.0, 311.0, 359.0, 145.0, 60.0, 48.0, 39.0, 41.0, 47.0, 36.0, 37.0, 22.0, 20.0, 11.0, 19.0, 14.0, 13.0, 8.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.9140625, -11.5501708984375, -11.186279296875, -10.8223876953125, -10.45849609375, -10.0946044921875, -9.730712890625, -9.3668212890625, -9.0029296875, -8.6390380859375, -8.275146484375, -7.9112548828125, -7.54736328125, -7.1834716796875, -6.819580078125, -6.4556884765625, -6.091796875, -5.7279052734375, -5.364013671875, -5.0001220703125, -4.63623046875, -4.2723388671875, -3.908447265625, -3.5445556640625, -3.1806640625, -2.8167724609375, -2.452880859375, -2.0889892578125, -1.72509765625, -1.3612060546875, -0.997314453125, -0.6334228515625, -0.26953125, 0.0943603515625, 0.458251953125, 0.8221435546875, 1.18603515625, 1.5499267578125, 1.913818359375, 2.2777099609375, 2.6416015625, 3.0054931640625, 3.369384765625, 3.7332763671875, 4.09716796875, 4.4610595703125, 4.824951171875, 5.1888427734375, 5.552734375, 5.9166259765625, 6.280517578125, 6.6444091796875, 7.00830078125, 7.3721923828125, 7.736083984375, 8.0999755859375, 8.4638671875, 8.8277587890625, 9.191650390625, 9.5555419921875, 9.91943359375, 10.2833251953125, 10.647216796875, 11.0111083984375, 11.375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 9.0, 11.0, 22.0, 32.0, 30.0, 40.0, 69.0, 95.0, 136.0, 251.0, 332.0, 596.0, 977.0, 1493.0, 2401.0, 4294.0, 7734.0, 14280.0, 29462.0, 66652.0, 181559.0, 670650.0, 4290709.0, 699300.0, 186690.0, 69279.0, 30308.0, 14766.0, 7968.0, 4435.0, 2593.0, 1608.0, 980.0, 590.0, 405.0, 229.0, 167.0, 84.0, 69.0, 30.0, 31.0, 18.0, 17.0, 6.0, 6.0, 2.0, 7.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0], "bins": [-14.5, -14.0540771484375, -13.608154296875, -13.1622314453125, -12.71630859375, -12.2703857421875, -11.824462890625, -11.3785400390625, -10.9326171875, -10.4866943359375, -10.040771484375, -9.5948486328125, -9.14892578125, -8.7030029296875, -8.257080078125, -7.8111572265625, -7.365234375, -6.9193115234375, -6.473388671875, -6.0274658203125, -5.58154296875, -5.1356201171875, -4.689697265625, -4.2437744140625, -3.7978515625, -3.3519287109375, -2.906005859375, -2.4600830078125, -2.01416015625, -1.5682373046875, -1.122314453125, -0.6763916015625, -0.23046875, 0.2154541015625, 0.661376953125, 1.1072998046875, 1.55322265625, 1.9991455078125, 2.445068359375, 2.8909912109375, 3.3369140625, 3.7828369140625, 4.228759765625, 4.6746826171875, 5.12060546875, 5.5665283203125, 6.012451171875, 6.4583740234375, 6.904296875, 7.3502197265625, 7.796142578125, 8.2420654296875, 8.68798828125, 9.1339111328125, 9.579833984375, 10.0257568359375, 10.4716796875, 10.9176025390625, 11.363525390625, 11.8094482421875, 12.25537109375, 12.7012939453125, 13.147216796875, 13.5931396484375, 14.0390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 9.0, 12.0, 10.0, 17.0, 17.0, 25.0, 35.0, 44.0, 57.0, 85.0, 103.0, 162.0, 273.0, 541.0, 187.0, 66.0, 64.0, 51.0, 46.0, 40.0, 28.0, 26.0, 19.0, 18.0, 17.0, 14.0, 11.0, 6.0, 4.0, 8.0, 7.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0, -14.480712890625, -13.96142578125, -13.442138671875, -12.9228515625, -12.403564453125, -11.88427734375, -11.364990234375, -10.845703125, -10.326416015625, -9.80712890625, -9.287841796875, -8.7685546875, -8.249267578125, -7.72998046875, -7.210693359375, -6.69140625, -6.172119140625, -5.65283203125, -5.133544921875, -4.6142578125, -4.094970703125, -3.57568359375, -3.056396484375, -2.537109375, -2.017822265625, -1.49853515625, -0.979248046875, -0.4599609375, 0.059326171875, 0.57861328125, 1.097900390625, 1.6171875, 2.136474609375, 2.65576171875, 3.175048828125, 3.6943359375, 4.213623046875, 4.73291015625, 5.252197265625, 5.771484375, 6.290771484375, 6.81005859375, 7.329345703125, 7.8486328125, 8.367919921875, 8.88720703125, 9.406494140625, 9.92578125, 10.445068359375, 10.96435546875, 11.483642578125, 12.0029296875, 12.522216796875, 13.04150390625, 13.560791015625, 14.080078125, 14.599365234375, 15.11865234375, 15.637939453125, 16.1572265625, 16.676513671875, 17.19580078125, 17.715087890625, 18.234375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [7.0, 7.0, 4.0, 5.0, 1.0, 7.0, 11.0, 11.0, 21.0, 14.0, 46.0, 29.0, 30.0, 53.0, 51.0, 71.0, 78.0, 130.0, 156.0, 183.0, 280.0, 418.0, 506.0, 710.0, 1113.0, 1948.0, 3048.0, 5937.0, 12667.0, 35320.0, 249754.0, 5890655.0, 53879.0, 16608.0, 7317.0, 3738.0, 2162.0, 1361.0, 840.0, 537.0, 448.0, 297.0, 223.0, 152.0, 141.0, 94.0, 94.0, 46.0, 38.0, 56.0, 23.0, 29.0, 14.0, 29.0, 11.0, 10.0, 6.0, 14.0, 8.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-79.625, -77.0693359375, -74.513671875, -71.9580078125, -69.40234375, -66.8466796875, -64.291015625, -61.7353515625, -59.1796875, -56.6240234375, -54.068359375, -51.5126953125, -48.95703125, -46.4013671875, -43.845703125, -41.2900390625, -38.734375, -36.1787109375, -33.623046875, -31.0673828125, -28.51171875, -25.9560546875, -23.400390625, -20.8447265625, -18.2890625, -15.7333984375, -13.177734375, -10.6220703125, -8.06640625, -5.5107421875, -2.955078125, -0.3994140625, 2.15625, 4.7119140625, 7.267578125, 9.8232421875, 12.37890625, 14.9345703125, 17.490234375, 20.0458984375, 22.6015625, 25.1572265625, 27.712890625, 30.2685546875, 32.82421875, 35.3798828125, 37.935546875, 40.4912109375, 43.046875, 45.6025390625, 48.158203125, 50.7138671875, 53.26953125, 55.8251953125, 58.380859375, 60.9365234375, 63.4921875, 66.0478515625, 68.603515625, 71.1591796875, 73.71484375, 76.2705078125, 78.826171875, 81.3818359375, 83.9375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 7.0, 5.0, 4.0, 11.0, 10.0, 8.0, 17.0, 22.0, 31.0, 28.0, 30.0, 52.0, 61.0, 111.0, 232.0, 474.0, 447.0, 88.0, 68.0, 60.0, 55.0, 38.0, 24.0, 24.0, 14.0, 17.0, 15.0, 14.0, 5.0, 9.0, 4.0, 6.0, 4.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.859375, -26.907470703125, -25.95556640625, -25.003662109375, -24.0517578125, -23.099853515625, -22.14794921875, -21.196044921875, -20.244140625, -19.292236328125, -18.34033203125, -17.388427734375, -16.4365234375, -15.484619140625, -14.53271484375, -13.580810546875, -12.62890625, -11.677001953125, -10.72509765625, -9.773193359375, -8.8212890625, -7.869384765625, -6.91748046875, -5.965576171875, -5.013671875, -4.061767578125, -3.10986328125, -2.157958984375, -1.2060546875, -0.254150390625, 0.69775390625, 1.649658203125, 2.6015625, 3.553466796875, 4.50537109375, 5.457275390625, 6.4091796875, 7.361083984375, 8.31298828125, 9.264892578125, 10.216796875, 11.168701171875, 12.12060546875, 13.072509765625, 14.0244140625, 14.976318359375, 15.92822265625, 16.880126953125, 17.83203125, 18.783935546875, 19.73583984375, 20.687744140625, 21.6396484375, 22.591552734375, 23.54345703125, 24.495361328125, 25.447265625, 26.399169921875, 27.35107421875, 28.302978515625, 29.2548828125, 30.206787109375, 31.15869140625, 32.110595703125, 33.0625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 11.0, 9.0, 19.0, 28.0, 66.0, 138.0, 622.0, 71.0, 22.0, 12.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-453.1336669921875, -439.1584167480469, -425.18316650390625, -411.2079162597656, -397.232666015625, -383.2574157714844, -369.28216552734375, -355.3069152832031, -341.3316650390625, -327.3564147949219, -313.38116455078125, -299.4059143066406, -285.4306640625, -271.4554138183594, -257.48016357421875, -243.50491333007812, -229.52964782714844, -215.5543975830078, -201.5791473388672, -187.60389709472656, -173.62864685058594, -159.65338134765625, -145.67813110351562, -131.702880859375, -117.7276382446289, -103.75238800048828, -89.77713775634766, -75.8018798828125, -61.82663345336914, -47.85137939453125, -33.876129150390625, -19.90087890625, -5.925628662109375, 8.049622535705566, 22.024873733520508, 36.000125885009766, 49.97537612915039, 63.95063018798828, 77.9258804321289, 91.90113067626953, 105.87638092041016, 119.85163116455078, 133.82688903808594, 147.80213928222656, 161.7773895263672, 175.7526397705078, 189.72789001464844, 203.70314025878906, 217.6783905029297, 231.6536407470703, 245.62889099121094, 259.6041564941406, 273.57940673828125, 287.5546569824219, 301.5299072265625, 315.5051574707031, 329.48040771484375, 343.4556579589844, 357.430908203125, 371.4061584472656, 385.38140869140625, 399.3566589355469, 413.3319091796875, 427.3071594238281, 441.28240966796875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 15.0, 22.0, 36.0, 42.0, 76.0, 84.0, 363.0, 126.0, 52.0, 46.0, 27.0, 31.0, 14.0, 17.0, 10.0, 7.0, 9.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.07293701171875, -256.2252197265625, -245.37750244140625, -234.52978515625, -223.68206787109375, -212.8343505859375, -201.9866180419922, -191.13890075683594, -180.2911834716797, -169.44346618652344, -158.5957489013672, -147.74801635742188, -136.90029907226562, -126.0525894165039, -115.20486450195312, -104.35714721679688, -93.50942993164062, -82.66171264648438, -71.81399536132812, -60.966270446777344, -50.118553161621094, -39.270835876464844, -28.423110961914062, -17.575393676757812, -6.7276763916015625, 4.12004280090332, 14.967761993408203, 25.81548309326172, 36.66320037841797, 47.51091766357422, 58.358642578125, 69.20635986328125, 80.05404663085938, 90.90176391601562, 101.74948120117188, 112.59720611572266, 123.4449234008789, 134.29263305664062, 145.14036560058594, 155.9880828857422, 166.83580017089844, 177.6835174560547, 188.53123474121094, 199.37896728515625, 210.2266845703125, 221.07440185546875, 231.922119140625, 242.76983642578125, 253.6175537109375, 264.46527099609375, 275.31298828125, 286.16070556640625, 297.0084228515625, 307.85614013671875, 318.703857421875, 329.55157470703125, 340.3992919921875, 351.24700927734375, 362.0947265625, 372.94244384765625, 383.7901611328125, 394.63787841796875, 405.485595703125, 416.33331298828125, 427.1810607910156]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 9.0, 6.0, 13.0, 14.0, 13.0, 27.0, 25.0, 34.0, 48.0, 65.0, 81.0, 111.0, 165.0, 207.0, 356.0, 499.0, 779.0, 1242.0, 1943.0, 3406.0, 6460.0, 14719.0, 53520.0, 3417719.0, 623767.0, 45184.0, 13405.0, 5255.0, 2432.0, 1261.0, 638.0, 398.0, 211.0, 109.0, 69.0, 37.0, 26.0, 16.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0], "bins": [-1.935546875, -1.8914337158203125, -1.847320556640625, -1.8032073974609375, -1.75909423828125, -1.7149810791015625, -1.670867919921875, -1.6267547607421875, -1.5826416015625, -1.5385284423828125, -1.494415283203125, -1.4503021240234375, -1.40618896484375, -1.3620758056640625, -1.317962646484375, -1.2738494873046875, -1.229736328125, -1.1856231689453125, -1.141510009765625, -1.0973968505859375, -1.05328369140625, -1.0091705322265625, -0.965057373046875, -0.9209442138671875, -0.8768310546875, -0.8327178955078125, -0.788604736328125, -0.7444915771484375, -0.70037841796875, -0.6562652587890625, -0.612152099609375, -0.5680389404296875, -0.52392578125, -0.4798126220703125, -0.435699462890625, -0.3915863037109375, -0.34747314453125, -0.3033599853515625, -0.259246826171875, -0.2151336669921875, -0.1710205078125, -0.1269073486328125, -0.082794189453125, -0.0386810302734375, 0.00543212890625, 0.0495452880859375, 0.093658447265625, 0.1377716064453125, 0.181884765625, 0.2259979248046875, 0.270111083984375, 0.3142242431640625, 0.35833740234375, 0.4024505615234375, 0.446563720703125, 0.4906768798828125, 0.5347900390625, 0.5789031982421875, 0.623016357421875, 0.6671295166015625, 0.71124267578125, 0.7553558349609375, 0.799468994140625, 0.8435821533203125, 0.8876953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 10.0, 4.0, 7.0, 15.0, 52.0, 153.0, 296.0, 223.0, 117.0, 49.0, 23.0, 7.0, 14.0, 6.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.1705322265625, -0.16646385192871094, -0.16239547729492188, -0.1583271026611328, -0.15425872802734375, -0.1501903533935547, -0.14612197875976562, -0.14205360412597656, -0.1379852294921875, -0.13391685485839844, -0.12984848022460938, -0.1257801055908203, -0.12171173095703125, -0.11764335632324219, -0.11357498168945312, -0.10950660705566406, -0.105438232421875, -0.10136985778808594, -0.09730148315429688, -0.09323310852050781, -0.08916473388671875, -0.08509635925292969, -0.08102798461914062, -0.07695960998535156, -0.0728912353515625, -0.06882286071777344, -0.06475448608398438, -0.06068611145019531, -0.05661773681640625, -0.05254936218261719, -0.048480987548828125, -0.04441261291503906, -0.04034423828125, -0.03627586364746094, -0.032207489013671875, -0.028139114379882812, -0.02407073974609375, -0.020002365112304688, -0.015933990478515625, -0.011865615844726562, -0.0077972412109375, -0.0037288665771484375, 0.000339508056640625, 0.0044078826904296875, 0.00847625732421875, 0.012544631958007812, 0.016613006591796875, 0.020681381225585938, 0.024749755859375, 0.028818130493164062, 0.032886505126953125, 0.03695487976074219, 0.04102325439453125, 0.04509162902832031, 0.049160003662109375, 0.05322837829589844, 0.0572967529296875, 0.06136512756347656, 0.06543350219726562, 0.06950187683105469, 0.07357025146484375, 0.07763862609863281, 0.08170700073242188, 0.08577537536621094, 0.08984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 5.0, 6.0, 7.0, 14.0, 10.0, 29.0, 19.0, 33.0, 37.0, 58.0, 71.0, 134.0, 182.0, 237.0, 348.0, 516.0, 955.0, 1615.0, 3128.0, 6662.0, 16203.0, 50347.0, 247407.0, 3235471.0, 525492.0, 70401.0, 19741.0, 7413.0, 3331.0, 1784.0, 980.0, 571.0, 339.0, 222.0, 148.0, 99.0, 79.0, 49.0, 50.0, 26.0, 20.0, 14.0, 14.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3271484375, -1.289947509765625, -1.25274658203125, -1.215545654296875, -1.1783447265625, -1.141143798828125, -1.10394287109375, -1.066741943359375, -1.029541015625, -0.992340087890625, -0.95513916015625, -0.917938232421875, -0.8807373046875, -0.843536376953125, -0.80633544921875, -0.769134521484375, -0.73193359375, -0.694732666015625, -0.65753173828125, -0.620330810546875, -0.5831298828125, -0.545928955078125, -0.50872802734375, -0.471527099609375, -0.434326171875, -0.397125244140625, -0.35992431640625, -0.322723388671875, -0.2855224609375, -0.248321533203125, -0.21112060546875, -0.173919677734375, -0.13671875, -0.099517822265625, -0.06231689453125, -0.025115966796875, 0.0120849609375, 0.049285888671875, 0.08648681640625, 0.123687744140625, 0.160888671875, 0.198089599609375, 0.23529052734375, 0.272491455078125, 0.3096923828125, 0.346893310546875, 0.38409423828125, 0.421295166015625, 0.45849609375, 0.495697021484375, 0.53289794921875, 0.570098876953125, 0.6072998046875, 0.644500732421875, 0.68170166015625, 0.718902587890625, 0.756103515625, 0.793304443359375, 0.83050537109375, 0.867706298828125, 0.9049072265625, 0.942108154296875, 0.97930908203125, 1.016510009765625, 1.0537109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 8.0, 10.0, 7.0, 18.0, 9.0, 18.0, 16.0, 19.0, 31.0, 43.0, 52.0, 53.0, 69.0, 76.0, 96.0, 121.0, 143.0, 180.0, 280.0, 352.0, 541.0, 665.0, 390.0, 248.0, 164.0, 119.0, 80.0, 62.0, 39.0, 23.0, 22.0, 19.0, 19.0, 10.0, 11.0, 13.0, 7.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.23876953125, -0.23219680786132812, -0.22562408447265625, -0.21905136108398438, -0.2124786376953125, -0.20590591430664062, -0.19933319091796875, -0.19276046752929688, -0.186187744140625, -0.17961502075195312, -0.17304229736328125, -0.16646957397460938, -0.1598968505859375, -0.15332412719726562, -0.14675140380859375, -0.14017868041992188, -0.13360595703125, -0.12703323364257812, -0.12046051025390625, -0.11388778686523438, -0.1073150634765625, -0.10074234008789062, -0.09416961669921875, -0.08759689331054688, -0.081024169921875, -0.07445144653320312, -0.06787872314453125, -0.061305999755859375, -0.0547332763671875, -0.048160552978515625, -0.04158782958984375, -0.035015106201171875, -0.0284423828125, -0.021869659423828125, -0.01529693603515625, -0.008724212646484375, -0.0021514892578125, 0.004421234130859375, 0.01099395751953125, 0.017566680908203125, 0.024139404296875, 0.030712127685546875, 0.03728485107421875, 0.043857574462890625, 0.0504302978515625, 0.057003021240234375, 0.06357574462890625, 0.07014846801757812, 0.07672119140625, 0.08329391479492188, 0.08986663818359375, 0.09643936157226562, 0.1030120849609375, 0.10958480834960938, 0.11615753173828125, 0.12273025512695312, 0.129302978515625, 0.13587570190429688, 0.14244842529296875, 0.14902114868164062, 0.1555938720703125, 0.16216659545898438, 0.16873931884765625, 0.17531204223632812, 0.181884765625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 12.0, 15.0, 31.0, 51.0, 73.0, 108.0, 217.0, 274.0, 122.0, 45.0, 16.0, 20.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.03487491607666, -9.827827453613281, -9.620779037475586, -9.413731575012207, -9.206684112548828, -8.99963665008545, -8.79258918762207, -8.585540771484375, -8.378493309020996, -8.171445846557617, -7.96439790725708, -7.757349967956543, -7.550302505493164, -7.343255043029785, -7.136207103729248, -6.929159164428711, -6.722111701965332, -6.515064239501953, -6.308016300201416, -6.100968360900879, -5.8939208984375, -5.686873435974121, -5.479825496673584, -5.272777557373047, -5.065730094909668, -4.858682632446289, -4.651634693145752, -4.444586753845215, -4.237539291381836, -4.030491828918457, -3.82344388961792, -3.616396188735962, -3.409348487854004, -3.202300786972046, -2.995253086090088, -2.78820538520813, -2.581157684326172, -2.374109983444214, -2.167062282562256, -1.9600145816802979, -1.7529668807983398, -1.5459191799163818, -1.3388714790344238, -1.1318237781524658, -0.9247760772705078, -0.7177283763885498, -0.5106806755065918, -0.3036329746246338, -0.09658527374267578, 0.11046242713928223, 0.31751012802124023, 0.5245578289031982, 0.7316055297851562, 0.9386532306671143, 1.1457009315490723, 1.3527486324310303, 1.5597963333129883, 1.7668440341949463, 1.9738917350769043, 2.1809394359588623, 2.3879871368408203, 2.5950348377227783, 2.8020825386047363, 3.0091302394866943, 3.2161779403686523]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 9.0, 9.0, 11.0, 12.0, 21.0, 26.0, 34.0, 57.0, 43.0, 58.0, 60.0, 80.0, 71.0, 72.0, 61.0, 79.0, 57.0, 69.0, 33.0, 34.0, 30.0, 18.0, 16.0, 7.0, 11.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.526061534881592, -4.3907151222229, -4.255369186401367, -4.120022773742676, -3.9846765995025635, -3.849330425262451, -3.7139840126037598, -3.5786378383636475, -3.443291664123535, -3.307945489883423, -3.1725993156433105, -3.037252902984619, -2.901906728744507, -2.7665605545043945, -2.631214141845703, -2.495867967605591, -2.3605217933654785, -2.225175619125366, -2.089829444885254, -1.9544830322265625, -1.8191368579864502, -1.683790683746338, -1.548444390296936, -1.4130980968475342, -1.2777519226074219, -1.1424057483673096, -1.0070594549179077, -0.8717132210731506, -0.7363669872283936, -0.6010207533836365, -0.4656745195388794, -0.3303282856941223, -0.19498157501220703, -0.05963534116744995, 0.07571089267730713, 0.2110571265220642, 0.3464033603668213, 0.48174959421157837, 0.6170958280563354, 0.7524420619010925, 0.8877882957458496, 1.023134469985962, 1.1584807634353638, 1.2938270568847656, 1.429173231124878, 1.5645194053649902, 1.699865698814392, 1.835211992263794, 1.9705581665039062, 2.1059043407440186, 2.241250514984131, 2.3765969276428223, 2.5119431018829346, 2.647289276123047, 2.7826356887817383, 2.9179818630218506, 3.053328037261963, 3.188674211502075, 3.3240203857421875, 3.459366798400879, 3.594712972640991, 3.7300591468811035, 3.865405559539795, 4.000751495361328, 4.1360979080200195]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 12.0, 10.0, 12.0, 13.0, 23.0, 19.0, 25.0, 42.0, 62.0, 75.0, 100.0, 153.0, 217.0, 388.0, 570.0, 1062.0, 1873.0, 4215.0, 11987.0, 60573.0, 679873.0, 244958.0, 28309.0, 7269.0, 2911.0, 1477.0, 840.0, 466.0, 322.0, 179.0, 148.0, 100.0, 65.0, 38.0, 38.0, 28.0, 21.0, 10.0, 18.0, 11.0, 13.0, 3.0, 4.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.59375, -1.5451507568359375, -1.496551513671875, -1.4479522705078125, -1.39935302734375, -1.3507537841796875, -1.302154541015625, -1.2535552978515625, -1.2049560546875, -1.1563568115234375, -1.107757568359375, -1.0591583251953125, -1.01055908203125, -0.9619598388671875, -0.913360595703125, -0.8647613525390625, -0.816162109375, -0.7675628662109375, -0.718963623046875, -0.6703643798828125, -0.62176513671875, -0.5731658935546875, -0.524566650390625, -0.4759674072265625, -0.4273681640625, -0.3787689208984375, -0.330169677734375, -0.2815704345703125, -0.23297119140625, -0.1843719482421875, -0.135772705078125, -0.0871734619140625, -0.03857421875, 0.0100250244140625, 0.058624267578125, 0.1072235107421875, 0.15582275390625, 0.2044219970703125, 0.253021240234375, 0.3016204833984375, 0.3502197265625, 0.3988189697265625, 0.447418212890625, 0.4960174560546875, 0.54461669921875, 0.5932159423828125, 0.641815185546875, 0.6904144287109375, 0.739013671875, 0.7876129150390625, 0.836212158203125, 0.8848114013671875, 0.93341064453125, 0.9820098876953125, 1.030609130859375, 1.0792083740234375, 1.1278076171875, 1.1764068603515625, 1.225006103515625, 1.2736053466796875, 1.32220458984375, 1.3708038330078125, 1.419403076171875, 1.4680023193359375, 1.5166015625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 3.0, 4.0, 12.0, 17.0, 48.0, 92.0, 125.0, 163.0, 157.0, 156.0, 102.0, 53.0, 22.0, 16.0, 5.0, 8.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2666015625, -0.26081085205078125, -0.2550201416015625, -0.24922943115234375, -0.243438720703125, -0.23764801025390625, -0.2318572998046875, -0.22606658935546875, -0.22027587890625, -0.21448516845703125, -0.2086944580078125, -0.20290374755859375, -0.197113037109375, -0.19132232666015625, -0.1855316162109375, -0.17974090576171875, -0.1739501953125, -0.16815948486328125, -0.1623687744140625, -0.15657806396484375, -0.150787353515625, -0.14499664306640625, -0.1392059326171875, -0.13341522216796875, -0.12762451171875, -0.12183380126953125, -0.1160430908203125, -0.11025238037109375, -0.104461669921875, -0.09867095947265625, -0.0928802490234375, -0.08708953857421875, -0.081298828125, -0.07550811767578125, -0.0697174072265625, -0.06392669677734375, -0.058135986328125, -0.05234527587890625, -0.0465545654296875, -0.04076385498046875, -0.03497314453125, -0.02918243408203125, -0.0233917236328125, -0.01760101318359375, -0.011810302734375, -0.00601959228515625, -0.0002288818359375, 0.00556182861328125, 0.0113525390625, 0.01714324951171875, 0.0229339599609375, 0.02872467041015625, 0.034515380859375, 0.04030609130859375, 0.0460968017578125, 0.05188751220703125, 0.05767822265625, 0.06346893310546875, 0.0692596435546875, 0.07505035400390625, 0.080841064453125, 0.08663177490234375, 0.0924224853515625, 0.09821319580078125, 0.10400390625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 16.0, 10.0, 19.0, 36.0, 51.0, 93.0, 131.0, 277.0, 725.0, 2212.0, 11418.0, 414325.0, 602605.0, 12862.0, 2271.0, 773.0, 332.0, 158.0, 93.0, 55.0, 31.0, 16.0, 15.0, 14.0, 2.0, 9.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.4815673828125, -4.349853515625, -4.2181396484375, -4.08642578125, -3.9547119140625, -3.822998046875, -3.6912841796875, -3.5595703125, -3.4278564453125, -3.296142578125, -3.1644287109375, -3.03271484375, -2.9010009765625, -2.769287109375, -2.6375732421875, -2.505859375, -2.3741455078125, -2.242431640625, -2.1107177734375, -1.97900390625, -1.8472900390625, -1.715576171875, -1.5838623046875, -1.4521484375, -1.3204345703125, -1.188720703125, -1.0570068359375, -0.92529296875, -0.7935791015625, -0.661865234375, -0.5301513671875, -0.3984375, -0.2667236328125, -0.135009765625, -0.0032958984375, 0.12841796875, 0.2601318359375, 0.391845703125, 0.5235595703125, 0.6552734375, 0.7869873046875, 0.918701171875, 1.0504150390625, 1.18212890625, 1.3138427734375, 1.445556640625, 1.5772705078125, 1.708984375, 1.8406982421875, 1.972412109375, 2.1041259765625, 2.23583984375, 2.3675537109375, 2.499267578125, 2.6309814453125, 2.7626953125, 2.8944091796875, 3.026123046875, 3.1578369140625, 3.28955078125, 3.4212646484375, 3.552978515625, 3.6846923828125, 3.81640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 10.0, 16.0, 11.0, 21.0, 22.0, 26.0, 18.0, 25.0, 40.0, 41.0, 40.0, 44.0, 44.0, 43.0, 56.0, 51.0, 50.0, 43.0, 54.0, 50.0, 39.0, 36.0, 34.0, 30.0, 28.0, 22.0, 29.0, 14.0, 13.0, 10.0, 12.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60302734375, -0.579620361328125, -0.55621337890625, -0.532806396484375, -0.5093994140625, -0.485992431640625, -0.46258544921875, -0.439178466796875, -0.415771484375, -0.392364501953125, -0.36895751953125, -0.345550537109375, -0.3221435546875, -0.298736572265625, -0.27532958984375, -0.251922607421875, -0.228515625, -0.205108642578125, -0.18170166015625, -0.158294677734375, -0.1348876953125, -0.111480712890625, -0.08807373046875, -0.064666748046875, -0.041259765625, -0.017852783203125, 0.00555419921875, 0.028961181640625, 0.0523681640625, 0.075775146484375, 0.09918212890625, 0.122589111328125, 0.14599609375, 0.169403076171875, 0.19281005859375, 0.216217041015625, 0.2396240234375, 0.263031005859375, 0.28643798828125, 0.309844970703125, 0.333251953125, 0.356658935546875, 0.38006591796875, 0.403472900390625, 0.4268798828125, 0.450286865234375, 0.47369384765625, 0.497100830078125, 0.5205078125, 0.543914794921875, 0.56732177734375, 0.590728759765625, 0.6141357421875, 0.637542724609375, 0.66094970703125, 0.684356689453125, 0.707763671875, 0.731170654296875, 0.75457763671875, 0.777984619140625, 0.8013916015625, 0.824798583984375, 0.84820556640625, 0.871612548828125, 0.89501953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 2.0, 13.0, 8.0, 22.0, 24.0, 50.0, 51.0, 90.0, 127.0, 211.0, 435.0, 942.0, 2500.0, 12811.0, 945732.0, 77121.0, 5398.0, 1550.0, 622.0, 305.0, 188.0, 107.0, 73.0, 48.0, 28.0, 17.0, 21.0, 11.0, 10.0, 9.0, 2.0, 7.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.57421875, -6.37957763671875, -6.1849365234375, -5.99029541015625, -5.795654296875, -5.60101318359375, -5.4063720703125, -5.21173095703125, -5.01708984375, -4.82244873046875, -4.6278076171875, -4.43316650390625, -4.238525390625, -4.04388427734375, -3.8492431640625, -3.65460205078125, -3.4599609375, -3.26531982421875, -3.0706787109375, -2.87603759765625, -2.681396484375, -2.48675537109375, -2.2921142578125, -2.09747314453125, -1.90283203125, -1.70819091796875, -1.5135498046875, -1.31890869140625, -1.124267578125, -0.92962646484375, -0.7349853515625, -0.54034423828125, -0.345703125, -0.15106201171875, 0.0435791015625, 0.23822021484375, 0.432861328125, 0.62750244140625, 0.8221435546875, 1.01678466796875, 1.21142578125, 1.40606689453125, 1.6007080078125, 1.79534912109375, 1.989990234375, 2.18463134765625, 2.3792724609375, 2.57391357421875, 2.7685546875, 2.96319580078125, 3.1578369140625, 3.35247802734375, 3.547119140625, 3.74176025390625, 3.9364013671875, 4.13104248046875, 4.32568359375, 4.52032470703125, 4.7149658203125, 4.90960693359375, 5.104248046875, 5.29888916015625, 5.4935302734375, 5.68817138671875, 5.8828125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 3.0, 6.0, 4.0, 14.0, 14.0, 16.0, 9.0, 18.0, 29.0, 35.0, 56.0, 81.0, 108.0, 166.0, 135.0, 65.0, 54.0, 35.0, 24.0, 22.0, 17.0, 16.0, 13.0, 12.0, 8.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016660690307617188, -0.001609697937965393, -0.0015533268451690674, -0.0014969557523727417, -0.001440584659576416, -0.0013842135667800903, -0.0013278424739837646, -0.001271471381187439, -0.0012151002883911133, -0.0011587291955947876, -0.001102358102798462, -0.0010459870100021362, -0.0009896159172058105, -0.0009332448244094849, -0.0008768737316131592, -0.0008205026388168335, -0.0007641315460205078, -0.0007077604532241821, -0.0006513893604278564, -0.0005950182676315308, -0.0005386471748352051, -0.0004822760820388794, -0.0004259049892425537, -0.00036953389644622803, -0.00031316280364990234, -0.00025679171085357666, -0.00020042061805725098, -0.0001440495252609253, -8.767843246459961e-05, -3.1307339668273926e-05, 2.5063753128051758e-05, 8.143484592437744e-05, 0.00013780593872070312, 0.0001941770315170288, 0.0002505481243133545, 0.0003069192171096802, 0.00036329030990600586, 0.00041966140270233154, 0.0004760324954986572, 0.0005324035882949829, 0.0005887746810913086, 0.0006451457738876343, 0.00070151686668396, 0.0007578879594802856, 0.0008142590522766113, 0.000870630145072937, 0.0009270012378692627, 0.0009833723306655884, 0.001039743423461914, 0.0010961145162582397, 0.0011524856090545654, 0.0012088567018508911, 0.0012652277946472168, 0.0013215988874435425, 0.0013779699802398682, 0.0014343410730361938, 0.0014907121658325195, 0.0015470832586288452, 0.001603454351425171, 0.0016598254442214966, 0.0017161965370178223, 0.001772567629814148, 0.0018289387226104736, 0.0018853098154067993, 0.001941680908203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 11.0, 5.0, 5.0, 7.0, 17.0, 16.0, 30.0, 37.0, 47.0, 88.0, 107.0, 161.0, 283.0, 495.0, 820.0, 1571.0, 3368.0, 9173.0, 41900.0, 842137.0, 123163.0, 15286.0, 4940.0, 2189.0, 1115.0, 608.0, 307.0, 210.0, 150.0, 67.0, 67.0, 50.0, 33.0, 30.0, 6.0, 9.0, 11.0, 12.0, 6.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.7890625, -3.6695556640625, -3.550048828125, -3.4305419921875, -3.31103515625, -3.1915283203125, -3.072021484375, -2.9525146484375, -2.8330078125, -2.7135009765625, -2.593994140625, -2.4744873046875, -2.35498046875, -2.2354736328125, -2.115966796875, -1.9964599609375, -1.876953125, -1.7574462890625, -1.637939453125, -1.5184326171875, -1.39892578125, -1.2794189453125, -1.159912109375, -1.0404052734375, -0.9208984375, -0.8013916015625, -0.681884765625, -0.5623779296875, -0.44287109375, -0.3233642578125, -0.203857421875, -0.0843505859375, 0.03515625, 0.1546630859375, 0.274169921875, 0.3936767578125, 0.51318359375, 0.6326904296875, 0.752197265625, 0.8717041015625, 0.9912109375, 1.1107177734375, 1.230224609375, 1.3497314453125, 1.46923828125, 1.5887451171875, 1.708251953125, 1.8277587890625, 1.947265625, 2.0667724609375, 2.186279296875, 2.3057861328125, 2.42529296875, 2.5447998046875, 2.664306640625, 2.7838134765625, 2.9033203125, 3.0228271484375, 3.142333984375, 3.2618408203125, 3.38134765625, 3.5008544921875, 3.620361328125, 3.7398681640625, 3.859375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 3.0, 7.0, 11.0, 5.0, 16.0, 20.0, 19.0, 50.0, 94.0, 149.0, 180.0, 172.0, 115.0, 56.0, 32.0, 18.0, 4.0, 11.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.088165283203125, -2.02203369140625, -1.955902099609375, -1.8897705078125, -1.823638916015625, -1.75750732421875, -1.691375732421875, -1.625244140625, -1.559112548828125, -1.49298095703125, -1.426849365234375, -1.3607177734375, -1.294586181640625, -1.22845458984375, -1.162322998046875, -1.09619140625, -1.030059814453125, -0.96392822265625, -0.897796630859375, -0.8316650390625, -0.765533447265625, -0.69940185546875, -0.633270263671875, -0.567138671875, -0.501007080078125, -0.43487548828125, -0.368743896484375, -0.3026123046875, -0.236480712890625, -0.17034912109375, -0.104217529296875, -0.0380859375, 0.028045654296875, 0.09417724609375, 0.160308837890625, 0.2264404296875, 0.292572021484375, 0.35870361328125, 0.424835205078125, 0.490966796875, 0.557098388671875, 0.62322998046875, 0.689361572265625, 0.7554931640625, 0.821624755859375, 0.88775634765625, 0.953887939453125, 1.02001953125, 1.086151123046875, 1.15228271484375, 1.218414306640625, 1.2845458984375, 1.350677490234375, 1.41680908203125, 1.482940673828125, 1.549072265625, 1.615203857421875, 1.68133544921875, 1.747467041015625, 1.8135986328125, 1.879730224609375, 1.94586181640625, 2.011993408203125, 2.078125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 12.0, 22.0, 59.0, 200.0, 486.0, 153.0, 43.0, 18.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0], "bins": [-49.44446563720703, -48.53675079345703, -47.62903594970703, -46.72132110595703, -45.81360626220703, -44.90589141845703, -43.99817657470703, -43.09046173095703, -42.18274688720703, -41.27503204345703, -40.36731719970703, -39.45960235595703, -38.55188751220703, -37.64417266845703, -36.73645782470703, -35.82874298095703, -34.92102813720703, -34.01331329345703, -33.10559844970703, -32.19788360595703, -31.29016876220703, -30.38245391845703, -29.47473907470703, -28.56702423095703, -27.659313201904297, -26.751598358154297, -25.843883514404297, -24.936168670654297, -24.028453826904297, -23.120738983154297, -22.213024139404297, -21.305309295654297, -20.39759635925293, -19.48988151550293, -18.58216667175293, -17.67445182800293, -16.76673698425293, -15.85902214050293, -14.951308250427246, -14.043593406677246, -13.135878562927246, -12.228163719177246, -11.320448875427246, -10.412734985351562, -9.505020141601562, -8.597305297851562, -7.6895904541015625, -6.7818756103515625, -5.8741607666015625, -4.9664459228515625, -4.0587310791015625, -3.1510167121887207, -2.2433018684387207, -1.3355870246887207, -0.4278726577758789, 0.4798421859741211, 1.387557029724121, 2.295271873474121, 3.202986478805542, 4.110701084136963, 5.018415927886963, 5.926130771636963, 6.833845138549805, 7.741559982299805, 8.649274826049805]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 4.0, 5.0, 8.0, 12.0, 16.0, 25.0, 28.0, 37.0, 66.0, 76.0, 92.0, 119.0, 107.0, 100.0, 80.0, 61.0, 54.0, 41.0, 18.0, 18.0, 7.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.741109371185303, -7.388061046600342, -7.035012722015381, -6.68196439743042, -6.328916072845459, -5.975867748260498, -5.622819423675537, -5.269771099090576, -4.916722774505615, -4.563674449920654, -4.210626125335693, -3.8575778007507324, -3.5045294761657715, -3.1514811515808105, -2.7984328269958496, -2.4453845024108887, -2.0923361778259277, -1.7392878532409668, -1.3862395286560059, -1.033191204071045, -0.680142879486084, -0.32709455490112305, 0.02595376968383789, 0.37900209426879883, 0.7320504188537598, 1.0850987434387207, 1.4381470680236816, 1.7911953926086426, 2.1442437171936035, 2.4972920417785645, 2.8503403663635254, 3.2033886909484863, 3.556436538696289, 3.90948486328125, 4.262533187866211, 4.615581512451172, 4.968629837036133, 5.321678161621094, 5.674726486206055, 6.027774810791016, 6.380823135375977, 6.7338714599609375, 7.086919784545898, 7.439968109130859, 7.79301643371582, 8.146064758300781, 8.499113082885742, 8.852161407470703, 9.205209732055664, 9.558258056640625, 9.911306381225586, 10.264354705810547, 10.617403030395508, 10.970451354980469, 11.32349967956543, 11.67654800415039, 12.029596328735352, 12.382644653320312, 12.735692977905273, 13.088741302490234, 13.441789627075195, 13.794837951660156, 14.147886276245117, 14.500934600830078, 14.853982925415039]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 2.0, 7.0, 5.0, 18.0, 19.0, 32.0, 63.0, 226.0, 1722.0, 4180317.0, 11577.0, 166.0, 51.0, 23.0, 16.0, 10.0, 9.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-63.28125, -61.865966796875, -60.45068359375, -59.035400390625, -57.6201171875, -56.204833984375, -54.78955078125, -53.374267578125, -51.958984375, -50.543701171875, -49.12841796875, -47.713134765625, -46.2978515625, -44.882568359375, -43.46728515625, -42.052001953125, -40.63671875, -39.221435546875, -37.80615234375, -36.390869140625, -34.9755859375, -33.560302734375, -32.14501953125, -30.729736328125, -29.314453125, -27.899169921875, -26.48388671875, -25.068603515625, -23.6533203125, -22.238037109375, -20.82275390625, -19.407470703125, -17.9921875, -16.576904296875, -15.16162109375, -13.746337890625, -12.3310546875, -10.915771484375, -9.50048828125, -8.085205078125, -6.669921875, -5.254638671875, -3.83935546875, -2.424072265625, -1.0087890625, 0.406494140625, 1.82177734375, 3.237060546875, 4.65234375, 6.067626953125, 7.48291015625, 8.898193359375, 10.3134765625, 11.728759765625, 13.14404296875, 14.559326171875, 15.974609375, 17.389892578125, 18.80517578125, 20.220458984375, 21.6357421875, 23.051025390625, 24.46630859375, 25.881591796875, 27.296875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 8.0, 10.0, 9.0, 18.0, 22.0, 59.0, 77.0, 123.0, 135.0, 160.0, 110.0, 107.0, 63.0, 51.0, 27.0, 11.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2548828125, -0.24959754943847656, -0.24431228637695312, -0.2390270233154297, -0.23374176025390625, -0.2284564971923828, -0.22317123413085938, -0.21788597106933594, -0.2126007080078125, -0.20731544494628906, -0.20203018188476562, -0.1967449188232422, -0.19145965576171875, -0.1861743927001953, -0.18088912963867188, -0.17560386657714844, -0.170318603515625, -0.16503334045410156, -0.15974807739257812, -0.1544628143310547, -0.14917755126953125, -0.1438922882080078, -0.13860702514648438, -0.13332176208496094, -0.1280364990234375, -0.12275123596191406, -0.11746597290039062, -0.11218070983886719, -0.10689544677734375, -0.10161018371582031, -0.09632492065429688, -0.09103965759277344, -0.08575439453125, -0.08046913146972656, -0.07518386840820312, -0.06989860534667969, -0.06461334228515625, -0.05932807922363281, -0.054042816162109375, -0.04875755310058594, -0.0434722900390625, -0.03818702697753906, -0.032901763916015625, -0.027616500854492188, -0.02233123779296875, -0.017045974731445312, -0.011760711669921875, -0.0064754486083984375, -0.001190185546875, 0.0040950775146484375, 0.009380340576171875, 0.014665603637695312, 0.01995086669921875, 0.025236129760742188, 0.030521392822265625, 0.03580665588378906, 0.0410919189453125, 0.04637718200683594, 0.051662445068359375, 0.05694770812988281, 0.06223297119140625, 0.06751823425292969, 0.07280349731445312, 0.07808876037597656, 0.0833740234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 7.0, 9.0, 32.0, 109.0, 588.0, 27037.0, 4163243.0, 2360.0, 502.0, 192.0, 113.0, 51.0, 19.0, 15.0, 6.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40234375, -5.71002197265625, -5.0177001953125, -4.32537841796875, -3.633056640625, -2.94073486328125, -2.2484130859375, -1.55609130859375, -0.86376953125, -0.17144775390625, 0.5208740234375, 1.21319580078125, 1.905517578125, 2.59783935546875, 3.2901611328125, 3.98248291015625, 4.6748046875, 5.36712646484375, 6.0594482421875, 6.75177001953125, 7.444091796875, 8.13641357421875, 8.8287353515625, 9.52105712890625, 10.21337890625, 10.90570068359375, 11.5980224609375, 12.29034423828125, 12.982666015625, 13.67498779296875, 14.3673095703125, 15.05963134765625, 15.751953125, 16.44427490234375, 17.1365966796875, 17.82891845703125, 18.521240234375, 19.21356201171875, 19.9058837890625, 20.59820556640625, 21.29052734375, 21.98284912109375, 22.6751708984375, 23.36749267578125, 24.059814453125, 24.75213623046875, 25.4444580078125, 26.13677978515625, 26.8291015625, 27.52142333984375, 28.2137451171875, 28.90606689453125, 29.598388671875, 30.29071044921875, 30.9830322265625, 31.67535400390625, 32.36767578125, 33.05999755859375, 33.7523193359375, 34.44464111328125, 35.136962890625, 35.82928466796875, 36.5216064453125, 37.21392822265625, 37.90625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 15.0, 6.0, 15.0, 19.0, 39.0, 72.0, 129.0, 321.0, 1717.0, 1047.0, 394.0, 110.0, 78.0, 37.0, 20.0, 18.0, 11.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.371337890625, -0.3574409484863281, -0.34354400634765625, -0.3296470642089844, -0.3157501220703125, -0.3018531799316406, -0.28795623779296875, -0.2740592956542969, -0.260162353515625, -0.24626541137695312, -0.23236846923828125, -0.21847152709960938, -0.2045745849609375, -0.19067764282226562, -0.17678070068359375, -0.16288375854492188, -0.14898681640625, -0.13508987426757812, -0.12119293212890625, -0.10729598999023438, -0.0933990478515625, -0.07950210571289062, -0.06560516357421875, -0.051708221435546875, -0.037811279296875, -0.023914337158203125, -0.01001739501953125, 0.003879547119140625, 0.0177764892578125, 0.031673431396484375, 0.04557037353515625, 0.059467315673828125, 0.0733642578125, 0.08726119995117188, 0.10115814208984375, 0.11505508422851562, 0.1289520263671875, 0.14284896850585938, 0.15674591064453125, 0.17064285278320312, 0.184539794921875, 0.19843673706054688, 0.21233367919921875, 0.22623062133789062, 0.2401275634765625, 0.2540245056152344, 0.26792144775390625, 0.2818183898925781, 0.29571533203125, 0.3096122741699219, 0.32350921630859375, 0.3374061584472656, 0.3513031005859375, 0.3652000427246094, 0.37909698486328125, 0.3929939270019531, 0.406890869140625, 0.4207878112792969, 0.43468475341796875, 0.4485816955566406, 0.4624786376953125, 0.4763755798339844, 0.49027252197265625, 0.5041694641113281, 0.51806640625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 310.0, 682.0, 19.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.691525459289551, -2.347419261932373, -0.0033130645751953125, 2.3407931327819824, 4.68489933013916, 7.029006004333496, 9.373111724853516, 11.717217445373535, 14.061324119567871, 16.40542984008789, 18.749536514282227, 21.093643188476562, 23.437747955322266, 25.781856536865234, 28.125961303710938, 30.47006607055664, 32.81417465209961, 35.15827941894531, 37.50238800048828, 39.846492767333984, 42.19059753417969, 44.534706115722656, 46.87881088256836, 49.22291564941406, 51.56702423095703, 53.911128997802734, 56.2552375793457, 58.599342346191406, 60.943450927734375, 63.28755569458008, 65.63166046142578, 67.97576904296875, 70.31986999511719, 72.66397857666016, 75.0080795288086, 77.35218811035156, 79.69629669189453, 82.0404052734375, 84.38450622558594, 86.7286148071289, 89.07272338867188, 91.41683197021484, 93.76093292236328, 96.10504150390625, 98.44915008544922, 100.79325866699219, 103.13735961914062, 105.4814682006836, 107.82556915283203, 110.169677734375, 112.51377868652344, 114.8578872680664, 117.20199584960938, 119.54609680175781, 121.89020538330078, 124.23431396484375, 126.57841491699219, 128.92251586914062, 131.26663208007812, 133.61073303222656, 135.954833984375, 138.2989501953125, 140.64305114746094, 142.98715209960938, 145.33126831054688]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 15.0, 21.0, 24.0, 39.0, 57.0, 92.0, 139.0, 133.0, 124.0, 121.0, 101.0, 62.0, 41.0, 19.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4511938095092773, -3.2409725189208984, -3.0307512283325195, -2.8205299377441406, -2.6103086471557617, -2.400087356567383, -2.189866065979004, -1.9796446561813354, -1.7694233655929565, -1.5592020750045776, -1.3489807844161987, -1.1387593746185303, -0.9285381436347961, -0.7183167934417725, -0.5080955028533936, -0.29787421226501465, -0.08765292167663574, 0.12256838381290436, 0.33278968930244446, 0.5430110096931458, 0.7532323002815247, 0.9634536504745483, 1.1736749410629272, 1.3838962316513062, 1.594117522239685, 1.804338812828064, 2.0145602226257324, 2.2247815132141113, 2.4350028038024902, 2.645224094390869, 2.855445384979248, 3.065666675567627, 3.275887966156006, 3.4861092567443848, 3.6963305473327637, 3.9065518379211426, 4.1167731285095215, 4.3269944190979, 4.537215709686279, 4.747437000274658, 4.957658290863037, 5.167879581451416, 5.378100872039795, 5.588322162628174, 5.798543453216553, 6.008764743804932, 6.2189860343933105, 6.4292073249816895, 6.639429092407227, 6.8496503829956055, 7.059871673583984, 7.270092964172363, 7.480314254760742, 7.690535545349121, 7.9007568359375, 8.110978126525879, 8.321199417114258, 8.531420707702637, 8.741641998291016, 8.951863288879395, 9.162084579467773, 9.372305870056152, 9.582527160644531, 9.79274845123291, 10.002969741821289]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 8.0, 8.0, 10.0, 23.0, 26.0, 42.0, 43.0, 68.0, 100.0, 151.0, 220.0, 372.0, 657.0, 1097.0, 2136.0, 4234.0, 10252.0, 30325.0, 144521.0, 664557.0, 141013.0, 29453.0, 10052.0, 4263.0, 2079.0, 1092.0, 637.0, 378.0, 222.0, 158.0, 109.0, 70.0, 35.0, 33.0, 25.0, 26.0, 14.0, 8.0, 9.0, 5.0, 13.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9658203125, -1.9013519287109375, -1.836883544921875, -1.7724151611328125, -1.70794677734375, -1.6434783935546875, -1.579010009765625, -1.5145416259765625, -1.4500732421875, -1.3856048583984375, -1.321136474609375, -1.2566680908203125, -1.19219970703125, -1.1277313232421875, -1.063262939453125, -0.9987945556640625, -0.934326171875, -0.8698577880859375, -0.805389404296875, -0.7409210205078125, -0.67645263671875, -0.6119842529296875, -0.547515869140625, -0.4830474853515625, -0.4185791015625, -0.3541107177734375, -0.289642333984375, -0.2251739501953125, -0.16070556640625, -0.0962371826171875, -0.031768798828125, 0.0326995849609375, 0.09716796875, 0.1616363525390625, 0.226104736328125, 0.2905731201171875, 0.35504150390625, 0.4195098876953125, 0.483978271484375, 0.5484466552734375, 0.6129150390625, 0.6773834228515625, 0.741851806640625, 0.8063201904296875, 0.87078857421875, 0.9352569580078125, 0.999725341796875, 1.0641937255859375, 1.128662109375, 1.1931304931640625, 1.257598876953125, 1.3220672607421875, 1.38653564453125, 1.4510040283203125, 1.515472412109375, 1.5799407958984375, 1.6444091796875, 1.7088775634765625, 1.773345947265625, 1.8378143310546875, 1.90228271484375, 1.9667510986328125, 2.031219482421875, 2.0956878662109375, 2.16015625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0, 7.0, 6.0, 17.0, 8.0, 14.0, 19.0, 21.0, 28.0, 31.0, 42.0, 63.0, 62.0, 61.0, 67.0, 81.0, 70.0, 69.0, 51.0, 53.0, 53.0, 35.0, 39.0, 26.0, 18.0, 13.0, 7.0, 11.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08056640625, -0.07771587371826172, -0.07486534118652344, -0.07201480865478516, -0.06916427612304688, -0.0663137435913086, -0.06346321105957031, -0.06061267852783203, -0.05776214599609375, -0.05491161346435547, -0.05206108093261719, -0.049210548400878906, -0.046360015869140625, -0.043509483337402344, -0.04065895080566406, -0.03780841827392578, -0.0349578857421875, -0.03210735321044922, -0.029256820678710938, -0.026406288146972656, -0.023555755615234375, -0.020705223083496094, -0.017854690551757812, -0.015004158020019531, -0.01215362548828125, -0.009303092956542969, -0.0064525604248046875, -0.0036020278930664062, -0.000751495361328125, 0.0020990371704101562, 0.0049495697021484375, 0.007800102233886719, 0.010650634765625, 0.013501167297363281, 0.016351699829101562, 0.019202232360839844, 0.022052764892578125, 0.024903297424316406, 0.027753829956054688, 0.03060436248779297, 0.03345489501953125, 0.03630542755126953, 0.03915596008300781, 0.042006492614746094, 0.044857025146484375, 0.047707557678222656, 0.05055809020996094, 0.05340862274169922, 0.0562591552734375, 0.05910968780517578, 0.06196022033691406, 0.06481075286865234, 0.06766128540039062, 0.0705118179321289, 0.07336235046386719, 0.07621288299560547, 0.07906341552734375, 0.08191394805908203, 0.08476448059082031, 0.0876150131225586, 0.09046554565429688, 0.09331607818603516, 0.09616661071777344, 0.09901714324951172, 0.10186767578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 10.0, 5.0, 2.0, 8.0, 9.0, 16.0, 27.0, 67.0, 285.0, 3061.0, 729650.0, 312701.0, 2308.0, 221.0, 42.0, 20.0, 14.0, 14.0, 6.0, 8.0, 8.0, 10.0, 9.0, 6.0, 5.0, 6.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.99609375, -7.77362060546875, -7.5511474609375, -7.32867431640625, -7.106201171875, -6.88372802734375, -6.6612548828125, -6.43878173828125, -6.21630859375, -5.99383544921875, -5.7713623046875, -5.54888916015625, -5.326416015625, -5.10394287109375, -4.8814697265625, -4.65899658203125, -4.4365234375, -4.21405029296875, -3.9915771484375, -3.76910400390625, -3.546630859375, -3.32415771484375, -3.1016845703125, -2.87921142578125, -2.65673828125, -2.43426513671875, -2.2117919921875, -1.98931884765625, -1.766845703125, -1.54437255859375, -1.3218994140625, -1.09942626953125, -0.876953125, -0.65447998046875, -0.4320068359375, -0.20953369140625, 0.012939453125, 0.23541259765625, 0.4578857421875, 0.68035888671875, 0.90283203125, 1.12530517578125, 1.3477783203125, 1.57025146484375, 1.792724609375, 2.01519775390625, 2.2376708984375, 2.46014404296875, 2.6826171875, 2.90509033203125, 3.1275634765625, 3.35003662109375, 3.572509765625, 3.79498291015625, 4.0174560546875, 4.23992919921875, 4.46240234375, 4.68487548828125, 4.9073486328125, 5.12982177734375, 5.352294921875, 5.57476806640625, 5.7972412109375, 6.01971435546875, 6.2421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 10.0, 7.0, 8.0, 16.0, 13.0, 12.0, 17.0, 26.0, 28.0, 28.0, 30.0, 40.0, 40.0, 49.0, 42.0, 52.0, 40.0, 47.0, 47.0, 57.0, 41.0, 44.0, 45.0, 38.0, 36.0, 40.0, 28.0, 25.0, 21.0, 11.0, 10.0, 14.0, 7.0, 5.0, 10.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.490966796875, -0.4748954772949219, -0.45882415771484375, -0.4427528381347656, -0.4266815185546875, -0.4106101989746094, -0.39453887939453125, -0.3784675598144531, -0.362396240234375, -0.3463249206542969, -0.33025360107421875, -0.3141822814941406, -0.2981109619140625, -0.2820396423339844, -0.26596832275390625, -0.24989700317382812, -0.23382568359375, -0.21775436401367188, -0.20168304443359375, -0.18561172485351562, -0.1695404052734375, -0.15346908569335938, -0.13739776611328125, -0.12132644653320312, -0.105255126953125, -0.08918380737304688, -0.07311248779296875, -0.057041168212890625, -0.0409698486328125, -0.024898529052734375, -0.00882720947265625, 0.007244110107421875, 0.0233154296875, 0.039386749267578125, 0.05545806884765625, 0.07152938842773438, 0.0876007080078125, 0.10367202758789062, 0.11974334716796875, 0.13581466674804688, 0.151885986328125, 0.16795730590820312, 0.18402862548828125, 0.20009994506835938, 0.2161712646484375, 0.23224258422851562, 0.24831390380859375, 0.2643852233886719, 0.28045654296875, 0.2965278625488281, 0.31259918212890625, 0.3286705017089844, 0.3447418212890625, 0.3608131408691406, 0.37688446044921875, 0.3929557800292969, 0.409027099609375, 0.4250984191894531, 0.44116973876953125, 0.4572410583496094, 0.4733123779296875, 0.4893836975097656, 0.5054550170898438, 0.5215263366699219, 0.53759765625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 2.0, 6.0, 4.0, 7.0, 5.0, 8.0, 10.0, 8.0, 11.0, 16.0, 9.0, 25.0, 39.0, 109.0, 536.0, 4546.0, 445835.0, 591352.0, 5067.0, 597.0, 148.0, 63.0, 27.0, 18.0, 18.0, 10.0, 9.0, 8.0, 16.0, 4.0, 4.0, 4.0, 5.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.0078125, -6.7576904296875, -6.507568359375, -6.2574462890625, -6.00732421875, -5.7572021484375, -5.507080078125, -5.2569580078125, -5.0068359375, -4.7567138671875, -4.506591796875, -4.2564697265625, -4.00634765625, -3.7562255859375, -3.506103515625, -3.2559814453125, -3.005859375, -2.7557373046875, -2.505615234375, -2.2554931640625, -2.00537109375, -1.7552490234375, -1.505126953125, -1.2550048828125, -1.0048828125, -0.7547607421875, -0.504638671875, -0.2545166015625, -0.00439453125, 0.2457275390625, 0.495849609375, 0.7459716796875, 0.99609375, 1.2462158203125, 1.496337890625, 1.7464599609375, 1.99658203125, 2.2467041015625, 2.496826171875, 2.7469482421875, 2.9970703125, 3.2471923828125, 3.497314453125, 3.7474365234375, 3.99755859375, 4.2476806640625, 4.497802734375, 4.7479248046875, 4.998046875, 5.2481689453125, 5.498291015625, 5.7484130859375, 5.99853515625, 6.2486572265625, 6.498779296875, 6.7489013671875, 6.9990234375, 7.2491455078125, 7.499267578125, 7.7493896484375, 7.99951171875, 8.2496337890625, 8.499755859375, 8.7498779296875, 9.0]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 5.0, 5.0, 9.0, 10.0, 27.0, 39.0, 75.0, 189.0, 380.0, 119.0, 47.0, 25.0, 13.0, 8.0, 7.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0045318603515625, -0.00438690185546875, -0.004241943359375, -0.00409698486328125, -0.0039520263671875, -0.00380706787109375, -0.003662109375, -0.00351715087890625, -0.0033721923828125, -0.00322723388671875, -0.003082275390625, -0.00293731689453125, -0.0027923583984375, -0.00264739990234375, -0.00250244140625, -0.00235748291015625, -0.0022125244140625, -0.00206756591796875, -0.001922607421875, -0.00177764892578125, -0.0016326904296875, -0.00148773193359375, -0.0013427734375, -0.00119781494140625, -0.0010528564453125, -0.00090789794921875, -0.000762939453125, -0.00061798095703125, -0.0004730224609375, -0.00032806396484375, -0.00018310546875, -3.814697265625e-05, 0.0001068115234375, 0.00025177001953125, 0.000396728515625, 0.00054168701171875, 0.0006866455078125, 0.00083160400390625, 0.0009765625, 0.00112152099609375, 0.0012664794921875, 0.00141143798828125, 0.001556396484375, 0.00170135498046875, 0.0018463134765625, 0.00199127197265625, 0.00213623046875, 0.00228118896484375, 0.0024261474609375, 0.00257110595703125, 0.002716064453125, 0.00286102294921875, 0.0030059814453125, 0.00315093994140625, 0.0032958984375, 0.00344085693359375, 0.0035858154296875, 0.00373077392578125, 0.003875732421875, 0.00402069091796875, 0.0041656494140625, 0.00431060791015625, 0.00445556640625, 0.00460052490234375, 0.0047454833984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 10.0, 20.0, 38.0, 56.0, 111.0, 199.0, 435.0, 899.0, 2136.0, 5879.0, 26030.0, 539796.0, 439510.0, 24151.0, 5585.0, 1978.0, 878.0, 393.0, 188.0, 108.0, 64.0, 28.0, 18.0, 18.0, 8.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.671875, -4.52105712890625, -4.3702392578125, -4.21942138671875, -4.068603515625, -3.91778564453125, -3.7669677734375, -3.61614990234375, -3.46533203125, -3.31451416015625, -3.1636962890625, -3.01287841796875, -2.862060546875, -2.71124267578125, -2.5604248046875, -2.40960693359375, -2.2587890625, -2.10797119140625, -1.9571533203125, -1.80633544921875, -1.655517578125, -1.50469970703125, -1.3538818359375, -1.20306396484375, -1.05224609375, -0.90142822265625, -0.7506103515625, -0.59979248046875, -0.448974609375, -0.29815673828125, -0.1473388671875, 0.00347900390625, 0.154296875, 0.30511474609375, 0.4559326171875, 0.60675048828125, 0.757568359375, 0.90838623046875, 1.0592041015625, 1.21002197265625, 1.36083984375, 1.51165771484375, 1.6624755859375, 1.81329345703125, 1.964111328125, 2.11492919921875, 2.2657470703125, 2.41656494140625, 2.5673828125, 2.71820068359375, 2.8690185546875, 3.01983642578125, 3.170654296875, 3.32147216796875, 3.4722900390625, 3.62310791015625, 3.77392578125, 3.92474365234375, 4.0755615234375, 4.22637939453125, 4.377197265625, 4.52801513671875, 4.6788330078125, 4.82965087890625, 4.98046875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 7.0, 11.0, 4.0, 14.0, 20.0, 23.0, 33.0, 40.0, 74.0, 90.0, 109.0, 140.0, 102.0, 89.0, 56.0, 42.0, 27.0, 29.0, 22.0, 15.0, 9.0, 9.0, 3.0, 3.0, 8.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2919921875, -1.25323486328125, -1.2144775390625, -1.17572021484375, -1.136962890625, -1.09820556640625, -1.0594482421875, -1.02069091796875, -0.98193359375, -0.94317626953125, -0.9044189453125, -0.86566162109375, -0.826904296875, -0.78814697265625, -0.7493896484375, -0.71063232421875, -0.671875, -0.63311767578125, -0.5943603515625, -0.55560302734375, -0.516845703125, -0.47808837890625, -0.4393310546875, -0.40057373046875, -0.36181640625, -0.32305908203125, -0.2843017578125, -0.24554443359375, -0.206787109375, -0.16802978515625, -0.1292724609375, -0.09051513671875, -0.0517578125, -0.01300048828125, 0.0257568359375, 0.06451416015625, 0.103271484375, 0.14202880859375, 0.1807861328125, 0.21954345703125, 0.25830078125, 0.29705810546875, 0.3358154296875, 0.37457275390625, 0.413330078125, 0.45208740234375, 0.4908447265625, 0.52960205078125, 0.568359375, 0.60711669921875, 0.6458740234375, 0.68463134765625, 0.723388671875, 0.76214599609375, 0.8009033203125, 0.83966064453125, 0.87841796875, 0.91717529296875, 0.9559326171875, 0.99468994140625, 1.033447265625, 1.07220458984375, 1.1109619140625, 1.14971923828125, 1.1884765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 18.0, 37.0, 65.0, 131.0, 253.0, 202.0, 134.0, 73.0, 35.0, 18.0, 11.0, 8.0, 3.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.209115982055664, -9.817031860351562, -9.424946784973145, -9.032862663269043, -8.640777587890625, -8.248693466186523, -7.856608867645264, -7.464524269104004, -7.072439670562744, -6.680355072021484, -6.288270473480225, -5.896185874938965, -5.504101753234863, -5.112016677856445, -4.719932556152344, -4.327847957611084, -3.935763359069824, -3.5436787605285645, -3.1515941619873047, -2.759509801864624, -2.3674252033233643, -1.9753406047821045, -1.5832562446594238, -1.191171646118164, -0.7990870475769043, -0.4070025086402893, -0.014917969703674316, 0.3771665096282959, 0.7692511081695557, 1.1613357067108154, 1.553420066833496, 1.9455046653747559, 2.337588310241699, 2.729672908782959, 3.1217575073242188, 3.5138418674468994, 3.905926465988159, 4.29801082611084, 4.6900954246521, 5.082180023193359, 5.474264621734619, 5.866349220275879, 6.258433818817139, 6.650518417358398, 7.0426025390625, 7.434687614440918, 7.8267717361450195, 8.218856811523438, 8.610940933227539, 9.00302505493164, 9.395110130310059, 9.78719425201416, 10.179279327392578, 10.57136344909668, 10.963447570800781, 11.3555326461792, 11.747617721557617, 12.139701843261719, 12.531786918640137, 12.923871040344238, 13.315956115722656, 13.708040237426758, 14.10012435913086, 14.492209434509277, 14.884293556213379]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 6.0, 12.0, 19.0, 25.0, 32.0, 37.0, 46.0, 68.0, 65.0, 74.0, 87.0, 81.0, 79.0, 84.0, 53.0, 44.0, 45.0, 35.0, 32.0, 19.0, 11.0, 11.0, 10.0, 6.0, 5.0, 0.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.988197326660156, -6.805105209350586, -6.622012615203857, -6.438920497894287, -6.255827903747559, -6.072735786437988, -5.889643669128418, -5.7065510749816895, -5.523458480834961, -5.340366363525391, -5.157273769378662, -4.974181652069092, -4.791089057922363, -4.607996940612793, -4.424904823303223, -4.241812229156494, -4.058720111846924, -3.8756277561187744, -3.692535400390625, -3.5094432830810547, -3.326350688934326, -3.143258571624756, -2.9601662158966064, -2.777073860168457, -2.5939815044403076, -2.410889148712158, -2.227796792984009, -2.0447044372558594, -1.8616122007369995, -1.67851984500885, -1.4954276084899902, -1.3123352527618408, -1.1292428970336914, -0.946150541305542, -0.7630582451820374, -0.5799659490585327, -0.3968735933303833, -0.2137812376022339, -0.030689001083374023, 0.1524033546447754, 0.3354957103729248, 0.5185880661010742, 0.7016803622245789, 0.8847726583480835, 1.067865014076233, 1.2509573698043823, 1.4340496063232422, 1.6171419620513916, 1.800234317779541, 1.9833266735076904, 2.16641902923584, 2.34951114654541, 2.5326037406921387, 2.715695858001709, 2.8987882137298584, 3.081880569458008, 3.2649729251861572, 3.4480652809143066, 3.631157636642456, 3.8142499923706055, 3.997342109680176, 4.180434703826904, 4.363526821136475, 4.546619415283203, 4.729711532592773]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 8.0, 6.0, 2.0, 7.0, 9.0, 12.0, 12.0, 14.0, 12.0, 18.0, 16.0, 14.0, 30.0, 26.0, 111.0, 733.0, 3645006.0, 547006.0, 870.0, 170.0, 48.0, 22.0, 24.0, 18.0, 12.0, 14.0, 8.0, 12.0, 6.0, 6.0, 4.0, 8.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 6.0, 0.0, 2.0, 0.0, 2.0], "bins": [-21.75, -21.0244140625, -20.298828125, -19.5732421875, -18.84765625, -18.1220703125, -17.396484375, -16.6708984375, -15.9453125, -15.2197265625, -14.494140625, -13.7685546875, -13.04296875, -12.3173828125, -11.591796875, -10.8662109375, -10.140625, -9.4150390625, -8.689453125, -7.9638671875, -7.23828125, -6.5126953125, -5.787109375, -5.0615234375, -4.3359375, -3.6103515625, -2.884765625, -2.1591796875, -1.43359375, -0.7080078125, 0.017578125, 0.7431640625, 1.46875, 2.1943359375, 2.919921875, 3.6455078125, 4.37109375, 5.0966796875, 5.822265625, 6.5478515625, 7.2734375, 7.9990234375, 8.724609375, 9.4501953125, 10.17578125, 10.9013671875, 11.626953125, 12.3525390625, 13.078125, 13.8037109375, 14.529296875, 15.2548828125, 15.98046875, 16.7060546875, 17.431640625, 18.1572265625, 18.8828125, 19.6083984375, 20.333984375, 21.0595703125, 21.78515625, 22.5107421875, 23.236328125, 23.9619140625, 24.6875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 7.0, 1.0, 6.0, 2.0, 4.0, 8.0, 10.0, 7.0, 15.0, 23.0, 28.0, 36.0, 51.0, 57.0, 52.0, 56.0, 56.0, 77.0, 64.0, 61.0, 57.0, 65.0, 51.0, 54.0, 35.0, 25.0, 20.0, 26.0, 19.0, 16.0, 6.0, 8.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07513427734375, -0.07190227508544922, -0.06867027282714844, -0.06543827056884766, -0.062206268310546875, -0.058974266052246094, -0.05574226379394531, -0.05251026153564453, -0.04927825927734375, -0.04604625701904297, -0.04281425476074219, -0.039582252502441406, -0.036350250244140625, -0.033118247985839844, -0.029886245727539062, -0.02665424346923828, -0.0234222412109375, -0.02019023895263672, -0.016958236694335938, -0.013726234436035156, -0.010494232177734375, -0.007262229919433594, -0.0040302276611328125, -0.0007982254028320312, 0.00243377685546875, 0.005665779113769531, 0.008897781372070312, 0.012129783630371094, 0.015361785888671875, 0.018593788146972656, 0.021825790405273438, 0.02505779266357422, 0.028289794921875, 0.03152179718017578, 0.03475379943847656, 0.037985801696777344, 0.041217803955078125, 0.044449806213378906, 0.04768180847167969, 0.05091381072998047, 0.05414581298828125, 0.05737781524658203, 0.06060981750488281, 0.0638418197631836, 0.06707382202148438, 0.07030582427978516, 0.07353782653808594, 0.07676982879638672, 0.0800018310546875, 0.08323383331298828, 0.08646583557128906, 0.08969783782958984, 0.09292984008789062, 0.0961618423461914, 0.09939384460449219, 0.10262584686279297, 0.10585784912109375, 0.10908985137939453, 0.11232185363769531, 0.1155538558959961, 0.11878585815429688, 0.12201786041259766, 0.12524986267089844, 0.12848186492919922, 0.1317138671875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 38.0, 161.0, 2400.0, 4190946.0, 690.0, 43.0, 10.0, 4.0], "bins": [-74.1875, -72.9381103515625, -71.688720703125, -70.4393310546875, -69.18994140625, -67.9405517578125, -66.691162109375, -65.4417724609375, -64.1923828125, -62.9429931640625, -61.693603515625, -60.4442138671875, -59.19482421875, -57.9454345703125, -56.696044921875, -55.4466552734375, -54.197265625, -52.9478759765625, -51.698486328125, -50.4490966796875, -49.19970703125, -47.9503173828125, -46.700927734375, -45.4515380859375, -44.2021484375, -42.9527587890625, -41.703369140625, -40.4539794921875, -39.20458984375, -37.9552001953125, -36.705810546875, -35.4564208984375, -34.20703125, -32.9576416015625, -31.708251953125, -30.4588623046875, -29.20947265625, -27.9600830078125, -26.710693359375, -25.4613037109375, -24.2119140625, -22.9625244140625, -21.713134765625, -20.4637451171875, -19.21435546875, -17.9649658203125, -16.715576171875, -15.4661865234375, -14.216796875, -12.9674072265625, -11.718017578125, -10.4686279296875, -9.21923828125, -7.9698486328125, -6.720458984375, -5.4710693359375, -4.2216796875, -2.9722900390625, -1.722900390625, -0.4735107421875, 0.77587890625, 2.0252685546875, 3.274658203125, 4.5240478515625, 5.7734375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 0.0, 3.0, 10.0, 9.0, 6.0, 23.0, 14.0, 33.0, 38.0, 46.0, 84.0, 129.0, 230.0, 533.0, 1737.0, 545.0, 258.0, 136.0, 79.0, 53.0, 35.0, 17.0, 15.0, 7.0, 11.0, 10.0, 2.0, 2.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.46533203125, -0.4541282653808594, -0.44292449951171875, -0.4317207336425781, -0.4205169677734375, -0.4093132019042969, -0.39810943603515625, -0.3869056701660156, -0.375701904296875, -0.3644981384277344, -0.35329437255859375, -0.3420906066894531, -0.3308868408203125, -0.3196830749511719, -0.30847930908203125, -0.2972755432128906, -0.28607177734375, -0.2748680114746094, -0.26366424560546875, -0.2524604797363281, -0.2412567138671875, -0.23005294799804688, -0.21884918212890625, -0.20764541625976562, -0.196441650390625, -0.18523788452148438, -0.17403411865234375, -0.16283035278320312, -0.1516265869140625, -0.14042282104492188, -0.12921905517578125, -0.11801528930664062, -0.1068115234375, -0.09560775756835938, -0.08440399169921875, -0.07320022583007812, -0.0619964599609375, -0.050792694091796875, -0.03958892822265625, -0.028385162353515625, -0.017181396484375, -0.005977630615234375, 0.00522613525390625, 0.016429901123046875, 0.0276336669921875, 0.038837432861328125, 0.05004119873046875, 0.061244964599609375, 0.07244873046875, 0.08365249633789062, 0.09485626220703125, 0.10606002807617188, 0.1172637939453125, 0.12846755981445312, 0.13967132568359375, 0.15087509155273438, 0.162078857421875, 0.17328262329101562, 0.18448638916015625, 0.19569015502929688, 0.2068939208984375, 0.21809768676757812, 0.22930145263671875, 0.24050521850585938, 0.251708984375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 439.0, 581.0, 1.0, 1.0], "bins": [-183.40098571777344, -180.39559936523438, -177.39022827148438, -174.38485717773438, -171.3794708251953, -168.37408447265625, -165.36871337890625, -162.36334228515625, -159.3579559326172, -156.35256958007812, -153.34719848632812, -150.34182739257812, -147.33644104003906, -144.3310546875, -141.32568359375, -138.3203125, -135.31492614746094, -132.30953979492188, -129.30416870117188, -126.29878997802734, -123.29341125488281, -120.28803253173828, -117.28265380859375, -114.27727508544922, -111.27189636230469, -108.26651763916016, -105.26113891601562, -102.2557601928711, -99.25038146972656, -96.24500274658203, -93.2396240234375, -90.23424530029297, -87.22887420654297, -84.22349548339844, -81.2181167602539, -78.21273803710938, -75.20735931396484, -72.20198059082031, -69.19660186767578, -66.19122314453125, -63.18584060668945, -60.18046188354492, -57.17508316040039, -54.16970443725586, -51.16432571411133, -48.1589469909668, -45.153568267822266, -42.148189544677734, -39.1428108215332, -36.13743209838867, -33.13205337524414, -30.12667465209961, -27.121295928955078, -24.115917205810547, -21.110538482666016, -18.105159759521484, -15.09978199005127, -12.094403266906738, -9.089024543762207, -6.083645820617676, -3.0782670974731445, -0.07288837432861328, 2.932490348815918, 5.937869071960449, 8.94324779510498]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 4.0, 8.0, 15.0, 23.0, 40.0, 57.0, 85.0, 96.0, 96.0, 111.0, 107.0, 101.0, 70.0, 67.0, 37.0, 41.0, 18.0, 15.0, 9.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4474754333496094, -2.3467395305633545, -2.2460038661956787, -2.145267963409424, -2.044532299041748, -1.9437963962554932, -1.8430606126785278, -1.7423248291015625, -1.6415890455245972, -1.5408532619476318, -1.4401174783706665, -1.3393816947937012, -1.2386457920074463, -1.1379101276397705, -1.0371742248535156, -0.9364384412765503, -0.835702657699585, -0.7349668741226196, -0.6342310905456543, -0.5334952473640442, -0.43275946378707886, -0.3320236802101135, -0.23128783702850342, -0.13055205345153809, -0.029816269874572754, 0.07091952860355377, 0.1716553270816803, 0.272391140460968, 0.37312692403793335, 0.4738627076148987, 0.5745985507965088, 0.6753343343734741, 0.7760698795318604, 0.8768056631088257, 0.977541446685791, 1.078277349472046, 1.1790130138397217, 1.2797489166259766, 1.380484700202942, 1.4812204837799072, 1.5819562673568726, 1.682692050933838, 1.7834278345108032, 1.8841636180877686, 1.9848995208740234, 2.085635185241699, 2.186371088027954, 2.287106990814209, 2.3878426551818848, 2.4885785579681396, 2.5893142223358154, 2.6900501251220703, 2.790785789489746, 2.891521692276001, 2.992257595062256, 3.0929932594299316, 3.1937289237976074, 3.2944648265838623, 3.395200490951538, 3.495936393737793, 3.5966720581054688, 3.6974079608917236, 3.7981438636779785, 3.8988795280456543, 3.999615430831909]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 5.0, 8.0, 6.0, 13.0, 13.0, 16.0, 16.0, 22.0, 22.0, 31.0, 34.0, 41.0, 54.0, 51.0, 54.0, 89.0, 43607.0, 1003791.0, 267.0, 48.0, 58.0, 42.0, 43.0, 36.0, 27.0, 31.0, 20.0, 29.0, 14.0, 8.0, 11.0, 8.0, 7.0, 9.0, 6.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.1875, -18.52978515625, -17.8720703125, -17.21435546875, -16.556640625, -15.89892578125, -15.2412109375, -14.58349609375, -13.92578125, -13.26806640625, -12.6103515625, -11.95263671875, -11.294921875, -10.63720703125, -9.9794921875, -9.32177734375, -8.6640625, -8.00634765625, -7.3486328125, -6.69091796875, -6.033203125, -5.37548828125, -4.7177734375, -4.06005859375, -3.40234375, -2.74462890625, -2.0869140625, -1.42919921875, -0.771484375, -0.11376953125, 0.5439453125, 1.20166015625, 1.859375, 2.51708984375, 3.1748046875, 3.83251953125, 4.490234375, 5.14794921875, 5.8056640625, 6.46337890625, 7.12109375, 7.77880859375, 8.4365234375, 9.09423828125, 9.751953125, 10.40966796875, 11.0673828125, 11.72509765625, 12.3828125, 13.04052734375, 13.6982421875, 14.35595703125, 15.013671875, 15.67138671875, 16.3291015625, 16.98681640625, 17.64453125, 18.30224609375, 18.9599609375, 19.61767578125, 20.275390625, 20.93310546875, 21.5908203125, 22.24853515625, 22.90625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 59.0, 338.0, 480.0, 128.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1932373046875, -0.1563129425048828, -0.11938858032226562, -0.08246421813964844, -0.04553985595703125, -0.008615493774414062, 0.028308868408203125, 0.06523323059082031, 0.1021575927734375, 0.1390819549560547, 0.17600631713867188, 0.21293067932128906, 0.24985504150390625, 0.28677940368652344, 0.3237037658691406, 0.3606281280517578, 0.397552490234375, 0.4344768524169922, 0.4714012145996094, 0.5083255767822266, 0.5452499389648438, 0.5821743011474609, 0.6190986633300781, 0.6560230255126953, 0.6929473876953125, 0.7298717498779297, 0.7667961120605469, 0.8037204742431641, 0.8406448364257812, 0.8775691986083984, 0.9144935607910156, 0.9514179229736328, 0.98834228515625, 1.0252666473388672, 1.0621910095214844, 1.0991153717041016, 1.1360397338867188, 1.172964096069336, 1.2098884582519531, 1.2468128204345703, 1.2837371826171875, 1.3206615447998047, 1.3575859069824219, 1.394510269165039, 1.4314346313476562, 1.4683589935302734, 1.5052833557128906, 1.5422077178955078, 1.579132080078125, 1.6160564422607422, 1.6529808044433594, 1.6899051666259766, 1.7268295288085938, 1.763753890991211, 1.8006782531738281, 1.8376026153564453, 1.8745269775390625, 1.9114513397216797, 1.9483757019042969, 1.985300064086914, 2.0222244262695312, 2.0591487884521484, 2.0960731506347656, 2.132997512817383, 2.169921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 2.0, 11.0, 7.0, 8.0, 16.0, 27.0, 31.0, 39.0, 62.0, 102.0, 159.0, 220.0, 356.0, 658.0, 1310.0, 2678.0, 6772.0, 19287.0, 73136.0, 419572.0, 419453.0, 73146.0, 19243.0, 6488.0, 2648.0, 1396.0, 671.0, 374.0, 221.0, 116.0, 102.0, 76.0, 51.0, 31.0, 22.0, 18.0, 11.0, 11.0, 8.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.5859375, -4.4510498046875, -4.316162109375, -4.1812744140625, -4.04638671875, -3.9114990234375, -3.776611328125, -3.6417236328125, -3.5068359375, -3.3719482421875, -3.237060546875, -3.1021728515625, -2.96728515625, -2.8323974609375, -2.697509765625, -2.5626220703125, -2.427734375, -2.2928466796875, -2.157958984375, -2.0230712890625, -1.88818359375, -1.7532958984375, -1.618408203125, -1.4835205078125, -1.3486328125, -1.2137451171875, -1.078857421875, -0.9439697265625, -0.80908203125, -0.6741943359375, -0.539306640625, -0.4044189453125, -0.26953125, -0.1346435546875, 0.000244140625, 0.1351318359375, 0.27001953125, 0.4049072265625, 0.539794921875, 0.6746826171875, 0.8095703125, 0.9444580078125, 1.079345703125, 1.2142333984375, 1.34912109375, 1.4840087890625, 1.618896484375, 1.7537841796875, 1.888671875, 2.0235595703125, 2.158447265625, 2.2933349609375, 2.42822265625, 2.5631103515625, 2.697998046875, 2.8328857421875, 2.9677734375, 3.1026611328125, 3.237548828125, 3.3724365234375, 3.50732421875, 3.6422119140625, 3.777099609375, 3.9119873046875, 4.046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 6.0, 9.0, 12.0, 14.0, 17.0, 24.0, 23.0, 18.0, 43.0, 40.0, 51.0, 48.0, 56.0, 55.0, 69.0, 70.0, 56.0, 64.0, 48.0, 47.0, 38.0, 34.0, 31.0, 28.0, 25.0, 16.0, 8.0, 7.0, 3.0, 11.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8681640625, -1.812957763671875, -1.75775146484375, -1.702545166015625, -1.6473388671875, -1.592132568359375, -1.53692626953125, -1.481719970703125, -1.426513671875, -1.371307373046875, -1.31610107421875, -1.260894775390625, -1.2056884765625, -1.150482177734375, -1.09527587890625, -1.040069580078125, -0.98486328125, -0.929656982421875, -0.87445068359375, -0.819244384765625, -0.7640380859375, -0.708831787109375, -0.65362548828125, -0.598419189453125, -0.543212890625, -0.488006591796875, -0.43280029296875, -0.377593994140625, -0.3223876953125, -0.267181396484375, -0.21197509765625, -0.156768798828125, -0.1015625, -0.046356201171875, 0.00885009765625, 0.064056396484375, 0.1192626953125, 0.174468994140625, 0.22967529296875, 0.284881591796875, 0.340087890625, 0.395294189453125, 0.45050048828125, 0.505706787109375, 0.5609130859375, 0.616119384765625, 0.67132568359375, 0.726531982421875, 0.78173828125, 0.836944580078125, 0.89215087890625, 0.947357177734375, 1.0025634765625, 1.057769775390625, 1.11297607421875, 1.168182373046875, 1.223388671875, 1.278594970703125, 1.33380126953125, 1.389007568359375, 1.4442138671875, 1.499420166015625, 1.55462646484375, 1.609832763671875, 1.6650390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 12.0, 11.0, 22.0, 37.0, 47.0, 115.0, 237.0, 603.0, 1494.0, 5158.0, 28800.0, 545762.0, 434341.0, 24811.0, 4693.0, 1458.0, 468.0, 245.0, 99.0, 49.0, 34.0, 19.0, 17.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.48046875, -7.2535400390625, -7.026611328125, -6.7996826171875, -6.57275390625, -6.3458251953125, -6.118896484375, -5.8919677734375, -5.6650390625, -5.4381103515625, -5.211181640625, -4.9842529296875, -4.75732421875, -4.5303955078125, -4.303466796875, -4.0765380859375, -3.849609375, -3.6226806640625, -3.395751953125, -3.1688232421875, -2.94189453125, -2.7149658203125, -2.488037109375, -2.2611083984375, -2.0341796875, -1.8072509765625, -1.580322265625, -1.3533935546875, -1.12646484375, -0.8995361328125, -0.672607421875, -0.4456787109375, -0.21875, 0.0081787109375, 0.235107421875, 0.4620361328125, 0.68896484375, 0.9158935546875, 1.142822265625, 1.3697509765625, 1.5966796875, 1.8236083984375, 2.050537109375, 2.2774658203125, 2.50439453125, 2.7313232421875, 2.958251953125, 3.1851806640625, 3.412109375, 3.6390380859375, 3.865966796875, 4.0928955078125, 4.31982421875, 4.5467529296875, 4.773681640625, 5.0006103515625, 5.2275390625, 5.4544677734375, 5.681396484375, 5.9083251953125, 6.13525390625, 6.3621826171875, 6.589111328125, 6.8160400390625, 7.04296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 9.0, 10.0, 13.0, 20.0, 23.0, 31.0, 33.0, 35.0, 56.0, 63.0, 94.0, 101.0, 94.0, 94.0, 72.0, 55.0, 37.0, 38.0, 25.0, 22.0, 16.0, 12.0, 8.0, 8.0, 8.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0012445449829101562, -0.0012093782424926758, -0.0011742115020751953, -0.0011390447616577148, -0.0011038780212402344, -0.001068711280822754, -0.0010335445404052734, -0.000998377799987793, -0.0009632110595703125, -0.000928044319152832, -0.0008928775787353516, -0.0008577108383178711, -0.0008225440979003906, -0.0007873773574829102, -0.0007522106170654297, -0.0007170438766479492, -0.0006818771362304688, -0.0006467103958129883, -0.0006115436553955078, -0.0005763769149780273, -0.0005412101745605469, -0.0005060434341430664, -0.00047087669372558594, -0.00043570995330810547, -0.000400543212890625, -0.00036537647247314453, -0.00033020973205566406, -0.0002950429916381836, -0.0002598762512207031, -0.00022470951080322266, -0.0001895427703857422, -0.00015437602996826172, -0.00011920928955078125, -8.404254913330078e-05, -4.887580871582031e-05, -1.3709068298339844e-05, 2.1457672119140625e-05, 5.6624412536621094e-05, 9.179115295410156e-05, 0.00012695789337158203, 0.0001621246337890625, 0.00019729137420654297, 0.00023245811462402344, 0.0002676248550415039, 0.0003027915954589844, 0.00033795833587646484, 0.0003731250762939453, 0.0004082918167114258, 0.00044345855712890625, 0.0004786252975463867, 0.0005137920379638672, 0.0005489587783813477, 0.0005841255187988281, 0.0006192922592163086, 0.0006544589996337891, 0.0006896257400512695, 0.00072479248046875, 0.0007599592208862305, 0.0007951259613037109, 0.0008302927017211914, 0.0008654594421386719, 0.0009006261825561523, 0.0009357929229736328, 0.0009709596633911133, 0.0010061264038085938]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 4.0, 8.0, 17.0, 20.0, 31.0, 45.0, 68.0, 117.0, 185.0, 383.0, 878.0, 2329.0, 8075.0, 41826.0, 642154.0, 318858.0, 24763.0, 5501.0, 1784.0, 728.0, 324.0, 164.0, 96.0, 77.0, 42.0, 26.0, 18.0, 5.0, 6.0, 1.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.5252685546875, -4.335693359375, -4.1461181640625, -3.95654296875, -3.7669677734375, -3.577392578125, -3.3878173828125, -3.1982421875, -3.0086669921875, -2.819091796875, -2.6295166015625, -2.43994140625, -2.2503662109375, -2.060791015625, -1.8712158203125, -1.681640625, -1.4920654296875, -1.302490234375, -1.1129150390625, -0.92333984375, -0.7337646484375, -0.544189453125, -0.3546142578125, -0.1650390625, 0.0245361328125, 0.214111328125, 0.4036865234375, 0.59326171875, 0.7828369140625, 0.972412109375, 1.1619873046875, 1.3515625, 1.5411376953125, 1.730712890625, 1.9202880859375, 2.10986328125, 2.2994384765625, 2.489013671875, 2.6785888671875, 2.8681640625, 3.0577392578125, 3.247314453125, 3.4368896484375, 3.62646484375, 3.8160400390625, 4.005615234375, 4.1951904296875, 4.384765625, 4.5743408203125, 4.763916015625, 4.9534912109375, 5.14306640625, 5.3326416015625, 5.522216796875, 5.7117919921875, 5.9013671875, 6.0909423828125, 6.280517578125, 6.4700927734375, 6.65966796875, 6.8492431640625, 7.038818359375, 7.2283935546875, 7.41796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 12.0, 13.0, 12.0, 13.0, 14.0, 23.0, 34.0, 35.0, 64.0, 86.0, 87.0, 104.0, 107.0, 96.0, 69.0, 56.0, 40.0, 33.0, 33.0, 14.0, 11.0, 8.0, 12.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4013671875, -1.3451690673828125, -1.288970947265625, -1.2327728271484375, -1.17657470703125, -1.1203765869140625, -1.064178466796875, -1.0079803466796875, -0.9517822265625, -0.8955841064453125, -0.839385986328125, -0.7831878662109375, -0.72698974609375, -0.6707916259765625, -0.614593505859375, -0.5583953857421875, -0.502197265625, -0.4459991455078125, -0.389801025390625, -0.3336029052734375, -0.27740478515625, -0.2212066650390625, -0.165008544921875, -0.1088104248046875, -0.0526123046875, 0.0035858154296875, 0.059783935546875, 0.1159820556640625, 0.17218017578125, 0.2283782958984375, 0.284576416015625, 0.3407745361328125, 0.39697265625, 0.4531707763671875, 0.509368896484375, 0.5655670166015625, 0.62176513671875, 0.6779632568359375, 0.734161376953125, 0.7903594970703125, 0.8465576171875, 0.9027557373046875, 0.958953857421875, 1.0151519775390625, 1.07135009765625, 1.1275482177734375, 1.183746337890625, 1.2399444580078125, 1.296142578125, 1.3523406982421875, 1.408538818359375, 1.4647369384765625, 1.52093505859375, 1.5771331787109375, 1.633331298828125, 1.6895294189453125, 1.7457275390625, 1.8019256591796875, 1.858123779296875, 1.9143218994140625, 1.97052001953125, 2.0267181396484375, 2.082916259765625, 2.1391143798828125, 2.1953125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 13.0, 32.0, 199.0, 551.0, 163.0, 24.0, 10.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.590049743652344, -37.161651611328125, -34.733253479003906, -32.30485153198242, -29.876453399658203, -27.448055267333984, -25.019655227661133, -22.59125518798828, -20.162857055664062, -17.734458923339844, -15.306058883666992, -12.877659797668457, -10.449260711669922, -8.020861625671387, -5.592462539672852, -3.1640625, -0.7356643676757812, 1.692734718322754, 4.121133804321289, 6.549532890319824, 8.97793197631836, 11.406331062316895, 13.83473014831543, 16.26313018798828, 18.6915283203125, 21.11992645263672, 23.54832649230957, 25.976726531982422, 28.40512466430664, 30.83352279663086, 33.261924743652344, 35.69032287597656, 38.11872863769531, 40.54712677001953, 42.97552490234375, 45.403926849365234, 47.83232498168945, 50.26072311401367, 52.689125061035156, 55.117523193359375, 57.545921325683594, 59.97431945800781, 62.40271759033203, 64.83111572265625, 67.259521484375, 69.68791961669922, 72.11631774902344, 74.54471588134766, 76.97311401367188, 79.4015121459961, 81.82991027832031, 84.25830841064453, 86.68670654296875, 89.1151123046875, 91.54351043701172, 93.97190856933594, 96.40030670166016, 98.82870483398438, 101.2571029663086, 103.68550109863281, 106.11390686035156, 108.54230499267578, 110.970703125, 113.39910125732422, 115.82749938964844]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 7.0, 12.0, 14.0, 9.0, 17.0, 22.0, 23.0, 24.0, 34.0, 33.0, 41.0, 36.0, 50.0, 52.0, 45.0, 50.0, 56.0, 48.0, 59.0, 44.0, 34.0, 40.0, 48.0, 33.0, 25.0, 26.0, 22.0, 15.0, 9.0, 16.0, 13.0, 11.0, 5.0, 4.0, 5.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.888134002685547, -8.56002426147461, -8.231915473937988, -7.903806209564209, -7.57569694519043, -7.24758768081665, -6.919478416442871, -6.591369152069092, -6.2632598876953125, -5.935150623321533, -5.607041358947754, -5.278932094573975, -4.950822830200195, -4.622713565826416, -4.294604301452637, -3.9664950370788574, -3.638385772705078, -3.310276508331299, -2.9821672439575195, -2.6540579795837402, -2.325948715209961, -1.9978394508361816, -1.6697301864624023, -1.341620922088623, -1.0135116577148438, -0.6854023933410645, -0.35729312896728516, -0.02918386459350586, 0.29892539978027344, 0.6270346641540527, 0.955143928527832, 1.2832531929016113, 1.6113615036010742, 1.9394707679748535, 2.267580032348633, 2.595689296722412, 2.9237985610961914, 3.2519078254699707, 3.58001708984375, 3.9081263542175293, 4.236235618591309, 4.564344882965088, 4.892454147338867, 5.2205634117126465, 5.548672676086426, 5.876781940460205, 6.204891204833984, 6.533000469207764, 6.861109733581543, 7.189218997955322, 7.517328262329102, 7.845437526702881, 8.17354679107666, 8.501655578613281, 8.829765319824219, 9.157875061035156, 9.485983848571777, 9.814092636108398, 10.142202377319336, 10.470312118530273, 10.798420906066895, 11.126529693603516, 11.454639434814453, 11.78274917602539, 12.110857963562012]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 38.0, 415.0, 4167683.0, 25398.0, 326.0, 144.0, 88.0, 68.0, 56.0, 27.0, 19.0, 13.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.375, -66.083984375, -63.79296875, -61.501953125, -59.2109375, -56.919921875, -54.62890625, -52.337890625, -50.046875, -47.755859375, -45.46484375, -43.173828125, -40.8828125, -38.591796875, -36.30078125, -34.009765625, -31.71875, -29.427734375, -27.13671875, -24.845703125, -22.5546875, -20.263671875, -17.97265625, -15.681640625, -13.390625, -11.099609375, -8.80859375, -6.517578125, -4.2265625, -1.935546875, 0.35546875, 2.646484375, 4.9375, 7.228515625, 9.51953125, 11.810546875, 14.1015625, 16.392578125, 18.68359375, 20.974609375, 23.265625, 25.556640625, 27.84765625, 30.138671875, 32.4296875, 34.720703125, 37.01171875, 39.302734375, 41.59375, 43.884765625, 46.17578125, 48.466796875, 50.7578125, 53.048828125, 55.33984375, 57.630859375, 59.921875, 62.212890625, 64.50390625, 66.794921875, 69.0859375, 71.376953125, 73.66796875, 75.958984375, 78.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 11.0, 43.0, 110.0, 223.0, 237.0, 214.0, 124.0, 31.0, 14.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270751953125, -0.23487472534179688, -0.19899749755859375, -0.16312026977539062, -0.1272430419921875, -0.09136581420898438, -0.05548858642578125, -0.019611358642578125, 0.016265869140625, 0.052143096923828125, 0.08802032470703125, 0.12389755249023438, 0.1597747802734375, 0.19565200805664062, 0.23152923583984375, 0.2674064636230469, 0.30328369140625, 0.3391609191894531, 0.37503814697265625, 0.4109153747558594, 0.4467926025390625, 0.4826698303222656, 0.5185470581054688, 0.5544242858886719, 0.590301513671875, 0.6261787414550781, 0.6620559692382812, 0.6979331970214844, 0.7338104248046875, 0.7696876525878906, 0.8055648803710938, 0.8414421081542969, 0.8773193359375, 0.9131965637207031, 0.9490737915039062, 0.9849510192871094, 1.0208282470703125, 1.0567054748535156, 1.0925827026367188, 1.1284599304199219, 1.164337158203125, 1.2002143859863281, 1.2360916137695312, 1.2719688415527344, 1.3078460693359375, 1.3437232971191406, 1.3796005249023438, 1.4154777526855469, 1.45135498046875, 1.4872322082519531, 1.5231094360351562, 1.5589866638183594, 1.5948638916015625, 1.6307411193847656, 1.6666183471679688, 1.7024955749511719, 1.738372802734375, 1.7742500305175781, 1.8101272583007812, 1.8460044860839844, 1.8818817138671875, 1.9177589416503906, 1.9536361694335938, 1.9895133972167969, 2.025390625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 14.0, 14.0, 14.0, 25.0, 40.0, 51.0, 90.0, 106.0, 122.0, 161.0, 482.0, 82163.0, 4109432.0, 801.0, 192.0, 134.0, 125.0, 100.0, 70.0, 45.0, 32.0, 27.0, 17.0, 7.0, 7.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.5625, -97.08056640625, -94.5986328125, -92.11669921875, -89.634765625, -87.15283203125, -84.6708984375, -82.18896484375, -79.70703125, -77.22509765625, -74.7431640625, -72.26123046875, -69.779296875, -67.29736328125, -64.8154296875, -62.33349609375, -59.8515625, -57.36962890625, -54.8876953125, -52.40576171875, -49.923828125, -47.44189453125, -44.9599609375, -42.47802734375, -39.99609375, -37.51416015625, -35.0322265625, -32.55029296875, -30.068359375, -27.58642578125, -25.1044921875, -22.62255859375, -20.140625, -17.65869140625, -15.1767578125, -12.69482421875, -10.212890625, -7.73095703125, -5.2490234375, -2.76708984375, -0.28515625, 2.19677734375, 4.6787109375, 7.16064453125, 9.642578125, 12.12451171875, 14.6064453125, 17.08837890625, 19.5703125, 22.05224609375, 24.5341796875, 27.01611328125, 29.498046875, 31.97998046875, 34.4619140625, 36.94384765625, 39.42578125, 41.90771484375, 44.3896484375, 46.87158203125, 49.353515625, 51.83544921875, 54.3173828125, 56.79931640625, 59.28125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 7.0, 13.0, 24.0, 35.0, 80.0, 192.0, 2690.0, 892.0, 114.0, 25.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33984375, -2.20880126953125, -2.0777587890625, -1.94671630859375, -1.815673828125, -1.68463134765625, -1.5535888671875, -1.42254638671875, -1.29150390625, -1.16046142578125, -1.0294189453125, -0.89837646484375, -0.767333984375, -0.63629150390625, -0.5052490234375, -0.37420654296875, -0.2431640625, -0.11212158203125, 0.0189208984375, 0.14996337890625, 0.281005859375, 0.41204833984375, 0.5430908203125, 0.67413330078125, 0.80517578125, 0.93621826171875, 1.0672607421875, 1.19830322265625, 1.329345703125, 1.46038818359375, 1.5914306640625, 1.72247314453125, 1.853515625, 1.98455810546875, 2.1156005859375, 2.24664306640625, 2.377685546875, 2.50872802734375, 2.6397705078125, 2.77081298828125, 2.90185546875, 3.03289794921875, 3.1639404296875, 3.29498291015625, 3.426025390625, 3.55706787109375, 3.6881103515625, 3.81915283203125, 3.9501953125, 4.08123779296875, 4.2122802734375, 4.34332275390625, 4.474365234375, 4.60540771484375, 4.7364501953125, 4.86749267578125, 4.99853515625, 5.12957763671875, 5.2606201171875, 5.39166259765625, 5.522705078125, 5.65374755859375, 5.7847900390625, 5.91583251953125, 6.046875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 11.0, 16.0, 40.0, 148.0, 562.0, 180.0, 36.0, 9.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-134.80123901367188, -132.2401580810547, -129.67906188964844, -127.11798095703125, -124.55690002441406, -121.99581146240234, -119.43473052978516, -116.87364196777344, -114.31256103515625, -111.75147247314453, -109.19039154052734, -106.62930297851562, -104.06822204589844, -101.50713348388672, -98.94605255126953, -96.38496398925781, -93.82388305664062, -91.2627944946289, -88.70171356201172, -86.140625, -83.57954406738281, -81.0184555053711, -78.4573745727539, -75.89628601074219, -73.33519744873047, -70.77410888671875, -68.21302795410156, -65.65193939208984, -63.090858459472656, -60.5297737121582, -57.96868896484375, -55.40760040283203, -52.84651565551758, -50.285430908203125, -47.72434616088867, -45.16326141357422, -42.602176666259766, -40.04109191894531, -37.480003356933594, -34.918922424316406, -32.35783386230469, -29.796749114990234, -27.23566436767578, -24.674579620361328, -22.113494873046875, -19.552410125732422, -16.991323471069336, -14.430238723754883, -11.869155883789062, -9.30807113647461, -6.746985912322998, -4.185900688171387, -1.6248159408569336, 0.9362688064575195, 3.497354507446289, 6.058439254760742, 8.619524002075195, 11.180608749389648, 13.741693496704102, 16.302780151367188, 18.86386489868164, 21.424949645996094, 23.986034393310547, 26.547119140625, 29.108203887939453]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 18.0, 22.0, 34.0, 56.0, 53.0, 83.0, 96.0, 111.0, 92.0, 101.0, 88.0, 70.0, 52.0, 49.0, 24.0, 19.0, 15.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.984966278076172, -18.52027130126953, -18.055574417114258, -17.590879440307617, -17.126182556152344, -16.661487579345703, -16.19679069519043, -15.732095718383789, -15.267398834228516, -14.802702903747559, -14.338006973266602, -13.873311042785645, -13.408615112304688, -12.94391918182373, -12.479223251342773, -12.014528274536133, -11.549832344055176, -11.085136413574219, -10.620440483093262, -10.155744552612305, -9.691048622131348, -9.22635269165039, -8.76165771484375, -8.296960830688477, -7.832265377044678, -7.367569446563721, -6.902873516082764, -6.438178062438965, -5.973482131958008, -5.508786201477051, -5.044090270996094, -4.579394340515137, -4.11469841003418, -3.6500024795532227, -3.1853065490722656, -2.7206108570098877, -2.2559149265289307, -1.7912189960479736, -1.3265233039855957, -0.8618273735046387, -0.39713144302368164, 0.06756442785263062, 0.5322602987289429, 0.9969561100006104, 1.4616520404815674, 1.9263479709625244, 2.3910436630249023, 2.8557395935058594, 3.3204355239868164, 3.7851314544677734, 4.2498273849487305, 4.7145233154296875, 5.1792192459106445, 5.643915176391602, 6.1086106300354, 6.573306560516357, 7.0380024909973145, 7.5026984214782715, 7.9673943519592285, 8.432089805603027, 8.896785736083984, 9.361481666564941, 9.826177597045898, 10.290873527526855, 10.755569458007812]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 7.0, 13.0, 12.0, 17.0, 18.0, 34.0, 37.0, 71.0, 116.0, 171.0, 299.0, 513.0, 1210.0, 4271.0, 26250.0, 487803.0, 494271.0, 26602.0, 4264.0, 1219.0, 534.0, 271.0, 170.0, 97.0, 61.0, 51.0, 31.0, 22.0, 25.0, 19.0, 11.0, 7.0, 7.0, 6.0, 6.0, 0.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.125, -16.55419921875, -15.9833984375, -15.41259765625, -14.841796875, -14.27099609375, -13.7001953125, -13.12939453125, -12.55859375, -11.98779296875, -11.4169921875, -10.84619140625, -10.275390625, -9.70458984375, -9.1337890625, -8.56298828125, -7.9921875, -7.42138671875, -6.8505859375, -6.27978515625, -5.708984375, -5.13818359375, -4.5673828125, -3.99658203125, -3.42578125, -2.85498046875, -2.2841796875, -1.71337890625, -1.142578125, -0.57177734375, -0.0009765625, 0.56982421875, 1.140625, 1.71142578125, 2.2822265625, 2.85302734375, 3.423828125, 3.99462890625, 4.5654296875, 5.13623046875, 5.70703125, 6.27783203125, 6.8486328125, 7.41943359375, 7.990234375, 8.56103515625, 9.1318359375, 9.70263671875, 10.2734375, 10.84423828125, 11.4150390625, 11.98583984375, 12.556640625, 13.12744140625, 13.6982421875, 14.26904296875, 14.83984375, 15.41064453125, 15.9814453125, 16.55224609375, 17.123046875, 17.69384765625, 18.2646484375, 18.83544921875, 19.40625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 27.0, 63.0, 89.0, 142.0, 210.0, 170.0, 137.0, 76.0, 49.0, 19.0, 7.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.744140625, -0.694305419921875, -0.64447021484375, -0.594635009765625, -0.5447998046875, -0.494964599609375, -0.44512939453125, -0.395294189453125, -0.345458984375, -0.295623779296875, -0.24578857421875, -0.195953369140625, -0.1461181640625, -0.096282958984375, -0.04644775390625, 0.003387451171875, 0.05322265625, 0.103057861328125, 0.15289306640625, 0.202728271484375, 0.2525634765625, 0.302398681640625, 0.35223388671875, 0.402069091796875, 0.451904296875, 0.501739501953125, 0.55157470703125, 0.601409912109375, 0.6512451171875, 0.701080322265625, 0.75091552734375, 0.800750732421875, 0.8505859375, 0.900421142578125, 0.95025634765625, 1.000091552734375, 1.0499267578125, 1.099761962890625, 1.14959716796875, 1.199432373046875, 1.249267578125, 1.299102783203125, 1.34893798828125, 1.398773193359375, 1.4486083984375, 1.498443603515625, 1.54827880859375, 1.598114013671875, 1.64794921875, 1.697784423828125, 1.74761962890625, 1.797454833984375, 1.8472900390625, 1.897125244140625, 1.94696044921875, 1.996795654296875, 2.046630859375, 2.096466064453125, 2.14630126953125, 2.196136474609375, 2.2459716796875, 2.295806884765625, 2.34564208984375, 2.395477294921875, 2.4453125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 7.0, 5.0, 8.0, 15.0, 21.0, 14.0, 24.0, 25.0, 51.0, 68.0, 96.0, 146.0, 208.0, 310.0, 437.0, 853.0, 1382.0, 2682.0, 6052.0, 15605.0, 51277.0, 219029.0, 507382.0, 175781.0, 42832.0, 13049.0, 5222.0, 2440.0, 1372.0, 723.0, 469.0, 310.0, 200.0, 149.0, 84.0, 54.0, 45.0, 37.0, 25.0, 11.0, 11.0, 6.0, 10.0, 8.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.25390625, -5.08123779296875, -4.9085693359375, -4.73590087890625, -4.563232421875, -4.39056396484375, -4.2178955078125, -4.04522705078125, -3.87255859375, -3.69989013671875, -3.5272216796875, -3.35455322265625, -3.181884765625, -3.00921630859375, -2.8365478515625, -2.66387939453125, -2.4912109375, -2.31854248046875, -2.1458740234375, -1.97320556640625, -1.800537109375, -1.62786865234375, -1.4552001953125, -1.28253173828125, -1.10986328125, -0.93719482421875, -0.7645263671875, -0.59185791015625, -0.419189453125, -0.24652099609375, -0.0738525390625, 0.09881591796875, 0.271484375, 0.44415283203125, 0.6168212890625, 0.78948974609375, 0.962158203125, 1.13482666015625, 1.3074951171875, 1.48016357421875, 1.65283203125, 1.82550048828125, 1.9981689453125, 2.17083740234375, 2.343505859375, 2.51617431640625, 2.6888427734375, 2.86151123046875, 3.0341796875, 3.20684814453125, 3.3795166015625, 3.55218505859375, 3.724853515625, 3.89752197265625, 4.0701904296875, 4.24285888671875, 4.41552734375, 4.58819580078125, 4.7608642578125, 4.93353271484375, 5.106201171875, 5.27886962890625, 5.4515380859375, 5.62420654296875, 5.796875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 5.0, 8.0, 8.0, 8.0, 11.0, 15.0, 25.0, 30.0, 32.0, 34.0, 43.0, 41.0, 48.0, 59.0, 62.0, 61.0, 55.0, 53.0, 59.0, 46.0, 32.0, 39.0, 42.0, 32.0, 35.0, 26.0, 15.0, 14.0, 17.0, 8.0, 7.0, 8.0, 2.0, 3.0, 6.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.47265625, -2.38543701171875, -2.2982177734375, -2.21099853515625, -2.123779296875, -2.03656005859375, -1.9493408203125, -1.86212158203125, -1.77490234375, -1.68768310546875, -1.6004638671875, -1.51324462890625, -1.426025390625, -1.33880615234375, -1.2515869140625, -1.16436767578125, -1.0771484375, -0.98992919921875, -0.9027099609375, -0.81549072265625, -0.728271484375, -0.64105224609375, -0.5538330078125, -0.46661376953125, -0.37939453125, -0.29217529296875, -0.2049560546875, -0.11773681640625, -0.030517578125, 0.05670166015625, 0.1439208984375, 0.23114013671875, 0.318359375, 0.40557861328125, 0.4927978515625, 0.58001708984375, 0.667236328125, 0.75445556640625, 0.8416748046875, 0.92889404296875, 1.01611328125, 1.10333251953125, 1.1905517578125, 1.27777099609375, 1.364990234375, 1.45220947265625, 1.5394287109375, 1.62664794921875, 1.7138671875, 1.80108642578125, 1.8883056640625, 1.97552490234375, 2.062744140625, 2.14996337890625, 2.2371826171875, 2.32440185546875, 2.41162109375, 2.49884033203125, 2.5860595703125, 2.67327880859375, 2.760498046875, 2.84771728515625, 2.9349365234375, 3.02215576171875, 3.109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 10.0, 9.0, 14.0, 18.0, 17.0, 33.0, 53.0, 80.0, 140.0, 193.0, 353.0, 644.0, 1213.0, 2703.0, 7790.0, 31785.0, 507107.0, 453374.0, 30148.0, 7535.0, 2590.0, 1187.0, 616.0, 335.0, 210.0, 113.0, 76.0, 45.0, 46.0, 24.0, 22.0, 13.0, 10.0, 8.0, 3.0, 4.0, 5.0, 6.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.7578125, -7.4805908203125, -7.203369140625, -6.9261474609375, -6.64892578125, -6.3717041015625, -6.094482421875, -5.8172607421875, -5.5400390625, -5.2628173828125, -4.985595703125, -4.7083740234375, -4.43115234375, -4.1539306640625, -3.876708984375, -3.5994873046875, -3.322265625, -3.0450439453125, -2.767822265625, -2.4906005859375, -2.21337890625, -1.9361572265625, -1.658935546875, -1.3817138671875, -1.1044921875, -0.8272705078125, -0.550048828125, -0.2728271484375, 0.00439453125, 0.2816162109375, 0.558837890625, 0.8360595703125, 1.11328125, 1.3905029296875, 1.667724609375, 1.9449462890625, 2.22216796875, 2.4993896484375, 2.776611328125, 3.0538330078125, 3.3310546875, 3.6082763671875, 3.885498046875, 4.1627197265625, 4.43994140625, 4.7171630859375, 4.994384765625, 5.2716064453125, 5.548828125, 5.8260498046875, 6.103271484375, 6.3804931640625, 6.65771484375, 6.9349365234375, 7.212158203125, 7.4893798828125, 7.7666015625, 8.0438232421875, 8.321044921875, 8.5982666015625, 8.87548828125, 9.1527099609375, 9.429931640625, 9.7071533203125, 9.984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 4.0, 12.0, 6.0, 15.0, 19.0, 28.0, 32.0, 39.0, 53.0, 55.0, 81.0, 90.0, 86.0, 102.0, 85.0, 57.0, 45.0, 44.0, 31.0, 17.0, 17.0, 16.0, 17.0, 11.0, 8.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.001194000244140625, -0.0011628344655036926, -0.0011316686868667603, -0.0011005029082298279, -0.0010693371295928955, -0.0010381713509559631, -0.0010070055723190308, -0.0009758397936820984, -0.000944674015045166, -0.0009135082364082336, -0.0008823424577713013, -0.0008511766791343689, -0.0008200109004974365, -0.0007888451218605042, -0.0007576793432235718, -0.0007265135645866394, -0.000695347785949707, -0.0006641820073127747, -0.0006330162286758423, -0.0006018504500389099, -0.0005706846714019775, -0.0005395188927650452, -0.0005083531141281128, -0.0004771873354911804, -0.00044602155685424805, -0.0004148557782173157, -0.0003836899995803833, -0.00035252422094345093, -0.00032135844230651855, -0.0002901926636695862, -0.0002590268850326538, -0.00022786110639572144, -0.00019669532775878906, -0.0001655295491218567, -0.00013436377048492432, -0.00010319799184799194, -7.203221321105957e-05, -4.08664345741272e-05, -9.700655937194824e-06, 2.146512269973755e-05, 5.263090133666992e-05, 8.37966799736023e-05, 0.00011496245861053467, 0.00014612823724746704, 0.00017729401588439941, 0.0002084597945213318, 0.00023962557315826416, 0.00027079135179519653, 0.0003019571304321289, 0.0003331229090690613, 0.00036428868770599365, 0.000395454466342926, 0.0004266202449798584, 0.00045778602361679077, 0.0004889518022537231, 0.0005201175808906555, 0.0005512833595275879, 0.0005824491381645203, 0.0006136149168014526, 0.000644780695438385, 0.0006759464740753174, 0.0007071122527122498, 0.0007382780313491821, 0.0007694438099861145, 0.0008006095886230469]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 7.0, 5.0, 14.0, 24.0, 34.0, 61.0, 116.0, 332.0, 837.0, 2889.0, 29802.0, 958823.0, 50107.0, 3853.0, 974.0, 360.0, 162.0, 67.0, 32.0, 27.0, 11.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-21.328125, -20.838623046875, -20.34912109375, -19.859619140625, -19.3701171875, -18.880615234375, -18.39111328125, -17.901611328125, -17.412109375, -16.922607421875, -16.43310546875, -15.943603515625, -15.4541015625, -14.964599609375, -14.47509765625, -13.985595703125, -13.49609375, -13.006591796875, -12.51708984375, -12.027587890625, -11.5380859375, -11.048583984375, -10.55908203125, -10.069580078125, -9.580078125, -9.090576171875, -8.60107421875, -8.111572265625, -7.6220703125, -7.132568359375, -6.64306640625, -6.153564453125, -5.6640625, -5.174560546875, -4.68505859375, -4.195556640625, -3.7060546875, -3.216552734375, -2.72705078125, -2.237548828125, -1.748046875, -1.258544921875, -0.76904296875, -0.279541015625, 0.2099609375, 0.699462890625, 1.18896484375, 1.678466796875, 2.16796875, 2.657470703125, 3.14697265625, 3.636474609375, 4.1259765625, 4.615478515625, 5.10498046875, 5.594482421875, 6.083984375, 6.573486328125, 7.06298828125, 7.552490234375, 8.0419921875, 8.531494140625, 9.02099609375, 9.510498046875, 10.0]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 11.0, 9.0, 19.0, 45.0, 75.0, 172.0, 251.0, 194.0, 103.0, 48.0, 32.0, 16.0, 11.0, 6.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.59375, -7.41119384765625, -7.2286376953125, -7.04608154296875, -6.863525390625, -6.68096923828125, -6.4984130859375, -6.31585693359375, -6.13330078125, -5.95074462890625, -5.7681884765625, -5.58563232421875, -5.403076171875, -5.22052001953125, -5.0379638671875, -4.85540771484375, -4.6728515625, -4.49029541015625, -4.3077392578125, -4.12518310546875, -3.942626953125, -3.76007080078125, -3.5775146484375, -3.39495849609375, -3.21240234375, -3.02984619140625, -2.8472900390625, -2.66473388671875, -2.482177734375, -2.29962158203125, -2.1170654296875, -1.93450927734375, -1.751953125, -1.56939697265625, -1.3868408203125, -1.20428466796875, -1.021728515625, -0.83917236328125, -0.6566162109375, -0.47406005859375, -0.29150390625, -0.10894775390625, 0.0736083984375, 0.25616455078125, 0.438720703125, 0.62127685546875, 0.8038330078125, 0.98638916015625, 1.1689453125, 1.35150146484375, 1.5340576171875, 1.71661376953125, 1.899169921875, 2.08172607421875, 2.2642822265625, 2.44683837890625, 2.62939453125, 2.81195068359375, 2.9945068359375, 3.17706298828125, 3.359619140625, 3.54217529296875, 3.7247314453125, 3.90728759765625, 4.08984375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 9.0, 46.0, 302.0, 447.0, 150.0, 36.0, 11.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.36142349243164, -14.76602554321289, -11.170626640319824, -7.575227737426758, -3.979829788208008, -0.3844318389892578, 3.210968017578125, 6.806365966796875, 10.401763916015625, 13.997161865234375, 17.592559814453125, 21.187959671020508, 24.783357620239258, 28.378755569458008, 31.97415542602539, 35.56955337524414, 39.16495132446289, 42.76034927368164, 46.35574722290039, 49.951148986816406, 53.546546936035156, 57.141944885253906, 60.737342834472656, 64.3327407836914, 67.92813873291016, 71.5235366821289, 75.11893463134766, 78.7143325805664, 82.30973052978516, 85.9051284790039, 89.50053405761719, 93.09593200683594, 96.69132995605469, 100.28672790527344, 103.88212585449219, 107.47752380371094, 111.07292175292969, 114.66831970214844, 118.26371765136719, 121.85911560058594, 125.45451354980469, 129.04991149902344, 132.6453094482422, 136.24070739746094, 139.8361053466797, 143.43150329589844, 147.0269012451172, 150.62229919433594, 154.21771240234375, 157.8131103515625, 161.40850830078125, 165.00390625, 168.59930419921875, 172.1947021484375, 175.79010009765625, 179.385498046875, 182.98089599609375, 186.5762939453125, 190.17169189453125, 193.76708984375, 197.36248779296875, 200.9578857421875, 204.55328369140625, 208.148681640625, 211.74407958984375]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 4.0, 13.0, 18.0, 24.0, 32.0, 23.0, 32.0, 43.0, 46.0, 63.0, 60.0, 73.0, 68.0, 73.0, 78.0, 50.0, 52.0, 38.0, 52.0, 40.0, 29.0, 23.0, 17.0, 16.0, 13.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.94366455078125, -24.222599029541016, -23.50153350830078, -22.780467987060547, -22.05940055847168, -21.338335037231445, -20.61726951599121, -19.896203994750977, -19.17513656616211, -18.454071044921875, -17.73300552368164, -17.011940002441406, -16.29087257385254, -15.569807052612305, -14.84874153137207, -14.127676010131836, -13.406610488891602, -12.685544967651367, -11.964478492736816, -11.243412971496582, -10.522346496582031, -9.801280975341797, -9.080215454101562, -8.359149932861328, -7.638083457946777, -6.917017459869385, -6.195951461791992, -5.474885940551758, -4.753819942474365, -4.032753944396973, -3.3116884231567383, -2.5906224250793457, -1.8695564270019531, -1.14849054813385, -0.42742466926574707, 0.2936410903930664, 1.014707088470459, 1.7357730865478516, 2.456838607788086, 3.1779046058654785, 3.898970603942871, 4.620036602020264, 5.341102600097656, 6.062168121337891, 6.783234119415283, 7.504300117492676, 8.22536563873291, 8.946432113647461, 9.667497634887695, 10.38856315612793, 11.10962963104248, 11.830695152282715, 12.551761627197266, 13.2728271484375, 13.993892669677734, 14.714958190917969, 15.43602466583252, 16.15709114074707, 16.878156661987305, 17.59922218322754, 18.320287704467773, 19.04135513305664, 19.762420654296875, 20.48348617553711, 21.204551696777344]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 10.0, 19.0, 28.0, 67.0, 126.0, 350.0, 1155.0, 5982.0, 93883.0, 4062608.0, 25179.0, 3070.0, 857.0, 380.0, 185.0, 117.0, 69.0, 43.0, 42.0, 26.0, 18.0, 17.0, 16.0, 9.0, 6.0, 5.0, 5.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.53125, -32.3876953125, -31.244140625, -30.1005859375, -28.95703125, -27.8134765625, -26.669921875, -25.5263671875, -24.3828125, -23.2392578125, -22.095703125, -20.9521484375, -19.80859375, -18.6650390625, -17.521484375, -16.3779296875, -15.234375, -14.0908203125, -12.947265625, -11.8037109375, -10.66015625, -9.5166015625, -8.373046875, -7.2294921875, -6.0859375, -4.9423828125, -3.798828125, -2.6552734375, -1.51171875, -0.3681640625, 0.775390625, 1.9189453125, 3.0625, 4.2060546875, 5.349609375, 6.4931640625, 7.63671875, 8.7802734375, 9.923828125, 11.0673828125, 12.2109375, 13.3544921875, 14.498046875, 15.6416015625, 16.78515625, 17.9287109375, 19.072265625, 20.2158203125, 21.359375, 22.5029296875, 23.646484375, 24.7900390625, 25.93359375, 27.0771484375, 28.220703125, 29.3642578125, 30.5078125, 31.6513671875, 32.794921875, 33.9384765625, 35.08203125, 36.2255859375, 37.369140625, 38.5126953125, 39.65625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 22.0, 28.0, 46.0, 76.0, 106.0, 138.0, 175.0, 135.0, 118.0, 71.0, 35.0, 28.0, 13.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83984375, -0.791656494140625, -0.74346923828125, -0.695281982421875, -0.6470947265625, -0.598907470703125, -0.55072021484375, -0.502532958984375, -0.454345703125, -0.406158447265625, -0.35797119140625, -0.309783935546875, -0.2615966796875, -0.213409423828125, -0.16522216796875, -0.117034912109375, -0.06884765625, -0.020660400390625, 0.02752685546875, 0.075714111328125, 0.1239013671875, 0.172088623046875, 0.22027587890625, 0.268463134765625, 0.316650390625, 0.364837646484375, 0.41302490234375, 0.461212158203125, 0.5093994140625, 0.557586669921875, 0.60577392578125, 0.653961181640625, 0.7021484375, 0.750335693359375, 0.79852294921875, 0.846710205078125, 0.8948974609375, 0.943084716796875, 0.99127197265625, 1.039459228515625, 1.087646484375, 1.135833740234375, 1.18402099609375, 1.232208251953125, 1.2803955078125, 1.328582763671875, 1.37677001953125, 1.424957275390625, 1.47314453125, 1.521331787109375, 1.56951904296875, 1.617706298828125, 1.6658935546875, 1.714080810546875, 1.76226806640625, 1.810455322265625, 1.858642578125, 1.906829833984375, 1.95501708984375, 2.003204345703125, 2.0513916015625, 2.099578857421875, 2.14776611328125, 2.195953369140625, 2.244140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 8.0, 7.0, 22.0, 32.0, 45.0, 51.0, 108.0, 199.0, 463.0, 1444.0, 10640.0, 4141200.0, 37036.0, 1961.0, 512.0, 211.0, 129.0, 80.0, 47.0, 24.0, 24.0, 14.0, 7.0, 6.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.5625, -64.58544921875, -62.6083984375, -60.63134765625, -58.654296875, -56.67724609375, -54.7001953125, -52.72314453125, -50.74609375, -48.76904296875, -46.7919921875, -44.81494140625, -42.837890625, -40.86083984375, -38.8837890625, -36.90673828125, -34.9296875, -32.95263671875, -30.9755859375, -28.99853515625, -27.021484375, -25.04443359375, -23.0673828125, -21.09033203125, -19.11328125, -17.13623046875, -15.1591796875, -13.18212890625, -11.205078125, -9.22802734375, -7.2509765625, -5.27392578125, -3.296875, -1.31982421875, 0.6572265625, 2.63427734375, 4.611328125, 6.58837890625, 8.5654296875, 10.54248046875, 12.51953125, 14.49658203125, 16.4736328125, 18.45068359375, 20.427734375, 22.40478515625, 24.3818359375, 26.35888671875, 28.3359375, 30.31298828125, 32.2900390625, 34.26708984375, 36.244140625, 38.22119140625, 40.1982421875, 42.17529296875, 44.15234375, 46.12939453125, 48.1064453125, 50.08349609375, 52.060546875, 54.03759765625, 56.0146484375, 57.99169921875, 59.96875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 10.0, 6.0, 20.0, 35.0, 83.0, 202.0, 875.0, 2432.0, 257.0, 71.0, 34.0, 28.0, 7.0, 2.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.62451171875, -5.4599609375, -5.29541015625, -5.130859375, -4.96630859375, -4.8017578125, -4.63720703125, -4.47265625, -4.30810546875, -4.1435546875, -3.97900390625, -3.814453125, -3.64990234375, -3.4853515625, -3.32080078125, -3.15625, -2.99169921875, -2.8271484375, -2.66259765625, -2.498046875, -2.33349609375, -2.1689453125, -2.00439453125, -1.83984375, -1.67529296875, -1.5107421875, -1.34619140625, -1.181640625, -1.01708984375, -0.8525390625, -0.68798828125, -0.5234375, -0.35888671875, -0.1943359375, -0.02978515625, 0.134765625, 0.29931640625, 0.4638671875, 0.62841796875, 0.79296875, 0.95751953125, 1.1220703125, 1.28662109375, 1.451171875, 1.61572265625, 1.7802734375, 1.94482421875, 2.109375, 2.27392578125, 2.4384765625, 2.60302734375, 2.767578125, 2.93212890625, 3.0966796875, 3.26123046875, 3.42578125, 3.59033203125, 3.7548828125, 3.91943359375, 4.083984375, 4.24853515625, 4.4130859375, 4.57763671875, 4.7421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 36.0, 167.0, 609.0, 156.0, 22.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.89335632324219, -74.8414306640625, -71.78951263427734, -68.73758697509766, -65.6856689453125, -62.63374328613281, -59.581817626953125, -56.5298957824707, -53.47797393798828, -50.42605209350586, -47.37413024902344, -44.32220458984375, -41.27028274536133, -38.218360900878906, -35.16643524169922, -32.1145133972168, -29.062591552734375, -26.010669708251953, -22.9587459564209, -19.906822204589844, -16.854900360107422, -13.802977561950684, -10.751054763793945, -7.699131011962891, -4.647209167480469, -1.5952863693237305, 1.4566364288330078, 4.508559226989746, 7.560482025146484, 10.612404823303223, 13.664327621459961, 16.716251373291016, 19.768165588378906, 22.820087432861328, 25.872011184692383, 28.923934936523438, 31.97585678100586, 35.02777862548828, 38.07970428466797, 41.13162612915039, 44.18354797363281, 47.235469818115234, 50.287391662597656, 53.339317321777344, 56.391239166259766, 59.44316101074219, 62.495086669921875, 65.54701232910156, 68.59893035888672, 71.6508560180664, 74.70277404785156, 77.75469970703125, 80.80662536621094, 83.8585433959961, 86.91046905517578, 89.96238708496094, 93.01431274414062, 96.06623840332031, 99.11815643310547, 102.17008209228516, 105.22200012207031, 108.27392578125, 111.32585144042969, 114.37777709960938, 117.42969512939453]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 8.0, 7.0, 8.0, 9.0, 11.0, 21.0, 26.0, 17.0, 35.0, 36.0, 44.0, 43.0, 49.0, 66.0, 73.0, 66.0, 60.0, 62.0, 52.0, 55.0, 46.0, 41.0, 44.0, 32.0, 33.0, 20.0, 13.0, 11.0, 8.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.119608879089355, -13.672750473022461, -13.225892066955566, -12.779033660888672, -12.332175254821777, -11.885316848754883, -11.438457489013672, -10.991600036621094, -10.544740676879883, -10.097882270812988, -9.651023864746094, -9.2041654586792, -8.757307052612305, -8.31044864654541, -7.863589763641357, -7.416731357574463, -6.969873428344727, -6.523015022277832, -6.0761566162109375, -5.629298210144043, -5.182439804077148, -4.735581398010254, -4.288722515106201, -3.8418641090393066, -3.395005702972412, -2.9481472969055176, -2.501288890838623, -2.0544302463531494, -1.6075718402862549, -1.1607134342193604, -0.7138547897338867, -0.2669963836669922, 0.17986106872558594, 0.6267195343971252, 1.0735780000686646, 1.5204365253448486, 1.9672949314117432, 2.4141533374786377, 2.8610119819641113, 3.307870388031006, 3.7547287940979004, 4.201587200164795, 4.6484456062316895, 5.095304489135742, 5.542162895202637, 5.989021301269531, 6.435879707336426, 6.88273811340332, 7.329596519470215, 7.776454925537109, 8.223313331604004, 8.670171737670898, 9.117030143737793, 9.563888549804688, 10.010747909545898, 10.457605361938477, 10.904464721679688, 11.351323127746582, 11.798181533813477, 12.245039939880371, 12.691898345947266, 13.13875675201416, 13.585615158081055, 14.032474517822266, 14.479331970214844]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 5.0, 15.0, 13.0, 23.0, 38.0, 38.0, 58.0, 87.0, 154.0, 208.0, 422.0, 841.0, 2147.0, 7252.0, 42133.0, 524469.0, 425531.0, 34816.0, 6525.0, 1985.0, 784.0, 357.0, 213.0, 122.0, 92.0, 68.0, 42.0, 24.0, 20.0, 14.0, 15.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5, -14.999267578125, -14.49853515625, -13.997802734375, -13.4970703125, -12.996337890625, -12.49560546875, -11.994873046875, -11.494140625, -10.993408203125, -10.49267578125, -9.991943359375, -9.4912109375, -8.990478515625, -8.48974609375, -7.989013671875, -7.48828125, -6.987548828125, -6.48681640625, -5.986083984375, -5.4853515625, -4.984619140625, -4.48388671875, -3.983154296875, -3.482421875, -2.981689453125, -2.48095703125, -1.980224609375, -1.4794921875, -0.978759765625, -0.47802734375, 0.022705078125, 0.5234375, 1.024169921875, 1.52490234375, 2.025634765625, 2.5263671875, 3.027099609375, 3.52783203125, 4.028564453125, 4.529296875, 5.030029296875, 5.53076171875, 6.031494140625, 6.5322265625, 7.032958984375, 7.53369140625, 8.034423828125, 8.53515625, 9.035888671875, 9.53662109375, 10.037353515625, 10.5380859375, 11.038818359375, 11.53955078125, 12.040283203125, 12.541015625, 13.041748046875, 13.54248046875, 14.043212890625, 14.5439453125, 15.044677734375, 15.54541015625, 16.046142578125, 16.546875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 12.0, 22.0, 40.0, 58.0, 45.0, 91.0, 108.0, 119.0, 109.0, 115.0, 86.0, 73.0, 44.0, 30.0, 24.0, 16.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2016143798828125, -1.144439697265625, -1.0872650146484375, -1.03009033203125, -0.9729156494140625, -0.915740966796875, -0.8585662841796875, -0.8013916015625, -0.7442169189453125, -0.687042236328125, -0.6298675537109375, -0.57269287109375, -0.5155181884765625, -0.458343505859375, -0.4011688232421875, -0.343994140625, -0.2868194580078125, -0.229644775390625, -0.1724700927734375, -0.11529541015625, -0.0581207275390625, -0.000946044921875, 0.0562286376953125, 0.1134033203125, 0.1705780029296875, 0.227752685546875, 0.2849273681640625, 0.34210205078125, 0.3992767333984375, 0.456451416015625, 0.5136260986328125, 0.57080078125, 0.6279754638671875, 0.685150146484375, 0.7423248291015625, 0.79949951171875, 0.8566741943359375, 0.913848876953125, 0.9710235595703125, 1.0281982421875, 1.0853729248046875, 1.142547607421875, 1.1997222900390625, 1.25689697265625, 1.3140716552734375, 1.371246337890625, 1.4284210205078125, 1.485595703125, 1.5427703857421875, 1.599945068359375, 1.6571197509765625, 1.71429443359375, 1.7714691162109375, 1.828643798828125, 1.8858184814453125, 1.9429931640625, 2.0001678466796875, 2.057342529296875, 2.1145172119140625, 2.17169189453125, 2.2288665771484375, 2.286041259765625, 2.3432159423828125, 2.400390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 9.0, 20.0, 13.0, 21.0, 24.0, 48.0, 85.0, 132.0, 212.0, 325.0, 614.0, 1132.0, 2580.0, 6771.0, 22343.0, 128157.0, 649003.0, 193310.0, 29450.0, 8285.0, 3073.0, 1318.0, 676.0, 352.0, 197.0, 114.0, 84.0, 66.0, 45.0, 25.0, 23.0, 7.0, 14.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.370849609375, -9.05419921875, -8.737548828125, -8.4208984375, -8.104248046875, -7.78759765625, -7.470947265625, -7.154296875, -6.837646484375, -6.52099609375, -6.204345703125, -5.8876953125, -5.571044921875, -5.25439453125, -4.937744140625, -4.62109375, -4.304443359375, -3.98779296875, -3.671142578125, -3.3544921875, -3.037841796875, -2.72119140625, -2.404541015625, -2.087890625, -1.771240234375, -1.45458984375, -1.137939453125, -0.8212890625, -0.504638671875, -0.18798828125, 0.128662109375, 0.4453125, 0.761962890625, 1.07861328125, 1.395263671875, 1.7119140625, 2.028564453125, 2.34521484375, 2.661865234375, 2.978515625, 3.295166015625, 3.61181640625, 3.928466796875, 4.2451171875, 4.561767578125, 4.87841796875, 5.195068359375, 5.51171875, 5.828369140625, 6.14501953125, 6.461669921875, 6.7783203125, 7.094970703125, 7.41162109375, 7.728271484375, 8.044921875, 8.361572265625, 8.67822265625, 8.994873046875, 9.3115234375, 9.628173828125, 9.94482421875, 10.261474609375, 10.578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 12.0, 5.0, 6.0, 8.0, 8.0, 15.0, 16.0, 16.0, 30.0, 19.0, 25.0, 34.0, 35.0, 51.0, 47.0, 42.0, 38.0, 41.0, 41.0, 42.0, 33.0, 48.0, 41.0, 33.0, 45.0, 30.0, 37.0, 28.0, 27.0, 33.0, 15.0, 24.0, 12.0, 10.0, 9.0, 5.0, 7.0, 3.0, 5.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.23046875, -4.09881591796875, -3.9671630859375, -3.83551025390625, -3.703857421875, -3.57220458984375, -3.4405517578125, -3.30889892578125, -3.17724609375, -3.04559326171875, -2.9139404296875, -2.78228759765625, -2.650634765625, -2.51898193359375, -2.3873291015625, -2.25567626953125, -2.1240234375, -1.99237060546875, -1.8607177734375, -1.72906494140625, -1.597412109375, -1.46575927734375, -1.3341064453125, -1.20245361328125, -1.07080078125, -0.93914794921875, -0.8074951171875, -0.67584228515625, -0.544189453125, -0.41253662109375, -0.2808837890625, -0.14923095703125, -0.017578125, 0.11407470703125, 0.2457275390625, 0.37738037109375, 0.509033203125, 0.64068603515625, 0.7723388671875, 0.90399169921875, 1.03564453125, 1.16729736328125, 1.2989501953125, 1.43060302734375, 1.562255859375, 1.69390869140625, 1.8255615234375, 1.95721435546875, 2.0888671875, 2.22052001953125, 2.3521728515625, 2.48382568359375, 2.615478515625, 2.74713134765625, 2.8787841796875, 3.01043701171875, 3.14208984375, 3.27374267578125, 3.4053955078125, 3.53704833984375, 3.668701171875, 3.80035400390625, 3.9320068359375, 4.06365966796875, 4.1953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 5.0, 4.0, 10.0, 12.0, 19.0, 34.0, 31.0, 46.0, 75.0, 100.0, 148.0, 256.0, 515.0, 923.0, 1762.0, 3629.0, 8354.0, 22352.0, 88833.0, 550223.0, 294660.0, 49901.0, 14984.0, 5930.0, 2711.0, 1332.0, 705.0, 365.0, 232.0, 145.0, 77.0, 64.0, 41.0, 25.0, 6.0, 11.0, 11.0, 7.0, 8.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.59765625, -4.44342041015625, -4.2891845703125, -4.13494873046875, -3.980712890625, -3.82647705078125, -3.6722412109375, -3.51800537109375, -3.36376953125, -3.20953369140625, -3.0552978515625, -2.90106201171875, -2.746826171875, -2.59259033203125, -2.4383544921875, -2.28411865234375, -2.1298828125, -1.97564697265625, -1.8214111328125, -1.66717529296875, -1.512939453125, -1.35870361328125, -1.2044677734375, -1.05023193359375, -0.89599609375, -0.74176025390625, -0.5875244140625, -0.43328857421875, -0.279052734375, -0.12481689453125, 0.0294189453125, 0.18365478515625, 0.337890625, 0.49212646484375, 0.6463623046875, 0.80059814453125, 0.954833984375, 1.10906982421875, 1.2633056640625, 1.41754150390625, 1.57177734375, 1.72601318359375, 1.8802490234375, 2.03448486328125, 2.188720703125, 2.34295654296875, 2.4971923828125, 2.65142822265625, 2.8056640625, 2.95989990234375, 3.1141357421875, 3.26837158203125, 3.422607421875, 3.57684326171875, 3.7310791015625, 3.88531494140625, 4.03955078125, 4.19378662109375, 4.3480224609375, 4.50225830078125, 4.656494140625, 4.81072998046875, 4.9649658203125, 5.11920166015625, 5.2734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 9.0, 10.0, 28.0, 29.0, 60.0, 67.0, 121.0, 157.0, 137.0, 111.0, 67.0, 59.0, 26.0, 30.0, 16.0, 3.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0013446807861328125, -0.0013082623481750488, -0.0012718439102172852, -0.0012354254722595215, -0.0011990070343017578, -0.0011625885963439941, -0.0011261701583862305, -0.0010897517204284668, -0.0010533332824707031, -0.0010169148445129395, -0.0009804964065551758, -0.0009440779685974121, -0.0009076595306396484, -0.0008712410926818848, -0.0008348226547241211, -0.0007984042167663574, -0.0007619857788085938, -0.0007255673408508301, -0.0006891489028930664, -0.0006527304649353027, -0.0006163120269775391, -0.0005798935890197754, -0.0005434751510620117, -0.000507056713104248, -0.0004706382751464844, -0.0004342198371887207, -0.00039780139923095703, -0.00036138296127319336, -0.0003249645233154297, -0.000288546085357666, -0.00025212764739990234, -0.00021570920944213867, -0.000179290771484375, -0.00014287233352661133, -0.00010645389556884766, -7.003545761108398e-05, -3.361701965332031e-05, 2.8014183044433594e-06, 3.921985626220703e-05, 7.56382942199707e-05, 0.00011205673217773438, 0.00014847517013549805, 0.00018489360809326172, 0.0002213120460510254, 0.00025773048400878906, 0.00029414892196655273, 0.0003305673599243164, 0.0003669857978820801, 0.00040340423583984375, 0.0004398226737976074, 0.0004762411117553711, 0.0005126595497131348, 0.0005490779876708984, 0.0005854964256286621, 0.0006219148635864258, 0.0006583333015441895, 0.0006947517395019531, 0.0007311701774597168, 0.0007675886154174805, 0.0008040070533752441, 0.0008404254913330078, 0.0008768439292907715, 0.0009132623672485352, 0.0009496808052062988, 0.0009860992431640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 5.0, 9.0, 13.0, 18.0, 18.0, 31.0, 49.0, 59.0, 67.0, 111.0, 184.0, 315.0, 496.0, 832.0, 1653.0, 3123.0, 6393.0, 16547.0, 62268.0, 421354.0, 439612.0, 64656.0, 17206.0, 6500.0, 3118.0, 1599.0, 879.0, 510.0, 328.0, 167.0, 130.0, 79.0, 57.0, 35.0, 26.0, 33.0, 22.0, 7.0, 13.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.953125, -4.79840087890625, -4.6436767578125, -4.48895263671875, -4.334228515625, -4.17950439453125, -4.0247802734375, -3.87005615234375, -3.71533203125, -3.56060791015625, -3.4058837890625, -3.25115966796875, -3.096435546875, -2.94171142578125, -2.7869873046875, -2.63226318359375, -2.4775390625, -2.32281494140625, -2.1680908203125, -2.01336669921875, -1.858642578125, -1.70391845703125, -1.5491943359375, -1.39447021484375, -1.23974609375, -1.08502197265625, -0.9302978515625, -0.77557373046875, -0.620849609375, -0.46612548828125, -0.3114013671875, -0.15667724609375, -0.001953125, 0.15277099609375, 0.3074951171875, 0.46221923828125, 0.616943359375, 0.77166748046875, 0.9263916015625, 1.08111572265625, 1.23583984375, 1.39056396484375, 1.5452880859375, 1.70001220703125, 1.854736328125, 2.00946044921875, 2.1641845703125, 2.31890869140625, 2.4736328125, 2.62835693359375, 2.7830810546875, 2.93780517578125, 3.092529296875, 3.24725341796875, 3.4019775390625, 3.55670166015625, 3.71142578125, 3.86614990234375, 4.0208740234375, 4.17559814453125, 4.330322265625, 4.48504638671875, 4.6397705078125, 4.79449462890625, 4.94921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 15.0, 22.0, 32.0, 41.0, 49.0, 77.0, 119.0, 129.0, 103.0, 110.0, 96.0, 56.0, 34.0, 33.0, 23.0, 15.0, 8.0, 4.0, 6.0, 1.0, 4.0, 3.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.935546875, -3.816864013671875, -3.69818115234375, -3.579498291015625, -3.4608154296875, -3.342132568359375, -3.22344970703125, -3.104766845703125, -2.986083984375, -2.867401123046875, -2.74871826171875, -2.630035400390625, -2.5113525390625, -2.392669677734375, -2.27398681640625, -2.155303955078125, -2.03662109375, -1.917938232421875, -1.79925537109375, -1.680572509765625, -1.5618896484375, -1.443206787109375, -1.32452392578125, -1.205841064453125, -1.087158203125, -0.968475341796875, -0.84979248046875, -0.731109619140625, -0.6124267578125, -0.493743896484375, -0.37506103515625, -0.256378173828125, -0.1376953125, -0.019012451171875, 0.09967041015625, 0.218353271484375, 0.3370361328125, 0.455718994140625, 0.57440185546875, 0.693084716796875, 0.811767578125, 0.930450439453125, 1.04913330078125, 1.167816162109375, 1.2864990234375, 1.405181884765625, 1.52386474609375, 1.642547607421875, 1.76123046875, 1.879913330078125, 1.99859619140625, 2.117279052734375, 2.2359619140625, 2.354644775390625, 2.47332763671875, 2.592010498046875, 2.710693359375, 2.829376220703125, 2.94805908203125, 3.066741943359375, 3.1854248046875, 3.304107666015625, 3.42279052734375, 3.541473388671875, 3.66015625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 29.0, 110.0, 296.0, 315.0, 186.0, 39.0, 11.0, 4.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.83102416992188, -61.24496078491211, -57.658897399902344, -54.072837829589844, -50.48677444458008, -46.90071105957031, -43.31464767456055, -39.72858428955078, -36.14252471923828, -32.556461334228516, -28.970399856567383, -25.384336471557617, -21.798274993896484, -18.21221160888672, -14.626148223876953, -11.04008674621582, -7.454021453857422, -3.8679587841033936, -0.28189611434936523, 3.304166793823242, 6.890229225158691, 10.47629165649414, 14.062355041503906, 17.64841651916504, 21.234479904174805, 24.82054328918457, 28.406604766845703, 31.99266815185547, 35.578731536865234, 39.164794921875, 42.7508544921875, 46.336917877197266, 49.92298126220703, 53.5090446472168, 57.09510803222656, 60.68116760253906, 64.2672348022461, 67.8532943725586, 71.43936157226562, 75.02542114257812, 78.61148071289062, 82.19754028320312, 85.78360748291016, 89.36966705322266, 92.95573425292969, 96.54179382324219, 100.12785339355469, 103.71392059326172, 107.29998779296875, 110.88604736328125, 114.47211456298828, 118.05817413330078, 121.64424133300781, 125.23030090332031, 128.8163604736328, 132.4024200439453, 135.9884796142578, 139.5745391845703, 143.1605987548828, 146.74667358398438, 150.33273315429688, 153.91879272460938, 157.50485229492188, 161.09091186523438, 164.67698669433594]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 6.0, 8.0, 11.0, 14.0, 23.0, 13.0, 16.0, 22.0, 37.0, 33.0, 47.0, 42.0, 47.0, 43.0, 62.0, 69.0, 62.0, 54.0, 52.0, 44.0, 53.0, 41.0, 41.0, 37.0, 31.0, 21.0, 14.0, 13.0, 7.0, 14.0, 7.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.05695915222168, -26.024885177612305, -24.992813110351562, -23.960739135742188, -22.928665161132812, -21.89659309387207, -20.864519119262695, -19.832447052001953, -18.800373077392578, -17.768299102783203, -16.73622703552246, -15.704153060913086, -14.672080039978027, -13.640007019042969, -12.607933044433594, -11.575860023498535, -10.543787002563477, -9.511713981628418, -8.47964096069336, -7.447566986083984, -6.415493965148926, -5.383420944213867, -4.35134744644165, -3.3192739486694336, -2.287200927734375, -1.2551276683807373, -0.2230544090270996, 0.8090188503265381, 1.8410921096801758, 2.8731651306152344, 3.905238628387451, 4.937312126159668, 5.969383239746094, 7.001456260681152, 8.033529281616211, 9.065603256225586, 10.097676277160645, 11.129749298095703, 12.161823272705078, 13.193896293640137, 14.225969314575195, 15.258042335510254, 16.290115356445312, 17.322189331054688, 18.354263305664062, 19.386335372924805, 20.41840934753418, 21.450481414794922, 22.482555389404297, 23.514629364013672, 24.546701431274414, 25.57877540588379, 26.61084747314453, 27.642921447753906, 28.67499542236328, 29.707069396972656, 30.7391414642334, 31.771215438842773, 32.803287506103516, 33.83536148071289, 34.867435455322266, 35.899505615234375, 36.93157958984375, 37.963653564453125, 38.9957275390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 9.0, 16.0, 21.0, 29.0, 60.0, 75.0, 124.0, 252.0, 506.0, 1043.0, 2885.0, 9684.0, 62918.0, 4028964.0, 72604.0, 9743.0, 2906.0, 1123.0, 511.0, 258.0, 159.0, 85.0, 75.0, 48.0, 41.0, 27.0, 25.0, 16.0, 19.0, 8.0, 11.0, 7.0, 4.0, 4.0, 8.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.078125, -22.269287109375, -21.46044921875, -20.651611328125, -19.8427734375, -19.033935546875, -18.22509765625, -17.416259765625, -16.607421875, -15.798583984375, -14.98974609375, -14.180908203125, -13.3720703125, -12.563232421875, -11.75439453125, -10.945556640625, -10.13671875, -9.327880859375, -8.51904296875, -7.710205078125, -6.9013671875, -6.092529296875, -5.28369140625, -4.474853515625, -3.666015625, -2.857177734375, -2.04833984375, -1.239501953125, -0.4306640625, 0.378173828125, 1.18701171875, 1.995849609375, 2.8046875, 3.613525390625, 4.42236328125, 5.231201171875, 6.0400390625, 6.848876953125, 7.65771484375, 8.466552734375, 9.275390625, 10.084228515625, 10.89306640625, 11.701904296875, 12.5107421875, 13.319580078125, 14.12841796875, 14.937255859375, 15.74609375, 16.554931640625, 17.36376953125, 18.172607421875, 18.9814453125, 19.790283203125, 20.59912109375, 21.407958984375, 22.216796875, 23.025634765625, 23.83447265625, 24.643310546875, 25.4521484375, 26.260986328125, 27.06982421875, 27.878662109375, 28.6875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 13.0, 23.0, 27.0, 51.0, 59.0, 70.0, 81.0, 95.0, 92.0, 111.0, 112.0, 77.0, 67.0, 38.0, 31.0, 18.0, 16.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -0.9972381591796875, -0.940765380859375, -0.8842926025390625, -0.82781982421875, -0.7713470458984375, -0.714874267578125, -0.6584014892578125, -0.6019287109375, -0.5454559326171875, -0.488983154296875, -0.4325103759765625, -0.37603759765625, -0.3195648193359375, -0.263092041015625, -0.2066192626953125, -0.150146484375, -0.0936737060546875, -0.037200927734375, 0.0192718505859375, 0.07574462890625, 0.1322174072265625, 0.188690185546875, 0.2451629638671875, 0.3016357421875, 0.3581085205078125, 0.414581298828125, 0.4710540771484375, 0.52752685546875, 0.5839996337890625, 0.640472412109375, 0.6969451904296875, 0.75341796875, 0.8098907470703125, 0.866363525390625, 0.9228363037109375, 0.97930908203125, 1.0357818603515625, 1.092254638671875, 1.1487274169921875, 1.2052001953125, 1.2616729736328125, 1.318145751953125, 1.3746185302734375, 1.43109130859375, 1.4875640869140625, 1.544036865234375, 1.6005096435546875, 1.656982421875, 1.7134552001953125, 1.769927978515625, 1.8264007568359375, 1.88287353515625, 1.9393463134765625, 1.995819091796875, 2.0522918701171875, 2.1087646484375, 2.1652374267578125, 2.221710205078125, 2.2781829833984375, 2.33465576171875, 2.3911285400390625, 2.447601318359375, 2.5040740966796875, 2.560546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 5.0, 14.0, 11.0, 17.0, 33.0, 74.0, 141.0, 244.0, 625.0, 6000.0, 4175015.0, 10586.0, 782.0, 283.0, 149.0, 111.0, 97.0, 43.0, 20.0, 24.0, 7.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.125, -33.6435546875, -31.162109375, -28.6806640625, -26.19921875, -23.7177734375, -21.236328125, -18.7548828125, -16.2734375, -13.7919921875, -11.310546875, -8.8291015625, -6.34765625, -3.8662109375, -1.384765625, 1.0966796875, 3.578125, 6.0595703125, 8.541015625, 11.0224609375, 13.50390625, 15.9853515625, 18.466796875, 20.9482421875, 23.4296875, 25.9111328125, 28.392578125, 30.8740234375, 33.35546875, 35.8369140625, 38.318359375, 40.7998046875, 43.28125, 45.7626953125, 48.244140625, 50.7255859375, 53.20703125, 55.6884765625, 58.169921875, 60.6513671875, 63.1328125, 65.6142578125, 68.095703125, 70.5771484375, 73.05859375, 75.5400390625, 78.021484375, 80.5029296875, 82.984375, 85.4658203125, 87.947265625, 90.4287109375, 92.91015625, 95.3916015625, 97.873046875, 100.3544921875, 102.8359375, 105.3173828125, 107.798828125, 110.2802734375, 112.76171875, 115.2431640625, 117.724609375, 120.2060546875, 122.6875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 13.0, 63.0, 451.0, 3328.0, 178.0, 34.0, 11.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -4.86407470703125, -4.4351806640625, -4.00628662109375, -3.577392578125, -3.14849853515625, -2.7196044921875, -2.29071044921875, -1.86181640625, -1.43292236328125, -1.0040283203125, -0.57513427734375, -0.146240234375, 0.28265380859375, 0.7115478515625, 1.14044189453125, 1.5693359375, 1.99822998046875, 2.4271240234375, 2.85601806640625, 3.284912109375, 3.71380615234375, 4.1427001953125, 4.57159423828125, 5.00048828125, 5.42938232421875, 5.8582763671875, 6.28717041015625, 6.716064453125, 7.14495849609375, 7.5738525390625, 8.00274658203125, 8.431640625, 8.86053466796875, 9.2894287109375, 9.71832275390625, 10.147216796875, 10.57611083984375, 11.0050048828125, 11.43389892578125, 11.86279296875, 12.29168701171875, 12.7205810546875, 13.14947509765625, 13.578369140625, 14.00726318359375, 14.4361572265625, 14.86505126953125, 15.2939453125, 15.72283935546875, 16.1517333984375, 16.58062744140625, 17.009521484375, 17.43841552734375, 17.8673095703125, 18.29620361328125, 18.72509765625, 19.15399169921875, 19.5828857421875, 20.01177978515625, 20.440673828125, 20.86956787109375, 21.2984619140625, 21.72735595703125, 22.15625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 9.0, 49.0, 575.0, 341.0, 29.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.20199584960938, -137.88038635253906, -133.5587615966797, -129.23715209960938, -124.91552734375, -120.59391021728516, -116.27229309082031, -111.95068359375, -107.62905883789062, -103.30744171142578, -98.98582458496094, -94.6642074584961, -90.34259033203125, -86.0209732055664, -81.69935607910156, -77.37774658203125, -73.0561294555664, -68.73451232910156, -64.41289520263672, -60.091278076171875, -55.76966094970703, -51.44804382324219, -47.12643051147461, -42.804813385009766, -38.48319625854492, -34.16157913208008, -29.839962005615234, -25.518346786499023, -21.19672966003418, -16.875112533569336, -12.553497314453125, -8.231880187988281, -3.9102630615234375, 0.41135358810424805, 4.732970237731934, 9.054586410522461, 13.376203536987305, 17.69782066345215, 22.01943588256836, 26.341053009033203, 30.662670135498047, 34.98428726196289, 39.305904388427734, 43.62751770019531, 47.949134826660156, 52.270751953125, 56.592369079589844, 60.91398620605469, 65.23560333251953, 69.55722045898438, 73.87883758544922, 78.20045471191406, 82.5220718383789, 86.84368896484375, 91.16529846191406, 95.48692321777344, 99.80853271484375, 104.1301498413086, 108.45176696777344, 112.77338409423828, 117.09500122070312, 121.41661834716797, 125.73823547363281, 130.05984497070312, 134.3814697265625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 9.0, 22.0, 48.0, 82.0, 120.0, 169.0, 189.0, 141.0, 105.0, 70.0, 34.0, 7.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.97163772583008, -53.53211975097656, -52.09260559082031, -50.6530876159668, -49.21357345581055, -47.77405548095703, -46.33454132080078, -44.895023345947266, -43.45550537109375, -42.015987396240234, -40.576473236083984, -39.13695526123047, -37.69744110107422, -36.2579231262207, -34.81840515136719, -33.37889099121094, -31.939376831054688, -30.499860763549805, -29.060344696044922, -27.620826721191406, -26.181312561035156, -24.74179458618164, -23.302278518676758, -21.862762451171875, -20.423246383666992, -18.98373031616211, -17.544214248657227, -16.104698181152344, -14.665181159973145, -13.225665092468262, -11.786148071289062, -10.34663200378418, -8.907112121582031, -7.467596054077148, -6.028079509735107, -4.588562965393066, -3.1490468978881836, -1.7095308303833008, -0.27001380920410156, 1.1695022583007812, 2.609018325805664, 4.048534393310547, 5.488050937652588, 6.927567481994629, 8.367083549499512, 9.806599617004395, 11.246116638183594, 12.685632705688477, 14.12514877319336, 15.564664840698242, 17.004180908203125, 18.44369888305664, 19.88321304321289, 21.322731018066406, 22.76224708557129, 24.201763153076172, 25.641279220581055, 27.080795288085938, 28.52031135559082, 29.959827423095703, 31.39934539794922, 32.83885955810547, 34.278377532958984, 35.7178955078125, 37.15740966796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 7.0, 12.0, 11.0, 21.0, 41.0, 55.0, 100.0, 202.0, 498.0, 1213.0, 4465.0, 50044.0, 890494.0, 92657.0, 6272.0, 1384.0, 491.0, 288.0, 132.0, 72.0, 36.0, 16.0, 12.0, 11.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.203125, -25.346435546875, -24.48974609375, -23.633056640625, -22.7763671875, -21.919677734375, -21.06298828125, -20.206298828125, -19.349609375, -18.492919921875, -17.63623046875, -16.779541015625, -15.9228515625, -15.066162109375, -14.20947265625, -13.352783203125, -12.49609375, -11.639404296875, -10.78271484375, -9.926025390625, -9.0693359375, -8.212646484375, -7.35595703125, -6.499267578125, -5.642578125, -4.785888671875, -3.92919921875, -3.072509765625, -2.2158203125, -1.359130859375, -0.50244140625, 0.354248046875, 1.2109375, 2.067626953125, 2.92431640625, 3.781005859375, 4.6376953125, 5.494384765625, 6.35107421875, 7.207763671875, 8.064453125, 8.921142578125, 9.77783203125, 10.634521484375, 11.4912109375, 12.347900390625, 13.20458984375, 14.061279296875, 14.91796875, 15.774658203125, 16.63134765625, 17.488037109375, 18.3447265625, 19.201416015625, 20.05810546875, 20.914794921875, 21.771484375, 22.628173828125, 23.48486328125, 24.341552734375, 25.1982421875, 26.054931640625, 26.91162109375, 27.768310546875, 28.625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 10.0, 27.0, 45.0, 54.0, 84.0, 111.0, 151.0, 121.0, 133.0, 104.0, 62.0, 48.0, 28.0, 9.0, 7.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.181640625, -2.087371826171875, -1.99310302734375, -1.898834228515625, -1.8045654296875, -1.710296630859375, -1.61602783203125, -1.521759033203125, -1.427490234375, -1.333221435546875, -1.23895263671875, -1.144683837890625, -1.0504150390625, -0.956146240234375, -0.86187744140625, -0.767608642578125, -0.67333984375, -0.579071044921875, -0.48480224609375, -0.390533447265625, -0.2962646484375, -0.201995849609375, -0.10772705078125, -0.013458251953125, 0.080810546875, 0.175079345703125, 0.26934814453125, 0.363616943359375, 0.4578857421875, 0.552154541015625, 0.64642333984375, 0.740692138671875, 0.8349609375, 0.929229736328125, 1.02349853515625, 1.117767333984375, 1.2120361328125, 1.306304931640625, 1.40057373046875, 1.494842529296875, 1.589111328125, 1.683380126953125, 1.77764892578125, 1.871917724609375, 1.9661865234375, 2.060455322265625, 2.15472412109375, 2.248992919921875, 2.34326171875, 2.437530517578125, 2.53179931640625, 2.626068115234375, 2.7203369140625, 2.814605712890625, 2.90887451171875, 3.003143310546875, 3.097412109375, 3.191680908203125, 3.28594970703125, 3.380218505859375, 3.4744873046875, 3.568756103515625, 3.66302490234375, 3.757293701171875, 3.8515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 6.0, 14.0, 12.0, 20.0, 36.0, 40.0, 72.0, 79.0, 150.0, 227.0, 368.0, 571.0, 1042.0, 1863.0, 3983.0, 10738.0, 40364.0, 224348.0, 576283.0, 144683.0, 28354.0, 8059.0, 3221.0, 1615.0, 878.0, 531.0, 342.0, 228.0, 117.0, 87.0, 70.0, 47.0, 26.0, 18.0, 15.0, 5.0, 7.0, 1.0, 8.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.92578125, -7.63629150390625, -7.3468017578125, -7.05731201171875, -6.767822265625, -6.47833251953125, -6.1888427734375, -5.89935302734375, -5.60986328125, -5.32037353515625, -5.0308837890625, -4.74139404296875, -4.451904296875, -4.16241455078125, -3.8729248046875, -3.58343505859375, -3.2939453125, -3.00445556640625, -2.7149658203125, -2.42547607421875, -2.135986328125, -1.84649658203125, -1.5570068359375, -1.26751708984375, -0.97802734375, -0.68853759765625, -0.3990478515625, -0.10955810546875, 0.179931640625, 0.46942138671875, 0.7589111328125, 1.04840087890625, 1.337890625, 1.62738037109375, 1.9168701171875, 2.20635986328125, 2.495849609375, 2.78533935546875, 3.0748291015625, 3.36431884765625, 3.65380859375, 3.94329833984375, 4.2327880859375, 4.52227783203125, 4.811767578125, 5.10125732421875, 5.3907470703125, 5.68023681640625, 5.9697265625, 6.25921630859375, 6.5487060546875, 6.83819580078125, 7.127685546875, 7.41717529296875, 7.7066650390625, 7.99615478515625, 8.28564453125, 8.57513427734375, 8.8646240234375, 9.15411376953125, 9.443603515625, 9.73309326171875, 10.0225830078125, 10.31207275390625, 10.6015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 6.0, 5.0, 6.0, 7.0, 13.0, 16.0, 27.0, 18.0, 39.0, 29.0, 37.0, 35.0, 51.0, 58.0, 62.0, 65.0, 59.0, 53.0, 61.0, 37.0, 50.0, 38.0, 47.0, 46.0, 28.0, 19.0, 18.0, 17.0, 11.0, 15.0, 11.0, 6.0, 5.0, 1.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.85546875, -5.6419677734375, -5.428466796875, -5.2149658203125, -5.00146484375, -4.7879638671875, -4.574462890625, -4.3609619140625, -4.1474609375, -3.9339599609375, -3.720458984375, -3.5069580078125, -3.29345703125, -3.0799560546875, -2.866455078125, -2.6529541015625, -2.439453125, -2.2259521484375, -2.012451171875, -1.7989501953125, -1.58544921875, -1.3719482421875, -1.158447265625, -0.9449462890625, -0.7314453125, -0.5179443359375, -0.304443359375, -0.0909423828125, 0.12255859375, 0.3360595703125, 0.549560546875, 0.7630615234375, 0.9765625, 1.1900634765625, 1.403564453125, 1.6170654296875, 1.83056640625, 2.0440673828125, 2.257568359375, 2.4710693359375, 2.6845703125, 2.8980712890625, 3.111572265625, 3.3250732421875, 3.53857421875, 3.7520751953125, 3.965576171875, 4.1790771484375, 4.392578125, 4.6060791015625, 4.819580078125, 5.0330810546875, 5.24658203125, 5.4600830078125, 5.673583984375, 5.8870849609375, 6.1005859375, 6.3140869140625, 6.527587890625, 6.7410888671875, 6.95458984375, 7.1680908203125, 7.381591796875, 7.5950927734375, 7.80859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 8.0, 19.0, 33.0, 29.0, 32.0, 56.0, 118.0, 227.0, 389.0, 794.0, 1847.0, 5206.0, 22754.0, 380161.0, 596761.0, 29814.0, 6320.0, 2119.0, 920.0, 395.0, 205.0, 149.0, 70.0, 47.0, 25.0, 18.0, 10.0, 4.0, 7.0, 1.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.362548828125, -7.06884765625, -6.775146484375, -6.4814453125, -6.187744140625, -5.89404296875, -5.600341796875, -5.306640625, -5.012939453125, -4.71923828125, -4.425537109375, -4.1318359375, -3.838134765625, -3.54443359375, -3.250732421875, -2.95703125, -2.663330078125, -2.36962890625, -2.075927734375, -1.7822265625, -1.488525390625, -1.19482421875, -0.901123046875, -0.607421875, -0.313720703125, -0.02001953125, 0.273681640625, 0.5673828125, 0.861083984375, 1.15478515625, 1.448486328125, 1.7421875, 2.035888671875, 2.32958984375, 2.623291015625, 2.9169921875, 3.210693359375, 3.50439453125, 3.798095703125, 4.091796875, 4.385498046875, 4.67919921875, 4.972900390625, 5.2666015625, 5.560302734375, 5.85400390625, 6.147705078125, 6.44140625, 6.735107421875, 7.02880859375, 7.322509765625, 7.6162109375, 7.909912109375, 8.20361328125, 8.497314453125, 8.791015625, 9.084716796875, 9.37841796875, 9.672119140625, 9.9658203125, 10.259521484375, 10.55322265625, 10.846923828125, 11.140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 6.0, 13.0, 16.0, 15.0, 39.0, 64.0, 92.0, 156.0, 219.0, 144.0, 92.0, 38.0, 39.0, 18.0, 14.0, 13.0, 6.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012035369873046875, -0.0011522471904754639, -0.0011009573936462402, -0.0010496675968170166, -0.000998377799987793, -0.0009470880031585693, -0.0008957982063293457, -0.0008445084095001221, -0.0007932186126708984, -0.0007419288158416748, -0.0006906390190124512, -0.0006393492221832275, -0.0005880594253540039, -0.0005367696285247803, -0.00048547983169555664, -0.000434190034866333, -0.0003829002380371094, -0.00033161044120788574, -0.0002803206443786621, -0.00022903084754943848, -0.00017774105072021484, -0.0001264512538909912, -7.516145706176758e-05, -2.3871660232543945e-05, 2.7418136596679688e-05, 7.870793342590332e-05, 0.00012999773025512695, 0.00018128752708435059, 0.00023257732391357422, 0.00028386712074279785, 0.0003351569175720215, 0.0003864467144012451, 0.00043773651123046875, 0.0004890263080596924, 0.000540316104888916, 0.0005916059017181396, 0.0006428956985473633, 0.0006941854953765869, 0.0007454752922058105, 0.0007967650890350342, 0.0008480548858642578, 0.0008993446826934814, 0.0009506344795227051, 0.0010019242763519287, 0.0010532140731811523, 0.001104503870010376, 0.0011557936668395996, 0.0012070834636688232, 0.0012583732604980469, 0.0013096630573272705, 0.0013609528541564941, 0.0014122426509857178, 0.0014635324478149414, 0.001514822244644165, 0.0015661120414733887, 0.0016174018383026123, 0.001668691635131836, 0.0017199814319610596, 0.0017712712287902832, 0.0018225610256195068, 0.0018738508224487305, 0.001925140619277954, 0.0019764304161071777, 0.0020277202129364014, 0.002079010009765625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 3.0, 5.0, 2.0, 6.0, 7.0, 11.0, 18.0, 23.0, 25.0, 45.0, 49.0, 66.0, 115.0, 137.0, 249.0, 373.0, 602.0, 1036.0, 1856.0, 3890.0, 9472.0, 34512.0, 315800.0, 602258.0, 54688.0, 13044.0, 4806.0, 2257.0, 1237.0, 703.0, 439.0, 245.0, 159.0, 112.0, 72.0, 63.0, 36.0, 32.0, 27.0, 17.0, 17.0, 5.0, 8.0, 7.0, 5.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.80078125, -6.6015625, -6.40234375, -6.203125, -6.00390625, -5.8046875, -5.60546875, -5.40625, -5.20703125, -5.0078125, -4.80859375, -4.609375, -4.41015625, -4.2109375, -4.01171875, -3.8125, -3.61328125, -3.4140625, -3.21484375, -3.015625, -2.81640625, -2.6171875, -2.41796875, -2.21875, -2.01953125, -1.8203125, -1.62109375, -1.421875, -1.22265625, -1.0234375, -0.82421875, -0.625, -0.42578125, -0.2265625, -0.02734375, 0.171875, 0.37109375, 0.5703125, 0.76953125, 0.96875, 1.16796875, 1.3671875, 1.56640625, 1.765625, 1.96484375, 2.1640625, 2.36328125, 2.5625, 2.76171875, 2.9609375, 3.16015625, 3.359375, 3.55859375, 3.7578125, 3.95703125, 4.15625, 4.35546875, 4.5546875, 4.75390625, 4.953125, 5.15234375, 5.3515625, 5.55078125, 5.75, 5.94921875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 12.0, 22.0, 23.0, 35.0, 67.0, 95.0, 152.0, 156.0, 140.0, 120.0, 73.0, 30.0, 21.0, 18.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.53515625, -5.374267578125, -5.21337890625, -5.052490234375, -4.8916015625, -4.730712890625, -4.56982421875, -4.408935546875, -4.248046875, -4.087158203125, -3.92626953125, -3.765380859375, -3.6044921875, -3.443603515625, -3.28271484375, -3.121826171875, -2.9609375, -2.800048828125, -2.63916015625, -2.478271484375, -2.3173828125, -2.156494140625, -1.99560546875, -1.834716796875, -1.673828125, -1.512939453125, -1.35205078125, -1.191162109375, -1.0302734375, -0.869384765625, -0.70849609375, -0.547607421875, -0.38671875, -0.225830078125, -0.06494140625, 0.095947265625, 0.2568359375, 0.417724609375, 0.57861328125, 0.739501953125, 0.900390625, 1.061279296875, 1.22216796875, 1.383056640625, 1.5439453125, 1.704833984375, 1.86572265625, 2.026611328125, 2.1875, 2.348388671875, 2.50927734375, 2.670166015625, 2.8310546875, 2.991943359375, 3.15283203125, 3.313720703125, 3.474609375, 3.635498046875, 3.79638671875, 3.957275390625, 4.1181640625, 4.279052734375, 4.43994140625, 4.600830078125, 4.76171875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 5.0, 9.0, 10.0, 25.0, 52.0, 67.0, 123.0, 159.0, 166.0, 145.0, 103.0, 50.0, 36.0, 19.0, 6.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.5450553894043, -53.64915084838867, -51.75324630737305, -49.85734558105469, -47.96144104003906, -46.06553649902344, -44.16963195800781, -42.27372741699219, -40.37782287597656, -38.48191833496094, -36.58601379394531, -34.69010925292969, -32.79420852661133, -30.898303985595703, -29.002399444580078, -27.106494903564453, -25.210594177246094, -23.31468963623047, -21.418787002563477, -19.52288246154785, -17.62697982788086, -15.731075286865234, -13.83517074584961, -11.9392671585083, -10.043363571166992, -8.147459983825684, -6.251555919647217, -4.35565185546875, -2.4597482681274414, -0.5638446807861328, 1.3320598602294922, 3.227963447570801, 5.123863220214844, 7.019766807556152, 8.915670394897461, 10.811574935913086, 12.707478523254395, 14.603382110595703, 16.499286651611328, 18.395191192626953, 20.291093826293945, 22.18699836730957, 24.082901000976562, 25.978805541992188, 27.874710083007812, 29.770612716674805, 31.66651725769043, 33.56241989135742, 35.45832443237305, 37.35422897338867, 39.2501335144043, 41.146034240722656, 43.04193878173828, 44.937843322753906, 46.83374786376953, 48.729652404785156, 50.62555694580078, 52.521461486816406, 54.41736602783203, 56.313270568847656, 58.209171295166016, 60.10507583618164, 62.000980377197266, 63.89688491821289, 65.79278564453125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 4.0, 8.0, 11.0, 13.0, 17.0, 23.0, 40.0, 39.0, 37.0, 47.0, 54.0, 68.0, 52.0, 72.0, 60.0, 49.0, 60.0, 54.0, 49.0, 40.0, 37.0, 34.0, 31.0, 25.0, 13.0, 16.0, 7.0, 4.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.98017501831055, -39.67043685913086, -38.36069869995117, -37.05095672607422, -35.74121856689453, -34.431480407714844, -33.121742248535156, -31.81200408935547, -30.50226402282715, -29.19252586364746, -27.88278579711914, -26.573047637939453, -25.263309478759766, -23.953569412231445, -22.643831253051758, -21.334091186523438, -20.02435302734375, -18.714614868164062, -17.404874801635742, -16.095136642456055, -14.78539752960205, -13.475658416748047, -12.16592025756836, -10.856181144714355, -9.546442031860352, -8.236702919006348, -6.926964282989502, -5.617225646972656, -4.307486534118652, -2.9977474212646484, -1.6880087852478027, -0.37827014923095703, 0.9314651489257812, 2.241204023361206, 3.550942897796631, 4.860681533813477, 6.1704206466674805, 7.480159759521484, 8.789897918701172, 10.099637031555176, 11.40937614440918, 12.719115257263184, 14.028854370117188, 15.338592529296875, 16.648330688476562, 17.958070755004883, 19.26780891418457, 20.57754898071289, 21.887287139892578, 23.197025299072266, 24.506765365600586, 25.816503524780273, 27.126243591308594, 28.43598175048828, 29.74571990966797, 31.055458068847656, 32.365196228027344, 33.67493438720703, 34.98467254638672, 36.29441452026367, 37.60415267944336, 38.91389083862305, 40.223628997802734, 41.53336715698242, 42.843109130859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 1.0, 10.0, 15.0, 18.0, 32.0, 46.0, 87.0, 139.0, 177.0, 330.0, 587.0, 1269.0, 3329.0, 9838.0, 35318.0, 381830.0, 3676283.0, 62423.0, 14023.0, 4409.0, 1773.0, 813.0, 404.0, 290.0, 175.0, 125.0, 107.0, 85.0, 60.0, 58.0, 43.0, 40.0, 39.0, 29.0, 22.0, 12.0, 18.0, 9.0, 7.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.796875, -13.113525390625, -12.43017578125, -11.746826171875, -11.0634765625, -10.380126953125, -9.69677734375, -9.013427734375, -8.330078125, -7.646728515625, -6.96337890625, -6.280029296875, -5.5966796875, -4.913330078125, -4.22998046875, -3.546630859375, -2.86328125, -2.179931640625, -1.49658203125, -0.813232421875, -0.1298828125, 0.553466796875, 1.23681640625, 1.920166015625, 2.603515625, 3.286865234375, 3.97021484375, 4.653564453125, 5.3369140625, 6.020263671875, 6.70361328125, 7.386962890625, 8.0703125, 8.753662109375, 9.43701171875, 10.120361328125, 10.8037109375, 11.487060546875, 12.17041015625, 12.853759765625, 13.537109375, 14.220458984375, 14.90380859375, 15.587158203125, 16.2705078125, 16.953857421875, 17.63720703125, 18.320556640625, 19.00390625, 19.687255859375, 20.37060546875, 21.053955078125, 21.7373046875, 22.420654296875, 23.10400390625, 23.787353515625, 24.470703125, 25.154052734375, 25.83740234375, 26.520751953125, 27.2041015625, 27.887451171875, 28.57080078125, 29.254150390625, 29.9375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 14.0, 28.0, 43.0, 69.0, 81.0, 109.0, 136.0, 125.0, 122.0, 99.0, 62.0, 54.0, 30.0, 13.0, 5.0, 6.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.072265625, -1.9786376953125, -1.885009765625, -1.7913818359375, -1.69775390625, -1.6041259765625, -1.510498046875, -1.4168701171875, -1.3232421875, -1.2296142578125, -1.135986328125, -1.0423583984375, -0.94873046875, -0.8551025390625, -0.761474609375, -0.6678466796875, -0.57421875, -0.4805908203125, -0.386962890625, -0.2933349609375, -0.19970703125, -0.1060791015625, -0.012451171875, 0.0811767578125, 0.1748046875, 0.2684326171875, 0.362060546875, 0.4556884765625, 0.54931640625, 0.6429443359375, 0.736572265625, 0.8302001953125, 0.923828125, 1.0174560546875, 1.111083984375, 1.2047119140625, 1.29833984375, 1.3919677734375, 1.485595703125, 1.5792236328125, 1.6728515625, 1.7664794921875, 1.860107421875, 1.9537353515625, 2.04736328125, 2.1409912109375, 2.234619140625, 2.3282470703125, 2.421875, 2.5155029296875, 2.609130859375, 2.7027587890625, 2.79638671875, 2.8900146484375, 2.983642578125, 3.0772705078125, 3.1708984375, 3.2645263671875, 3.358154296875, 3.4517822265625, 3.54541015625, 3.6390380859375, 3.732666015625, 3.8262939453125, 3.919921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 9.0, 12.0, 14.0, 20.0, 17.0, 31.0, 41.0, 71.0, 83.0, 111.0, 147.0, 205.0, 359.0, 676.0, 1616.0, 7244.0, 3629365.0, 544132.0, 6728.0, 1718.0, 661.0, 362.0, 202.0, 121.0, 84.0, 66.0, 46.0, 32.0, 28.0, 19.0, 12.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.3125, -83.912109375, -81.51171875, -79.111328125, -76.7109375, -74.310546875, -71.91015625, -69.509765625, -67.109375, -64.708984375, -62.30859375, -59.908203125, -57.5078125, -55.107421875, -52.70703125, -50.306640625, -47.90625, -45.505859375, -43.10546875, -40.705078125, -38.3046875, -35.904296875, -33.50390625, -31.103515625, -28.703125, -26.302734375, -23.90234375, -21.501953125, -19.1015625, -16.701171875, -14.30078125, -11.900390625, -9.5, -7.099609375, -4.69921875, -2.298828125, 0.1015625, 2.501953125, 4.90234375, 7.302734375, 9.703125, 12.103515625, 14.50390625, 16.904296875, 19.3046875, 21.705078125, 24.10546875, 26.505859375, 28.90625, 31.306640625, 33.70703125, 36.107421875, 38.5078125, 40.908203125, 43.30859375, 45.708984375, 48.109375, 50.509765625, 52.91015625, 55.310546875, 57.7109375, 60.111328125, 62.51171875, 64.912109375, 67.3125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 11.0, 40.0, 221.0, 3382.0, 325.0, 56.0, 15.0, 10.0, 7.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.375, -30.5615234375, -29.748046875, -28.9345703125, -28.12109375, -27.3076171875, -26.494140625, -25.6806640625, -24.8671875, -24.0537109375, -23.240234375, -22.4267578125, -21.61328125, -20.7998046875, -19.986328125, -19.1728515625, -18.359375, -17.5458984375, -16.732421875, -15.9189453125, -15.10546875, -14.2919921875, -13.478515625, -12.6650390625, -11.8515625, -11.0380859375, -10.224609375, -9.4111328125, -8.59765625, -7.7841796875, -6.970703125, -6.1572265625, -5.34375, -4.5302734375, -3.716796875, -2.9033203125, -2.08984375, -1.2763671875, -0.462890625, 0.3505859375, 1.1640625, 1.9775390625, 2.791015625, 3.6044921875, 4.41796875, 5.2314453125, 6.044921875, 6.8583984375, 7.671875, 8.4853515625, 9.298828125, 10.1123046875, 10.92578125, 11.7392578125, 12.552734375, 13.3662109375, 14.1796875, 14.9931640625, 15.806640625, 16.6201171875, 17.43359375, 18.2470703125, 19.060546875, 19.8740234375, 20.6875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 12.0, 29.0, 68.0, 263.0, 421.0, 131.0, 39.0, 13.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.414794921875, -147.69207763671875, -142.9693603515625, -138.2466278076172, -133.52391052246094, -128.8011932373047, -124.0784683227539, -119.35574340820312, -114.63302612304688, -109.91030883789062, -105.18758392333984, -100.46485900878906, -95.74214172363281, -91.01942443847656, -86.29669952392578, -81.573974609375, -76.85125732421875, -72.1285400390625, -67.40581512451172, -62.6830940246582, -57.96037292480469, -53.23765182495117, -48.514930725097656, -43.79220962524414, -39.069488525390625, -34.34676742553711, -29.624046325683594, -24.901325225830078, -20.178604125976562, -15.455883026123047, -10.733161926269531, -6.010440826416016, -1.2877197265625, 3.4350013732910156, 8.157722473144531, 12.880443572998047, 17.603164672851562, 22.325885772705078, 27.048606872558594, 31.77132797241211, 36.494049072265625, 41.21677017211914, 45.939491271972656, 50.66221237182617, 55.38493347167969, 60.1076545715332, 64.83037567138672, 69.5531005859375, 74.27581787109375, 78.99853515625, 83.72126007080078, 88.44398498535156, 93.16670227050781, 97.88941955566406, 102.61214447021484, 107.33486938476562, 112.05758666992188, 116.78030395507812, 121.5030288696289, 126.22575378417969, 130.94847106933594, 135.6711883544922, 140.3939208984375, 145.11663818359375, 149.83935546875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 7.0, 6.0, 13.0, 20.0, 29.0, 55.0, 69.0, 88.0, 126.0, 130.0, 136.0, 88.0, 97.0, 52.0, 33.0, 20.0, 14.0, 4.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.312744140625, -69.96802520751953, -67.6233139038086, -65.27859497070312, -62.93388366699219, -60.58916473388672, -58.244449615478516, -55.89973449707031, -53.55501937866211, -51.210304260253906, -48.8655891418457, -46.5208740234375, -44.17615509033203, -41.831443786621094, -39.486724853515625, -37.14200973510742, -34.79729461669922, -32.452579498291016, -30.107864379882812, -27.763147354125977, -25.418432235717773, -23.07371711730957, -20.729000091552734, -18.38428497314453, -16.039569854736328, -13.694854736328125, -11.350138664245605, -9.005422592163086, -6.660707473754883, -4.31599235534668, -1.9712762832641602, 0.3734397888183594, 2.7181472778320312, 5.062862873077393, 7.407578468322754, 9.752294540405273, 12.097009658813477, 14.44172477722168, 16.786441802978516, 19.13115692138672, 21.475872039794922, 23.820587158203125, 26.165302276611328, 28.510019302368164, 30.854734420776367, 33.19944763183594, 35.544166564941406, 37.88888168334961, 40.23359680175781, 42.578311920166016, 44.92302703857422, 47.26774215698242, 49.612457275390625, 51.957176208496094, 54.3018913269043, 56.6466064453125, 58.9913215637207, 61.336036682128906, 63.68075180053711, 66.02546691894531, 68.37018585205078, 70.71489715576172, 73.05961608886719, 75.40432739257812, 77.7490463256836]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 8.0, 10.0, 12.0, 23.0, 25.0, 30.0, 51.0, 71.0, 100.0, 179.0, 282.0, 467.0, 902.0, 2013.0, 5022.0, 18777.0, 149620.0, 763548.0, 85962.0, 13691.0, 4150.0, 1677.0, 814.0, 431.0, 210.0, 163.0, 99.0, 75.0, 42.0, 28.0, 18.0, 11.0, 9.0, 9.0, 5.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.40625, -22.66064453125, -21.9150390625, -21.16943359375, -20.423828125, -19.67822265625, -18.9326171875, -18.18701171875, -17.44140625, -16.69580078125, -15.9501953125, -15.20458984375, -14.458984375, -13.71337890625, -12.9677734375, -12.22216796875, -11.4765625, -10.73095703125, -9.9853515625, -9.23974609375, -8.494140625, -7.74853515625, -7.0029296875, -6.25732421875, -5.51171875, -4.76611328125, -4.0205078125, -3.27490234375, -2.529296875, -1.78369140625, -1.0380859375, -0.29248046875, 0.453125, 1.19873046875, 1.9443359375, 2.68994140625, 3.435546875, 4.18115234375, 4.9267578125, 5.67236328125, 6.41796875, 7.16357421875, 7.9091796875, 8.65478515625, 9.400390625, 10.14599609375, 10.8916015625, 11.63720703125, 12.3828125, 13.12841796875, 13.8740234375, 14.61962890625, 15.365234375, 16.11083984375, 16.8564453125, 17.60205078125, 18.34765625, 19.09326171875, 19.8388671875, 20.58447265625, 21.330078125, 22.07568359375, 22.8212890625, 23.56689453125, 24.3125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 12.0, 12.0, 31.0, 37.0, 53.0, 80.0, 84.0, 106.0, 124.0, 102.0, 89.0, 87.0, 63.0, 36.0, 36.0, 18.0, 7.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.512939453125, -2.39697265625, -2.281005859375, -2.1650390625, -2.049072265625, -1.93310546875, -1.817138671875, -1.701171875, -1.585205078125, -1.46923828125, -1.353271484375, -1.2373046875, -1.121337890625, -1.00537109375, -0.889404296875, -0.7734375, -0.657470703125, -0.54150390625, -0.425537109375, -0.3095703125, -0.193603515625, -0.07763671875, 0.038330078125, 0.154296875, 0.270263671875, 0.38623046875, 0.502197265625, 0.6181640625, 0.734130859375, 0.85009765625, 0.966064453125, 1.08203125, 1.197998046875, 1.31396484375, 1.429931640625, 1.5458984375, 1.661865234375, 1.77783203125, 1.893798828125, 2.009765625, 2.125732421875, 2.24169921875, 2.357666015625, 2.4736328125, 2.589599609375, 2.70556640625, 2.821533203125, 2.9375, 3.053466796875, 3.16943359375, 3.285400390625, 3.4013671875, 3.517333984375, 3.63330078125, 3.749267578125, 3.865234375, 3.981201171875, 4.09716796875, 4.213134765625, 4.3291015625, 4.445068359375, 4.56103515625, 4.677001953125, 4.79296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 11.0, 11.0, 22.0, 33.0, 41.0, 60.0, 98.0, 162.0, 264.0, 456.0, 865.0, 1778.0, 4263.0, 12906.0, 50361.0, 266713.0, 548785.0, 122132.0, 26297.0, 7507.0, 2835.0, 1329.0, 627.0, 383.0, 206.0, 145.0, 71.0, 67.0, 41.0, 21.0, 23.0, 13.0, 9.0, 6.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.96875, -10.6663818359375, -10.364013671875, -10.0616455078125, -9.75927734375, -9.4569091796875, -9.154541015625, -8.8521728515625, -8.5498046875, -8.2474365234375, -7.945068359375, -7.6427001953125, -7.34033203125, -7.0379638671875, -6.735595703125, -6.4332275390625, -6.130859375, -5.8284912109375, -5.526123046875, -5.2237548828125, -4.92138671875, -4.6190185546875, -4.316650390625, -4.0142822265625, -3.7119140625, -3.4095458984375, -3.107177734375, -2.8048095703125, -2.50244140625, -2.2000732421875, -1.897705078125, -1.5953369140625, -1.29296875, -0.9906005859375, -0.688232421875, -0.3858642578125, -0.08349609375, 0.2188720703125, 0.521240234375, 0.8236083984375, 1.1259765625, 1.4283447265625, 1.730712890625, 2.0330810546875, 2.33544921875, 2.6378173828125, 2.940185546875, 3.2425537109375, 3.544921875, 3.8472900390625, 4.149658203125, 4.4520263671875, 4.75439453125, 5.0567626953125, 5.359130859375, 5.6614990234375, 5.9638671875, 6.2662353515625, 6.568603515625, 6.8709716796875, 7.17333984375, 7.4757080078125, 7.778076171875, 8.0804443359375, 8.3828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 9.0, 3.0, 5.0, 3.0, 1.0, 14.0, 16.0, 17.0, 14.0, 13.0, 16.0, 29.0, 33.0, 33.0, 40.0, 36.0, 39.0, 50.0, 44.0, 47.0, 31.0, 52.0, 32.0, 41.0, 49.0, 34.0, 45.0, 31.0, 34.0, 30.0, 29.0, 20.0, 24.0, 17.0, 7.0, 17.0, 9.0, 8.0, 8.0, 9.0, 9.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.62109375, -6.43310546875, -6.2451171875, -6.05712890625, -5.869140625, -5.68115234375, -5.4931640625, -5.30517578125, -5.1171875, -4.92919921875, -4.7412109375, -4.55322265625, -4.365234375, -4.17724609375, -3.9892578125, -3.80126953125, -3.61328125, -3.42529296875, -3.2373046875, -3.04931640625, -2.861328125, -2.67333984375, -2.4853515625, -2.29736328125, -2.109375, -1.92138671875, -1.7333984375, -1.54541015625, -1.357421875, -1.16943359375, -0.9814453125, -0.79345703125, -0.60546875, -0.41748046875, -0.2294921875, -0.04150390625, 0.146484375, 0.33447265625, 0.5224609375, 0.71044921875, 0.8984375, 1.08642578125, 1.2744140625, 1.46240234375, 1.650390625, 1.83837890625, 2.0263671875, 2.21435546875, 2.40234375, 2.59033203125, 2.7783203125, 2.96630859375, 3.154296875, 3.34228515625, 3.5302734375, 3.71826171875, 3.90625, 4.09423828125, 4.2822265625, 4.47021484375, 4.658203125, 4.84619140625, 5.0341796875, 5.22216796875, 5.41015625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 15.0, 10.0, 6.0, 21.0, 23.0, 40.0, 39.0, 104.0, 182.0, 305.0, 736.0, 1557.0, 3960.0, 11483.0, 53627.0, 705720.0, 232382.0, 26221.0, 7281.0, 2660.0, 1079.0, 526.0, 255.0, 131.0, 60.0, 36.0, 29.0, 24.0, 12.0, 8.0, 5.0, 6.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.7578125, -10.396728515625, -10.03564453125, -9.674560546875, -9.3134765625, -8.952392578125, -8.59130859375, -8.230224609375, -7.869140625, -7.508056640625, -7.14697265625, -6.785888671875, -6.4248046875, -6.063720703125, -5.70263671875, -5.341552734375, -4.98046875, -4.619384765625, -4.25830078125, -3.897216796875, -3.5361328125, -3.175048828125, -2.81396484375, -2.452880859375, -2.091796875, -1.730712890625, -1.36962890625, -1.008544921875, -0.6474609375, -0.286376953125, 0.07470703125, 0.435791015625, 0.796875, 1.157958984375, 1.51904296875, 1.880126953125, 2.2412109375, 2.602294921875, 2.96337890625, 3.324462890625, 3.685546875, 4.046630859375, 4.40771484375, 4.768798828125, 5.1298828125, 5.490966796875, 5.85205078125, 6.213134765625, 6.57421875, 6.935302734375, 7.29638671875, 7.657470703125, 8.0185546875, 8.379638671875, 8.74072265625, 9.101806640625, 9.462890625, 9.823974609375, 10.18505859375, 10.546142578125, 10.9072265625, 11.268310546875, 11.62939453125, 11.990478515625, 12.3515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 8.0, 7.0, 4.0, 14.0, 9.0, 22.0, 21.0, 39.0, 82.0, 146.0, 275.0, 165.0, 85.0, 50.0, 20.0, 19.0, 13.0, 9.0, 7.0, 2.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014009475708007812, -0.0013498961925506592, -0.0012988448143005371, -0.001247793436050415, -0.001196742057800293, -0.001145690679550171, -0.0010946393013000488, -0.0010435879230499268, -0.0009925365447998047, -0.0009414851665496826, -0.0008904337882995605, -0.0008393824100494385, -0.0007883310317993164, -0.0007372796535491943, -0.0006862282752990723, -0.0006351768970489502, -0.0005841255187988281, -0.0005330741405487061, -0.000482022762298584, -0.0004309713840484619, -0.00037992000579833984, -0.0003288686275482178, -0.0002778172492980957, -0.00022676587104797363, -0.00017571449279785156, -0.0001246631145477295, -7.361173629760742e-05, -2.256035804748535e-05, 2.849102020263672e-05, 7.954239845275879e-05, 0.00013059377670288086, 0.00018164515495300293, 0.000232696533203125, 0.00028374791145324707, 0.00033479928970336914, 0.0003858506679534912, 0.0004369020462036133, 0.00048795342445373535, 0.0005390048027038574, 0.0005900561809539795, 0.0006411075592041016, 0.0006921589374542236, 0.0007432103157043457, 0.0007942616939544678, 0.0008453130722045898, 0.0008963644504547119, 0.000947415828704834, 0.000998467206954956, 0.0010495185852050781, 0.0011005699634552002, 0.0011516213417053223, 0.0012026727199554443, 0.0012537240982055664, 0.0013047754764556885, 0.0013558268547058105, 0.0014068782329559326, 0.0014579296112060547, 0.0015089809894561768, 0.0015600323677062988, 0.001611083745956421, 0.001662135124206543, 0.001713186502456665, 0.0017642378807067871, 0.0018152892589569092, 0.0018663406372070312]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 10.0, 16.0, 17.0, 21.0, 43.0, 45.0, 93.0, 115.0, 138.0, 247.0, 399.0, 655.0, 1125.0, 1875.0, 3469.0, 6921.0, 17405.0, 66033.0, 691496.0, 205334.0, 31509.0, 10831.0, 4743.0, 2463.0, 1388.0, 748.0, 474.0, 287.0, 194.0, 113.0, 103.0, 63.0, 42.0, 29.0, 19.0, 20.0, 21.0, 9.0, 9.0, 5.0, 8.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.359375, -9.0447998046875, -8.730224609375, -8.4156494140625, -8.10107421875, -7.7864990234375, -7.471923828125, -7.1573486328125, -6.8427734375, -6.5281982421875, -6.213623046875, -5.8990478515625, -5.58447265625, -5.2698974609375, -4.955322265625, -4.6407470703125, -4.326171875, -4.0115966796875, -3.697021484375, -3.3824462890625, -3.06787109375, -2.7532958984375, -2.438720703125, -2.1241455078125, -1.8095703125, -1.4949951171875, -1.180419921875, -0.8658447265625, -0.55126953125, -0.2366943359375, 0.077880859375, 0.3924560546875, 0.70703125, 1.0216064453125, 1.336181640625, 1.6507568359375, 1.96533203125, 2.2799072265625, 2.594482421875, 2.9090576171875, 3.2236328125, 3.5382080078125, 3.852783203125, 4.1673583984375, 4.48193359375, 4.7965087890625, 5.111083984375, 5.4256591796875, 5.740234375, 6.0548095703125, 6.369384765625, 6.6839599609375, 6.99853515625, 7.3131103515625, 7.627685546875, 7.9422607421875, 8.2568359375, 8.5714111328125, 8.885986328125, 9.2005615234375, 9.51513671875, 9.8297119140625, 10.144287109375, 10.4588623046875, 10.7734375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 8.0, 12.0, 8.0, 9.0, 17.0, 26.0, 32.0, 44.0, 71.0, 88.0, 155.0, 161.0, 108.0, 59.0, 38.0, 38.0, 27.0, 17.0, 11.0, 8.0, 4.0, 8.0, 6.0, 5.0, 5.0, 0.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1328125, -4.94976806640625, -4.7667236328125, -4.58367919921875, -4.400634765625, -4.21759033203125, -4.0345458984375, -3.85150146484375, -3.66845703125, -3.48541259765625, -3.3023681640625, -3.11932373046875, -2.936279296875, -2.75323486328125, -2.5701904296875, -2.38714599609375, -2.2041015625, -2.02105712890625, -1.8380126953125, -1.65496826171875, -1.471923828125, -1.28887939453125, -1.1058349609375, -0.92279052734375, -0.73974609375, -0.55670166015625, -0.3736572265625, -0.19061279296875, -0.007568359375, 0.17547607421875, 0.3585205078125, 0.54156494140625, 0.724609375, 0.90765380859375, 1.0906982421875, 1.27374267578125, 1.456787109375, 1.63983154296875, 1.8228759765625, 2.00592041015625, 2.18896484375, 2.37200927734375, 2.5550537109375, 2.73809814453125, 2.921142578125, 3.10418701171875, 3.2872314453125, 3.47027587890625, 3.6533203125, 3.83636474609375, 4.0194091796875, 4.20245361328125, 4.385498046875, 4.56854248046875, 4.7515869140625, 4.93463134765625, 5.11767578125, 5.30072021484375, 5.4837646484375, 5.66680908203125, 5.849853515625, 6.03289794921875, 6.2159423828125, 6.39898681640625, 6.58203125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 18.0, 32.0, 85.0, 146.0, 236.0, 248.0, 134.0, 60.0, 20.0, 8.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.59862518310547, -67.8323974609375, -64.06616973876953, -60.2999382019043, -56.53370666503906, -52.767478942871094, -49.001251220703125, -45.235023498535156, -41.46879196166992, -37.70256423950195, -33.93633270263672, -30.17010498046875, -26.40387535095215, -22.637645721435547, -18.871417999267578, -15.105188369750977, -11.338958740234375, -7.572729587554932, -3.8065004348754883, -0.040271759033203125, 3.7259578704833984, 7.4921875, 11.258415222167969, 15.02464485168457, 18.790874481201172, 22.557104110717773, 26.323333740234375, 30.089561462402344, 33.85578918457031, 37.62202072143555, 41.388248443603516, 45.15447998046875, 48.92070007324219, 52.686927795410156, 56.45315933227539, 60.21938705444336, 63.985618591308594, 67.75184631347656, 71.51807403564453, 75.2843017578125, 79.050537109375, 82.81676483154297, 86.58299255371094, 90.34922790527344, 94.1154556274414, 97.88168334960938, 101.64791107177734, 105.41413879394531, 109.18036651611328, 112.94659423828125, 116.71282196044922, 120.47904968261719, 124.24528503417969, 128.01150512695312, 131.77774047851562, 135.54397583007812, 139.31019592285156, 143.07643127441406, 146.8426513671875, 150.60888671875, 154.37510681152344, 158.14134216308594, 161.90756225585938, 165.67379760742188, 169.44003295898438]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 6.0, 9.0, 7.0, 11.0, 12.0, 11.0, 10.0, 10.0, 26.0, 19.0, 31.0, 33.0, 31.0, 30.0, 28.0, 30.0, 31.0, 37.0, 48.0, 43.0, 57.0, 30.0, 47.0, 36.0, 33.0, 30.0, 40.0, 28.0, 34.0, 25.0, 26.0, 16.0, 23.0, 16.0, 14.0, 13.0, 11.0, 9.0, 10.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-35.5597038269043, -34.491065979003906, -33.422428131103516, -32.35379409790039, -31.28515625, -30.21651840209961, -29.14788055419922, -28.079242706298828, -27.01060676574707, -25.94196891784668, -24.873332977294922, -23.80469512939453, -22.73605728149414, -21.667421340942383, -20.598783493041992, -19.530147552490234, -18.461509704589844, -17.392871856689453, -16.324235916137695, -15.255598068237305, -14.18696117401123, -13.118324279785156, -12.049686431884766, -10.981049537658691, -9.912412643432617, -8.843775749206543, -7.7751383781433105, -6.706501007080078, -5.637864112854004, -4.56922721862793, -3.5005898475646973, -2.431952476501465, -1.3633193969726562, -0.29468226432800293, 0.7739548683166504, 1.8425920009613037, 2.911229133605957, 3.9798660278320312, 5.048503398895264, 6.117140769958496, 7.18577766418457, 8.254414558410645, 9.323051452636719, 10.39168930053711, 11.460326194763184, 12.528963088989258, 13.597600936889648, 14.666237831115723, 15.734874725341797, 16.803512573242188, 17.872148513793945, 18.940786361694336, 20.009422302246094, 21.078060150146484, 22.146697998046875, 23.215335845947266, 24.283971786499023, 25.352609634399414, 26.421245574951172, 27.489883422851562, 28.558521270751953, 29.62715721130371, 30.6957950592041, 31.76443099975586, 32.83306884765625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 9.0, 12.0, 9.0, 14.0, 35.0, 54.0, 100.0, 150.0, 342.0, 706.0, 1682.0, 4877.0, 23646.0, 4048870.0, 98935.0, 10037.0, 2602.0, 970.0, 485.0, 254.0, 155.0, 105.0, 77.0, 41.0, 30.0, 27.0, 13.0, 13.0, 9.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.875, -37.2392578125, -35.603515625, -33.9677734375, -32.33203125, -30.6962890625, -29.060546875, -27.4248046875, -25.7890625, -24.1533203125, -22.517578125, -20.8818359375, -19.24609375, -17.6103515625, -15.974609375, -14.3388671875, -12.703125, -11.0673828125, -9.431640625, -7.7958984375, -6.16015625, -4.5244140625, -2.888671875, -1.2529296875, 0.3828125, 2.0185546875, 3.654296875, 5.2900390625, 6.92578125, 8.5615234375, 10.197265625, 11.8330078125, 13.46875, 15.1044921875, 16.740234375, 18.3759765625, 20.01171875, 21.6474609375, 23.283203125, 24.9189453125, 26.5546875, 28.1904296875, 29.826171875, 31.4619140625, 33.09765625, 34.7333984375, 36.369140625, 38.0048828125, 39.640625, 41.2763671875, 42.912109375, 44.5478515625, 46.18359375, 47.8193359375, 49.455078125, 51.0908203125, 52.7265625, 54.3623046875, 55.998046875, 57.6337890625, 59.26953125, 60.9052734375, 62.541015625, 64.1767578125, 65.8125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 7.0, 19.0, 18.0, 36.0, 44.0, 45.0, 75.0, 92.0, 79.0, 84.0, 108.0, 81.0, 76.0, 68.0, 44.0, 34.0, 23.0, 23.0, 12.0, 5.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.471466064453125, -2.36285400390625, -2.254241943359375, -2.1456298828125, -2.037017822265625, -1.92840576171875, -1.819793701171875, -1.711181640625, -1.602569580078125, -1.49395751953125, -1.385345458984375, -1.2767333984375, -1.168121337890625, -1.05950927734375, -0.950897216796875, -0.84228515625, -0.733673095703125, -0.62506103515625, -0.516448974609375, -0.4078369140625, -0.299224853515625, -0.19061279296875, -0.082000732421875, 0.026611328125, 0.135223388671875, 0.24383544921875, 0.352447509765625, 0.4610595703125, 0.569671630859375, 0.67828369140625, 0.786895751953125, 0.8955078125, 1.004119873046875, 1.11273193359375, 1.221343994140625, 1.3299560546875, 1.438568115234375, 1.54718017578125, 1.655792236328125, 1.764404296875, 1.873016357421875, 1.98162841796875, 2.090240478515625, 2.1988525390625, 2.307464599609375, 2.41607666015625, 2.524688720703125, 2.63330078125, 2.741912841796875, 2.85052490234375, 2.959136962890625, 3.0677490234375, 3.176361083984375, 3.28497314453125, 3.393585205078125, 3.502197265625, 3.610809326171875, 3.71942138671875, 3.828033447265625, 3.9366455078125, 4.045257568359375, 4.15386962890625, 4.262481689453125, 4.37109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 12.0, 3.0, 12.0, 11.0, 10.0, 24.0, 24.0, 36.0, 54.0, 53.0, 66.0, 90.0, 102.0, 138.0, 313.0, 1110.0, 7117.0, 232341.0, 3938987.0, 11323.0, 1430.0, 357.0, 146.0, 107.0, 79.0, 81.0, 57.0, 48.0, 34.0, 19.0, 25.0, 14.0, 19.0, 13.0, 4.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.65625, -59.7939453125, -57.931640625, -56.0693359375, -54.20703125, -52.3447265625, -50.482421875, -48.6201171875, -46.7578125, -44.8955078125, -43.033203125, -41.1708984375, -39.30859375, -37.4462890625, -35.583984375, -33.7216796875, -31.859375, -29.9970703125, -28.134765625, -26.2724609375, -24.41015625, -22.5478515625, -20.685546875, -18.8232421875, -16.9609375, -15.0986328125, -13.236328125, -11.3740234375, -9.51171875, -7.6494140625, -5.787109375, -3.9248046875, -2.0625, -0.2001953125, 1.662109375, 3.5244140625, 5.38671875, 7.2490234375, 9.111328125, 10.9736328125, 12.8359375, 14.6982421875, 16.560546875, 18.4228515625, 20.28515625, 22.1474609375, 24.009765625, 25.8720703125, 27.734375, 29.5966796875, 31.458984375, 33.3212890625, 35.18359375, 37.0458984375, 38.908203125, 40.7705078125, 42.6328125, 44.4951171875, 46.357421875, 48.2197265625, 50.08203125, 51.9443359375, 53.806640625, 55.6689453125, 57.53125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 13.0, 14.0, 37.0, 125.0, 3266.0, 527.0, 61.0, 24.0, 13.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.375, -25.657958984375, -24.94091796875, -24.223876953125, -23.5068359375, -22.789794921875, -22.07275390625, -21.355712890625, -20.638671875, -19.921630859375, -19.20458984375, -18.487548828125, -17.7705078125, -17.053466796875, -16.33642578125, -15.619384765625, -14.90234375, -14.185302734375, -13.46826171875, -12.751220703125, -12.0341796875, -11.317138671875, -10.60009765625, -9.883056640625, -9.166015625, -8.448974609375, -7.73193359375, -7.014892578125, -6.2978515625, -5.580810546875, -4.86376953125, -4.146728515625, -3.4296875, -2.712646484375, -1.99560546875, -1.278564453125, -0.5615234375, 0.155517578125, 0.87255859375, 1.589599609375, 2.306640625, 3.023681640625, 3.74072265625, 4.457763671875, 5.1748046875, 5.891845703125, 6.60888671875, 7.325927734375, 8.04296875, 8.760009765625, 9.47705078125, 10.194091796875, 10.9111328125, 11.628173828125, 12.34521484375, 13.062255859375, 13.779296875, 14.496337890625, 15.21337890625, 15.930419921875, 16.6474609375, 17.364501953125, 18.08154296875, 18.798583984375, 19.515625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 9.0, 10.0, 40.0, 43.0, 112.0, 224.0, 325.0, 137.0, 55.0, 19.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.91889190673828, -76.21824645996094, -73.5176010131836, -70.81695556640625, -68.1163101196289, -65.41566467285156, -62.71501922607422, -60.014373779296875, -57.31372833251953, -54.61308288574219, -51.912437438964844, -49.2117919921875, -46.511146545410156, -43.81050109863281, -41.10985565185547, -38.409210205078125, -35.70856475830078, -33.00791931152344, -30.307273864746094, -27.60662841796875, -24.905982971191406, -22.205337524414062, -19.50469207763672, -16.804046630859375, -14.103401184082031, -11.402755737304688, -8.702110290527344, -6.00146484375, -3.3008193969726562, -0.6001739501953125, 2.1004714965820312, 4.801116943359375, 7.5017547607421875, 10.202400207519531, 12.903045654296875, 15.603691101074219, 18.304336547851562, 21.004981994628906, 23.70562744140625, 26.406272888183594, 29.106918334960938, 31.80756378173828, 34.508209228515625, 37.20885467529297, 39.90950012207031, 42.610145568847656, 45.310791015625, 48.011436462402344, 50.71208190917969, 53.41272735595703, 56.113372802734375, 58.81401824951172, 61.51466369628906, 64.2153091430664, 66.91595458984375, 69.6166000366211, 72.31724548339844, 75.01789093017578, 77.71853637695312, 80.41918182373047, 83.11982727050781, 85.82047271728516, 88.5211181640625, 91.22176361083984, 93.92240905761719]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 8.0, 19.0, 22.0, 33.0, 42.0, 54.0, 67.0, 71.0, 83.0, 72.0, 86.0, 87.0, 84.0, 60.0, 56.0, 42.0, 34.0, 20.0, 18.0, 3.0, 10.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.62874221801758, -37.190574645996094, -35.752403259277344, -34.31423568725586, -32.876068115234375, -31.437896728515625, -29.99972915649414, -28.561559677124023, -27.123390197753906, -25.68522071838379, -24.247051239013672, -22.808883666992188, -21.37071418762207, -19.932544708251953, -18.49437713623047, -17.05620765686035, -15.618038177490234, -14.179868698120117, -12.741700172424316, -11.303531646728516, -9.865362167358398, -8.427192687988281, -6.9890241622924805, -5.55085563659668, -4.1126861572265625, -2.6745171546936035, -1.2363481521606445, 0.20182085037231445, 1.6399898529052734, 3.0781588554382324, 4.516327857971191, 5.954496383666992, 7.392669677734375, 8.830839157104492, 10.269007682800293, 11.707176208496094, 13.145345687866211, 14.583515167236328, 16.021682739257812, 17.45985221862793, 18.898021697998047, 20.336191177368164, 21.77436065673828, 23.212528228759766, 24.650697708129883, 26.0888671875, 27.527034759521484, 28.9652042388916, 30.40337371826172, 31.841543197631836, 33.27971267700195, 34.71788024902344, 36.15605163574219, 37.59421920776367, 39.032386779785156, 40.470558166503906, 41.90872573852539, 43.346893310546875, 44.785064697265625, 46.22323226928711, 47.661399841308594, 49.099571228027344, 50.53773880004883, 51.97590637207031, 53.41407775878906]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 14.0, 17.0, 21.0, 26.0, 46.0, 58.0, 120.0, 177.0, 358.0, 690.0, 1555.0, 4025.0, 15537.0, 126943.0, 788970.0, 90816.0, 12903.0, 3539.0, 1293.0, 666.0, 314.0, 175.0, 103.0, 55.0, 33.0, 29.0, 19.0, 9.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -23.6640625, -22.609375, -21.5546875, -20.5, -19.4453125, -18.390625, -17.3359375, -16.28125, -15.2265625, -14.171875, -13.1171875, -12.0625, -11.0078125, -9.953125, -8.8984375, -7.84375, -6.7890625, -5.734375, -4.6796875, -3.625, -2.5703125, -1.515625, -0.4609375, 0.59375, 1.6484375, 2.703125, 3.7578125, 4.8125, 5.8671875, 6.921875, 7.9765625, 9.03125, 10.0859375, 11.140625, 12.1953125, 13.25, 14.3046875, 15.359375, 16.4140625, 17.46875, 18.5234375, 19.578125, 20.6328125, 21.6875, 22.7421875, 23.796875, 24.8515625, 25.90625, 26.9609375, 28.015625, 29.0703125, 30.125, 31.1796875, 32.234375, 33.2890625, 34.34375, 35.3984375, 36.453125, 37.5078125, 38.5625, 39.6171875, 40.671875, 41.7265625, 42.78125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 3.0, 16.0, 10.0, 20.0, 29.0, 33.0, 44.0, 47.0, 47.0, 80.0, 75.0, 80.0, 91.0, 98.0, 68.0, 66.0, 49.0, 43.0, 29.0, 21.0, 14.0, 12.0, 8.0, 8.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.010986328125, -2.88525390625, -2.759521484375, -2.6337890625, -2.508056640625, -2.38232421875, -2.256591796875, -2.130859375, -2.005126953125, -1.87939453125, -1.753662109375, -1.6279296875, -1.502197265625, -1.37646484375, -1.250732421875, -1.125, -0.999267578125, -0.87353515625, -0.747802734375, -0.6220703125, -0.496337890625, -0.37060546875, -0.244873046875, -0.119140625, 0.006591796875, 0.13232421875, 0.258056640625, 0.3837890625, 0.509521484375, 0.63525390625, 0.760986328125, 0.88671875, 1.012451171875, 1.13818359375, 1.263916015625, 1.3896484375, 1.515380859375, 1.64111328125, 1.766845703125, 1.892578125, 2.018310546875, 2.14404296875, 2.269775390625, 2.3955078125, 2.521240234375, 2.64697265625, 2.772705078125, 2.8984375, 3.024169921875, 3.14990234375, 3.275634765625, 3.4013671875, 3.527099609375, 3.65283203125, 3.778564453125, 3.904296875, 4.030029296875, 4.15576171875, 4.281494140625, 4.4072265625, 4.532958984375, 4.65869140625, 4.784423828125, 4.91015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 7.0, 9.0, 13.0, 16.0, 24.0, 22.0, 43.0, 59.0, 75.0, 101.0, 132.0, 202.0, 269.0, 474.0, 772.0, 1425.0, 2890.0, 6907.0, 18384.0, 64644.0, 364373.0, 467773.0, 82737.0, 22041.0, 7868.0, 3336.0, 1591.0, 843.0, 466.0, 307.0, 209.0, 146.0, 111.0, 76.0, 50.0, 35.0, 23.0, 25.0, 23.0, 11.0, 7.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.0703125, -12.6048583984375, -12.139404296875, -11.6739501953125, -11.20849609375, -10.7430419921875, -10.277587890625, -9.8121337890625, -9.3466796875, -8.8812255859375, -8.415771484375, -7.9503173828125, -7.48486328125, -7.0194091796875, -6.553955078125, -6.0885009765625, -5.623046875, -5.1575927734375, -4.692138671875, -4.2266845703125, -3.76123046875, -3.2957763671875, -2.830322265625, -2.3648681640625, -1.8994140625, -1.4339599609375, -0.968505859375, -0.5030517578125, -0.03759765625, 0.4278564453125, 0.893310546875, 1.3587646484375, 1.82421875, 2.2896728515625, 2.755126953125, 3.2205810546875, 3.68603515625, 4.1514892578125, 4.616943359375, 5.0823974609375, 5.5478515625, 6.0133056640625, 6.478759765625, 6.9442138671875, 7.40966796875, 7.8751220703125, 8.340576171875, 8.8060302734375, 9.271484375, 9.7369384765625, 10.202392578125, 10.6678466796875, 11.13330078125, 11.5987548828125, 12.064208984375, 12.5296630859375, 12.9951171875, 13.4605712890625, 13.926025390625, 14.3914794921875, 14.85693359375, 15.3223876953125, 15.787841796875, 16.2532958984375, 16.71875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 9.0, 6.0, 14.0, 11.0, 7.0, 13.0, 15.0, 26.0, 31.0, 29.0, 36.0, 43.0, 46.0, 50.0, 46.0, 44.0, 43.0, 50.0, 42.0, 42.0, 50.0, 39.0, 39.0, 46.0, 36.0, 31.0, 27.0, 22.0, 14.0, 25.0, 9.0, 13.0, 7.0, 6.0, 8.0, 4.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-12.0078125, -11.66015625, -11.3125, -10.96484375, -10.6171875, -10.26953125, -9.921875, -9.57421875, -9.2265625, -8.87890625, -8.53125, -8.18359375, -7.8359375, -7.48828125, -7.140625, -6.79296875, -6.4453125, -6.09765625, -5.75, -5.40234375, -5.0546875, -4.70703125, -4.359375, -4.01171875, -3.6640625, -3.31640625, -2.96875, -2.62109375, -2.2734375, -1.92578125, -1.578125, -1.23046875, -0.8828125, -0.53515625, -0.1875, 0.16015625, 0.5078125, 0.85546875, 1.203125, 1.55078125, 1.8984375, 2.24609375, 2.59375, 2.94140625, 3.2890625, 3.63671875, 3.984375, 4.33203125, 4.6796875, 5.02734375, 5.375, 5.72265625, 6.0703125, 6.41796875, 6.765625, 7.11328125, 7.4609375, 7.80859375, 8.15625, 8.50390625, 8.8515625, 9.19921875, 9.546875, 9.89453125, 10.2421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 12.0, 13.0, 20.0, 49.0, 84.0, 213.0, 608.0, 2035.0, 8509.0, 162557.0, 852730.0, 17145.0, 3037.0, 961.0, 315.0, 127.0, 62.0, 19.0, 14.0, 16.0, 11.0, 10.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.90625, -43.62939453125, -42.3525390625, -41.07568359375, -39.798828125, -38.52197265625, -37.2451171875, -35.96826171875, -34.69140625, -33.41455078125, -32.1376953125, -30.86083984375, -29.583984375, -28.30712890625, -27.0302734375, -25.75341796875, -24.4765625, -23.19970703125, -21.9228515625, -20.64599609375, -19.369140625, -18.09228515625, -16.8154296875, -15.53857421875, -14.26171875, -12.98486328125, -11.7080078125, -10.43115234375, -9.154296875, -7.87744140625, -6.6005859375, -5.32373046875, -4.046875, -2.77001953125, -1.4931640625, -0.21630859375, 1.060546875, 2.33740234375, 3.6142578125, 4.89111328125, 6.16796875, 7.44482421875, 8.7216796875, 9.99853515625, 11.275390625, 12.55224609375, 13.8291015625, 15.10595703125, 16.3828125, 17.65966796875, 18.9365234375, 20.21337890625, 21.490234375, 22.76708984375, 24.0439453125, 25.32080078125, 26.59765625, 27.87451171875, 29.1513671875, 30.42822265625, 31.705078125, 32.98193359375, 34.2587890625, 35.53564453125, 36.8125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 11.0, 9.0, 14.0, 26.0, 39.0, 77.0, 153.0, 253.0, 177.0, 105.0, 50.0, 29.0, 18.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002849578857421875, -0.0027566850185394287, -0.0026637911796569824, -0.002570897340774536, -0.00247800350189209, -0.0023851096630096436, -0.0022922158241271973, -0.002199321985244751, -0.0021064281463623047, -0.0020135343074798584, -0.0019206404685974121, -0.0018277466297149658, -0.0017348527908325195, -0.0016419589519500732, -0.001549065113067627, -0.0014561712741851807, -0.0013632774353027344, -0.001270383596420288, -0.0011774897575378418, -0.0010845959186553955, -0.0009917020797729492, -0.0008988082408905029, -0.0008059144020080566, -0.0007130205631256104, -0.0006201267242431641, -0.0005272328853607178, -0.0004343390464782715, -0.0003414452075958252, -0.0002485513687133789, -0.00015565752983093262, -6.276369094848633e-05, 3.013014793395996e-05, 0.00012302398681640625, 0.00021591782569885254, 0.00030881166458129883, 0.0004017055034637451, 0.0004945993423461914, 0.0005874931812286377, 0.000680387020111084, 0.0007732808589935303, 0.0008661746978759766, 0.0009590685367584229, 0.0010519623756408691, 0.0011448562145233154, 0.0012377500534057617, 0.001330643892288208, 0.0014235377311706543, 0.0015164315700531006, 0.0016093254089355469, 0.0017022192478179932, 0.0017951130867004395, 0.0018880069255828857, 0.001980900764465332, 0.0020737946033477783, 0.0021666884422302246, 0.002259582281112671, 0.002352476119995117, 0.0024453699588775635, 0.0025382637977600098, 0.002631157636642456, 0.0027240514755249023, 0.0028169453144073486, 0.002909839153289795, 0.003002732992172241, 0.0030956268310546875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 8.0, 2.0, 10.0, 8.0, 13.0, 18.0, 19.0, 34.0, 48.0, 55.0, 88.0, 133.0, 185.0, 298.0, 567.0, 939.0, 1853.0, 3763.0, 8796.0, 24662.0, 118028.0, 741013.0, 108190.0, 23248.0, 8754.0, 3772.0, 1749.0, 904.0, 530.0, 297.0, 191.0, 120.0, 82.0, 51.0, 34.0, 22.0, 24.0, 14.0, 11.0, 5.0, 7.0, 1.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.1484375, -13.6141357421875, -13.079833984375, -12.5455322265625, -12.01123046875, -11.4769287109375, -10.942626953125, -10.4083251953125, -9.8740234375, -9.3397216796875, -8.805419921875, -8.2711181640625, -7.73681640625, -7.2025146484375, -6.668212890625, -6.1339111328125, -5.599609375, -5.0653076171875, -4.531005859375, -3.9967041015625, -3.46240234375, -2.9281005859375, -2.393798828125, -1.8594970703125, -1.3251953125, -0.7908935546875, -0.256591796875, 0.2777099609375, 0.81201171875, 1.3463134765625, 1.880615234375, 2.4149169921875, 2.94921875, 3.4835205078125, 4.017822265625, 4.5521240234375, 5.08642578125, 5.6207275390625, 6.155029296875, 6.6893310546875, 7.2236328125, 7.7579345703125, 8.292236328125, 8.8265380859375, 9.36083984375, 9.8951416015625, 10.429443359375, 10.9637451171875, 11.498046875, 12.0323486328125, 12.566650390625, 13.1009521484375, 13.63525390625, 14.1695556640625, 14.703857421875, 15.2381591796875, 15.7724609375, 16.3067626953125, 16.841064453125, 17.3753662109375, 17.90966796875, 18.4439697265625, 18.978271484375, 19.5125732421875, 20.046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 1.0, 7.0, 10.0, 8.0, 12.0, 16.0, 12.0, 20.0, 37.0, 33.0, 74.0, 102.0, 134.0, 129.0, 113.0, 81.0, 52.0, 39.0, 29.0, 19.0, 16.0, 6.0, 12.0, 5.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2421875, -9.851806640625, -9.46142578125, -9.071044921875, -8.6806640625, -8.290283203125, -7.89990234375, -7.509521484375, -7.119140625, -6.728759765625, -6.33837890625, -5.947998046875, -5.5576171875, -5.167236328125, -4.77685546875, -4.386474609375, -3.99609375, -3.605712890625, -3.21533203125, -2.824951171875, -2.4345703125, -2.044189453125, -1.65380859375, -1.263427734375, -0.873046875, -0.482666015625, -0.09228515625, 0.298095703125, 0.6884765625, 1.078857421875, 1.46923828125, 1.859619140625, 2.25, 2.640380859375, 3.03076171875, 3.421142578125, 3.8115234375, 4.201904296875, 4.59228515625, 4.982666015625, 5.373046875, 5.763427734375, 6.15380859375, 6.544189453125, 6.9345703125, 7.324951171875, 7.71533203125, 8.105712890625, 8.49609375, 8.886474609375, 9.27685546875, 9.667236328125, 10.0576171875, 10.447998046875, 10.83837890625, 11.228759765625, 11.619140625, 12.009521484375, 12.39990234375, 12.790283203125, 13.1806640625, 13.571044921875, 13.96142578125, 14.351806640625, 14.7421875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 11.0, 34.0, 56.0, 136.0, 247.0, 288.0, 143.0, 49.0, 15.0, 11.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-200.71292114257812, -192.77993774414062, -184.84695434570312, -176.91397094726562, -168.98098754882812, -161.04800415039062, -153.11502075195312, -145.18203735351562, -137.24905395507812, -129.31607055664062, -121.38308715820312, -113.45010375976562, -105.51712036132812, -97.58413696289062, -89.65115356445312, -81.71817016601562, -73.7851791381836, -65.8521957397461, -57.919212341308594, -49.986228942871094, -42.053245544433594, -34.12025833129883, -26.187274932861328, -18.254291534423828, -10.321308135986328, -2.38832426071167, 5.544659614562988, 13.477643966674805, 21.410627365112305, 29.343612670898438, 37.27659606933594, 45.20957946777344, 53.14256286621094, 61.07554626464844, 69.00852966308594, 76.94151306152344, 84.87449645996094, 92.80747985839844, 100.74046325683594, 108.67344665527344, 116.60643005371094, 124.53941345214844, 132.47239685058594, 140.40538024902344, 148.33836364746094, 156.27134704589844, 164.20433044433594, 172.13731384277344, 180.0703125, 188.0032958984375, 195.936279296875, 203.8692626953125, 211.80224609375, 219.7352294921875, 227.668212890625, 235.6011962890625, 243.5341796875, 251.4671630859375, 259.400146484375, 267.3331298828125, 275.26611328125, 283.1990966796875, 291.132080078125, 299.0650634765625, 306.998046875]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 7.0, 3.0, 5.0, 6.0, 10.0, 6.0, 9.0, 10.0, 12.0, 14.0, 16.0, 16.0, 26.0, 22.0, 29.0, 26.0, 30.0, 30.0, 26.0, 33.0, 37.0, 41.0, 32.0, 36.0, 41.0, 45.0, 38.0, 40.0, 38.0, 40.0, 36.0, 30.0, 30.0, 30.0, 16.0, 17.0, 25.0, 10.0, 17.0, 15.0, 7.0, 12.0, 11.0, 9.0, 7.0, 1.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-65.88626098632812, -63.836265563964844, -61.7862663269043, -59.736270904541016, -57.68627166748047, -55.63627624511719, -53.586280822753906, -51.53628158569336, -49.48628234863281, -47.43628692626953, -45.386287689208984, -43.3362922668457, -41.286293029785156, -39.236297607421875, -37.186302185058594, -35.13630294799805, -33.086307525634766, -31.03631019592285, -28.986312866210938, -26.936317443847656, -24.88631820678711, -22.836322784423828, -20.786325454711914, -18.736328125, -16.686330795288086, -14.636333465576172, -12.586336135864258, -10.53633975982666, -8.486342430114746, -6.436345100402832, -4.386348724365234, -2.3363513946533203, -0.28635406494140625, 1.7636430263519287, 3.8136401176452637, 5.8636369705200195, 7.913634300231934, 9.963631629943848, 12.013628005981445, 14.06362533569336, 16.113622665405273, 18.163619995117188, 20.2136173248291, 22.263614654541016, 24.313610076904297, 26.363609313964844, 28.413604736328125, 30.46360206604004, 32.51359939575195, 34.563594818115234, 36.61359405517578, 38.66358947753906, 40.71358871459961, 42.76358413696289, 44.81358337402344, 46.86357879638672, 48.91357421875, 50.96356964111328, 53.01356887817383, 55.06356430053711, 57.113563537597656, 59.16355895996094, 61.21355438232422, 63.263553619384766, 65.31355285644531]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 8.0, 11.0, 13.0, 28.0, 30.0, 70.0, 103.0, 158.0, 241.0, 393.0, 700.0, 1363.0, 2631.0, 5750.0, 14505.0, 60210.0, 3974611.0, 103043.0, 17971.0, 6386.0, 2747.0, 1267.0, 668.0, 390.0, 271.0, 200.0, 129.0, 93.0, 78.0, 44.0, 42.0, 35.0, 12.0, 13.0, 18.0, 10.0, 8.0, 8.0, 6.0, 2.0, 6.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.234375, -24.117919921875, -23.00146484375, -21.885009765625, -20.7685546875, -19.652099609375, -18.53564453125, -17.419189453125, -16.302734375, -15.186279296875, -14.06982421875, -12.953369140625, -11.8369140625, -10.720458984375, -9.60400390625, -8.487548828125, -7.37109375, -6.254638671875, -5.13818359375, -4.021728515625, -2.9052734375, -1.788818359375, -0.67236328125, 0.444091796875, 1.560546875, 2.677001953125, 3.79345703125, 4.909912109375, 6.0263671875, 7.142822265625, 8.25927734375, 9.375732421875, 10.4921875, 11.608642578125, 12.72509765625, 13.841552734375, 14.9580078125, 16.074462890625, 17.19091796875, 18.307373046875, 19.423828125, 20.540283203125, 21.65673828125, 22.773193359375, 23.8896484375, 25.006103515625, 26.12255859375, 27.239013671875, 28.35546875, 29.471923828125, 30.58837890625, 31.704833984375, 32.8212890625, 33.937744140625, 35.05419921875, 36.170654296875, 37.287109375, 38.403564453125, 39.52001953125, 40.636474609375, 41.7529296875, 42.869384765625, 43.98583984375, 45.102294921875, 46.21875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 10.0, 5.0, 12.0, 13.0, 20.0, 14.0, 36.0, 33.0, 40.0, 43.0, 63.0, 73.0, 71.0, 73.0, 69.0, 86.0, 71.0, 56.0, 47.0, 51.0, 30.0, 27.0, 17.0, 15.0, 6.0, 7.0, 3.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2890625, -3.1614990234375, -3.033935546875, -2.9063720703125, -2.77880859375, -2.6512451171875, -2.523681640625, -2.3961181640625, -2.2685546875, -2.1409912109375, -2.013427734375, -1.8858642578125, -1.75830078125, -1.6307373046875, -1.503173828125, -1.3756103515625, -1.248046875, -1.1204833984375, -0.992919921875, -0.8653564453125, -0.73779296875, -0.6102294921875, -0.482666015625, -0.3551025390625, -0.2275390625, -0.0999755859375, 0.027587890625, 0.1551513671875, 0.28271484375, 0.4102783203125, 0.537841796875, 0.6654052734375, 0.79296875, 0.9205322265625, 1.048095703125, 1.1756591796875, 1.30322265625, 1.4307861328125, 1.558349609375, 1.6859130859375, 1.8134765625, 1.9410400390625, 2.068603515625, 2.1961669921875, 2.32373046875, 2.4512939453125, 2.578857421875, 2.7064208984375, 2.833984375, 2.9615478515625, 3.089111328125, 3.2166748046875, 3.34423828125, 3.4718017578125, 3.599365234375, 3.7269287109375, 3.8544921875, 3.9820556640625, 4.109619140625, 4.2371826171875, 4.36474609375, 4.4923095703125, 4.619873046875, 4.7474365234375, 4.875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 10.0, 12.0, 21.0, 30.0, 52.0, 85.0, 120.0, 200.0, 321.0, 561.0, 1116.0, 2164.0, 5162.0, 14100.0, 57759.0, 3579847.0, 478476.0, 35996.0, 10204.0, 4144.0, 1796.0, 904.0, 487.0, 259.0, 160.0, 115.0, 61.0, 34.0, 25.0, 12.0, 8.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.953125, -30.11328125, -29.2734375, -28.43359375, -27.59375, -26.75390625, -25.9140625, -25.07421875, -24.234375, -23.39453125, -22.5546875, -21.71484375, -20.875, -20.03515625, -19.1953125, -18.35546875, -17.515625, -16.67578125, -15.8359375, -14.99609375, -14.15625, -13.31640625, -12.4765625, -11.63671875, -10.796875, -9.95703125, -9.1171875, -8.27734375, -7.4375, -6.59765625, -5.7578125, -4.91796875, -4.078125, -3.23828125, -2.3984375, -1.55859375, -0.71875, 0.12109375, 0.9609375, 1.80078125, 2.640625, 3.48046875, 4.3203125, 5.16015625, 6.0, 6.83984375, 7.6796875, 8.51953125, 9.359375, 10.19921875, 11.0390625, 11.87890625, 12.71875, 13.55859375, 14.3984375, 15.23828125, 16.078125, 16.91796875, 17.7578125, 18.59765625, 19.4375, 20.27734375, 21.1171875, 21.95703125, 22.796875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 12.0, 8.0, 18.0, 27.0, 27.0, 66.0, 119.0, 317.0, 1975.0, 979.0, 206.0, 105.0, 45.0, 33.0, 31.0, 13.0, 18.0, 15.0, 14.0, 4.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.5625, -11.257080078125, -10.95166015625, -10.646240234375, -10.3408203125, -10.035400390625, -9.72998046875, -9.424560546875, -9.119140625, -8.813720703125, -8.50830078125, -8.202880859375, -7.8974609375, -7.592041015625, -7.28662109375, -6.981201171875, -6.67578125, -6.370361328125, -6.06494140625, -5.759521484375, -5.4541015625, -5.148681640625, -4.84326171875, -4.537841796875, -4.232421875, -3.927001953125, -3.62158203125, -3.316162109375, -3.0107421875, -2.705322265625, -2.39990234375, -2.094482421875, -1.7890625, -1.483642578125, -1.17822265625, -0.872802734375, -0.5673828125, -0.261962890625, 0.04345703125, 0.348876953125, 0.654296875, 0.959716796875, 1.26513671875, 1.570556640625, 1.8759765625, 2.181396484375, 2.48681640625, 2.792236328125, 3.09765625, 3.403076171875, 3.70849609375, 4.013916015625, 4.3193359375, 4.624755859375, 4.93017578125, 5.235595703125, 5.541015625, 5.846435546875, 6.15185546875, 6.457275390625, 6.7626953125, 7.068115234375, 7.37353515625, 7.678955078125, 7.984375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 9.0, 16.0, 17.0, 45.0, 56.0, 142.0, 232.0, 188.0, 138.0, 69.0, 41.0, 14.0, 10.0, 9.0, 9.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.938751220703125, -33.6800651550293, -31.421375274658203, -29.162689208984375, -26.90399932861328, -24.645313262939453, -22.386625289916992, -20.12793731689453, -17.86924934387207, -15.61056137084961, -13.351873397827148, -11.093186378479004, -8.834498405456543, -6.575810432434082, -4.3171234130859375, -2.0584354400634766, 0.20025253295898438, 2.458940267562866, 4.717628002166748, 6.976315498352051, 9.235003471374512, 11.493691444396973, 13.752378463745117, 16.011066436767578, 18.26975440979004, 20.5284423828125, 22.78713035583496, 25.045818328857422, 27.30450439453125, 29.563194274902344, 31.821880340576172, 34.08056640625, 36.339256286621094, 38.59794235229492, 40.856632232666016, 43.115318298339844, 45.37400817871094, 47.632694244384766, 49.891380310058594, 52.15007019042969, 54.40876007080078, 56.66744613647461, 58.9261360168457, 61.18482208251953, 63.443511962890625, 65.70220184326172, 67.96088409423828, 70.21957397460938, 72.47825622558594, 74.73694610595703, 76.9956283569336, 79.25431823730469, 81.51300811767578, 83.77169799804688, 86.03038024902344, 88.28907012939453, 90.54776000976562, 92.80644989013672, 95.06513214111328, 97.32382202148438, 99.58251190185547, 101.84120178222656, 104.09988403320312, 106.35857391357422, 108.61726379394531]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 9.0, 3.0, 5.0, 2.0, 8.0, 11.0, 12.0, 20.0, 27.0, 15.0, 31.0, 37.0, 35.0, 36.0, 39.0, 28.0, 38.0, 67.0, 54.0, 51.0, 48.0, 55.0, 43.0, 60.0, 43.0, 24.0, 32.0, 28.0, 37.0, 33.0, 21.0, 11.0, 11.0, 8.0, 4.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.967374801635742, -28.04303741455078, -27.118701934814453, -26.194364547729492, -25.27002716064453, -24.345691680908203, -23.421354293823242, -22.49701690673828, -21.57267951965332, -20.64834213256836, -19.72400665283203, -18.79966926574707, -17.87533187866211, -16.95099639892578, -16.02665901184082, -15.10232162475586, -14.177985191345215, -13.25364875793457, -12.32931137084961, -11.404974937438965, -10.480637550354004, -9.55630111694336, -8.631963729858398, -7.707627296447754, -6.783290386199951, -5.858953475952148, -4.934616565704346, -4.010279655456543, -3.0859429836273193, -2.1616063117980957, -1.237269401550293, -0.31293249130249023, 0.6114044189453125, 1.5357413291931152, 2.460078239440918, 3.3844149112701416, 4.308752059936523, 5.233088493347168, 6.157425403594971, 7.081762313842773, 8.006099700927734, 8.930436134338379, 9.85477352142334, 10.779109954833984, 11.703447341918945, 12.62778377532959, 13.552120208740234, 14.476457595825195, 15.40079402923584, 16.325130462646484, 17.249467849731445, 18.173805236816406, 19.098140716552734, 20.022478103637695, 20.946815490722656, 21.871150970458984, 22.795488357543945, 23.719825744628906, 24.644161224365234, 25.568498611450195, 26.492835998535156, 27.417171478271484, 28.341508865356445, 29.265846252441406, 30.190183639526367]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 9.0, 14.0, 14.0, 22.0, 33.0, 55.0, 67.0, 101.0, 169.0, 337.0, 575.0, 1218.0, 2681.0, 7970.0, 36414.0, 560364.0, 395837.0, 30591.0, 7141.0, 2539.0, 1065.0, 573.0, 295.0, 163.0, 102.0, 50.0, 50.0, 33.0, 20.0, 9.0, 10.0, 10.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.984375, -30.879638671875, -29.77490234375, -28.670166015625, -27.5654296875, -26.460693359375, -25.35595703125, -24.251220703125, -23.146484375, -22.041748046875, -20.93701171875, -19.832275390625, -18.7275390625, -17.622802734375, -16.51806640625, -15.413330078125, -14.30859375, -13.203857421875, -12.09912109375, -10.994384765625, -9.8896484375, -8.784912109375, -7.68017578125, -6.575439453125, -5.470703125, -4.365966796875, -3.26123046875, -2.156494140625, -1.0517578125, 0.052978515625, 1.15771484375, 2.262451171875, 3.3671875, 4.471923828125, 5.57666015625, 6.681396484375, 7.7861328125, 8.890869140625, 9.99560546875, 11.100341796875, 12.205078125, 13.309814453125, 14.41455078125, 15.519287109375, 16.6240234375, 17.728759765625, 18.83349609375, 19.938232421875, 21.04296875, 22.147705078125, 23.25244140625, 24.357177734375, 25.4619140625, 26.566650390625, 27.67138671875, 28.776123046875, 29.880859375, 30.985595703125, 32.09033203125, 33.195068359375, 34.2998046875, 35.404541015625, 36.50927734375, 37.614013671875, 38.71875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 1.0, 9.0, 18.0, 18.0, 21.0, 33.0, 31.0, 44.0, 52.0, 75.0, 83.0, 71.0, 81.0, 78.0, 70.0, 72.0, 61.0, 48.0, 38.0, 26.0, 17.0, 15.0, 9.0, 11.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83203125, -3.6920166015625, -3.552001953125, -3.4119873046875, -3.27197265625, -3.1319580078125, -2.991943359375, -2.8519287109375, -2.7119140625, -2.5718994140625, -2.431884765625, -2.2918701171875, -2.15185546875, -2.0118408203125, -1.871826171875, -1.7318115234375, -1.591796875, -1.4517822265625, -1.311767578125, -1.1717529296875, -1.03173828125, -0.8917236328125, -0.751708984375, -0.6116943359375, -0.4716796875, -0.3316650390625, -0.191650390625, -0.0516357421875, 0.08837890625, 0.2283935546875, 0.368408203125, 0.5084228515625, 0.6484375, 0.7884521484375, 0.928466796875, 1.0684814453125, 1.20849609375, 1.3485107421875, 1.488525390625, 1.6285400390625, 1.7685546875, 1.9085693359375, 2.048583984375, 2.1885986328125, 2.32861328125, 2.4686279296875, 2.608642578125, 2.7486572265625, 2.888671875, 3.0286865234375, 3.168701171875, 3.3087158203125, 3.44873046875, 3.5887451171875, 3.728759765625, 3.8687744140625, 4.0087890625, 4.1488037109375, 4.288818359375, 4.4288330078125, 4.56884765625, 4.7088623046875, 4.848876953125, 4.9888916015625, 5.12890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 16.0, 20.0, 20.0, 24.0, 31.0, 56.0, 93.0, 106.0, 133.0, 246.0, 398.0, 740.0, 1423.0, 3448.0, 9692.0, 37405.0, 439626.0, 498927.0, 39369.0, 9904.0, 3504.0, 1506.0, 735.0, 399.0, 249.0, 157.0, 87.0, 64.0, 44.0, 28.0, 21.0, 16.0, 20.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-30.1875, -29.349365234375, -28.51123046875, -27.673095703125, -26.8349609375, -25.996826171875, -25.15869140625, -24.320556640625, -23.482421875, -22.644287109375, -21.80615234375, -20.968017578125, -20.1298828125, -19.291748046875, -18.45361328125, -17.615478515625, -16.77734375, -15.939208984375, -15.10107421875, -14.262939453125, -13.4248046875, -12.586669921875, -11.74853515625, -10.910400390625, -10.072265625, -9.234130859375, -8.39599609375, -7.557861328125, -6.7197265625, -5.881591796875, -5.04345703125, -4.205322265625, -3.3671875, -2.529052734375, -1.69091796875, -0.852783203125, -0.0146484375, 0.823486328125, 1.66162109375, 2.499755859375, 3.337890625, 4.176025390625, 5.01416015625, 5.852294921875, 6.6904296875, 7.528564453125, 8.36669921875, 9.204833984375, 10.04296875, 10.881103515625, 11.71923828125, 12.557373046875, 13.3955078125, 14.233642578125, 15.07177734375, 15.909912109375, 16.748046875, 17.586181640625, 18.42431640625, 19.262451171875, 20.1005859375, 20.938720703125, 21.77685546875, 22.614990234375, 23.453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 5.0, 8.0, 12.0, 10.0, 20.0, 20.0, 25.0, 34.0, 44.0, 60.0, 84.0, 77.0, 90.0, 69.0, 75.0, 84.0, 70.0, 54.0, 32.0, 34.0, 26.0, 19.0, 9.0, 6.0, 6.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.40625, -22.75927734375, -22.1123046875, -21.46533203125, -20.818359375, -20.17138671875, -19.5244140625, -18.87744140625, -18.23046875, -17.58349609375, -16.9365234375, -16.28955078125, -15.642578125, -14.99560546875, -14.3486328125, -13.70166015625, -13.0546875, -12.40771484375, -11.7607421875, -11.11376953125, -10.466796875, -9.81982421875, -9.1728515625, -8.52587890625, -7.87890625, -7.23193359375, -6.5849609375, -5.93798828125, -5.291015625, -4.64404296875, -3.9970703125, -3.35009765625, -2.703125, -2.05615234375, -1.4091796875, -0.76220703125, -0.115234375, 0.53173828125, 1.1787109375, 1.82568359375, 2.47265625, 3.11962890625, 3.7666015625, 4.41357421875, 5.060546875, 5.70751953125, 6.3544921875, 7.00146484375, 7.6484375, 8.29541015625, 8.9423828125, 9.58935546875, 10.236328125, 10.88330078125, 11.5302734375, 12.17724609375, 12.82421875, 13.47119140625, 14.1181640625, 14.76513671875, 15.412109375, 16.05908203125, 16.7060546875, 17.35302734375, 18.0]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 19.0, 28.0, 35.0, 81.0, 138.0, 280.0, 960.0, 4798.0, 205989.0, 827807.0, 6603.0, 1099.0, 339.0, 178.0, 86.0, 40.0, 15.0, 16.0, 13.0, 4.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.0, -51.6435546875, -50.287109375, -48.9306640625, -47.57421875, -46.2177734375, -44.861328125, -43.5048828125, -42.1484375, -40.7919921875, -39.435546875, -38.0791015625, -36.72265625, -35.3662109375, -34.009765625, -32.6533203125, -31.296875, -29.9404296875, -28.583984375, -27.2275390625, -25.87109375, -24.5146484375, -23.158203125, -21.8017578125, -20.4453125, -19.0888671875, -17.732421875, -16.3759765625, -15.01953125, -13.6630859375, -12.306640625, -10.9501953125, -9.59375, -8.2373046875, -6.880859375, -5.5244140625, -4.16796875, -2.8115234375, -1.455078125, -0.0986328125, 1.2578125, 2.6142578125, 3.970703125, 5.3271484375, 6.68359375, 8.0400390625, 9.396484375, 10.7529296875, 12.109375, 13.4658203125, 14.822265625, 16.1787109375, 17.53515625, 18.8916015625, 20.248046875, 21.6044921875, 22.9609375, 24.3173828125, 25.673828125, 27.0302734375, 28.38671875, 29.7431640625, 31.099609375, 32.4560546875, 33.8125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 7.0, 5.0, 11.0, 14.0, 24.0, 39.0, 81.0, 289.0, 287.0, 91.0, 53.0, 27.0, 20.0, 13.0, 10.0, 11.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002002716064453125, -0.001931220293045044, -0.0018597245216369629, -0.0017882287502288818, -0.0017167329788208008, -0.0016452372074127197, -0.0015737414360046387, -0.0015022456645965576, -0.0014307498931884766, -0.0013592541217803955, -0.0012877583503723145, -0.0012162625789642334, -0.0011447668075561523, -0.0010732710361480713, -0.0010017752647399902, -0.0009302794933319092, -0.0008587837219238281, -0.0007872879505157471, -0.000715792179107666, -0.000644296407699585, -0.0005728006362915039, -0.0005013048648834229, -0.0004298090934753418, -0.00035831332206726074, -0.0002868175506591797, -0.00021532177925109863, -0.00014382600784301758, -7.233023643493652e-05, -8.344650268554688e-07, 7.066130638122559e-05, 0.00014215707778930664, 0.0002136528491973877, 0.00028514862060546875, 0.0003566443920135498, 0.00042814016342163086, 0.0004996359348297119, 0.000571131706237793, 0.000642627477645874, 0.0007141232490539551, 0.0007856190204620361, 0.0008571147918701172, 0.0009286105632781982, 0.0010001063346862793, 0.0010716021060943604, 0.0011430978775024414, 0.0012145936489105225, 0.0012860894203186035, 0.0013575851917266846, 0.0014290809631347656, 0.0015005767345428467, 0.0015720725059509277, 0.0016435682773590088, 0.0017150640487670898, 0.001786559820175171, 0.001858055591583252, 0.001929551362991333, 0.002001047134399414, 0.002072542905807495, 0.002144038677215576, 0.0022155344486236572, 0.0022870302200317383, 0.0023585259914398193, 0.0024300217628479004, 0.0025015175342559814, 0.0025730133056640625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 8.0, 10.0, 16.0, 16.0, 33.0, 61.0, 107.0, 181.0, 459.0, 1105.0, 4048.0, 32028.0, 980091.0, 25019.0, 3494.0, 1022.0, 409.0, 194.0, 84.0, 55.0, 31.0, 22.0, 13.0, 16.0, 7.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.28125, -37.231201171875, -36.18115234375, -35.131103515625, -34.0810546875, -33.031005859375, -31.98095703125, -30.930908203125, -29.880859375, -28.830810546875, -27.78076171875, -26.730712890625, -25.6806640625, -24.630615234375, -23.58056640625, -22.530517578125, -21.48046875, -20.430419921875, -19.38037109375, -18.330322265625, -17.2802734375, -16.230224609375, -15.18017578125, -14.130126953125, -13.080078125, -12.030029296875, -10.97998046875, -9.929931640625, -8.8798828125, -7.829833984375, -6.77978515625, -5.729736328125, -4.6796875, -3.629638671875, -2.57958984375, -1.529541015625, -0.4794921875, 0.570556640625, 1.62060546875, 2.670654296875, 3.720703125, 4.770751953125, 5.82080078125, 6.870849609375, 7.9208984375, 8.970947265625, 10.02099609375, 11.071044921875, 12.12109375, 13.171142578125, 14.22119140625, 15.271240234375, 16.3212890625, 17.371337890625, 18.42138671875, 19.471435546875, 20.521484375, 21.571533203125, 22.62158203125, 23.671630859375, 24.7216796875, 25.771728515625, 26.82177734375, 27.871826171875, 28.921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 6.0, 5.0, 7.0, 14.0, 16.0, 30.0, 58.0, 216.0, 399.0, 125.0, 50.0, 22.0, 18.0, 8.0, 5.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.609375, -20.02587890625, -19.4423828125, -18.85888671875, -18.275390625, -17.69189453125, -17.1083984375, -16.52490234375, -15.94140625, -15.35791015625, -14.7744140625, -14.19091796875, -13.607421875, -13.02392578125, -12.4404296875, -11.85693359375, -11.2734375, -10.68994140625, -10.1064453125, -9.52294921875, -8.939453125, -8.35595703125, -7.7724609375, -7.18896484375, -6.60546875, -6.02197265625, -5.4384765625, -4.85498046875, -4.271484375, -3.68798828125, -3.1044921875, -2.52099609375, -1.9375, -1.35400390625, -0.7705078125, -0.18701171875, 0.396484375, 0.97998046875, 1.5634765625, 2.14697265625, 2.73046875, 3.31396484375, 3.8974609375, 4.48095703125, 5.064453125, 5.64794921875, 6.2314453125, 6.81494140625, 7.3984375, 7.98193359375, 8.5654296875, 9.14892578125, 9.732421875, 10.31591796875, 10.8994140625, 11.48291015625, 12.06640625, 12.64990234375, 13.2333984375, 13.81689453125, 14.400390625, 14.98388671875, 15.5673828125, 16.15087890625, 16.734375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 2.0, 9.0, 11.0, 19.0, 26.0, 63.0, 123.0, 177.0, 206.0, 156.0, 98.0, 59.0, 24.0, 11.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-237.96585083007812, -231.61892700195312, -225.27198791503906, -218.92506408691406, -212.57814025878906, -206.231201171875, -199.88427734375, -193.537353515625, -187.1904296875, -180.843505859375, -174.49656677246094, -168.14964294433594, -161.80271911621094, -155.45578002929688, -149.10885620117188, -142.76193237304688, -136.4149932861328, -130.0680694580078, -123.72113800048828, -117.37420654296875, -111.02728271484375, -104.68035125732422, -98.33341979980469, -91.98649597167969, -85.63956451416016, -79.29263305664062, -72.94570922851562, -66.5987777709961, -60.25185012817383, -53.90492248535156, -47.55799102783203, -41.211063385009766, -34.8641357421875, -28.517208099365234, -22.170278549194336, -15.823348999023438, -9.476421356201172, -3.1294937133789062, 3.217437744140625, 9.56436538696289, 15.911293029785156, 22.258220672607422, 28.60515022277832, 34.95207977294922, 41.299007415771484, 47.64593505859375, 53.99286651611328, 60.33979415893555, 66.68672180175781, 73.03365325927734, 79.38057708740234, 85.72750854492188, 92.07443237304688, 98.4213638305664, 104.76829528808594, 111.11521911621094, 117.46215057373047, 123.80908203125, 130.156005859375, 136.5029296875, 142.84986877441406, 149.19679260253906, 155.54373168945312, 161.89065551757812, 168.23757934570312]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 7.0, 8.0, 15.0, 6.0, 21.0, 18.0, 19.0, 33.0, 31.0, 46.0, 56.0, 54.0, 51.0, 56.0, 46.0, 40.0, 66.0, 54.0, 47.0, 64.0, 50.0, 36.0, 25.0, 28.0, 20.0, 18.0, 15.0, 15.0, 11.0, 8.0, 12.0, 5.0, 3.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.39179992675781, -75.05036163330078, -71.70891571044922, -68.36747741699219, -65.02603912353516, -61.68459701538086, -58.34315490722656, -55.00171661376953, -51.6602783203125, -48.3188362121582, -44.97739791870117, -41.635955810546875, -38.294517517089844, -34.95307540893555, -31.611635208129883, -28.27019500732422, -24.928752899169922, -21.587312698364258, -18.245872497558594, -14.904431343078613, -11.56299114227295, -8.221549987792969, -4.880109786987305, -1.5386695861816406, 1.8027706146240234, 5.1442108154296875, 8.485651016235352, 11.827092170715332, 15.168532371520996, 18.509973526000977, 21.85141372680664, 25.192853927612305, 28.53429412841797, 31.875734329223633, 35.2171745300293, 38.558616638183594, 41.900054931640625, 45.24149703979492, 48.58293914794922, 51.92437744140625, 55.26581573486328, 58.60725784301758, 61.94869613647461, 65.2901382446289, 68.63157653808594, 71.9730224609375, 75.31446075439453, 78.65589904785156, 81.99734497070312, 85.33878326416016, 88.68022918701172, 92.02166748046875, 95.36310577392578, 98.70454406738281, 102.04598999023438, 105.3874282836914, 108.72886657714844, 112.07030487060547, 115.41175079345703, 118.75318908691406, 122.0946273803711, 125.43606567382812, 128.7775115966797, 132.11895751953125, 135.46038818359375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 8.0, 18.0, 25.0, 55.0, 87.0, 172.0, 273.0, 592.0, 1291.0, 3245.0, 11458.0, 115710.0, 4025196.0, 27022.0, 5518.0, 1781.0, 789.0, 386.0, 244.0, 126.0, 82.0, 65.0, 35.0, 22.0, 14.0, 13.0, 13.0, 3.0, 3.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.0625, -40.328125, -38.59375, -36.859375, -35.125, -33.390625, -31.65625, -29.921875, -28.1875, -26.453125, -24.71875, -22.984375, -21.25, -19.515625, -17.78125, -16.046875, -14.3125, -12.578125, -10.84375, -9.109375, -7.375, -5.640625, -3.90625, -2.171875, -0.4375, 1.296875, 3.03125, 4.765625, 6.5, 8.234375, 9.96875, 11.703125, 13.4375, 15.171875, 16.90625, 18.640625, 20.375, 22.109375, 23.84375, 25.578125, 27.3125, 29.046875, 30.78125, 32.515625, 34.25, 35.984375, 37.71875, 39.453125, 41.1875, 42.921875, 44.65625, 46.390625, 48.125, 49.859375, 51.59375, 53.328125, 55.0625, 56.796875, 58.53125, 60.265625, 62.0, 63.734375, 65.46875, 67.203125, 68.9375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 2.0, 6.0, 8.0, 13.0, 6.0, 18.0, 22.0, 25.0, 37.0, 45.0, 60.0, 52.0, 68.0, 70.0, 63.0, 70.0, 67.0, 67.0, 66.0, 50.0, 37.0, 36.0, 27.0, 23.0, 20.0, 11.0, 9.0, 8.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9765625, -3.834228515625, -3.69189453125, -3.549560546875, -3.4072265625, -3.264892578125, -3.12255859375, -2.980224609375, -2.837890625, -2.695556640625, -2.55322265625, -2.410888671875, -2.2685546875, -2.126220703125, -1.98388671875, -1.841552734375, -1.69921875, -1.556884765625, -1.41455078125, -1.272216796875, -1.1298828125, -0.987548828125, -0.84521484375, -0.702880859375, -0.560546875, -0.418212890625, -0.27587890625, -0.133544921875, 0.0087890625, 0.151123046875, 0.29345703125, 0.435791015625, 0.578125, 0.720458984375, 0.86279296875, 1.005126953125, 1.1474609375, 1.289794921875, 1.43212890625, 1.574462890625, 1.716796875, 1.859130859375, 2.00146484375, 2.143798828125, 2.2861328125, 2.428466796875, 2.57080078125, 2.713134765625, 2.85546875, 2.997802734375, 3.14013671875, 3.282470703125, 3.4248046875, 3.567138671875, 3.70947265625, 3.851806640625, 3.994140625, 4.136474609375, 4.27880859375, 4.421142578125, 4.5634765625, 4.705810546875, 4.84814453125, 4.990478515625, 5.1328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 15.0, 12.0, 19.0, 24.0, 38.0, 48.0, 82.0, 96.0, 150.0, 227.0, 485.0, 864.0, 1960.0, 5610.0, 26658.0, 3044556.0, 1080031.0, 24074.0, 5427.0, 1877.0, 882.0, 395.0, 242.0, 135.0, 101.0, 66.0, 50.0, 34.0, 33.0, 17.0, 12.0, 10.0, 12.0, 8.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.5625, -42.31689453125, -41.0712890625, -39.82568359375, -38.580078125, -37.33447265625, -36.0888671875, -34.84326171875, -33.59765625, -32.35205078125, -31.1064453125, -29.86083984375, -28.615234375, -27.36962890625, -26.1240234375, -24.87841796875, -23.6328125, -22.38720703125, -21.1416015625, -19.89599609375, -18.650390625, -17.40478515625, -16.1591796875, -14.91357421875, -13.66796875, -12.42236328125, -11.1767578125, -9.93115234375, -8.685546875, -7.43994140625, -6.1943359375, -4.94873046875, -3.703125, -2.45751953125, -1.2119140625, 0.03369140625, 1.279296875, 2.52490234375, 3.7705078125, 5.01611328125, 6.26171875, 7.50732421875, 8.7529296875, 9.99853515625, 11.244140625, 12.48974609375, 13.7353515625, 14.98095703125, 16.2265625, 17.47216796875, 18.7177734375, 19.96337890625, 21.208984375, 22.45458984375, 23.7001953125, 24.94580078125, 26.19140625, 27.43701171875, 28.6826171875, 29.92822265625, 31.173828125, 32.41943359375, 33.6650390625, 34.91064453125, 36.15625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 8.0, 2.0, 3.0, 6.0, 11.0, 19.0, 38.0, 67.0, 192.0, 2656.0, 793.0, 147.0, 62.0, 27.0, 17.0, 20.0, 2.0, 7.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.3125, -19.802490234375, -19.29248046875, -18.782470703125, -18.2724609375, -17.762451171875, -17.25244140625, -16.742431640625, -16.232421875, -15.722412109375, -15.21240234375, -14.702392578125, -14.1923828125, -13.682373046875, -13.17236328125, -12.662353515625, -12.15234375, -11.642333984375, -11.13232421875, -10.622314453125, -10.1123046875, -9.602294921875, -9.09228515625, -8.582275390625, -8.072265625, -7.562255859375, -7.05224609375, -6.542236328125, -6.0322265625, -5.522216796875, -5.01220703125, -4.502197265625, -3.9921875, -3.482177734375, -2.97216796875, -2.462158203125, -1.9521484375, -1.442138671875, -0.93212890625, -0.422119140625, 0.087890625, 0.597900390625, 1.10791015625, 1.617919921875, 2.1279296875, 2.637939453125, 3.14794921875, 3.657958984375, 4.16796875, 4.677978515625, 5.18798828125, 5.697998046875, 6.2080078125, 6.718017578125, 7.22802734375, 7.738037109375, 8.248046875, 8.758056640625, 9.26806640625, 9.778076171875, 10.2880859375, 10.798095703125, 11.30810546875, 11.818115234375, 12.328125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 11.0, 13.0, 24.0, 73.0, 210.0, 346.0, 197.0, 74.0, 34.0, 13.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-166.60067749023438, -163.1521453857422, -159.70359802246094, -156.25506591796875, -152.80653381347656, -149.35800170898438, -145.90945434570312, -142.46092224121094, -139.01239013671875, -135.56385803222656, -132.1153106689453, -128.66677856445312, -125.21824645996094, -121.76970672607422, -118.3211669921875, -114.87263488769531, -111.42408752441406, -107.97554779052734, -104.52701568603516, -101.07847595214844, -97.62994384765625, -94.18140411376953, -90.73286437988281, -87.28433227539062, -83.8357925415039, -80.38725280761719, -76.938720703125, -73.49018096923828, -70.04164123535156, -66.59310913085938, -63.144569396972656, -59.6960334777832, -56.247501373291016, -52.79896545410156, -49.350425720214844, -45.90188980102539, -42.45335388183594, -39.004817962646484, -35.55628204345703, -32.10774230957031, -28.65920639038086, -25.210670471191406, -21.76213264465332, -18.313594818115234, -14.865058898925781, -11.416522979736328, -7.967985153198242, -4.519447326660156, -1.0709114074707031, 2.3776254653930664, 5.826162338256836, 9.274699211120605, 12.723236083984375, 16.171772003173828, 19.620309829711914, 23.06884765625, 26.517383575439453, 29.965919494628906, 33.414459228515625, 36.86299514770508, 40.31153106689453, 43.760066986083984, 47.20860290527344, 50.657142639160156, 54.10567855834961]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 7.0, 4.0, 9.0, 9.0, 10.0, 22.0, 39.0, 44.0, 54.0, 48.0, 70.0, 58.0, 67.0, 79.0, 65.0, 74.0, 61.0, 67.0, 37.0, 48.0, 40.0, 31.0, 18.0, 12.0, 12.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.10686492919922, -31.873485565185547, -30.640106201171875, -29.406726837158203, -28.17334747314453, -26.93996810913086, -25.706586837768555, -24.473207473754883, -23.23982810974121, -22.00644874572754, -20.773069381713867, -19.539690017700195, -18.30630874633789, -17.07292938232422, -15.839550018310547, -14.606170654296875, -13.372791290283203, -12.139411926269531, -10.90603256225586, -9.672652244567871, -8.4392728805542, -7.205893516540527, -5.972513675689697, -4.739133834838867, -3.5057544708251953, -2.2723748683929443, -1.0389952659606934, 0.19438433647155762, 1.4277639389038086, 2.6611433029174805, 3.8945231437683105, 5.127902984619141, 6.361278533935547, 7.594657897949219, 8.82803726196289, 10.061417579650879, 11.29479694366455, 12.528176307678223, 13.761556625366211, 14.994935989379883, 16.228315353393555, 17.461694717407227, 18.6950740814209, 19.92845344543457, 21.161834716796875, 22.395214080810547, 23.62859344482422, 24.86197280883789, 26.095352172851562, 27.328731536865234, 28.562110900878906, 29.795490264892578, 31.02886962890625, 32.26224899291992, 33.495628356933594, 34.72901153564453, 35.96238708496094, 37.19576644897461, 38.42914581298828, 39.66252517700195, 40.895904541015625, 42.1292839050293, 43.36266326904297, 44.596046447753906, 45.82942581176758]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 12.0, 16.0, 16.0, 35.0, 66.0, 97.0, 170.0, 365.0, 778.0, 1879.0, 7560.0, 65768.0, 876263.0, 83378.0, 8494.0, 2031.0, 778.0, 340.0, 194.0, 108.0, 66.0, 50.0, 19.0, 14.0, 15.0, 9.0, 8.0, 4.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-52.03125, -50.68115234375, -49.3310546875, -47.98095703125, -46.630859375, -45.28076171875, -43.9306640625, -42.58056640625, -41.23046875, -39.88037109375, -38.5302734375, -37.18017578125, -35.830078125, -34.47998046875, -33.1298828125, -31.77978515625, -30.4296875, -29.07958984375, -27.7294921875, -26.37939453125, -25.029296875, -23.67919921875, -22.3291015625, -20.97900390625, -19.62890625, -18.27880859375, -16.9287109375, -15.57861328125, -14.228515625, -12.87841796875, -11.5283203125, -10.17822265625, -8.828125, -7.47802734375, -6.1279296875, -4.77783203125, -3.427734375, -2.07763671875, -0.7275390625, 0.62255859375, 1.97265625, 3.32275390625, 4.6728515625, 6.02294921875, 7.373046875, 8.72314453125, 10.0732421875, 11.42333984375, 12.7734375, 14.12353515625, 15.4736328125, 16.82373046875, 18.173828125, 19.52392578125, 20.8740234375, 22.22412109375, 23.57421875, 24.92431640625, 26.2744140625, 27.62451171875, 28.974609375, 30.32470703125, 31.6748046875, 33.02490234375, 34.375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 8.0, 8.0, 15.0, 15.0, 31.0, 47.0, 36.0, 46.0, 61.0, 63.0, 72.0, 86.0, 82.0, 73.0, 62.0, 62.0, 42.0, 50.0, 31.0, 22.0, 25.0, 14.0, 14.0, 5.0, 4.0, 6.0, 2.0, 5.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.44293212890625, -4.2843017578125, -4.12567138671875, -3.967041015625, -3.80841064453125, -3.6497802734375, -3.49114990234375, -3.33251953125, -3.17388916015625, -3.0152587890625, -2.85662841796875, -2.697998046875, -2.53936767578125, -2.3807373046875, -2.22210693359375, -2.0634765625, -1.90484619140625, -1.7462158203125, -1.58758544921875, -1.428955078125, -1.27032470703125, -1.1116943359375, -0.95306396484375, -0.79443359375, -0.63580322265625, -0.4771728515625, -0.31854248046875, -0.159912109375, -0.00128173828125, 0.1573486328125, 0.31597900390625, 0.474609375, 0.63323974609375, 0.7918701171875, 0.95050048828125, 1.109130859375, 1.26776123046875, 1.4263916015625, 1.58502197265625, 1.74365234375, 1.90228271484375, 2.0609130859375, 2.21954345703125, 2.378173828125, 2.53680419921875, 2.6954345703125, 2.85406494140625, 3.0126953125, 3.17132568359375, 3.3299560546875, 3.48858642578125, 3.647216796875, 3.80584716796875, 3.9644775390625, 4.12310791015625, 4.28173828125, 4.44036865234375, 4.5989990234375, 4.75762939453125, 4.916259765625, 5.07489013671875, 5.2335205078125, 5.39215087890625, 5.55078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 9.0, 11.0, 12.0, 9.0, 17.0, 22.0, 30.0, 50.0, 54.0, 104.0, 144.0, 289.0, 513.0, 1261.0, 3094.0, 9711.0, 41352.0, 575032.0, 370630.0, 33000.0, 8206.0, 2759.0, 1050.0, 456.0, 248.0, 149.0, 103.0, 56.0, 39.0, 31.0, 36.0, 19.0, 18.0, 4.0, 11.0, 10.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-26.90625, -26.135986328125, -25.36572265625, -24.595458984375, -23.8251953125, -23.054931640625, -22.28466796875, -21.514404296875, -20.744140625, -19.973876953125, -19.20361328125, -18.433349609375, -17.6630859375, -16.892822265625, -16.12255859375, -15.352294921875, -14.58203125, -13.811767578125, -13.04150390625, -12.271240234375, -11.5009765625, -10.730712890625, -9.96044921875, -9.190185546875, -8.419921875, -7.649658203125, -6.87939453125, -6.109130859375, -5.3388671875, -4.568603515625, -3.79833984375, -3.028076171875, -2.2578125, -1.487548828125, -0.71728515625, 0.052978515625, 0.8232421875, 1.593505859375, 2.36376953125, 3.134033203125, 3.904296875, 4.674560546875, 5.44482421875, 6.215087890625, 6.9853515625, 7.755615234375, 8.52587890625, 9.296142578125, 10.06640625, 10.836669921875, 11.60693359375, 12.377197265625, 13.1474609375, 13.917724609375, 14.68798828125, 15.458251953125, 16.228515625, 16.998779296875, 17.76904296875, 18.539306640625, 19.3095703125, 20.079833984375, 20.85009765625, 21.620361328125, 22.390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 6.0, 10.0, 2.0, 7.0, 8.0, 15.0, 18.0, 11.0, 9.0, 27.0, 30.0, 32.0, 34.0, 43.0, 45.0, 54.0, 56.0, 42.0, 38.0, 59.0, 67.0, 48.0, 44.0, 50.0, 39.0, 30.0, 32.0, 20.0, 15.0, 12.0, 16.0, 10.0, 10.0, 10.0, 8.0, 10.0, 6.0, 4.0, 3.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-16.390625, -15.9061279296875, -15.421630859375, -14.9371337890625, -14.45263671875, -13.9681396484375, -13.483642578125, -12.9991455078125, -12.5146484375, -12.0301513671875, -11.545654296875, -11.0611572265625, -10.57666015625, -10.0921630859375, -9.607666015625, -9.1231689453125, -8.638671875, -8.1541748046875, -7.669677734375, -7.1851806640625, -6.70068359375, -6.2161865234375, -5.731689453125, -5.2471923828125, -4.7626953125, -4.2781982421875, -3.793701171875, -3.3092041015625, -2.82470703125, -2.3402099609375, -1.855712890625, -1.3712158203125, -0.88671875, -0.4022216796875, 0.082275390625, 0.5667724609375, 1.05126953125, 1.5357666015625, 2.020263671875, 2.5047607421875, 2.9892578125, 3.4737548828125, 3.958251953125, 4.4427490234375, 4.92724609375, 5.4117431640625, 5.896240234375, 6.3807373046875, 6.865234375, 7.3497314453125, 7.834228515625, 8.3187255859375, 8.80322265625, 9.2877197265625, 9.772216796875, 10.2567138671875, 10.7412109375, 11.2257080078125, 11.710205078125, 12.1947021484375, 12.67919921875, 13.1636962890625, 13.648193359375, 14.1326904296875, 14.6171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 4.0, 11.0, 15.0, 19.0, 35.0, 76.0, 130.0, 271.0, 660.0, 2190.0, 9105.0, 116609.0, 892037.0, 21361.0, 4127.0, 1161.0, 365.0, 175.0, 90.0, 55.0, 40.0, 10.0, 5.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.78125, -27.107421875, -26.43359375, -25.759765625, -25.0859375, -24.412109375, -23.73828125, -23.064453125, -22.390625, -21.716796875, -21.04296875, -20.369140625, -19.6953125, -19.021484375, -18.34765625, -17.673828125, -17.0, -16.326171875, -15.65234375, -14.978515625, -14.3046875, -13.630859375, -12.95703125, -12.283203125, -11.609375, -10.935546875, -10.26171875, -9.587890625, -8.9140625, -8.240234375, -7.56640625, -6.892578125, -6.21875, -5.544921875, -4.87109375, -4.197265625, -3.5234375, -2.849609375, -2.17578125, -1.501953125, -0.828125, -0.154296875, 0.51953125, 1.193359375, 1.8671875, 2.541015625, 3.21484375, 3.888671875, 4.5625, 5.236328125, 5.91015625, 6.583984375, 7.2578125, 7.931640625, 8.60546875, 9.279296875, 9.953125, 10.626953125, 11.30078125, 11.974609375, 12.6484375, 13.322265625, 13.99609375, 14.669921875, 15.34375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 3.0, 7.0, 7.0, 2.0, 5.0, 7.0, 7.0, 11.0, 18.0, 24.0, 38.0, 69.0, 223.0, 318.0, 108.0, 50.0, 24.0, 19.0, 19.0, 2.0, 3.0, 5.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0024318695068359375, -0.002369791269302368, -0.002307713031768799, -0.0022456347942352295, -0.00218355655670166, -0.002121478319168091, -0.0020594000816345215, -0.001997321844100952, -0.0019352436065673828, -0.0018731653690338135, -0.0018110871315002441, -0.0017490088939666748, -0.0016869306564331055, -0.0016248524188995361, -0.0015627741813659668, -0.0015006959438323975, -0.0014386177062988281, -0.0013765394687652588, -0.0013144612312316895, -0.0012523829936981201, -0.0011903047561645508, -0.0011282265186309814, -0.0010661482810974121, -0.0010040700435638428, -0.0009419918060302734, -0.0008799135684967041, -0.0008178353309631348, -0.0007557570934295654, -0.0006936788558959961, -0.0006316006183624268, -0.0005695223808288574, -0.0005074441432952881, -0.00044536590576171875, -0.0003832876682281494, -0.0003212094306945801, -0.00025913119316101074, -0.0001970529556274414, -0.00013497471809387207, -7.289648056030273e-05, -1.0818243026733398e-05, 5.125999450683594e-05, 0.00011333823204040527, 0.0001754164695739746, 0.00023749470710754395, 0.0002995729446411133, 0.0003616511821746826, 0.00042372941970825195, 0.0004858076572418213, 0.0005478858947753906, 0.00060996413230896, 0.0006720423698425293, 0.0007341206073760986, 0.000796198844909668, 0.0008582770824432373, 0.0009203553199768066, 0.000982433557510376, 0.0010445117950439453, 0.0011065900325775146, 0.001168668270111084, 0.0012307465076446533, 0.0012928247451782227, 0.001354902982711792, 0.0014169812202453613, 0.0014790594577789307, 0.0015411376953125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 11.0, 13.0, 29.0, 45.0, 73.0, 138.0, 222.0, 523.0, 1447.0, 6333.0, 106373.0, 915927.0, 13538.0, 2524.0, 720.0, 306.0, 142.0, 77.0, 48.0, 18.0, 14.0, 7.0, 7.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.859375, -20.031494140625, -19.20361328125, -18.375732421875, -17.5478515625, -16.719970703125, -15.89208984375, -15.064208984375, -14.236328125, -13.408447265625, -12.58056640625, -11.752685546875, -10.9248046875, -10.096923828125, -9.26904296875, -8.441162109375, -7.61328125, -6.785400390625, -5.95751953125, -5.129638671875, -4.3017578125, -3.473876953125, -2.64599609375, -1.818115234375, -0.990234375, -0.162353515625, 0.66552734375, 1.493408203125, 2.3212890625, 3.149169921875, 3.97705078125, 4.804931640625, 5.6328125, 6.460693359375, 7.28857421875, 8.116455078125, 8.9443359375, 9.772216796875, 10.60009765625, 11.427978515625, 12.255859375, 13.083740234375, 13.91162109375, 14.739501953125, 15.5673828125, 16.395263671875, 17.22314453125, 18.051025390625, 18.87890625, 19.706787109375, 20.53466796875, 21.362548828125, 22.1904296875, 23.018310546875, 23.84619140625, 24.674072265625, 25.501953125, 26.329833984375, 27.15771484375, 27.985595703125, 28.8134765625, 29.641357421875, 30.46923828125, 31.297119140625, 32.125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 4.0, 8.0, 12.0, 16.0, 33.0, 106.0, 397.0, 295.0, 78.0, 23.0, 12.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.765625, -10.086181640625, -9.40673828125, -8.727294921875, -8.0478515625, -7.368408203125, -6.68896484375, -6.009521484375, -5.330078125, -4.650634765625, -3.97119140625, -3.291748046875, -2.6123046875, -1.932861328125, -1.25341796875, -0.573974609375, 0.10546875, 0.784912109375, 1.46435546875, 2.143798828125, 2.8232421875, 3.502685546875, 4.18212890625, 4.861572265625, 5.541015625, 6.220458984375, 6.89990234375, 7.579345703125, 8.2587890625, 8.938232421875, 9.61767578125, 10.297119140625, 10.9765625, 11.656005859375, 12.33544921875, 13.014892578125, 13.6943359375, 14.373779296875, 15.05322265625, 15.732666015625, 16.412109375, 17.091552734375, 17.77099609375, 18.450439453125, 19.1298828125, 19.809326171875, 20.48876953125, 21.168212890625, 21.84765625, 22.527099609375, 23.20654296875, 23.885986328125, 24.5654296875, 25.244873046875, 25.92431640625, 26.603759765625, 27.283203125, 27.962646484375, 28.64208984375, 29.321533203125, 30.0009765625, 30.680419921875, 31.35986328125, 32.039306640625, 32.71875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 10.0, 37.0, 91.0, 198.0, 288.0, 195.0, 98.0, 42.0, 17.0, 16.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-299.1242370605469, -292.2449951171875, -285.36572265625, -278.4864807128906, -271.6072082519531, -264.72796630859375, -257.84869384765625, -250.96945190429688, -244.09019470214844, -237.2109375, -230.33168029785156, -223.45242309570312, -216.57318115234375, -209.6939239501953, -202.81466674804688, -195.93540954589844, -189.05615234375, -182.17689514160156, -175.29763793945312, -168.41839599609375, -161.5391387939453, -154.65988159179688, -147.78062438964844, -140.9013671875, -134.02212524414062, -127.14286804199219, -120.26361846923828, -113.38436126708984, -106.5051040649414, -99.6258544921875, -92.74659729003906, -85.86734008789062, -78.98808288574219, -72.10882568359375, -65.22957611083984, -58.350318908691406, -51.47106170654297, -44.5918083190918, -37.712554931640625, -30.833297729492188, -23.954044342041016, -17.07478904724121, -10.195534706115723, -3.3162803649902344, 3.5629749298095703, 10.442230224609375, 17.321483612060547, 24.200740814208984, 31.079994201660156, 37.95924758911133, 44.838504791259766, 51.71775817871094, 58.597015380859375, 65.47627258300781, 72.35552215576172, 79.23477935791016, 86.11402893066406, 92.9932861328125, 99.8725357055664, 106.75179290771484, 113.63105010986328, 120.51029968261719, 127.38955688476562, 134.26881408691406, 141.1480712890625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 4.0, 7.0, 7.0, 7.0, 8.0, 15.0, 14.0, 16.0, 24.0, 34.0, 23.0, 28.0, 32.0, 36.0, 42.0, 30.0, 44.0, 47.0, 40.0, 38.0, 41.0, 39.0, 36.0, 27.0, 32.0, 37.0, 32.0, 38.0, 32.0, 30.0, 26.0, 21.0, 21.0, 13.0, 9.0, 10.0, 11.0, 9.0, 7.0, 2.0, 7.0, 9.0, 5.0, 3.0, 1.0, 5.0, 1.0, 2.0], "bins": [-82.15996551513672, -79.87931823730469, -77.59866333007812, -75.31800842285156, -73.03736114501953, -70.7567138671875, -68.47605895996094, -66.19540405273438, -63.914756774902344, -61.63410568237305, -59.35345458984375, -57.07280349731445, -54.792152404785156, -52.51150131225586, -50.23085021972656, -47.950199127197266, -45.66954803466797, -43.38889694213867, -41.108245849609375, -38.82759475708008, -36.54694366455078, -34.266292572021484, -31.985641479492188, -29.70499038696289, -27.424339294433594, -25.143688201904297, -22.863037109375, -20.582386016845703, -18.301734924316406, -16.02108383178711, -13.740432739257812, -11.459781646728516, -9.179134368896484, -6.8984832763671875, -4.617832183837891, -2.3371810913085938, -0.056529998779296875, 2.22412109375, 4.504772186279297, 6.785423278808594, 9.06607437133789, 11.346725463867188, 13.627376556396484, 15.908027648925781, 18.188678741455078, 20.469329833984375, 22.749980926513672, 25.03063201904297, 27.311283111572266, 29.591934204101562, 31.87258529663086, 34.153236389160156, 36.43388748168945, 38.71453857421875, 40.99518966674805, 43.275840759277344, 45.55649185180664, 47.83714294433594, 50.117794036865234, 52.39844512939453, 54.67909622192383, 56.959747314453125, 59.24039840698242, 61.52104949951172, 63.801700592041016]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 11.0, 14.0, 20.0, 17.0, 45.0, 88.0, 172.0, 288.0, 574.0, 1370.0, 3476.0, 11559.0, 73979.0, 4039295.0, 49635.0, 8711.0, 2624.0, 1044.0, 553.0, 285.0, 172.0, 109.0, 74.0, 49.0, 27.0, 19.0, 16.0, 14.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.65625, -44.82080078125, -42.9853515625, -41.14990234375, -39.314453125, -37.47900390625, -35.6435546875, -33.80810546875, -31.97265625, -30.13720703125, -28.3017578125, -26.46630859375, -24.630859375, -22.79541015625, -20.9599609375, -19.12451171875, -17.2890625, -15.45361328125, -13.6181640625, -11.78271484375, -9.947265625, -8.11181640625, -6.2763671875, -4.44091796875, -2.60546875, -0.77001953125, 1.0654296875, 2.90087890625, 4.736328125, 6.57177734375, 8.4072265625, 10.24267578125, 12.078125, 13.91357421875, 15.7490234375, 17.58447265625, 19.419921875, 21.25537109375, 23.0908203125, 24.92626953125, 26.76171875, 28.59716796875, 30.4326171875, 32.26806640625, 34.103515625, 35.93896484375, 37.7744140625, 39.60986328125, 41.4453125, 43.28076171875, 45.1162109375, 46.95166015625, 48.787109375, 50.62255859375, 52.4580078125, 54.29345703125, 56.12890625, 57.96435546875, 59.7998046875, 61.63525390625, 63.470703125, 65.30615234375, 67.1416015625, 68.97705078125, 70.8125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 5.0, 7.0, 12.0, 15.0, 19.0, 24.0, 23.0, 47.0, 53.0, 49.0, 49.0, 72.0, 62.0, 79.0, 57.0, 53.0, 67.0, 44.0, 51.0, 54.0, 33.0, 35.0, 16.0, 18.0, 15.0, 9.0, 12.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.80078125, -4.64471435546875, -4.4886474609375, -4.33258056640625, -4.176513671875, -4.02044677734375, -3.8643798828125, -3.70831298828125, -3.55224609375, -3.39617919921875, -3.2401123046875, -3.08404541015625, -2.927978515625, -2.77191162109375, -2.6158447265625, -2.45977783203125, -2.3037109375, -2.14764404296875, -1.9915771484375, -1.83551025390625, -1.679443359375, -1.52337646484375, -1.3673095703125, -1.21124267578125, -1.05517578125, -0.89910888671875, -0.7430419921875, -0.58697509765625, -0.430908203125, -0.27484130859375, -0.1187744140625, 0.03729248046875, 0.193359375, 0.34942626953125, 0.5054931640625, 0.66156005859375, 0.817626953125, 0.97369384765625, 1.1297607421875, 1.28582763671875, 1.44189453125, 1.59796142578125, 1.7540283203125, 1.91009521484375, 2.066162109375, 2.22222900390625, 2.3782958984375, 2.53436279296875, 2.6904296875, 2.84649658203125, 3.0025634765625, 3.15863037109375, 3.314697265625, 3.47076416015625, 3.6268310546875, 3.78289794921875, 3.93896484375, 4.09503173828125, 4.2510986328125, 4.40716552734375, 4.563232421875, 4.71929931640625, 4.8753662109375, 5.03143310546875, 5.1875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 8.0, 11.0, 12.0, 11.0, 19.0, 20.0, 27.0, 29.0, 42.0, 81.0, 82.0, 122.0, 227.0, 357.0, 739.0, 1758.0, 5445.0, 24422.0, 3500964.0, 631243.0, 20801.0, 4706.0, 1513.0, 630.0, 339.0, 198.0, 124.0, 75.0, 69.0, 41.0, 43.0, 29.0, 27.0, 17.0, 17.0, 9.0, 5.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.0625, -60.287109375, -58.51171875, -56.736328125, -54.9609375, -53.185546875, -51.41015625, -49.634765625, -47.859375, -46.083984375, -44.30859375, -42.533203125, -40.7578125, -38.982421875, -37.20703125, -35.431640625, -33.65625, -31.880859375, -30.10546875, -28.330078125, -26.5546875, -24.779296875, -23.00390625, -21.228515625, -19.453125, -17.677734375, -15.90234375, -14.126953125, -12.3515625, -10.576171875, -8.80078125, -7.025390625, -5.25, -3.474609375, -1.69921875, 0.076171875, 1.8515625, 3.626953125, 5.40234375, 7.177734375, 8.953125, 10.728515625, 12.50390625, 14.279296875, 16.0546875, 17.830078125, 19.60546875, 21.380859375, 23.15625, 24.931640625, 26.70703125, 28.482421875, 30.2578125, 32.033203125, 33.80859375, 35.583984375, 37.359375, 39.134765625, 40.91015625, 42.685546875, 44.4609375, 46.236328125, 48.01171875, 49.787109375, 51.5625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 7.0, 16.0, 16.0, 19.0, 39.0, 70.0, 244.0, 3259.0, 249.0, 76.0, 29.0, 22.0, 13.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.046875, -27.319091796875, -26.59130859375, -25.863525390625, -25.1357421875, -24.407958984375, -23.68017578125, -22.952392578125, -22.224609375, -21.496826171875, -20.76904296875, -20.041259765625, -19.3134765625, -18.585693359375, -17.85791015625, -17.130126953125, -16.40234375, -15.674560546875, -14.94677734375, -14.218994140625, -13.4912109375, -12.763427734375, -12.03564453125, -11.307861328125, -10.580078125, -9.852294921875, -9.12451171875, -8.396728515625, -7.6689453125, -6.941162109375, -6.21337890625, -5.485595703125, -4.7578125, -4.030029296875, -3.30224609375, -2.574462890625, -1.8466796875, -1.118896484375, -0.39111328125, 0.336669921875, 1.064453125, 1.792236328125, 2.52001953125, 3.247802734375, 3.9755859375, 4.703369140625, 5.43115234375, 6.158935546875, 6.88671875, 7.614501953125, 8.34228515625, 9.070068359375, 9.7978515625, 10.525634765625, 11.25341796875, 11.981201171875, 12.708984375, 13.436767578125, 14.16455078125, 14.892333984375, 15.6201171875, 16.347900390625, 17.07568359375, 17.803466796875, 18.53125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 25.0, 68.0, 365.0, 420.0, 79.0, 25.0, 9.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.56797790527344, -198.1881103515625, -191.80825805664062, -185.4283905029297, -179.0485382080078, -172.66867065429688, -166.288818359375, -159.90895080566406, -153.52908325195312, -147.1492156982422, -140.7693634033203, -134.38949584960938, -128.0096435546875, -121.62977600097656, -115.24991607666016, -108.87005615234375, -102.49020385742188, -96.11034393310547, -89.73048400878906, -83.35061645507812, -76.97076416015625, -70.59089660644531, -64.2110366821289, -57.8311767578125, -51.451316833496094, -45.07145690917969, -38.69159698486328, -32.31173324584961, -25.931873321533203, -19.552013397216797, -13.172149658203125, -6.792289733886719, -0.412445068359375, 5.967415809631348, 12.34727668762207, 18.72713851928711, 25.106998443603516, 31.486858367919922, 37.866722106933594, 44.24658203125, 50.626441955566406, 57.00630187988281, 63.38616180419922, 69.76602172851562, 76.14588928222656, 82.52574157714844, 88.90560913085938, 95.28546905517578, 101.66532897949219, 108.0451889038086, 114.425048828125, 120.80491638183594, 127.18476867675781, 133.56463623046875, 139.94448852539062, 146.32435607910156, 152.7042236328125, 159.08409118652344, 165.4639434814453, 171.84381103515625, 178.22366333007812, 184.60353088378906, 190.9833984375, 197.36325073242188, 203.74310302734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 5.0, 5.0, 9.0, 9.0, 15.0, 15.0, 18.0, 31.0, 37.0, 46.0, 39.0, 53.0, 60.0, 65.0, 55.0, 75.0, 87.0, 59.0, 63.0, 56.0, 49.0, 35.0, 30.0, 22.0, 20.0, 10.0, 6.0, 5.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-47.510223388671875, -46.08542251586914, -44.660621643066406, -43.23582077026367, -41.81101989746094, -40.3862190246582, -38.96141815185547, -37.536617279052734, -36.11181640625, -34.687015533447266, -33.26221466064453, -31.837413787841797, -30.412612915039062, -28.987812042236328, -27.563011169433594, -26.13821029663086, -24.713409423828125, -23.28860855102539, -21.863807678222656, -20.439006805419922, -19.014205932617188, -17.589405059814453, -16.16460418701172, -14.739803314208984, -13.31500244140625, -11.890201568603516, -10.465400695800781, -9.040599822998047, -7.6157989501953125, -6.190998077392578, -4.766197204589844, -3.3413963317871094, -1.9165916442871094, -0.491790771484375, 0.9330101013183594, 2.3578109741210938, 3.782611846923828, 5.2074127197265625, 6.632213592529297, 8.057014465332031, 9.481815338134766, 10.9066162109375, 12.331417083740234, 13.756217956542969, 15.181018829345703, 16.605819702148438, 18.030620574951172, 19.455421447753906, 20.88022232055664, 22.305023193359375, 23.72982406616211, 25.154624938964844, 26.579425811767578, 28.004226684570312, 29.429027557373047, 30.85382843017578, 32.278629302978516, 33.70343017578125, 35.128231048583984, 36.55303192138672, 37.97783279418945, 39.40263366699219, 40.82743453979492, 42.252235412597656, 43.67703628540039]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 4.0, 15.0, 9.0, 17.0, 35.0, 29.0, 42.0, 69.0, 123.0, 169.0, 298.0, 500.0, 776.0, 1584.0, 3351.0, 8362.0, 24519.0, 102841.0, 539595.0, 287017.0, 53432.0, 14929.0, 5515.0, 2369.0, 1208.0, 628.0, 406.0, 260.0, 135.0, 99.0, 69.0, 45.0, 22.0, 28.0, 11.0, 19.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.484375, -27.6884765625, -26.892578125, -26.0966796875, -25.30078125, -24.5048828125, -23.708984375, -22.9130859375, -22.1171875, -21.3212890625, -20.525390625, -19.7294921875, -18.93359375, -18.1376953125, -17.341796875, -16.5458984375, -15.75, -14.9541015625, -14.158203125, -13.3623046875, -12.56640625, -11.7705078125, -10.974609375, -10.1787109375, -9.3828125, -8.5869140625, -7.791015625, -6.9951171875, -6.19921875, -5.4033203125, -4.607421875, -3.8115234375, -3.015625, -2.2197265625, -1.423828125, -0.6279296875, 0.16796875, 0.9638671875, 1.759765625, 2.5556640625, 3.3515625, 4.1474609375, 4.943359375, 5.7392578125, 6.53515625, 7.3310546875, 8.126953125, 8.9228515625, 9.71875, 10.5146484375, 11.310546875, 12.1064453125, 12.90234375, 13.6982421875, 14.494140625, 15.2900390625, 16.0859375, 16.8818359375, 17.677734375, 18.4736328125, 19.26953125, 20.0654296875, 20.861328125, 21.6572265625, 22.453125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 8.0, 5.0, 8.0, 11.0, 12.0, 17.0, 24.0, 24.0, 47.0, 53.0, 60.0, 53.0, 70.0, 68.0, 74.0, 80.0, 56.0, 61.0, 59.0, 44.0, 47.0, 42.0, 23.0, 19.0, 9.0, 13.0, 5.0, 4.0, 1.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.39532470703125, -5.2125244140625, -5.02972412109375, -4.846923828125, -4.66412353515625, -4.4813232421875, -4.29852294921875, -4.11572265625, -3.93292236328125, -3.7501220703125, -3.56732177734375, -3.384521484375, -3.20172119140625, -3.0189208984375, -2.83612060546875, -2.6533203125, -2.47052001953125, -2.2877197265625, -2.10491943359375, -1.922119140625, -1.73931884765625, -1.5565185546875, -1.37371826171875, -1.19091796875, -1.00811767578125, -0.8253173828125, -0.64251708984375, -0.459716796875, -0.27691650390625, -0.0941162109375, 0.08868408203125, 0.271484375, 0.45428466796875, 0.6370849609375, 0.81988525390625, 1.002685546875, 1.18548583984375, 1.3682861328125, 1.55108642578125, 1.73388671875, 1.91668701171875, 2.0994873046875, 2.28228759765625, 2.465087890625, 2.64788818359375, 2.8306884765625, 3.01348876953125, 3.1962890625, 3.37908935546875, 3.5618896484375, 3.74468994140625, 3.927490234375, 4.11029052734375, 4.2930908203125, 4.47589111328125, 4.65869140625, 4.84149169921875, 5.0242919921875, 5.20709228515625, 5.389892578125, 5.57269287109375, 5.7554931640625, 5.93829345703125, 6.12109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 9.0, 10.0, 19.0, 26.0, 22.0, 29.0, 46.0, 69.0, 71.0, 116.0, 158.0, 211.0, 299.0, 418.0, 751.0, 1430.0, 3420.0, 9918.0, 36126.0, 201680.0, 638040.0, 118271.0, 24488.0, 7220.0, 2555.0, 1119.0, 650.0, 425.0, 251.0, 179.0, 135.0, 105.0, 64.0, 63.0, 42.0, 30.0, 22.0, 14.0, 13.0, 12.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-23.078125, -22.406494140625, -21.73486328125, -21.063232421875, -20.3916015625, -19.719970703125, -19.04833984375, -18.376708984375, -17.705078125, -17.033447265625, -16.36181640625, -15.690185546875, -15.0185546875, -14.346923828125, -13.67529296875, -13.003662109375, -12.33203125, -11.660400390625, -10.98876953125, -10.317138671875, -9.6455078125, -8.973876953125, -8.30224609375, -7.630615234375, -6.958984375, -6.287353515625, -5.61572265625, -4.944091796875, -4.2724609375, -3.600830078125, -2.92919921875, -2.257568359375, -1.5859375, -0.914306640625, -0.24267578125, 0.428955078125, 1.1005859375, 1.772216796875, 2.44384765625, 3.115478515625, 3.787109375, 4.458740234375, 5.13037109375, 5.802001953125, 6.4736328125, 7.145263671875, 7.81689453125, 8.488525390625, 9.16015625, 9.831787109375, 10.50341796875, 11.175048828125, 11.8466796875, 12.518310546875, 13.18994140625, 13.861572265625, 14.533203125, 15.204833984375, 15.87646484375, 16.548095703125, 17.2197265625, 17.891357421875, 18.56298828125, 19.234619140625, 19.90625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 4.0, 8.0, 7.0, 10.0, 8.0, 10.0, 20.0, 24.0, 16.0, 25.0, 33.0, 44.0, 41.0, 52.0, 48.0, 36.0, 56.0, 58.0, 39.0, 48.0, 51.0, 38.0, 43.0, 35.0, 45.0, 28.0, 30.0, 23.0, 21.0, 17.0, 16.0, 11.0, 13.0, 12.0, 3.0, 4.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.671875, -19.078125, -18.484375, -17.890625, -17.296875, -16.703125, -16.109375, -15.515625, -14.921875, -14.328125, -13.734375, -13.140625, -12.546875, -11.953125, -11.359375, -10.765625, -10.171875, -9.578125, -8.984375, -8.390625, -7.796875, -7.203125, -6.609375, -6.015625, -5.421875, -4.828125, -4.234375, -3.640625, -3.046875, -2.453125, -1.859375, -1.265625, -0.671875, -0.078125, 0.515625, 1.109375, 1.703125, 2.296875, 2.890625, 3.484375, 4.078125, 4.671875, 5.265625, 5.859375, 6.453125, 7.046875, 7.640625, 8.234375, 8.828125, 9.421875, 10.015625, 10.609375, 11.203125, 11.796875, 12.390625, 12.984375, 13.578125, 14.171875, 14.765625, 15.359375, 15.953125, 16.546875, 17.140625, 17.734375, 18.328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 4.0, 8.0, 24.0, 30.0, 36.0, 66.0, 112.0, 174.0, 333.0, 639.0, 1405.0, 3380.0, 9357.0, 34522.0, 233494.0, 658514.0, 80127.0, 16774.0, 5356.0, 2194.0, 929.0, 465.0, 250.0, 118.0, 85.0, 46.0, 32.0, 16.0, 12.0, 13.0, 5.0, 7.0, 8.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6328125, -8.337646484375, -8.04248046875, -7.747314453125, -7.4521484375, -7.156982421875, -6.86181640625, -6.566650390625, -6.271484375, -5.976318359375, -5.68115234375, -5.385986328125, -5.0908203125, -4.795654296875, -4.50048828125, -4.205322265625, -3.91015625, -3.614990234375, -3.31982421875, -3.024658203125, -2.7294921875, -2.434326171875, -2.13916015625, -1.843994140625, -1.548828125, -1.253662109375, -0.95849609375, -0.663330078125, -0.3681640625, -0.072998046875, 0.22216796875, 0.517333984375, 0.8125, 1.107666015625, 1.40283203125, 1.697998046875, 1.9931640625, 2.288330078125, 2.58349609375, 2.878662109375, 3.173828125, 3.468994140625, 3.76416015625, 4.059326171875, 4.3544921875, 4.649658203125, 4.94482421875, 5.239990234375, 5.53515625, 5.830322265625, 6.12548828125, 6.420654296875, 6.7158203125, 7.010986328125, 7.30615234375, 7.601318359375, 7.896484375, 8.191650390625, 8.48681640625, 8.781982421875, 9.0771484375, 9.372314453125, 9.66748046875, 9.962646484375, 10.2578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 3.0, 8.0, 10.0, 11.0, 18.0, 27.0, 37.0, 76.0, 96.0, 219.0, 212.0, 88.0, 63.0, 42.0, 36.0, 15.0, 12.0, 8.0, 7.0, 5.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016050338745117188, -0.0015380531549453735, -0.0014710724353790283, -0.001404091715812683, -0.0013371109962463379, -0.0012701302766799927, -0.0012031495571136475, -0.0011361688375473022, -0.001069188117980957, -0.0010022073984146118, -0.0009352266788482666, -0.0008682459592819214, -0.0008012652397155762, -0.000734284520149231, -0.0006673038005828857, -0.0006003230810165405, -0.0005333423614501953, -0.0004663616418838501, -0.0003993809223175049, -0.00033240020275115967, -0.00026541948318481445, -0.00019843876361846924, -0.00013145804405212402, -6.447732448577881e-05, 2.5033950805664062e-06, 6.948411464691162e-05, 0.00013646483421325684, 0.00020344555377960205, 0.00027042627334594727, 0.0003374069929122925, 0.0004043877124786377, 0.0004713684320449829, 0.0005383491516113281, 0.0006053298711776733, 0.0006723105907440186, 0.0007392913103103638, 0.000806272029876709, 0.0008732527494430542, 0.0009402334690093994, 0.0010072141885757446, 0.0010741949081420898, 0.001141175627708435, 0.0012081563472747803, 0.0012751370668411255, 0.0013421177864074707, 0.001409098505973816, 0.0014760792255401611, 0.0015430599451065063, 0.0016100406646728516, 0.0016770213842391968, 0.001744002103805542, 0.0018109828233718872, 0.0018779635429382324, 0.0019449442625045776, 0.002011924982070923, 0.002078905701637268, 0.0021458864212036133, 0.0022128671407699585, 0.0022798478603363037, 0.002346828579902649, 0.002413809299468994, 0.0024807900190353394, 0.0025477707386016846, 0.00261475145816803, 0.002681732177734375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 12.0, 6.0, 8.0, 16.0, 18.0, 21.0, 31.0, 50.0, 76.0, 129.0, 188.0, 284.0, 511.0, 918.0, 1808.0, 4555.0, 14372.0, 69949.0, 594271.0, 304893.0, 40269.0, 9471.0, 3351.0, 1413.0, 743.0, 419.0, 228.0, 142.0, 112.0, 60.0, 54.0, 41.0, 32.0, 26.0, 18.0, 9.0, 9.0, 11.0, 5.0, 1.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.21875, -9.8978271484375, -9.576904296875, -9.2559814453125, -8.93505859375, -8.6141357421875, -8.293212890625, -7.9722900390625, -7.6513671875, -7.3304443359375, -7.009521484375, -6.6885986328125, -6.36767578125, -6.0467529296875, -5.725830078125, -5.4049072265625, -5.083984375, -4.7630615234375, -4.442138671875, -4.1212158203125, -3.80029296875, -3.4793701171875, -3.158447265625, -2.8375244140625, -2.5166015625, -2.1956787109375, -1.874755859375, -1.5538330078125, -1.23291015625, -0.9119873046875, -0.591064453125, -0.2701416015625, 0.05078125, 0.3717041015625, 0.692626953125, 1.0135498046875, 1.33447265625, 1.6553955078125, 1.976318359375, 2.2972412109375, 2.6181640625, 2.9390869140625, 3.260009765625, 3.5809326171875, 3.90185546875, 4.2227783203125, 4.543701171875, 4.8646240234375, 5.185546875, 5.5064697265625, 5.827392578125, 6.1483154296875, 6.46923828125, 6.7901611328125, 7.111083984375, 7.4320068359375, 7.7529296875, 8.0738525390625, 8.394775390625, 8.7156982421875, 9.03662109375, 9.3575439453125, 9.678466796875, 9.9993896484375, 10.3203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 11.0, 8.0, 11.0, 16.0, 20.0, 41.0, 49.0, 58.0, 73.0, 97.0, 104.0, 109.0, 87.0, 76.0, 54.0, 39.0, 27.0, 24.0, 20.0, 9.0, 13.0, 11.0, 8.0, 10.0, 11.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.87890625, -7.60870361328125, -7.3385009765625, -7.06829833984375, -6.798095703125, -6.52789306640625, -6.2576904296875, -5.98748779296875, -5.71728515625, -5.44708251953125, -5.1768798828125, -4.90667724609375, -4.636474609375, -4.36627197265625, -4.0960693359375, -3.82586669921875, -3.5556640625, -3.28546142578125, -3.0152587890625, -2.74505615234375, -2.474853515625, -2.20465087890625, -1.9344482421875, -1.66424560546875, -1.39404296875, -1.12384033203125, -0.8536376953125, -0.58343505859375, -0.313232421875, -0.04302978515625, 0.2271728515625, 0.49737548828125, 0.767578125, 1.03778076171875, 1.3079833984375, 1.57818603515625, 1.848388671875, 2.11859130859375, 2.3887939453125, 2.65899658203125, 2.92919921875, 3.19940185546875, 3.4696044921875, 3.73980712890625, 4.010009765625, 4.28021240234375, 4.5504150390625, 4.82061767578125, 5.0908203125, 5.36102294921875, 5.6312255859375, 5.90142822265625, 6.171630859375, 6.44183349609375, 6.7120361328125, 6.98223876953125, 7.25244140625, 7.52264404296875, 7.7928466796875, 8.06304931640625, 8.333251953125, 8.60345458984375, 8.8736572265625, 9.14385986328125, 9.4140625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 9.0, 11.0, 22.0, 39.0, 60.0, 124.0, 146.0, 170.0, 160.0, 96.0, 62.0, 40.0, 25.0, 13.0, 7.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-195.258056640625, -190.41287231445312, -185.5676727294922, -180.7224884033203, -175.87730407714844, -171.0321044921875, -166.18692016601562, -161.34173583984375, -156.49655151367188, -151.6513671875, -146.80616760253906, -141.9609832763672, -137.1157989501953, -132.27059936523438, -127.4254150390625, -122.58023071289062, -117.73503112792969, -112.88983917236328, -108.0446548461914, -103.199462890625, -98.35427856445312, -93.50908660888672, -88.66389465332031, -83.81871032714844, -78.97351837158203, -74.12832641601562, -69.28314208984375, -64.43795013427734, -59.5927619934082, -54.74757385253906, -49.902381896972656, -45.057193756103516, -40.212005615234375, -35.366817474365234, -30.52162742614746, -25.676437377929688, -20.831249237060547, -15.986061096191406, -11.140871047973633, -6.295680999755859, -1.4504928588867188, 3.3946962356567383, 8.239885330200195, 13.085074424743652, 17.93026351928711, 22.77545166015625, 27.620641708374023, 32.4658317565918, 37.31101989746094, 42.15620803833008, 47.00139617919922, 51.846588134765625, 56.691776275634766, 61.536964416503906, 66.38215637207031, 71.22734069824219, 76.0725326538086, 80.917724609375, 85.76290893554688, 90.60810089111328, 95.45329284667969, 100.29847717285156, 105.14366912841797, 109.98886108398438, 114.83404541015625]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 9.0, 5.0, 10.0, 9.0, 17.0, 16.0, 12.0, 30.0, 31.0, 27.0, 26.0, 30.0, 35.0, 32.0, 39.0, 48.0, 50.0, 57.0, 40.0, 40.0, 41.0, 40.0, 43.0, 44.0, 42.0, 32.0, 26.0, 23.0, 27.0, 23.0, 18.0, 17.0, 13.0, 13.0, 8.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-97.74896240234375, -94.64547729492188, -91.54199981689453, -88.43851470947266, -85.33503723144531, -82.23155212402344, -79.12806701660156, -76.02458953857422, -72.92110443115234, -69.81761932373047, -66.71414184570312, -63.61065673828125, -60.50717544555664, -57.40369415283203, -54.30021286010742, -51.19673156738281, -48.0932502746582, -44.989768981933594, -41.886287689208984, -38.782806396484375, -35.6793212890625, -32.57583999633789, -29.47235870361328, -26.36887550354004, -23.26539421081543, -20.16191291809082, -17.058429718017578, -13.954948425292969, -10.851466178894043, -7.747983932495117, -4.644502639770508, -1.5410194396972656, 1.5624618530273438, 4.6659440994262695, 7.769425868988037, 10.872907638549805, 13.97638988494873, 17.079872131347656, 20.183353424072266, 23.286836624145508, 26.390317916870117, 29.493799209594727, 32.59728240966797, 35.70076370239258, 38.80424499511719, 41.90773010253906, 45.011207580566406, 48.11469268798828, 51.21817398071289, 54.3216552734375, 57.42513656616211, 60.52861785888672, 63.632102966308594, 66.73558044433594, 69.83906555175781, 72.94255065917969, 76.04602813720703, 79.1495132446289, 82.25299072265625, 85.35647583007812, 88.45995330810547, 91.56343841552734, 94.66691589355469, 97.77040100097656, 100.87388610839844]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 7.0, 10.0, 13.0, 25.0, 30.0, 38.0, 65.0, 96.0, 143.0, 255.0, 449.0, 855.0, 1675.0, 4149.0, 11980.0, 55914.0, 3980080.0, 112300.0, 16434.0, 5147.0, 2120.0, 977.0, 517.0, 340.0, 187.0, 131.0, 100.0, 59.0, 36.0, 31.0, 31.0, 27.0, 9.0, 14.0, 10.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.59375, -39.06982421875, -37.5458984375, -36.02197265625, -34.498046875, -32.97412109375, -31.4501953125, -29.92626953125, -28.40234375, -26.87841796875, -25.3544921875, -23.83056640625, -22.306640625, -20.78271484375, -19.2587890625, -17.73486328125, -16.2109375, -14.68701171875, -13.1630859375, -11.63916015625, -10.115234375, -8.59130859375, -7.0673828125, -5.54345703125, -4.01953125, -2.49560546875, -0.9716796875, 0.55224609375, 2.076171875, 3.60009765625, 5.1240234375, 6.64794921875, 8.171875, 9.69580078125, 11.2197265625, 12.74365234375, 14.267578125, 15.79150390625, 17.3154296875, 18.83935546875, 20.36328125, 21.88720703125, 23.4111328125, 24.93505859375, 26.458984375, 27.98291015625, 29.5068359375, 31.03076171875, 32.5546875, 34.07861328125, 35.6025390625, 37.12646484375, 38.650390625, 40.17431640625, 41.6982421875, 43.22216796875, 44.74609375, 46.27001953125, 47.7939453125, 49.31787109375, 50.841796875, 52.36572265625, 53.8896484375, 55.41357421875, 56.9375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 12.0, 14.0, 15.0, 19.0, 29.0, 33.0, 42.0, 44.0, 48.0, 46.0, 75.0, 74.0, 62.0, 62.0, 56.0, 56.0, 57.0, 37.0, 48.0, 34.0, 31.0, 28.0, 23.0, 12.0, 8.0, 11.0, 2.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48046875, -5.3023681640625, -5.124267578125, -4.9461669921875, -4.76806640625, -4.5899658203125, -4.411865234375, -4.2337646484375, -4.0556640625, -3.8775634765625, -3.699462890625, -3.5213623046875, -3.34326171875, -3.1651611328125, -2.987060546875, -2.8089599609375, -2.630859375, -2.4527587890625, -2.274658203125, -2.0965576171875, -1.91845703125, -1.7403564453125, -1.562255859375, -1.3841552734375, -1.2060546875, -1.0279541015625, -0.849853515625, -0.6717529296875, -0.49365234375, -0.3155517578125, -0.137451171875, 0.0406494140625, 0.21875, 0.3968505859375, 0.574951171875, 0.7530517578125, 0.93115234375, 1.1092529296875, 1.287353515625, 1.4654541015625, 1.6435546875, 1.8216552734375, 1.999755859375, 2.1778564453125, 2.35595703125, 2.5340576171875, 2.712158203125, 2.8902587890625, 3.068359375, 3.2464599609375, 3.424560546875, 3.6026611328125, 3.78076171875, 3.9588623046875, 4.136962890625, 4.3150634765625, 4.4931640625, 4.6712646484375, 4.849365234375, 5.0274658203125, 5.20556640625, 5.3836669921875, 5.561767578125, 5.7398681640625, 5.91796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 6.0, 10.0, 9.0, 14.0, 21.0, 25.0, 40.0, 69.0, 88.0, 116.0, 182.0, 250.0, 380.0, 584.0, 869.0, 1312.0, 2052.0, 3297.0, 5603.0, 10675.0, 24189.0, 75058.0, 976771.0, 2943802.0, 93323.0, 27753.0, 11964.0, 5967.0, 3524.0, 2161.0, 1351.0, 913.0, 611.0, 393.0, 298.0, 202.0, 116.0, 93.0, 56.0, 40.0, 28.0, 26.0, 18.0, 5.0, 8.0, 4.0, 3.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.671875, -16.098388671875, -15.52490234375, -14.951416015625, -14.3779296875, -13.804443359375, -13.23095703125, -12.657470703125, -12.083984375, -11.510498046875, -10.93701171875, -10.363525390625, -9.7900390625, -9.216552734375, -8.64306640625, -8.069580078125, -7.49609375, -6.922607421875, -6.34912109375, -5.775634765625, -5.2021484375, -4.628662109375, -4.05517578125, -3.481689453125, -2.908203125, -2.334716796875, -1.76123046875, -1.187744140625, -0.6142578125, -0.040771484375, 0.53271484375, 1.106201171875, 1.6796875, 2.253173828125, 2.82666015625, 3.400146484375, 3.9736328125, 4.547119140625, 5.12060546875, 5.694091796875, 6.267578125, 6.841064453125, 7.41455078125, 7.988037109375, 8.5615234375, 9.135009765625, 9.70849609375, 10.281982421875, 10.85546875, 11.428955078125, 12.00244140625, 12.575927734375, 13.1494140625, 13.722900390625, 14.29638671875, 14.869873046875, 15.443359375, 16.016845703125, 16.59033203125, 17.163818359375, 17.7373046875, 18.310791015625, 18.88427734375, 19.457763671875, 20.03125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 13.0, 11.0, 14.0, 14.0, 26.0, 26.0, 31.0, 47.0, 89.0, 147.0, 416.0, 2279.0, 524.0, 145.0, 86.0, 55.0, 34.0, 20.0, 10.0, 15.0, 16.0, 10.0, 7.0, 1.0, 7.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.65625, -9.3179931640625, -8.979736328125, -8.6414794921875, -8.30322265625, -7.9649658203125, -7.626708984375, -7.2884521484375, -6.9501953125, -6.6119384765625, -6.273681640625, -5.9354248046875, -5.59716796875, -5.2589111328125, -4.920654296875, -4.5823974609375, -4.244140625, -3.9058837890625, -3.567626953125, -3.2293701171875, -2.89111328125, -2.5528564453125, -2.214599609375, -1.8763427734375, -1.5380859375, -1.1998291015625, -0.861572265625, -0.5233154296875, -0.18505859375, 0.1531982421875, 0.491455078125, 0.8297119140625, 1.16796875, 1.5062255859375, 1.844482421875, 2.1827392578125, 2.52099609375, 2.8592529296875, 3.197509765625, 3.5357666015625, 3.8740234375, 4.2122802734375, 4.550537109375, 4.8887939453125, 5.22705078125, 5.5653076171875, 5.903564453125, 6.2418212890625, 6.580078125, 6.9183349609375, 7.256591796875, 7.5948486328125, 7.93310546875, 8.2713623046875, 8.609619140625, 8.9478759765625, 9.2861328125, 9.6243896484375, 9.962646484375, 10.3009033203125, 10.63916015625, 10.9774169921875, 11.315673828125, 11.6539306640625, 11.9921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 20.0, 39.0, 70.0, 246.0, 289.0, 212.0, 74.0, 27.0, 10.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-197.39710998535156, -193.25624084472656, -189.11537170410156, -184.97450256347656, -180.8336181640625, -176.6927490234375, -172.5518798828125, -168.4110107421875, -164.2701416015625, -160.1292724609375, -155.9884033203125, -151.8475341796875, -147.7066650390625, -143.56578063964844, -139.42491149902344, -135.28404235839844, -131.14317321777344, -127.00230407714844, -122.86143493652344, -118.7205581665039, -114.5796890258789, -110.4388198852539, -106.29794311523438, -102.15707397460938, -98.01620483398438, -93.87533569335938, -89.73446655273438, -85.59358978271484, -81.45272064208984, -77.31185150146484, -73.17097473144531, -69.03010559082031, -64.88924407958984, -60.748374938964844, -56.60750198364258, -52.46662902832031, -48.32575988769531, -44.18489074707031, -40.04401779174805, -35.90314483642578, -31.76227569580078, -27.62140464782715, -23.480533599853516, -19.339662551879883, -15.19879150390625, -11.057920455932617, -6.917049407958984, -2.7761783599853516, 1.3646926879882812, 5.505563735961914, 9.646434783935547, 13.78730583190918, 17.928176879882812, 22.069047927856445, 26.209918975830078, 30.35079002380371, 34.491661071777344, 38.632530212402344, 42.77340316772461, 46.914276123046875, 51.055145263671875, 55.196014404296875, 59.33688735961914, 63.477760314941406, 67.6186294555664]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 14.0, 17.0, 13.0, 18.0, 21.0, 28.0, 24.0, 26.0, 29.0, 42.0, 42.0, 45.0, 46.0, 41.0, 52.0, 60.0, 53.0, 49.0, 39.0, 40.0, 24.0, 43.0, 29.0, 32.0, 21.0, 21.0, 27.0, 24.0, 16.0, 9.0, 9.0, 7.0, 8.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-40.072574615478516, -39.00344467163086, -37.93431854248047, -36.86518859863281, -35.796058654785156, -34.7269287109375, -33.65780258178711, -32.58867263793945, -31.51954460144043, -30.450416564941406, -29.38128662109375, -28.312158584594727, -27.243030548095703, -26.173900604248047, -25.104772567749023, -24.03564453125, -22.966514587402344, -21.89738655090332, -20.828256607055664, -19.75912857055664, -18.689998626708984, -17.62087059020996, -16.551742553710938, -15.482613563537598, -14.413484573364258, -13.344355583190918, -12.275226593017578, -11.206098556518555, -10.136969566345215, -9.067840576171875, -7.998712062835693, -6.929583549499512, -5.860450744628906, -4.791321754455566, -3.7221932411193848, -2.653064489364624, -1.5839357376098633, -0.5148067474365234, 0.5543217658996582, 1.6234502792358398, 2.6925792694091797, 3.7617080211639404, 4.830836772918701, 5.899965286254883, 6.969094276428223, 8.038223266601562, 9.107351303100586, 10.176480293273926, 11.245609283447266, 12.314738273620605, 13.383867263793945, 14.452995300292969, 15.522124290466309, 16.59125328063965, 17.660381317138672, 18.729511260986328, 19.79863929748535, 20.867767333984375, 21.93689727783203, 23.006025314331055, 24.075153350830078, 25.144283294677734, 26.213411331176758, 27.28253936767578, 28.351669311523438]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 11.0, 14.0, 10.0, 21.0, 25.0, 46.0, 52.0, 83.0, 117.0, 222.0, 308.0, 501.0, 840.0, 1651.0, 3271.0, 8454.0, 27861.0, 135063.0, 569304.0, 236115.0, 43762.0, 11892.0, 4397.0, 1992.0, 980.0, 529.0, 352.0, 200.0, 154.0, 84.0, 60.0, 52.0, 27.0, 29.0, 19.0, 14.0, 8.0, 12.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-24.40625, -23.610107421875, -22.81396484375, -22.017822265625, -21.2216796875, -20.425537109375, -19.62939453125, -18.833251953125, -18.037109375, -17.240966796875, -16.44482421875, -15.648681640625, -14.8525390625, -14.056396484375, -13.26025390625, -12.464111328125, -11.66796875, -10.871826171875, -10.07568359375, -9.279541015625, -8.4833984375, -7.687255859375, -6.89111328125, -6.094970703125, -5.298828125, -4.502685546875, -3.70654296875, -2.910400390625, -2.1142578125, -1.318115234375, -0.52197265625, 0.274169921875, 1.0703125, 1.866455078125, 2.66259765625, 3.458740234375, 4.2548828125, 5.051025390625, 5.84716796875, 6.643310546875, 7.439453125, 8.235595703125, 9.03173828125, 9.827880859375, 10.6240234375, 11.420166015625, 12.21630859375, 13.012451171875, 13.80859375, 14.604736328125, 15.40087890625, 16.197021484375, 16.9931640625, 17.789306640625, 18.58544921875, 19.381591796875, 20.177734375, 20.973876953125, 21.77001953125, 22.566162109375, 23.3623046875, 24.158447265625, 24.95458984375, 25.750732421875, 26.546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 10.0, 11.0, 13.0, 22.0, 19.0, 27.0, 33.0, 40.0, 45.0, 51.0, 70.0, 47.0, 58.0, 60.0, 67.0, 76.0, 53.0, 61.0, 46.0, 45.0, 24.0, 27.0, 25.0, 24.0, 13.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.91796875, -5.7415771484375, -5.565185546875, -5.3887939453125, -5.21240234375, -5.0360107421875, -4.859619140625, -4.6832275390625, -4.5068359375, -4.3304443359375, -4.154052734375, -3.9776611328125, -3.80126953125, -3.6248779296875, -3.448486328125, -3.2720947265625, -3.095703125, -2.9193115234375, -2.742919921875, -2.5665283203125, -2.39013671875, -2.2137451171875, -2.037353515625, -1.8609619140625, -1.6845703125, -1.5081787109375, -1.331787109375, -1.1553955078125, -0.97900390625, -0.8026123046875, -0.626220703125, -0.4498291015625, -0.2734375, -0.0970458984375, 0.079345703125, 0.2557373046875, 0.43212890625, 0.6085205078125, 0.784912109375, 0.9613037109375, 1.1376953125, 1.3140869140625, 1.490478515625, 1.6668701171875, 1.84326171875, 2.0196533203125, 2.196044921875, 2.3724365234375, 2.548828125, 2.7252197265625, 2.901611328125, 3.0780029296875, 3.25439453125, 3.4307861328125, 3.607177734375, 3.7835693359375, 3.9599609375, 4.1363525390625, 4.312744140625, 4.4891357421875, 4.66552734375, 4.8419189453125, 5.018310546875, 5.1947021484375, 5.37109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 4.0, 10.0, 7.0, 10.0, 14.0, 14.0, 21.0, 33.0, 46.0, 61.0, 96.0, 134.0, 225.0, 337.0, 562.0, 1018.0, 2174.0, 6814.0, 34763.0, 315350.0, 596067.0, 73126.0, 11456.0, 3078.0, 1327.0, 693.0, 392.0, 220.0, 142.0, 96.0, 77.0, 54.0, 34.0, 28.0, 21.0, 17.0, 10.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.8125, -26.998779296875, -26.18505859375, -25.371337890625, -24.5576171875, -23.743896484375, -22.93017578125, -22.116455078125, -21.302734375, -20.489013671875, -19.67529296875, -18.861572265625, -18.0478515625, -17.234130859375, -16.42041015625, -15.606689453125, -14.79296875, -13.979248046875, -13.16552734375, -12.351806640625, -11.5380859375, -10.724365234375, -9.91064453125, -9.096923828125, -8.283203125, -7.469482421875, -6.65576171875, -5.842041015625, -5.0283203125, -4.214599609375, -3.40087890625, -2.587158203125, -1.7734375, -0.959716796875, -0.14599609375, 0.667724609375, 1.4814453125, 2.295166015625, 3.10888671875, 3.922607421875, 4.736328125, 5.550048828125, 6.36376953125, 7.177490234375, 7.9912109375, 8.804931640625, 9.61865234375, 10.432373046875, 11.24609375, 12.059814453125, 12.87353515625, 13.687255859375, 14.5009765625, 15.314697265625, 16.12841796875, 16.942138671875, 17.755859375, 18.569580078125, 19.38330078125, 20.197021484375, 21.0107421875, 21.824462890625, 22.63818359375, 23.451904296875, 24.265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 4.0, 4.0, 10.0, 3.0, 7.0, 11.0, 17.0, 17.0, 11.0, 15.0, 24.0, 17.0, 30.0, 29.0, 30.0, 32.0, 48.0, 29.0, 41.0, 46.0, 32.0, 46.0, 48.0, 38.0, 43.0, 46.0, 40.0, 41.0, 28.0, 21.0, 28.0, 25.0, 29.0, 17.0, 18.0, 13.0, 14.0, 11.0, 8.0, 13.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.375, -17.820068359375, -17.26513671875, -16.710205078125, -16.1552734375, -15.600341796875, -15.04541015625, -14.490478515625, -13.935546875, -13.380615234375, -12.82568359375, -12.270751953125, -11.7158203125, -11.160888671875, -10.60595703125, -10.051025390625, -9.49609375, -8.941162109375, -8.38623046875, -7.831298828125, -7.2763671875, -6.721435546875, -6.16650390625, -5.611572265625, -5.056640625, -4.501708984375, -3.94677734375, -3.391845703125, -2.8369140625, -2.281982421875, -1.72705078125, -1.172119140625, -0.6171875, -0.062255859375, 0.49267578125, 1.047607421875, 1.6025390625, 2.157470703125, 2.71240234375, 3.267333984375, 3.822265625, 4.377197265625, 4.93212890625, 5.487060546875, 6.0419921875, 6.596923828125, 7.15185546875, 7.706787109375, 8.26171875, 8.816650390625, 9.37158203125, 9.926513671875, 10.4814453125, 11.036376953125, 11.59130859375, 12.146240234375, 12.701171875, 13.256103515625, 13.81103515625, 14.365966796875, 14.9208984375, 15.475830078125, 16.03076171875, 16.585693359375, 17.140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 0.0, 4.0, 7.0, 5.0, 11.0, 21.0, 23.0, 35.0, 66.0, 88.0, 152.0, 280.0, 550.0, 1391.0, 3530.0, 10706.0, 46058.0, 350298.0, 541726.0, 71206.0, 14782.0, 4476.0, 1639.0, 694.0, 355.0, 160.0, 109.0, 75.0, 36.0, 28.0, 12.0, 9.0, 8.0, 2.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.03125, -8.6717529296875, -8.312255859375, -7.9527587890625, -7.59326171875, -7.2337646484375, -6.874267578125, -6.5147705078125, -6.1552734375, -5.7957763671875, -5.436279296875, -5.0767822265625, -4.71728515625, -4.3577880859375, -3.998291015625, -3.6387939453125, -3.279296875, -2.9197998046875, -2.560302734375, -2.2008056640625, -1.84130859375, -1.4818115234375, -1.122314453125, -0.7628173828125, -0.4033203125, -0.0438232421875, 0.315673828125, 0.6751708984375, 1.03466796875, 1.3941650390625, 1.753662109375, 2.1131591796875, 2.47265625, 2.8321533203125, 3.191650390625, 3.5511474609375, 3.91064453125, 4.2701416015625, 4.629638671875, 4.9891357421875, 5.3486328125, 5.7081298828125, 6.067626953125, 6.4271240234375, 6.78662109375, 7.1461181640625, 7.505615234375, 7.8651123046875, 8.224609375, 8.5841064453125, 8.943603515625, 9.3031005859375, 9.66259765625, 10.0220947265625, 10.381591796875, 10.7410888671875, 11.1005859375, 11.4600830078125, 11.819580078125, 12.1790771484375, 12.53857421875, 12.8980712890625, 13.257568359375, 13.6170654296875, 13.9765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 5.0, 7.0, 10.0, 6.0, 10.0, 25.0, 33.0, 49.0, 61.0, 95.0, 114.0, 132.0, 103.0, 103.0, 71.0, 45.0, 40.0, 12.0, 19.0, 8.0, 19.0, 9.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014286041259765625, -0.0013805478811264038, -0.0013324916362762451, -0.0012844353914260864, -0.0012363791465759277, -0.001188322901725769, -0.0011402666568756104, -0.0010922104120254517, -0.001044154167175293, -0.0009960979223251343, -0.0009480416774749756, -0.0008999854326248169, -0.0008519291877746582, -0.0008038729429244995, -0.0007558166980743408, -0.0007077604532241821, -0.0006597042083740234, -0.0006116479635238647, -0.0005635917186737061, -0.0005155354738235474, -0.00046747922897338867, -0.00041942298412323, -0.0003713667392730713, -0.0003233104944229126, -0.0002752542495727539, -0.00022719800472259521, -0.00017914175987243652, -0.00013108551502227783, -8.302927017211914e-05, -3.497302532196045e-05, 1.3083219528198242e-05, 6.113946437835693e-05, 0.00010919570922851562, 0.00015725195407867432, 0.000205308198928833, 0.0002533644437789917, 0.0003014206886291504, 0.0003494769334793091, 0.0003975331783294678, 0.00044558942317962646, 0.0004936456680297852, 0.0005417019128799438, 0.0005897581577301025, 0.0006378144025802612, 0.0006858706474304199, 0.0007339268922805786, 0.0007819831371307373, 0.000830039381980896, 0.0008780956268310547, 0.0009261518716812134, 0.0009742081165313721, 0.0010222643613815308, 0.0010703206062316895, 0.0011183768510818481, 0.0011664330959320068, 0.0012144893407821655, 0.0012625455856323242, 0.001310601830482483, 0.0013586580753326416, 0.0014067143201828003, 0.001454770565032959, 0.0015028268098831177, 0.0015508830547332764, 0.001598939299583435, 0.0016469955444335938]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 10.0, 11.0, 19.0, 17.0, 20.0, 36.0, 43.0, 51.0, 72.0, 142.0, 192.0, 339.0, 592.0, 1075.0, 2262.0, 4891.0, 13716.0, 48985.0, 273012.0, 554522.0, 108749.0, 24690.0, 8248.0, 3315.0, 1528.0, 812.0, 437.0, 237.0, 140.0, 109.0, 57.0, 40.0, 46.0, 30.0, 29.0, 18.0, 10.0, 8.0, 6.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.1796875, -9.87353515625, -9.5673828125, -9.26123046875, -8.955078125, -8.64892578125, -8.3427734375, -8.03662109375, -7.73046875, -7.42431640625, -7.1181640625, -6.81201171875, -6.505859375, -6.19970703125, -5.8935546875, -5.58740234375, -5.28125, -4.97509765625, -4.6689453125, -4.36279296875, -4.056640625, -3.75048828125, -3.4443359375, -3.13818359375, -2.83203125, -2.52587890625, -2.2197265625, -1.91357421875, -1.607421875, -1.30126953125, -0.9951171875, -0.68896484375, -0.3828125, -0.07666015625, 0.2294921875, 0.53564453125, 0.841796875, 1.14794921875, 1.4541015625, 1.76025390625, 2.06640625, 2.37255859375, 2.6787109375, 2.98486328125, 3.291015625, 3.59716796875, 3.9033203125, 4.20947265625, 4.515625, 4.82177734375, 5.1279296875, 5.43408203125, 5.740234375, 6.04638671875, 6.3525390625, 6.65869140625, 6.96484375, 7.27099609375, 7.5771484375, 7.88330078125, 8.189453125, 8.49560546875, 8.8017578125, 9.10791015625, 9.4140625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 7.0, 4.0, 9.0, 19.0, 15.0, 27.0, 24.0, 22.0, 46.0, 61.0, 68.0, 92.0, 95.0, 94.0, 74.0, 74.0, 56.0, 49.0, 42.0, 21.0, 19.0, 11.0, 8.0, 11.0, 6.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.3203125, -8.0498046875, -7.779296875, -7.5087890625, -7.23828125, -6.9677734375, -6.697265625, -6.4267578125, -6.15625, -5.8857421875, -5.615234375, -5.3447265625, -5.07421875, -4.8037109375, -4.533203125, -4.2626953125, -3.9921875, -3.7216796875, -3.451171875, -3.1806640625, -2.91015625, -2.6396484375, -2.369140625, -2.0986328125, -1.828125, -1.5576171875, -1.287109375, -1.0166015625, -0.74609375, -0.4755859375, -0.205078125, 0.0654296875, 0.3359375, 0.6064453125, 0.876953125, 1.1474609375, 1.41796875, 1.6884765625, 1.958984375, 2.2294921875, 2.5, 2.7705078125, 3.041015625, 3.3115234375, 3.58203125, 3.8525390625, 4.123046875, 4.3935546875, 4.6640625, 4.9345703125, 5.205078125, 5.4755859375, 5.74609375, 6.0166015625, 6.287109375, 6.5576171875, 6.828125, 7.0986328125, 7.369140625, 7.6396484375, 7.91015625, 8.1806640625, 8.451171875, 8.7216796875, 8.9921875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 11.0, 3.0, 10.0, 20.0, 31.0, 45.0, 66.0, 98.0, 114.0, 114.0, 108.0, 104.0, 87.0, 51.0, 50.0, 25.0, 24.0, 10.0, 8.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.4216079711914, -101.90574645996094, -98.389892578125, -94.87403106689453, -91.3581771850586, -87.84231567382812, -84.32646179199219, -80.81060028076172, -77.29473876953125, -73.77887725830078, -70.26302337646484, -66.74716186523438, -63.23130798339844, -59.71544647216797, -56.199588775634766, -52.68373107910156, -49.167877197265625, -45.65201950073242, -42.13616180419922, -38.62030029296875, -35.10444641113281, -31.588586807250977, -28.07272720336914, -24.556869506835938, -21.041011810302734, -17.52515411376953, -14.009295463562012, -10.493436813354492, -6.977579116821289, -3.461721420288086, 0.05413818359375, 3.569995880126953, 7.0858612060546875, 10.60171890258789, 14.11757755279541, 17.63343620300293, 21.149293899536133, 24.665151596069336, 28.181011199951172, 31.696868896484375, 35.21272659301758, 38.72858428955078, 42.244441986083984, 45.76029968261719, 49.276161193847656, 52.792015075683594, 56.30787658691406, 59.823734283447266, 63.33959197998047, 66.85545349121094, 70.37130737304688, 73.88716888427734, 77.40302276611328, 80.91888427734375, 84.43473815917969, 87.95059967041016, 91.46646118164062, 94.9823226928711, 98.49817657470703, 102.0140380859375, 105.52989196777344, 109.0457534790039, 112.56161499023438, 116.07746887207031, 119.59332275390625]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 8.0, 14.0, 8.0, 17.0, 29.0, 25.0, 27.0, 40.0, 30.0, 28.0, 46.0, 44.0, 42.0, 59.0, 54.0, 52.0, 56.0, 51.0, 55.0, 57.0, 36.0, 49.0, 29.0, 27.0, 25.0, 19.0, 18.0, 8.0, 10.0, 7.0, 4.0, 7.0, 7.0, 3.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.14005279541016, -84.6661376953125, -81.19221496582031, -77.71829986572266, -74.244384765625, -70.77046203613281, -67.29654693603516, -63.8226318359375, -60.34871292114258, -56.874794006347656, -53.40087890625, -49.92695999145508, -46.453041076660156, -42.9791259765625, -39.50520706176758, -36.031288146972656, -32.557373046875, -29.08345603942871, -25.609539031982422, -22.1356201171875, -18.66170310974121, -15.187786102294922, -11.7138671875, -8.239950180053711, -4.766033172607422, -1.2921156883239746, 2.1818017959594727, 5.655719757080078, 9.129636764526367, 12.603553771972656, 16.077472686767578, 19.551389694213867, 23.025299072265625, 26.499216079711914, 29.973133087158203, 33.447052001953125, 36.92096710205078, 40.3948860168457, 43.868804931640625, 47.34272003173828, 50.8166389465332, 54.290557861328125, 57.76447296142578, 61.2383918762207, 64.71231079101562, 68.18622589111328, 71.66014099121094, 75.13406372070312, 78.60797882080078, 82.08189392089844, 85.55581665039062, 89.02973175048828, 92.50364685058594, 95.97756958007812, 99.45148468017578, 102.92539978027344, 106.39932250976562, 109.87323760986328, 113.34716033935547, 116.82107543945312, 120.29499053955078, 123.76890563964844, 127.24282836914062, 130.7167510986328, 134.19065856933594]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 10.0, 7.0, 9.0, 13.0, 20.0, 24.0, 66.0, 94.0, 149.0, 278.0, 773.0, 2941.0, 3900596.0, 285213.0, 2674.0, 690.0, 292.0, 166.0, 89.0, 59.0, 37.0, 20.0, 14.0, 12.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.875, -87.7392578125, -84.603515625, -81.4677734375, -78.33203125, -75.1962890625, -72.060546875, -68.9248046875, -65.7890625, -62.6533203125, -59.517578125, -56.3818359375, -53.24609375, -50.1103515625, -46.974609375, -43.8388671875, -40.703125, -37.5673828125, -34.431640625, -31.2958984375, -28.16015625, -25.0244140625, -21.888671875, -18.7529296875, -15.6171875, -12.4814453125, -9.345703125, -6.2099609375, -3.07421875, 0.0615234375, 3.197265625, 6.3330078125, 9.46875, 12.6044921875, 15.740234375, 18.8759765625, 22.01171875, 25.1474609375, 28.283203125, 31.4189453125, 34.5546875, 37.6904296875, 40.826171875, 43.9619140625, 47.09765625, 50.2333984375, 53.369140625, 56.5048828125, 59.640625, 62.7763671875, 65.912109375, 69.0478515625, 72.18359375, 75.3193359375, 78.455078125, 81.5908203125, 84.7265625, 87.8623046875, 90.998046875, 94.1337890625, 97.26953125, 100.4052734375, 103.541015625, 106.6767578125, 109.8125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 11.0, 10.0, 19.0, 23.0, 17.0, 38.0, 40.0, 46.0, 52.0, 59.0, 55.0, 64.0, 63.0, 52.0, 69.0, 62.0, 44.0, 50.0, 37.0, 39.0, 32.0, 26.0, 23.0, 11.0, 13.0, 13.0, 7.0, 5.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3515625, -6.15264892578125, -5.9537353515625, -5.75482177734375, -5.555908203125, -5.35699462890625, -5.1580810546875, -4.95916748046875, -4.76025390625, -4.56134033203125, -4.3624267578125, -4.16351318359375, -3.964599609375, -3.76568603515625, -3.5667724609375, -3.36785888671875, -3.1689453125, -2.97003173828125, -2.7711181640625, -2.57220458984375, -2.373291015625, -2.17437744140625, -1.9754638671875, -1.77655029296875, -1.57763671875, -1.37872314453125, -1.1798095703125, -0.98089599609375, -0.781982421875, -0.58306884765625, -0.3841552734375, -0.18524169921875, 0.013671875, 0.21258544921875, 0.4114990234375, 0.61041259765625, 0.809326171875, 1.00823974609375, 1.2071533203125, 1.40606689453125, 1.60498046875, 1.80389404296875, 2.0028076171875, 2.20172119140625, 2.400634765625, 2.59954833984375, 2.7984619140625, 2.99737548828125, 3.1962890625, 3.39520263671875, 3.5941162109375, 3.79302978515625, 3.991943359375, 4.19085693359375, 4.3897705078125, 4.58868408203125, 4.78759765625, 4.98651123046875, 5.1854248046875, 5.38433837890625, 5.583251953125, 5.78216552734375, 5.9810791015625, 6.17999267578125, 6.37890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 12.0, 20.0, 32.0, 38.0, 49.0, 97.0, 124.0, 184.0, 308.0, 597.0, 1250.0, 4103.0, 392779.0, 3787251.0, 4687.0, 1207.0, 616.0, 333.0, 197.0, 128.0, 75.0, 40.0, 45.0, 30.0, 16.0, 11.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.3125, -61.33544921875, -59.3583984375, -57.38134765625, -55.404296875, -53.42724609375, -51.4501953125, -49.47314453125, -47.49609375, -45.51904296875, -43.5419921875, -41.56494140625, -39.587890625, -37.61083984375, -35.6337890625, -33.65673828125, -31.6796875, -29.70263671875, -27.7255859375, -25.74853515625, -23.771484375, -21.79443359375, -19.8173828125, -17.84033203125, -15.86328125, -13.88623046875, -11.9091796875, -9.93212890625, -7.955078125, -5.97802734375, -4.0009765625, -2.02392578125, -0.046875, 1.93017578125, 3.9072265625, 5.88427734375, 7.861328125, 9.83837890625, 11.8154296875, 13.79248046875, 15.76953125, 17.74658203125, 19.7236328125, 21.70068359375, 23.677734375, 25.65478515625, 27.6318359375, 29.60888671875, 31.5859375, 33.56298828125, 35.5400390625, 37.51708984375, 39.494140625, 41.47119140625, 43.4482421875, 45.42529296875, 47.40234375, 49.37939453125, 51.3564453125, 53.33349609375, 55.310546875, 57.28759765625, 59.2646484375, 61.24169921875, 63.21875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 3.0, 15.0, 30.0, 120.0, 3629.0, 180.0, 44.0, 19.0, 10.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5703125, -7.33807373046875, -7.1058349609375, -6.87359619140625, -6.641357421875, -6.40911865234375, -6.1768798828125, -5.94464111328125, -5.71240234375, -5.48016357421875, -5.2479248046875, -5.01568603515625, -4.783447265625, -4.55120849609375, -4.3189697265625, -4.08673095703125, -3.8544921875, -3.62225341796875, -3.3900146484375, -3.15777587890625, -2.925537109375, -2.69329833984375, -2.4610595703125, -2.22882080078125, -1.99658203125, -1.76434326171875, -1.5321044921875, -1.29986572265625, -1.067626953125, -0.83538818359375, -0.6031494140625, -0.37091064453125, -0.138671875, 0.09356689453125, 0.3258056640625, 0.55804443359375, 0.790283203125, 1.02252197265625, 1.2547607421875, 1.48699951171875, 1.71923828125, 1.95147705078125, 2.1837158203125, 2.41595458984375, 2.648193359375, 2.88043212890625, 3.1126708984375, 3.34490966796875, 3.5771484375, 3.80938720703125, 4.0416259765625, 4.27386474609375, 4.506103515625, 4.73834228515625, 4.9705810546875, 5.20281982421875, 5.43505859375, 5.66729736328125, 5.8995361328125, 6.13177490234375, 6.364013671875, 6.59625244140625, 6.8284912109375, 7.06072998046875, 7.29296875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 7.0, 8.0, 8.0, 9.0, 10.0, 10.0, 20.0, 21.0, 30.0, 34.0, 39.0, 52.0, 76.0, 103.0, 106.0, 106.0, 103.0, 70.0, 40.0, 36.0, 30.0, 22.0, 13.0, 10.0, 10.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.97657585144043, -19.404468536376953, -18.83236312866211, -18.260255813598633, -17.688148498535156, -17.11604118347168, -16.543933868408203, -15.97182846069336, -15.399721145629883, -14.827613830566406, -14.255507469177246, -13.683401107788086, -13.11129379272461, -12.539186477661133, -11.967080116271973, -11.394973754882812, -10.822866439819336, -10.25075912475586, -9.6786527633667, -9.106546401977539, -8.534439086914062, -7.962332248687744, -7.390225410461426, -6.818118572235107, -6.246011734008789, -5.673904895782471, -5.101798057556152, -4.529691219329834, -3.9575843811035156, -3.3854775428771973, -2.813370704650879, -2.2412638664245605, -1.669158935546875, -1.0970520973205566, -0.5249452590942383, 0.04716157913208008, 0.6192684173583984, 1.1913752555847168, 1.7634820938110352, 2.3355889320373535, 2.907695770263672, 3.4798026084899902, 4.051909446716309, 4.624016284942627, 5.196123123168945, 5.768229961395264, 6.340336799621582, 6.9124436378479, 7.484550476074219, 8.056657791137695, 8.628764152526855, 9.200870513916016, 9.772977828979492, 10.345085144042969, 10.917191505432129, 11.489297866821289, 12.061405181884766, 12.633512496948242, 13.205618858337402, 13.777725219726562, 14.349832534790039, 14.921939849853516, 15.494046211242676, 16.066152572631836, 16.638259887695312]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 3.0, 10.0, 7.0, 11.0, 12.0, 7.0, 7.0, 9.0, 13.0, 18.0, 12.0, 19.0, 17.0, 20.0, 29.0, 29.0, 37.0, 40.0, 34.0, 33.0, 38.0, 43.0, 37.0, 40.0, 37.0, 34.0, 26.0, 23.0, 32.0, 35.0, 31.0, 25.0, 37.0, 22.0, 15.0, 26.0, 18.0, 17.0, 8.0, 22.0, 11.0, 7.0, 9.0, 6.0, 4.0, 6.0, 4.0, 6.0, 4.0, 1.0, 1.0, 5.0, 3.0, 0.0, 2.0], "bins": [-8.951093673706055, -8.668628692626953, -8.386163711547852, -8.103697776794434, -7.821232795715332, -7.5387678146362305, -7.256302833557129, -6.973837852478027, -6.691372394561768, -6.408907413482666, -6.126441955566406, -5.843976974487305, -5.561511993408203, -5.279046535491943, -4.996581554412842, -4.714116096496582, -4.4316511154174805, -4.149186134338379, -3.866720676422119, -3.5842556953430176, -3.301790475845337, -3.0193252563476562, -2.7368602752685547, -2.454395055770874, -2.1719298362731934, -1.8894646167755127, -1.6069995164871216, -1.3245344161987305, -1.0420691967010498, -0.7596039772033691, -0.477138876914978, -0.19467377662658691, 0.08779239654541016, 0.37025755643844604, 0.6527227163314819, 0.9351878762245178, 1.2176530361175537, 1.5001182556152344, 1.7825833559036255, 2.0650484561920166, 2.3475136756896973, 2.629978895187378, 2.9124441146850586, 3.19490909576416, 3.477374315261841, 3.7598395347595215, 4.042304515838623, 4.324769973754883, 4.607234954833984, 4.889699935913086, 5.172165393829346, 5.454630374908447, 5.737095832824707, 6.019560813903809, 6.30202579498291, 6.584490776062012, 6.8669562339782715, 7.149421215057373, 7.431886672973633, 7.714351654052734, 7.996816635131836, 8.279281616210938, 8.561747550964355, 8.844212532043457, 9.126677513122559]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 10.0, 10.0, 15.0, 16.0, 40.0, 51.0, 72.0, 89.0, 119.0, 199.0, 295.0, 427.0, 716.0, 1104.0, 1974.0, 3727.0, 7294.0, 16379.0, 40521.0, 112877.0, 302150.0, 338226.0, 136931.0, 48071.0, 19087.0, 8600.0, 4042.0, 2204.0, 1155.0, 718.0, 432.0, 296.0, 239.0, 133.0, 82.0, 66.0, 41.0, 25.0, 38.0, 17.0, 16.0, 8.0, 8.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-16.28125, -15.7891845703125, -15.297119140625, -14.8050537109375, -14.31298828125, -13.8209228515625, -13.328857421875, -12.8367919921875, -12.3447265625, -11.8526611328125, -11.360595703125, -10.8685302734375, -10.37646484375, -9.8843994140625, -9.392333984375, -8.9002685546875, -8.408203125, -7.9161376953125, -7.424072265625, -6.9320068359375, -6.43994140625, -5.9478759765625, -5.455810546875, -4.9637451171875, -4.4716796875, -3.9796142578125, -3.487548828125, -2.9954833984375, -2.50341796875, -2.0113525390625, -1.519287109375, -1.0272216796875, -0.53515625, -0.0430908203125, 0.448974609375, 0.9410400390625, 1.43310546875, 1.9251708984375, 2.417236328125, 2.9093017578125, 3.4013671875, 3.8934326171875, 4.385498046875, 4.8775634765625, 5.36962890625, 5.8616943359375, 6.353759765625, 6.8458251953125, 7.337890625, 7.8299560546875, 8.322021484375, 8.8140869140625, 9.30615234375, 9.7982177734375, 10.290283203125, 10.7823486328125, 11.2744140625, 11.7664794921875, 12.258544921875, 12.7506103515625, 13.24267578125, 13.7347412109375, 14.226806640625, 14.7188720703125, 15.2109375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 8.0, 6.0, 8.0, 14.0, 18.0, 14.0, 30.0, 26.0, 33.0, 33.0, 45.0, 46.0, 55.0, 60.0, 46.0, 66.0, 54.0, 61.0, 48.0, 57.0, 35.0, 48.0, 33.0, 37.0, 28.0, 17.0, 21.0, 10.0, 12.0, 7.0, 5.0, 8.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.69140625, -6.49493408203125, -6.2984619140625, -6.10198974609375, -5.905517578125, -5.70904541015625, -5.5125732421875, -5.31610107421875, -5.11962890625, -4.92315673828125, -4.7266845703125, -4.53021240234375, -4.333740234375, -4.13726806640625, -3.9407958984375, -3.74432373046875, -3.5478515625, -3.35137939453125, -3.1549072265625, -2.95843505859375, -2.761962890625, -2.56549072265625, -2.3690185546875, -2.17254638671875, -1.97607421875, -1.77960205078125, -1.5831298828125, -1.38665771484375, -1.190185546875, -0.99371337890625, -0.7972412109375, -0.60076904296875, -0.404296875, -0.20782470703125, -0.0113525390625, 0.18511962890625, 0.381591796875, 0.57806396484375, 0.7745361328125, 0.97100830078125, 1.16748046875, 1.36395263671875, 1.5604248046875, 1.75689697265625, 1.953369140625, 2.14984130859375, 2.3463134765625, 2.54278564453125, 2.7392578125, 2.93572998046875, 3.1322021484375, 3.32867431640625, 3.525146484375, 3.72161865234375, 3.9180908203125, 4.11456298828125, 4.31103515625, 4.50750732421875, 4.7039794921875, 4.90045166015625, 5.096923828125, 5.29339599609375, 5.4898681640625, 5.68634033203125, 5.8828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 7.0, 4.0, 3.0, 8.0, 19.0, 24.0, 31.0, 41.0, 73.0, 66.0, 129.0, 211.0, 296.0, 492.0, 976.0, 2574.0, 13747.0, 224069.0, 754342.0, 43304.0, 4898.0, 1432.0, 684.0, 383.0, 257.0, 154.0, 104.0, 81.0, 49.0, 30.0, 20.0, 19.0, 10.0, 8.0, 7.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.8125, -45.5205078125, -44.228515625, -42.9365234375, -41.64453125, -40.3525390625, -39.060546875, -37.7685546875, -36.4765625, -35.1845703125, -33.892578125, -32.6005859375, -31.30859375, -30.0166015625, -28.724609375, -27.4326171875, -26.140625, -24.8486328125, -23.556640625, -22.2646484375, -20.97265625, -19.6806640625, -18.388671875, -17.0966796875, -15.8046875, -14.5126953125, -13.220703125, -11.9287109375, -10.63671875, -9.3447265625, -8.052734375, -6.7607421875, -5.46875, -4.1767578125, -2.884765625, -1.5927734375, -0.30078125, 0.9912109375, 2.283203125, 3.5751953125, 4.8671875, 6.1591796875, 7.451171875, 8.7431640625, 10.03515625, 11.3271484375, 12.619140625, 13.9111328125, 15.203125, 16.4951171875, 17.787109375, 19.0791015625, 20.37109375, 21.6630859375, 22.955078125, 24.2470703125, 25.5390625, 26.8310546875, 28.123046875, 29.4150390625, 30.70703125, 31.9990234375, 33.291015625, 34.5830078125, 35.875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 7.0, 3.0, 10.0, 11.0, 17.0, 17.0, 26.0, 28.0, 30.0, 42.0, 37.0, 42.0, 45.0, 64.0, 60.0, 68.0, 57.0, 74.0, 62.0, 44.0, 50.0, 33.0, 28.0, 34.0, 31.0, 20.0, 21.0, 10.0, 9.0, 11.0, 10.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.890625, -29.889404296875, -28.88818359375, -27.886962890625, -26.8857421875, -25.884521484375, -24.88330078125, -23.882080078125, -22.880859375, -21.879638671875, -20.87841796875, -19.877197265625, -18.8759765625, -17.874755859375, -16.87353515625, -15.872314453125, -14.87109375, -13.869873046875, -12.86865234375, -11.867431640625, -10.8662109375, -9.864990234375, -8.86376953125, -7.862548828125, -6.861328125, -5.860107421875, -4.85888671875, -3.857666015625, -2.8564453125, -1.855224609375, -0.85400390625, 0.147216796875, 1.1484375, 2.149658203125, 3.15087890625, 4.152099609375, 5.1533203125, 6.154541015625, 7.15576171875, 8.156982421875, 9.158203125, 10.159423828125, 11.16064453125, 12.161865234375, 13.1630859375, 14.164306640625, 15.16552734375, 16.166748046875, 17.16796875, 18.169189453125, 19.17041015625, 20.171630859375, 21.1728515625, 22.174072265625, 23.17529296875, 24.176513671875, 25.177734375, 26.178955078125, 27.18017578125, 28.181396484375, 29.1826171875, 30.183837890625, 31.18505859375, 32.186279296875, 33.1875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 6.0, 6.0, 5.0, 24.0, 25.0, 33.0, 41.0, 82.0, 109.0, 164.0, 222.0, 367.0, 595.0, 1029.0, 1844.0, 3833.0, 8881.0, 26577.0, 127178.0, 677802.0, 151619.0, 29237.0, 9874.0, 4177.0, 2010.0, 1076.0, 566.0, 422.0, 250.0, 155.0, 100.0, 78.0, 57.0, 31.0, 18.0, 19.0, 13.0, 13.0, 6.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.140625, -15.62890625, -15.1171875, -14.60546875, -14.09375, -13.58203125, -13.0703125, -12.55859375, -12.046875, -11.53515625, -11.0234375, -10.51171875, -10.0, -9.48828125, -8.9765625, -8.46484375, -7.953125, -7.44140625, -6.9296875, -6.41796875, -5.90625, -5.39453125, -4.8828125, -4.37109375, -3.859375, -3.34765625, -2.8359375, -2.32421875, -1.8125, -1.30078125, -0.7890625, -0.27734375, 0.234375, 0.74609375, 1.2578125, 1.76953125, 2.28125, 2.79296875, 3.3046875, 3.81640625, 4.328125, 4.83984375, 5.3515625, 5.86328125, 6.375, 6.88671875, 7.3984375, 7.91015625, 8.421875, 8.93359375, 9.4453125, 9.95703125, 10.46875, 10.98046875, 11.4921875, 12.00390625, 12.515625, 13.02734375, 13.5390625, 14.05078125, 14.5625, 15.07421875, 15.5859375, 16.09765625, 16.609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 7.0, 6.0, 8.0, 9.0, 13.0, 16.0, 24.0, 27.0, 46.0, 63.0, 95.0, 135.0, 140.0, 124.0, 84.0, 51.0, 36.0, 15.0, 20.0, 14.0, 16.0, 8.0, 8.0, 2.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.003265380859375, -0.0031801462173461914, -0.003094911575317383, -0.0030096769332885742, -0.0029244422912597656, -0.002839207649230957, -0.0027539730072021484, -0.00266873836517334, -0.0025835037231445312, -0.0024982690811157227, -0.002413034439086914, -0.0023277997970581055, -0.002242565155029297, -0.0021573305130004883, -0.0020720958709716797, -0.001986861228942871, -0.0019016265869140625, -0.001816391944885254, -0.0017311573028564453, -0.0016459226608276367, -0.0015606880187988281, -0.0014754533767700195, -0.001390218734741211, -0.0013049840927124023, -0.0012197494506835938, -0.0011345148086547852, -0.0010492801666259766, -0.000964045524597168, -0.0008788108825683594, -0.0007935762405395508, -0.0007083415985107422, -0.0006231069564819336, -0.000537872314453125, -0.0004526376724243164, -0.0003674030303955078, -0.0002821683883666992, -0.00019693374633789062, -0.00011169910430908203, -2.6464462280273438e-05, 5.8770179748535156e-05, 0.00014400482177734375, 0.00022923946380615234, 0.00031447410583496094, 0.00039970874786376953, 0.0004849433898925781, 0.0005701780319213867, 0.0006554126739501953, 0.0007406473159790039, 0.0008258819580078125, 0.0009111166000366211, 0.0009963512420654297, 0.0010815858840942383, 0.0011668205261230469, 0.0012520551681518555, 0.001337289810180664, 0.0014225244522094727, 0.0015077590942382812, 0.0015929937362670898, 0.0016782283782958984, 0.001763463020324707, 0.0018486976623535156, 0.0019339323043823242, 0.002019166946411133, 0.0021044015884399414, 0.00218963623046875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 4.0, 12.0, 12.0, 15.0, 26.0, 27.0, 28.0, 60.0, 120.0, 164.0, 273.0, 455.0, 827.0, 1573.0, 3716.0, 10682.0, 42660.0, 368633.0, 542984.0, 54961.0, 12867.0, 4441.0, 1838.0, 881.0, 495.0, 267.0, 161.0, 119.0, 82.0, 50.0, 34.0, 17.0, 12.0, 10.0, 10.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.71875, -17.109375, -16.5, -15.890625, -15.28125, -14.671875, -14.0625, -13.453125, -12.84375, -12.234375, -11.625, -11.015625, -10.40625, -9.796875, -9.1875, -8.578125, -7.96875, -7.359375, -6.75, -6.140625, -5.53125, -4.921875, -4.3125, -3.703125, -3.09375, -2.484375, -1.875, -1.265625, -0.65625, -0.046875, 0.5625, 1.171875, 1.78125, 2.390625, 3.0, 3.609375, 4.21875, 4.828125, 5.4375, 6.046875, 6.65625, 7.265625, 7.875, 8.484375, 9.09375, 9.703125, 10.3125, 10.921875, 11.53125, 12.140625, 12.75, 13.359375, 13.96875, 14.578125, 15.1875, 15.796875, 16.40625, 17.015625, 17.625, 18.234375, 18.84375, 19.453125, 20.0625, 20.671875, 21.28125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 11.0, 6.0, 13.0, 15.0, 41.0, 60.0, 75.0, 81.0, 96.0, 101.0, 98.0, 96.0, 84.0, 62.0, 32.0, 45.0, 28.0, 13.0, 12.0, 4.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.171875, -15.631103515625, -15.09033203125, -14.549560546875, -14.0087890625, -13.468017578125, -12.92724609375, -12.386474609375, -11.845703125, -11.304931640625, -10.76416015625, -10.223388671875, -9.6826171875, -9.141845703125, -8.60107421875, -8.060302734375, -7.51953125, -6.978759765625, -6.43798828125, -5.897216796875, -5.3564453125, -4.815673828125, -4.27490234375, -3.734130859375, -3.193359375, -2.652587890625, -2.11181640625, -1.571044921875, -1.0302734375, -0.489501953125, 0.05126953125, 0.592041015625, 1.1328125, 1.673583984375, 2.21435546875, 2.755126953125, 3.2958984375, 3.836669921875, 4.37744140625, 4.918212890625, 5.458984375, 5.999755859375, 6.54052734375, 7.081298828125, 7.6220703125, 8.162841796875, 8.70361328125, 9.244384765625, 9.78515625, 10.325927734375, 10.86669921875, 11.407470703125, 11.9482421875, 12.489013671875, 13.02978515625, 13.570556640625, 14.111328125, 14.652099609375, 15.19287109375, 15.733642578125, 16.2744140625, 16.815185546875, 17.35595703125, 17.896728515625, 18.4375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 1.0, 7.0, 18.0, 25.0, 41.0, 58.0, 78.0, 115.0, 137.0, 127.0, 114.0, 110.0, 59.0, 33.0, 21.0, 18.0, 10.0, 10.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-220.7029571533203, -214.5623321533203, -208.4217071533203, -202.28109741210938, -196.14047241210938, -189.99984741210938, -183.85922241210938, -177.71859741210938, -171.57797241210938, -165.43734741210938, -159.29672241210938, -153.15609741210938, -147.01548767089844, -140.87486267089844, -134.73423767089844, -128.59361267089844, -122.4530029296875, -116.3123779296875, -110.17176055908203, -104.03113555908203, -97.89051818847656, -91.74989318847656, -85.60926818847656, -79.46864318847656, -73.3280258178711, -67.1874008178711, -61.046783447265625, -54.906158447265625, -48.76553726196289, -42.624916076660156, -36.484291076660156, -30.343669891357422, -24.20306396484375, -18.062442779541016, -11.921819686889648, -5.781196594238281, 0.3594245910644531, 6.5000457763671875, 12.640670776367188, 18.781291961669922, 24.921913146972656, 31.06253433227539, 37.203155517578125, 43.343780517578125, 49.48440170288086, 55.625022888183594, 61.765647888183594, 67.90626525878906, 74.04689025878906, 80.18751525878906, 86.32813262939453, 92.46875762939453, 98.609375, 104.75, 110.890625, 117.03125, 123.17186737060547, 129.31248474121094, 135.45310974121094, 141.59373474121094, 147.73435974121094, 153.87496948242188, 160.01559448242188, 166.15621948242188, 172.29684448242188]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 10.0, 4.0, 12.0, 8.0, 10.0, 18.0, 12.0, 11.0, 13.0, 22.0, 26.0, 25.0, 24.0, 23.0, 35.0, 31.0, 37.0, 51.0, 44.0, 39.0, 60.0, 41.0, 28.0, 37.0, 51.0, 33.0, 36.0, 46.0, 29.0, 27.0, 18.0, 23.0, 14.0, 8.0, 11.0, 14.0, 15.0, 14.0, 11.0, 7.0, 5.0, 8.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-112.93780517578125, -109.39639282226562, -105.85498809814453, -102.31358337402344, -98.77217102050781, -95.23075866699219, -91.6893539428711, -88.14794921875, -84.60653686523438, -81.06512451171875, -77.52371978759766, -73.98231506347656, -70.44090270996094, -66.89949035644531, -63.35808563232422, -59.81667709350586, -56.2752685546875, -52.73386001586914, -49.19245147705078, -45.65104293823242, -42.10963439941406, -38.5682258605957, -35.026817321777344, -31.485408782958984, -27.944000244140625, -24.402591705322266, -20.861183166503906, -17.319774627685547, -13.778366088867188, -10.236957550048828, -6.695549011230469, -3.1541404724121094, 0.38726806640625, 3.9286766052246094, 7.470085144042969, 11.011493682861328, 14.552902221679688, 18.094310760498047, 21.635719299316406, 25.177127838134766, 28.718536376953125, 32.259944915771484, 35.801353454589844, 39.3427619934082, 42.88417053222656, 46.42557907104492, 49.96698760986328, 53.50839614868164, 57.0498046875, 60.59121322631836, 64.13262176513672, 67.67402648925781, 71.21543884277344, 74.75685119628906, 78.29825592041016, 81.83966064453125, 85.38107299804688, 88.9224853515625, 92.4638900756836, 96.00529479980469, 99.54670715332031, 103.08811950683594, 106.62952423095703, 110.17092895507812, 113.71234130859375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 15.0, 15.0, 30.0, 34.0, 45.0, 82.0, 132.0, 209.0, 444.0, 1003.0, 2845.0, 16068.0, 4144563.0, 23059.0, 3518.0, 1051.0, 450.0, 261.0, 158.0, 91.0, 55.0, 37.0, 24.0, 18.0, 16.0, 11.0, 8.0, 3.0, 2.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.25, -46.56103515625, -44.8720703125, -43.18310546875, -41.494140625, -39.80517578125, -38.1162109375, -36.42724609375, -34.73828125, -33.04931640625, -31.3603515625, -29.67138671875, -27.982421875, -26.29345703125, -24.6044921875, -22.91552734375, -21.2265625, -19.53759765625, -17.8486328125, -16.15966796875, -14.470703125, -12.78173828125, -11.0927734375, -9.40380859375, -7.71484375, -6.02587890625, -4.3369140625, -2.64794921875, -0.958984375, 0.72998046875, 2.4189453125, 4.10791015625, 5.796875, 7.48583984375, 9.1748046875, 10.86376953125, 12.552734375, 14.24169921875, 15.9306640625, 17.61962890625, 19.30859375, 20.99755859375, 22.6865234375, 24.37548828125, 26.064453125, 27.75341796875, 29.4423828125, 31.13134765625, 32.8203125, 34.50927734375, 36.1982421875, 37.88720703125, 39.576171875, 41.26513671875, 42.9541015625, 44.64306640625, 46.33203125, 48.02099609375, 49.7099609375, 51.39892578125, 53.087890625, 54.77685546875, 56.4658203125, 58.15478515625, 59.84375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 6.0, 7.0, 12.0, 15.0, 11.0, 21.0, 26.0, 25.0, 28.0, 38.0, 33.0, 53.0, 57.0, 57.0, 53.0, 56.0, 50.0, 70.0, 46.0, 42.0, 57.0, 36.0, 30.0, 34.0, 26.0, 26.0, 19.0, 13.0, 9.0, 11.0, 5.0, 6.0, 9.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.86328125, -6.6676025390625, -6.471923828125, -6.2762451171875, -6.08056640625, -5.8848876953125, -5.689208984375, -5.4935302734375, -5.2978515625, -5.1021728515625, -4.906494140625, -4.7108154296875, -4.51513671875, -4.3194580078125, -4.123779296875, -3.9281005859375, -3.732421875, -3.5367431640625, -3.341064453125, -3.1453857421875, -2.94970703125, -2.7540283203125, -2.558349609375, -2.3626708984375, -2.1669921875, -1.9713134765625, -1.775634765625, -1.5799560546875, -1.38427734375, -1.1885986328125, -0.992919921875, -0.7972412109375, -0.6015625, -0.4058837890625, -0.210205078125, -0.0145263671875, 0.18115234375, 0.3768310546875, 0.572509765625, 0.7681884765625, 0.9638671875, 1.1595458984375, 1.355224609375, 1.5509033203125, 1.74658203125, 1.9422607421875, 2.137939453125, 2.3336181640625, 2.529296875, 2.7249755859375, 2.920654296875, 3.1163330078125, 3.31201171875, 3.5076904296875, 3.703369140625, 3.8990478515625, 4.0947265625, 4.2904052734375, 4.486083984375, 4.6817626953125, 4.87744140625, 5.0731201171875, 5.268798828125, 5.4644775390625, 5.66015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 11.0, 18.0, 24.0, 26.0, 39.0, 62.0, 67.0, 90.0, 87.0, 147.0, 213.0, 268.0, 387.0, 497.0, 720.0, 1101.0, 1776.0, 3098.0, 6910.0, 25954.0, 4087355.0, 47353.0, 8405.0, 3628.0, 2000.0, 1189.0, 811.0, 542.0, 377.0, 279.0, 211.0, 153.0, 113.0, 89.0, 75.0, 46.0, 35.0, 40.0, 23.0, 19.0, 8.0, 11.0, 4.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.875, -35.70849609375, -34.5419921875, -33.37548828125, -32.208984375, -31.04248046875, -29.8759765625, -28.70947265625, -27.54296875, -26.37646484375, -25.2099609375, -24.04345703125, -22.876953125, -21.71044921875, -20.5439453125, -19.37744140625, -18.2109375, -17.04443359375, -15.8779296875, -14.71142578125, -13.544921875, -12.37841796875, -11.2119140625, -10.04541015625, -8.87890625, -7.71240234375, -6.5458984375, -5.37939453125, -4.212890625, -3.04638671875, -1.8798828125, -0.71337890625, 0.453125, 1.61962890625, 2.7861328125, 3.95263671875, 5.119140625, 6.28564453125, 7.4521484375, 8.61865234375, 9.78515625, 10.95166015625, 12.1181640625, 13.28466796875, 14.451171875, 15.61767578125, 16.7841796875, 17.95068359375, 19.1171875, 20.28369140625, 21.4501953125, 22.61669921875, 23.783203125, 24.94970703125, 26.1162109375, 27.28271484375, 28.44921875, 29.61572265625, 30.7822265625, 31.94873046875, 33.115234375, 34.28173828125, 35.4482421875, 36.61474609375, 37.78125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 11.0, 8.0, 19.0, 52.0, 850.0, 2969.0, 79.0, 31.0, 13.0, 8.0, 6.0, 4.0, 1.0, 0.0, 2.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.6015625, -8.3153076171875, -8.029052734375, -7.7427978515625, -7.45654296875, -7.1702880859375, -6.884033203125, -6.5977783203125, -6.3115234375, -6.0252685546875, -5.739013671875, -5.4527587890625, -5.16650390625, -4.8802490234375, -4.593994140625, -4.3077392578125, -4.021484375, -3.7352294921875, -3.448974609375, -3.1627197265625, -2.87646484375, -2.5902099609375, -2.303955078125, -2.0177001953125, -1.7314453125, -1.4451904296875, -1.158935546875, -0.8726806640625, -0.58642578125, -0.3001708984375, -0.013916015625, 0.2723388671875, 0.55859375, 0.8448486328125, 1.131103515625, 1.4173583984375, 1.70361328125, 1.9898681640625, 2.276123046875, 2.5623779296875, 2.8486328125, 3.1348876953125, 3.421142578125, 3.7073974609375, 3.99365234375, 4.2799072265625, 4.566162109375, 4.8524169921875, 5.138671875, 5.4249267578125, 5.711181640625, 5.9974365234375, 6.28369140625, 6.5699462890625, 6.856201171875, 7.1424560546875, 7.4287109375, 7.7149658203125, 8.001220703125, 8.2874755859375, 8.57373046875, 8.8599853515625, 9.146240234375, 9.4324951171875, 9.71875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 8.0, 17.0, 22.0, 80.0, 144.0, 224.0, 215.0, 136.0, 60.0, 39.0, 30.0, 14.0, 13.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.588838577270508, -14.684802055358887, -12.780765533447266, -10.876729965209961, -8.97269344329834, -7.068656921386719, -5.164621353149414, -3.260584831237793, -1.3565483093261719, 0.5474879741668701, 2.451524257659912, 4.355560302734375, 6.259596824645996, 8.163633346557617, 10.067668914794922, 11.971705436706543, 13.875741958618164, 15.779778480529785, 17.683815002441406, 19.58785057067871, 21.491886138916016, 23.395923614501953, 25.299959182739258, 27.203994750976562, 29.1080322265625, 31.012067794799805, 32.91610336303711, 34.82014083862305, 36.724178314208984, 38.628211975097656, 40.532249450683594, 42.43628692626953, 44.34032440185547, 46.244361877441406, 48.14839553833008, 50.052433013916016, 51.95647048950195, 53.860504150390625, 55.76454162597656, 57.6685791015625, 59.57261657714844, 61.476654052734375, 63.38068771362305, 65.28472900390625, 67.18875885009766, 69.0927963256836, 70.99683380126953, 72.90087127685547, 74.80490112304688, 76.70893859863281, 78.61297607421875, 80.51701354980469, 82.4210433959961, 84.32508087158203, 86.22911834716797, 88.1331558227539, 90.03719329833984, 91.94123077392578, 93.84526824951172, 95.74929809570312, 97.65333557128906, 99.557373046875, 101.46141052246094, 103.36544799804688, 105.26948547363281]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 10.0, 10.0, 11.0, 17.0, 15.0, 19.0, 23.0, 23.0, 21.0, 44.0, 34.0, 33.0, 65.0, 35.0, 43.0, 54.0, 40.0, 55.0, 39.0, 36.0, 38.0, 34.0, 39.0, 36.0, 30.0, 24.0, 28.0, 22.0, 12.0, 15.0, 24.0, 10.0, 14.0, 7.0, 11.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.721115112304688, -18.14789581298828, -17.574676513671875, -17.00145721435547, -16.428237915039062, -15.855018615722656, -15.28179931640625, -14.708580017089844, -14.135360717773438, -13.562141418457031, -12.988922119140625, -12.415702819824219, -11.842483520507812, -11.269264221191406, -10.696044921875, -10.122825622558594, -9.549606323242188, -8.976387023925781, -8.403167724609375, -7.829948425292969, -7.2567291259765625, -6.683509826660156, -6.11029052734375, -5.537071228027344, -4.9638519287109375, -4.390632629394531, -3.817413330078125, -3.2441940307617188, -2.6709747314453125, -2.0977554321289062, -1.5245361328125, -0.9513168334960938, -0.3780994415283203, 0.19511985778808594, 0.7683391571044922, 1.3415584564208984, 1.9147777557373047, 2.487997055053711, 3.061216354370117, 3.6344356536865234, 4.20765495300293, 4.780874252319336, 5.354093551635742, 5.927312850952148, 6.500532150268555, 7.073751449584961, 7.646970748901367, 8.220190048217773, 8.79340934753418, 9.366628646850586, 9.939847946166992, 10.513067245483398, 11.086286544799805, 11.659505844116211, 12.232725143432617, 12.805944442749023, 13.37916374206543, 13.952383041381836, 14.525602340698242, 15.098821640014648, 15.672040939331055, 16.24526023864746, 16.818479537963867, 17.391698837280273, 17.96491813659668]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 7.0, 10.0, 16.0, 8.0, 19.0, 32.0, 46.0, 68.0, 96.0, 136.0, 229.0, 355.0, 548.0, 951.0, 1593.0, 2943.0, 5637.0, 11874.0, 26371.0, 66612.0, 194317.0, 399560.0, 210639.0, 72461.0, 28065.0, 12571.0, 6028.0, 3082.0, 1722.0, 949.0, 561.0, 338.0, 239.0, 156.0, 103.0, 59.0, 44.0, 29.0, 26.0, 17.0, 13.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-16.09375, -15.6138916015625, -15.134033203125, -14.6541748046875, -14.17431640625, -13.6944580078125, -13.214599609375, -12.7347412109375, -12.2548828125, -11.7750244140625, -11.295166015625, -10.8153076171875, -10.33544921875, -9.8555908203125, -9.375732421875, -8.8958740234375, -8.416015625, -7.9361572265625, -7.456298828125, -6.9764404296875, -6.49658203125, -6.0167236328125, -5.536865234375, -5.0570068359375, -4.5771484375, -4.0972900390625, -3.617431640625, -3.1375732421875, -2.65771484375, -2.1778564453125, -1.697998046875, -1.2181396484375, -0.73828125, -0.2584228515625, 0.221435546875, 0.7012939453125, 1.18115234375, 1.6610107421875, 2.140869140625, 2.6207275390625, 3.1005859375, 3.5804443359375, 4.060302734375, 4.5401611328125, 5.02001953125, 5.4998779296875, 5.979736328125, 6.4595947265625, 6.939453125, 7.4193115234375, 7.899169921875, 8.3790283203125, 8.85888671875, 9.3387451171875, 9.818603515625, 10.2984619140625, 10.7783203125, 11.2581787109375, 11.738037109375, 12.2178955078125, 12.69775390625, 13.1776123046875, 13.657470703125, 14.1373291015625, 14.6171875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 7.0, 8.0, 7.0, 19.0, 8.0, 23.0, 17.0, 26.0, 17.0, 29.0, 31.0, 30.0, 43.0, 28.0, 53.0, 66.0, 50.0, 42.0, 59.0, 45.0, 52.0, 49.0, 42.0, 58.0, 28.0, 28.0, 26.0, 14.0, 19.0, 18.0, 17.0, 11.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-6.8046875, -6.6085205078125, -6.412353515625, -6.2161865234375, -6.02001953125, -5.8238525390625, -5.627685546875, -5.4315185546875, -5.2353515625, -5.0391845703125, -4.843017578125, -4.6468505859375, -4.45068359375, -4.2545166015625, -4.058349609375, -3.8621826171875, -3.666015625, -3.4698486328125, -3.273681640625, -3.0775146484375, -2.88134765625, -2.6851806640625, -2.489013671875, -2.2928466796875, -2.0966796875, -1.9005126953125, -1.704345703125, -1.5081787109375, -1.31201171875, -1.1158447265625, -0.919677734375, -0.7235107421875, -0.52734375, -0.3311767578125, -0.135009765625, 0.0611572265625, 0.25732421875, 0.4534912109375, 0.649658203125, 0.8458251953125, 1.0419921875, 1.2381591796875, 1.434326171875, 1.6304931640625, 1.82666015625, 2.0228271484375, 2.218994140625, 2.4151611328125, 2.611328125, 2.8074951171875, 3.003662109375, 3.1998291015625, 3.39599609375, 3.5921630859375, 3.788330078125, 3.9844970703125, 4.1806640625, 4.3768310546875, 4.572998046875, 4.7691650390625, 4.96533203125, 5.1614990234375, 5.357666015625, 5.5538330078125, 5.75]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 9.0, 9.0, 13.0, 17.0, 17.0, 34.0, 42.0, 58.0, 94.0, 131.0, 169.0, 288.0, 528.0, 949.0, 2511.0, 11755.0, 203357.0, 784325.0, 36460.0, 4613.0, 1393.0, 660.0, 400.0, 247.0, 151.0, 106.0, 63.0, 37.0, 33.0, 24.0, 18.0, 14.0, 7.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.59375, -52.07275390625, -50.5517578125, -49.03076171875, -47.509765625, -45.98876953125, -44.4677734375, -42.94677734375, -41.42578125, -39.90478515625, -38.3837890625, -36.86279296875, -35.341796875, -33.82080078125, -32.2998046875, -30.77880859375, -29.2578125, -27.73681640625, -26.2158203125, -24.69482421875, -23.173828125, -21.65283203125, -20.1318359375, -18.61083984375, -17.08984375, -15.56884765625, -14.0478515625, -12.52685546875, -11.005859375, -9.48486328125, -7.9638671875, -6.44287109375, -4.921875, -3.40087890625, -1.8798828125, -0.35888671875, 1.162109375, 2.68310546875, 4.2041015625, 5.72509765625, 7.24609375, 8.76708984375, 10.2880859375, 11.80908203125, 13.330078125, 14.85107421875, 16.3720703125, 17.89306640625, 19.4140625, 20.93505859375, 22.4560546875, 23.97705078125, 25.498046875, 27.01904296875, 28.5400390625, 30.06103515625, 31.58203125, 33.10302734375, 34.6240234375, 36.14501953125, 37.666015625, 39.18701171875, 40.7080078125, 42.22900390625, 43.75]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 9.0, 10.0, 14.0, 15.0, 13.0, 15.0, 14.0, 28.0, 27.0, 41.0, 40.0, 34.0, 33.0, 44.0, 39.0, 50.0, 36.0, 44.0, 54.0, 45.0, 51.0, 39.0, 23.0, 50.0, 34.0, 23.0, 35.0, 24.0, 20.0, 20.0, 15.0, 10.0, 13.0, 4.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-33.8125, -32.892333984375, -31.97216796875, -31.052001953125, -30.1318359375, -29.211669921875, -28.29150390625, -27.371337890625, -26.451171875, -25.531005859375, -24.61083984375, -23.690673828125, -22.7705078125, -21.850341796875, -20.93017578125, -20.010009765625, -19.08984375, -18.169677734375, -17.24951171875, -16.329345703125, -15.4091796875, -14.489013671875, -13.56884765625, -12.648681640625, -11.728515625, -10.808349609375, -9.88818359375, -8.968017578125, -8.0478515625, -7.127685546875, -6.20751953125, -5.287353515625, -4.3671875, -3.447021484375, -2.52685546875, -1.606689453125, -0.6865234375, 0.233642578125, 1.15380859375, 2.073974609375, 2.994140625, 3.914306640625, 4.83447265625, 5.754638671875, 6.6748046875, 7.594970703125, 8.51513671875, 9.435302734375, 10.35546875, 11.275634765625, 12.19580078125, 13.115966796875, 14.0361328125, 14.956298828125, 15.87646484375, 16.796630859375, 17.716796875, 18.636962890625, 19.55712890625, 20.477294921875, 21.3974609375, 22.317626953125, 23.23779296875, 24.157958984375, 25.078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 11.0, 6.0, 11.0, 13.0, 20.0, 24.0, 36.0, 58.0, 68.0, 143.0, 238.0, 440.0, 844.0, 1819.0, 4749.0, 16914.0, 126652.0, 785719.0, 89389.0, 13788.0, 4116.0, 1668.0, 800.0, 412.0, 209.0, 135.0, 69.0, 49.0, 31.0, 23.0, 17.0, 20.0, 11.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-16.1875, -15.6181640625, -15.048828125, -14.4794921875, -13.91015625, -13.3408203125, -12.771484375, -12.2021484375, -11.6328125, -11.0634765625, -10.494140625, -9.9248046875, -9.35546875, -8.7861328125, -8.216796875, -7.6474609375, -7.078125, -6.5087890625, -5.939453125, -5.3701171875, -4.80078125, -4.2314453125, -3.662109375, -3.0927734375, -2.5234375, -1.9541015625, -1.384765625, -0.8154296875, -0.24609375, 0.3232421875, 0.892578125, 1.4619140625, 2.03125, 2.6005859375, 3.169921875, 3.7392578125, 4.30859375, 4.8779296875, 5.447265625, 6.0166015625, 6.5859375, 7.1552734375, 7.724609375, 8.2939453125, 8.86328125, 9.4326171875, 10.001953125, 10.5712890625, 11.140625, 11.7099609375, 12.279296875, 12.8486328125, 13.41796875, 13.9873046875, 14.556640625, 15.1259765625, 15.6953125, 16.2646484375, 16.833984375, 17.4033203125, 17.97265625, 18.5419921875, 19.111328125, 19.6806640625, 20.25]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 8.0, 5.0, 9.0, 18.0, 27.0, 45.0, 71.0, 140.0, 224.0, 188.0, 119.0, 59.0, 27.0, 10.0, 9.0, 8.0, 8.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003749847412109375, -0.00359189510345459, -0.0034339427947998047, -0.0032759904861450195, -0.0031180381774902344, -0.0029600858688354492, -0.002802133560180664, -0.002644181251525879, -0.0024862289428710938, -0.0023282766342163086, -0.0021703243255615234, -0.0020123720169067383, -0.0018544197082519531, -0.001696467399597168, -0.0015385150909423828, -0.0013805627822875977, -0.0012226104736328125, -0.0010646581649780273, -0.0009067058563232422, -0.000748753547668457, -0.0005908012390136719, -0.0004328489303588867, -0.00027489662170410156, -0.0001169443130493164, 4.100799560546875e-05, 0.0001989603042602539, 0.00035691261291503906, 0.0005148649215698242, 0.0006728172302246094, 0.0008307695388793945, 0.0009887218475341797, 0.0011466741561889648, 0.00130462646484375, 0.0014625787734985352, 0.0016205310821533203, 0.0017784833908081055, 0.0019364356994628906, 0.0020943880081176758, 0.002252340316772461, 0.002410292625427246, 0.0025682449340820312, 0.0027261972427368164, 0.0028841495513916016, 0.0030421018600463867, 0.003200054168701172, 0.003358006477355957, 0.003515958786010742, 0.0036739110946655273, 0.0038318634033203125, 0.003989815711975098, 0.004147768020629883, 0.004305720329284668, 0.004463672637939453, 0.004621624946594238, 0.0047795772552490234, 0.004937529563903809, 0.005095481872558594, 0.005253434181213379, 0.005411386489868164, 0.005569338798522949, 0.005727291107177734, 0.0058852434158325195, 0.006043195724487305, 0.00620114803314209, 0.006359100341796875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 16.0, 23.0, 23.0, 49.0, 83.0, 120.0, 253.0, 498.0, 1147.0, 3397.0, 13727.0, 146178.0, 824703.0, 47058.0, 7439.0, 2188.0, 800.0, 360.0, 195.0, 111.0, 52.0, 42.0, 26.0, 21.0, 12.0, 8.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.21875, -23.392333984375, -22.56591796875, -21.739501953125, -20.9130859375, -20.086669921875, -19.26025390625, -18.433837890625, -17.607421875, -16.781005859375, -15.95458984375, -15.128173828125, -14.3017578125, -13.475341796875, -12.64892578125, -11.822509765625, -10.99609375, -10.169677734375, -9.34326171875, -8.516845703125, -7.6904296875, -6.864013671875, -6.03759765625, -5.211181640625, -4.384765625, -3.558349609375, -2.73193359375, -1.905517578125, -1.0791015625, -0.252685546875, 0.57373046875, 1.400146484375, 2.2265625, 3.052978515625, 3.87939453125, 4.705810546875, 5.5322265625, 6.358642578125, 7.18505859375, 8.011474609375, 8.837890625, 9.664306640625, 10.49072265625, 11.317138671875, 12.1435546875, 12.969970703125, 13.79638671875, 14.622802734375, 15.44921875, 16.275634765625, 17.10205078125, 17.928466796875, 18.7548828125, 19.581298828125, 20.40771484375, 21.234130859375, 22.060546875, 22.886962890625, 23.71337890625, 24.539794921875, 25.3662109375, 26.192626953125, 27.01904296875, 27.845458984375, 28.671875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 8.0, 11.0, 19.0, 28.0, 44.0, 68.0, 107.0, 136.0, 142.0, 142.0, 103.0, 62.0, 40.0, 31.0, 13.0, 11.0, 13.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.046875, -15.4638671875, -14.880859375, -14.2978515625, -13.71484375, -13.1318359375, -12.548828125, -11.9658203125, -11.3828125, -10.7998046875, -10.216796875, -9.6337890625, -9.05078125, -8.4677734375, -7.884765625, -7.3017578125, -6.71875, -6.1357421875, -5.552734375, -4.9697265625, -4.38671875, -3.8037109375, -3.220703125, -2.6376953125, -2.0546875, -1.4716796875, -0.888671875, -0.3056640625, 0.27734375, 0.8603515625, 1.443359375, 2.0263671875, 2.609375, 3.1923828125, 3.775390625, 4.3583984375, 4.94140625, 5.5244140625, 6.107421875, 6.6904296875, 7.2734375, 7.8564453125, 8.439453125, 9.0224609375, 9.60546875, 10.1884765625, 10.771484375, 11.3544921875, 11.9375, 12.5205078125, 13.103515625, 13.6865234375, 14.26953125, 14.8525390625, 15.435546875, 16.0185546875, 16.6015625, 17.1845703125, 17.767578125, 18.3505859375, 18.93359375, 19.5166015625, 20.099609375, 20.6826171875, 21.265625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 13.0, 19.0, 40.0, 79.0, 103.0, 166.0, 165.0, 149.0, 97.0, 70.0, 43.0, 29.0, 9.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.9344482421875, -210.02053833007812, -202.1066131591797, -194.1927032470703, -186.27879333496094, -178.3648681640625, -170.45095825195312, -162.53704833984375, -154.62313842773438, -146.709228515625, -138.79530334472656, -130.8813934326172, -122.96748352050781, -115.0535659790039, -107.1396484375, -99.22573852539062, -91.31182098388672, -83.39790344238281, -75.48399353027344, -67.57007598876953, -59.656166076660156, -51.74224853515625, -43.82833480834961, -35.91442108154297, -28.000507354736328, -20.086593627929688, -12.17267894744873, -4.258764266967773, 3.655149459838867, 11.56906509399414, 19.48297882080078, 27.396892547607422, 35.31080627441406, 43.2247200012207, 51.138633728027344, 59.05255126953125, 66.96646118164062, 74.88037872314453, 82.79429626464844, 90.70820617675781, 98.62211608886719, 106.5360336303711, 114.44994354248047, 122.36386108398438, 130.27777099609375, 138.19168090820312, 146.10560607910156, 154.01951599121094, 161.93344116210938, 169.84735107421875, 177.7612762451172, 185.67518615722656, 193.58909606933594, 201.50302124023438, 209.41693115234375, 217.33084106445312, 225.2447509765625, 233.15866088867188, 241.0725860595703, 248.9864959716797, 256.9004211425781, 264.8143310546875, 272.7282409667969, 280.64215087890625, 288.5560607910156]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 0.0, 5.0, 7.0, 8.0, 7.0, 10.0, 9.0, 22.0, 14.0, 16.0, 18.0, 31.0, 32.0, 25.0, 34.0, 39.0, 49.0, 46.0, 43.0, 39.0, 68.0, 57.0, 49.0, 37.0, 42.0, 42.0, 33.0, 35.0, 28.0, 24.0, 19.0, 13.0, 13.0, 15.0, 12.0, 14.0, 13.0, 5.0, 6.0, 5.0, 8.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-142.135009765625, -137.78236389160156, -133.42971801757812, -129.0770721435547, -124.72441864013672, -120.37177276611328, -116.01912689208984, -111.6664810180664, -107.31382751464844, -102.961181640625, -98.60853576660156, -94.25588989257812, -89.90323638916016, -85.55059051513672, -81.19794464111328, -76.84529876708984, -72.4926528930664, -68.14000701904297, -63.787357330322266, -59.43471145629883, -55.082061767578125, -50.72941589355469, -46.37677001953125, -42.02412414550781, -37.67147445678711, -33.31882858276367, -28.96617889404297, -24.61353302001953, -20.26088523864746, -15.90823745727539, -11.555591583251953, -7.202943801879883, -2.8502960205078125, 1.5023512840270996, 5.854998588562012, 10.207645416259766, 14.560293197631836, 18.912940979003906, 23.265586853027344, 27.618234634399414, 31.970882415771484, 36.32352828979492, 40.676177978515625, 45.02882385253906, 49.3814697265625, 53.7341194152832, 58.08676528930664, 62.439414978027344, 66.79206085205078, 71.14470672607422, 75.49735260009766, 79.85000610351562, 84.20265197753906, 88.5552978515625, 92.90794372558594, 97.26058959960938, 101.61323547363281, 105.96588134765625, 110.31852722167969, 114.67117309570312, 119.0238265991211, 123.37647247314453, 127.72911834716797, 132.08177185058594, 136.43441772460938]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 8.0, 8.0, 8.0, 11.0, 18.0, 14.0, 28.0, 38.0, 58.0, 88.0, 168.0, 244.0, 463.0, 903.0, 2892.0, 4077737.0, 107182.0, 2439.0, 880.0, 423.0, 228.0, 136.0, 84.0, 70.0, 41.0, 31.0, 25.0, 20.0, 6.0, 8.0, 6.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.6875, -64.4609375, -62.234375, -60.0078125, -57.78125, -55.5546875, -53.328125, -51.1015625, -48.875, -46.6484375, -44.421875, -42.1953125, -39.96875, -37.7421875, -35.515625, -33.2890625, -31.0625, -28.8359375, -26.609375, -24.3828125, -22.15625, -19.9296875, -17.703125, -15.4765625, -13.25, -11.0234375, -8.796875, -6.5703125, -4.34375, -2.1171875, 0.109375, 2.3359375, 4.5625, 6.7890625, 9.015625, 11.2421875, 13.46875, 15.6953125, 17.921875, 20.1484375, 22.375, 24.6015625, 26.828125, 29.0546875, 31.28125, 33.5078125, 35.734375, 37.9609375, 40.1875, 42.4140625, 44.640625, 46.8671875, 49.09375, 51.3203125, 53.546875, 55.7734375, 58.0, 60.2265625, 62.453125, 64.6796875, 66.90625, 69.1328125, 71.359375, 73.5859375, 75.8125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 3.0, 8.0, 4.0, 6.0, 6.0, 10.0, 9.0, 15.0, 26.0, 25.0, 33.0, 34.0, 41.0, 47.0, 44.0, 68.0, 61.0, 67.0, 72.0, 68.0, 62.0, 54.0, 48.0, 33.0, 32.0, 25.0, 17.0, 21.0, 10.0, 16.0, 10.0, 11.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.6796875, -8.42230224609375, -8.1649169921875, -7.90753173828125, -7.650146484375, -7.39276123046875, -7.1353759765625, -6.87799072265625, -6.62060546875, -6.36322021484375, -6.1058349609375, -5.84844970703125, -5.591064453125, -5.33367919921875, -5.0762939453125, -4.81890869140625, -4.5615234375, -4.30413818359375, -4.0467529296875, -3.78936767578125, -3.531982421875, -3.27459716796875, -3.0172119140625, -2.75982666015625, -2.50244140625, -2.24505615234375, -1.9876708984375, -1.73028564453125, -1.472900390625, -1.21551513671875, -0.9581298828125, -0.70074462890625, -0.443359375, -0.18597412109375, 0.0714111328125, 0.32879638671875, 0.586181640625, 0.84356689453125, 1.1009521484375, 1.35833740234375, 1.61572265625, 1.87310791015625, 2.1304931640625, 2.38787841796875, 2.645263671875, 2.90264892578125, 3.1600341796875, 3.41741943359375, 3.6748046875, 3.93218994140625, 4.1895751953125, 4.44696044921875, 4.704345703125, 4.96173095703125, 5.2191162109375, 5.47650146484375, 5.73388671875, 5.99127197265625, 6.2486572265625, 6.50604248046875, 6.763427734375, 7.02081298828125, 7.2781982421875, 7.53558349609375, 7.79296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 8.0, 10.0, 12.0, 10.0, 17.0, 19.0, 26.0, 39.0, 54.0, 72.0, 108.0, 128.0, 223.0, 316.0, 507.0, 969.0, 2068.0, 6032.0, 101289.0, 4067609.0, 9089.0, 2736.0, 1151.0, 597.0, 417.0, 215.0, 157.0, 107.0, 58.0, 68.0, 49.0, 38.0, 22.0, 19.0, 13.0, 14.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.625, -24.6806640625, -23.736328125, -22.7919921875, -21.84765625, -20.9033203125, -19.958984375, -19.0146484375, -18.0703125, -17.1259765625, -16.181640625, -15.2373046875, -14.29296875, -13.3486328125, -12.404296875, -11.4599609375, -10.515625, -9.5712890625, -8.626953125, -7.6826171875, -6.73828125, -5.7939453125, -4.849609375, -3.9052734375, -2.9609375, -2.0166015625, -1.072265625, -0.1279296875, 0.81640625, 1.7607421875, 2.705078125, 3.6494140625, 4.59375, 5.5380859375, 6.482421875, 7.4267578125, 8.37109375, 9.3154296875, 10.259765625, 11.2041015625, 12.1484375, 13.0927734375, 14.037109375, 14.9814453125, 15.92578125, 16.8701171875, 17.814453125, 18.7587890625, 19.703125, 20.6474609375, 21.591796875, 22.5361328125, 23.48046875, 24.4248046875, 25.369140625, 26.3134765625, 27.2578125, 28.2021484375, 29.146484375, 30.0908203125, 31.03515625, 31.9794921875, 32.923828125, 33.8681640625, 34.8125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 4.0, 15.0, 44.0, 3582.0, 366.0, 37.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.90625, -11.6220703125, -11.337890625, -11.0537109375, -10.76953125, -10.4853515625, -10.201171875, -9.9169921875, -9.6328125, -9.3486328125, -9.064453125, -8.7802734375, -8.49609375, -8.2119140625, -7.927734375, -7.6435546875, -7.359375, -7.0751953125, -6.791015625, -6.5068359375, -6.22265625, -5.9384765625, -5.654296875, -5.3701171875, -5.0859375, -4.8017578125, -4.517578125, -4.2333984375, -3.94921875, -3.6650390625, -3.380859375, -3.0966796875, -2.8125, -2.5283203125, -2.244140625, -1.9599609375, -1.67578125, -1.3916015625, -1.107421875, -0.8232421875, -0.5390625, -0.2548828125, 0.029296875, 0.3134765625, 0.59765625, 0.8818359375, 1.166015625, 1.4501953125, 1.734375, 2.0185546875, 2.302734375, 2.5869140625, 2.87109375, 3.1552734375, 3.439453125, 3.7236328125, 4.0078125, 4.2919921875, 4.576171875, 4.8603515625, 5.14453125, 5.4287109375, 5.712890625, 5.9970703125, 6.28125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 18.0, 45.0, 170.0, 354.0, 268.0, 96.0, 33.0, 15.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.422706604003906, -35.1540641784668, -33.88542556762695, -32.616783142089844, -31.348140716552734, -30.079500198364258, -28.81085968017578, -27.542217254638672, -26.273576736450195, -25.00493621826172, -23.73629379272461, -22.467653274536133, -21.199012756347656, -19.930370330810547, -18.66172981262207, -17.393089294433594, -16.124446868896484, -14.855805397033691, -13.587163925170898, -12.318523406982422, -11.049881935119629, -9.781240463256836, -8.51259994506836, -7.243958473205566, -5.975317001342773, -4.7066755294799805, -3.4380345344543457, -2.169393301010132, -0.900752067565918, 0.367889404296875, 1.6365303993225098, 2.9051713943481445, 4.173809051513672, 5.442450523376465, 6.7110915184021, 7.979732513427734, 9.248373985290527, 10.51701545715332, 11.785655975341797, 13.05429744720459, 14.322938919067383, 15.591580390930176, 16.86022186279297, 18.128862380981445, 19.397502899169922, 20.66614532470703, 21.934785842895508, 23.203426361083984, 24.472068786621094, 25.74070930480957, 27.00935173034668, 28.277992248535156, 29.546634674072266, 30.815275192260742, 32.08391571044922, 33.35255813598633, 34.62120056152344, 35.88984298706055, 37.15848159790039, 38.4271240234375, 39.69576644897461, 40.96440887451172, 42.23304748535156, 43.50168991088867, 44.770328521728516]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 16.0, 10.0, 16.0, 10.0, 13.0, 25.0, 38.0, 33.0, 30.0, 34.0, 50.0, 55.0, 61.0, 61.0, 58.0, 52.0, 50.0, 64.0, 46.0, 48.0, 40.0, 37.0, 34.0, 24.0, 24.0, 19.0, 9.0, 9.0, 7.0, 4.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.129558563232422, -9.797567367553711, -9.465575218200684, -9.133584022521973, -8.801592826843262, -8.469600677490234, -8.137609481811523, -7.805617809295654, -7.473626136779785, -7.141634464263916, -6.809643268585205, -6.477651596069336, -6.145659923553467, -5.813668251037598, -5.481677055358887, -5.149685382843018, -4.817694187164307, -4.4857025146484375, -4.153711318969727, -3.8217196464538574, -3.4897279739379883, -3.1577365398406982, -2.825745105743408, -2.493753433227539, -2.161761999130249, -1.8297704458236694, -1.4977788925170898, -1.1657874584197998, -0.8337959051132202, -0.5018043518066406, -0.16981291770935059, 0.16217875480651855, 0.4941701889038086, 0.8261617422103882, 1.1581532955169678, 1.4901447296142578, 1.8221362829208374, 2.154127836227417, 2.486119270324707, 2.818110942840576, 3.150102376937866, 3.4820938110351562, 3.8140854835510254, 4.1460771560668945, 4.4780683517456055, 4.810060024261475, 5.142051696777344, 5.474042892456055, 5.806034564971924, 6.138026237487793, 6.470017433166504, 6.802009105682373, 7.134000778198242, 7.465991973876953, 7.797983646392822, 8.129975318908691, 8.461966514587402, 8.793957710266113, 9.12594985961914, 9.457941055297852, 9.789932250976562, 10.12192440032959, 10.4539155960083, 10.785907745361328, 11.117898941040039]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 11.0, 14.0, 28.0, 33.0, 55.0, 82.0, 132.0, 206.0, 306.0, 585.0, 967.0, 1939.0, 4115.0, 9706.0, 28467.0, 108041.0, 461387.0, 326391.0, 71197.0, 20522.0, 7539.0, 3144.0, 1568.0, 848.0, 478.0, 278.0, 156.0, 98.0, 71.0, 52.0, 37.0, 22.0, 24.0, 10.0, 7.0, 7.0, 3.0, 4.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-25.84375, -25.102294921875, -24.36083984375, -23.619384765625, -22.8779296875, -22.136474609375, -21.39501953125, -20.653564453125, -19.912109375, -19.170654296875, -18.42919921875, -17.687744140625, -16.9462890625, -16.204833984375, -15.46337890625, -14.721923828125, -13.98046875, -13.239013671875, -12.49755859375, -11.756103515625, -11.0146484375, -10.273193359375, -9.53173828125, -8.790283203125, -8.048828125, -7.307373046875, -6.56591796875, -5.824462890625, -5.0830078125, -4.341552734375, -3.60009765625, -2.858642578125, -2.1171875, -1.375732421875, -0.63427734375, 0.107177734375, 0.8486328125, 1.590087890625, 2.33154296875, 3.072998046875, 3.814453125, 4.555908203125, 5.29736328125, 6.038818359375, 6.7802734375, 7.521728515625, 8.26318359375, 9.004638671875, 9.74609375, 10.487548828125, 11.22900390625, 11.970458984375, 12.7119140625, 13.453369140625, 14.19482421875, 14.936279296875, 15.677734375, 16.419189453125, 17.16064453125, 17.902099609375, 18.6435546875, 19.385009765625, 20.12646484375, 20.867919921875, 21.609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 4.0, 7.0, 0.0, 9.0, 6.0, 8.0, 15.0, 24.0, 25.0, 32.0, 29.0, 40.0, 43.0, 48.0, 47.0, 67.0, 64.0, 65.0, 65.0, 65.0, 60.0, 43.0, 60.0, 29.0, 28.0, 24.0, 20.0, 16.0, 16.0, 11.0, 6.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8515625, -8.593017578125, -8.33447265625, -8.075927734375, -7.8173828125, -7.558837890625, -7.30029296875, -7.041748046875, -6.783203125, -6.524658203125, -6.26611328125, -6.007568359375, -5.7490234375, -5.490478515625, -5.23193359375, -4.973388671875, -4.71484375, -4.456298828125, -4.19775390625, -3.939208984375, -3.6806640625, -3.422119140625, -3.16357421875, -2.905029296875, -2.646484375, -2.387939453125, -2.12939453125, -1.870849609375, -1.6123046875, -1.353759765625, -1.09521484375, -0.836669921875, -0.578125, -0.319580078125, -0.06103515625, 0.197509765625, 0.4560546875, 0.714599609375, 0.97314453125, 1.231689453125, 1.490234375, 1.748779296875, 2.00732421875, 2.265869140625, 2.5244140625, 2.782958984375, 3.04150390625, 3.300048828125, 3.55859375, 3.817138671875, 4.07568359375, 4.334228515625, 4.5927734375, 4.851318359375, 5.10986328125, 5.368408203125, 5.626953125, 5.885498046875, 6.14404296875, 6.402587890625, 6.6611328125, 6.919677734375, 7.17822265625, 7.436767578125, 7.6953125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 6.0, 6.0, 13.0, 14.0, 12.0, 24.0, 33.0, 47.0, 72.0, 77.0, 132.0, 196.0, 324.0, 469.0, 735.0, 1367.0, 2994.0, 8408.0, 34630.0, 250409.0, 629928.0, 91747.0, 17042.0, 5005.0, 2006.0, 1051.0, 621.0, 356.0, 245.0, 176.0, 110.0, 76.0, 50.0, 41.0, 29.0, 37.0, 14.0, 14.0, 10.0, 11.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.265625, -23.489501953125, -22.71337890625, -21.937255859375, -21.1611328125, -20.385009765625, -19.60888671875, -18.832763671875, -18.056640625, -17.280517578125, -16.50439453125, -15.728271484375, -14.9521484375, -14.176025390625, -13.39990234375, -12.623779296875, -11.84765625, -11.071533203125, -10.29541015625, -9.519287109375, -8.7431640625, -7.967041015625, -7.19091796875, -6.414794921875, -5.638671875, -4.862548828125, -4.08642578125, -3.310302734375, -2.5341796875, -1.758056640625, -0.98193359375, -0.205810546875, 0.5703125, 1.346435546875, 2.12255859375, 2.898681640625, 3.6748046875, 4.450927734375, 5.22705078125, 6.003173828125, 6.779296875, 7.555419921875, 8.33154296875, 9.107666015625, 9.8837890625, 10.659912109375, 11.43603515625, 12.212158203125, 12.98828125, 13.764404296875, 14.54052734375, 15.316650390625, 16.0927734375, 16.868896484375, 17.64501953125, 18.421142578125, 19.197265625, 19.973388671875, 20.74951171875, 21.525634765625, 22.3017578125, 23.077880859375, 23.85400390625, 24.630126953125, 25.40625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 7.0, 2.0, 9.0, 6.0, 8.0, 17.0, 20.0, 17.0, 19.0, 26.0, 17.0, 24.0, 35.0, 30.0, 37.0, 36.0, 55.0, 38.0, 40.0, 42.0, 42.0, 46.0, 43.0, 33.0, 45.0, 31.0, 37.0, 30.0, 21.0, 27.0, 30.0, 22.0, 24.0, 19.0, 9.0, 8.0, 12.0, 12.0, 8.0, 2.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.140625, -22.28662109375, -21.4326171875, -20.57861328125, -19.724609375, -18.87060546875, -18.0166015625, -17.16259765625, -16.30859375, -15.45458984375, -14.6005859375, -13.74658203125, -12.892578125, -12.03857421875, -11.1845703125, -10.33056640625, -9.4765625, -8.62255859375, -7.7685546875, -6.91455078125, -6.060546875, -5.20654296875, -4.3525390625, -3.49853515625, -2.64453125, -1.79052734375, -0.9365234375, -0.08251953125, 0.771484375, 1.62548828125, 2.4794921875, 3.33349609375, 4.1875, 5.04150390625, 5.8955078125, 6.74951171875, 7.603515625, 8.45751953125, 9.3115234375, 10.16552734375, 11.01953125, 11.87353515625, 12.7275390625, 13.58154296875, 14.435546875, 15.28955078125, 16.1435546875, 16.99755859375, 17.8515625, 18.70556640625, 19.5595703125, 20.41357421875, 21.267578125, 22.12158203125, 22.9755859375, 23.82958984375, 24.68359375, 25.53759765625, 26.3916015625, 27.24560546875, 28.099609375, 28.95361328125, 29.8076171875, 30.66162109375, 31.515625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 5.0, 8.0, 8.0, 11.0, 16.0, 22.0, 21.0, 35.0, 58.0, 76.0, 127.0, 207.0, 433.0, 987.0, 3712.0, 23671.0, 785634.0, 218416.0, 11310.0, 2284.0, 708.0, 296.0, 182.0, 93.0, 59.0, 49.0, 30.0, 16.0, 23.0, 10.0, 14.0, 11.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.7060546875, -23.818359375, -22.9306640625, -22.04296875, -21.1552734375, -20.267578125, -19.3798828125, -18.4921875, -17.6044921875, -16.716796875, -15.8291015625, -14.94140625, -14.0537109375, -13.166015625, -12.2783203125, -11.390625, -10.5029296875, -9.615234375, -8.7275390625, -7.83984375, -6.9521484375, -6.064453125, -5.1767578125, -4.2890625, -3.4013671875, -2.513671875, -1.6259765625, -0.73828125, 0.1494140625, 1.037109375, 1.9248046875, 2.8125, 3.7001953125, 4.587890625, 5.4755859375, 6.36328125, 7.2509765625, 8.138671875, 9.0263671875, 9.9140625, 10.8017578125, 11.689453125, 12.5771484375, 13.46484375, 14.3525390625, 15.240234375, 16.1279296875, 17.015625, 17.9033203125, 18.791015625, 19.6787109375, 20.56640625, 21.4541015625, 22.341796875, 23.2294921875, 24.1171875, 25.0048828125, 25.892578125, 26.7802734375, 27.66796875, 28.5556640625, 29.443359375, 30.3310546875, 31.21875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 11.0, 6.0, 10.0, 4.0, 13.0, 21.0, 21.0, 37.0, 52.0, 70.0, 74.0, 109.0, 126.0, 105.0, 92.0, 70.0, 52.0, 37.0, 16.0, 19.0, 16.0, 6.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0018062591552734375, -0.001742720603942871, -0.0016791820526123047, -0.0016156435012817383, -0.0015521049499511719, -0.0014885663986206055, -0.001425027847290039, -0.0013614892959594727, -0.0012979507446289062, -0.0012344121932983398, -0.0011708736419677734, -0.001107335090637207, -0.0010437965393066406, -0.0009802579879760742, -0.0009167194366455078, -0.0008531808853149414, -0.000789642333984375, -0.0007261037826538086, -0.0006625652313232422, -0.0005990266799926758, -0.0005354881286621094, -0.00047194957733154297, -0.00040841102600097656, -0.00034487247467041016, -0.00028133392333984375, -0.00021779537200927734, -0.00015425682067871094, -9.071826934814453e-05, -2.7179718017578125e-05, 3.635883331298828e-05, 9.989738464355469e-05, 0.0001634359359741211, 0.0002269744873046875, 0.0002905130386352539, 0.0003540515899658203, 0.0004175901412963867, 0.0004811286926269531, 0.0005446672439575195, 0.0006082057952880859, 0.0006717443466186523, 0.0007352828979492188, 0.0007988214492797852, 0.0008623600006103516, 0.000925898551940918, 0.0009894371032714844, 0.0010529756546020508, 0.0011165142059326172, 0.0011800527572631836, 0.00124359130859375, 0.0013071298599243164, 0.0013706684112548828, 0.0014342069625854492, 0.0014977455139160156, 0.001561284065246582, 0.0016248226165771484, 0.0016883611679077148, 0.0017518997192382812, 0.0018154382705688477, 0.001878976821899414, 0.0019425153732299805, 0.002006053924560547, 0.0020695924758911133, 0.0021331310272216797, 0.002196669578552246, 0.0022602081298828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 11.0, 6.0, 16.0, 21.0, 36.0, 64.0, 97.0, 197.0, 339.0, 746.0, 2199.0, 8924.0, 102399.0, 884701.0, 40430.0, 5533.0, 1574.0, 626.0, 291.0, 144.0, 72.0, 54.0, 27.0, 19.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.40625, -31.37255859375, -30.3388671875, -29.30517578125, -28.271484375, -27.23779296875, -26.2041015625, -25.17041015625, -24.13671875, -23.10302734375, -22.0693359375, -21.03564453125, -20.001953125, -18.96826171875, -17.9345703125, -16.90087890625, -15.8671875, -14.83349609375, -13.7998046875, -12.76611328125, -11.732421875, -10.69873046875, -9.6650390625, -8.63134765625, -7.59765625, -6.56396484375, -5.5302734375, -4.49658203125, -3.462890625, -2.42919921875, -1.3955078125, -0.36181640625, 0.671875, 1.70556640625, 2.7392578125, 3.77294921875, 4.806640625, 5.84033203125, 6.8740234375, 7.90771484375, 8.94140625, 9.97509765625, 11.0087890625, 12.04248046875, 13.076171875, 14.10986328125, 15.1435546875, 16.17724609375, 17.2109375, 18.24462890625, 19.2783203125, 20.31201171875, 21.345703125, 22.37939453125, 23.4130859375, 24.44677734375, 25.48046875, 26.51416015625, 27.5478515625, 28.58154296875, 29.615234375, 30.64892578125, 31.6826171875, 32.71630859375, 33.75]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 19.0, 16.0, 34.0, 64.0, 116.0, 166.0, 212.0, 158.0, 105.0, 43.0, 21.0, 10.0, 10.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.96875, -31.08984375, -30.2109375, -29.33203125, -28.453125, -27.57421875, -26.6953125, -25.81640625, -24.9375, -24.05859375, -23.1796875, -22.30078125, -21.421875, -20.54296875, -19.6640625, -18.78515625, -17.90625, -17.02734375, -16.1484375, -15.26953125, -14.390625, -13.51171875, -12.6328125, -11.75390625, -10.875, -9.99609375, -9.1171875, -8.23828125, -7.359375, -6.48046875, -5.6015625, -4.72265625, -3.84375, -2.96484375, -2.0859375, -1.20703125, -0.328125, 0.55078125, 1.4296875, 2.30859375, 3.1875, 4.06640625, 4.9453125, 5.82421875, 6.703125, 7.58203125, 8.4609375, 9.33984375, 10.21875, 11.09765625, 11.9765625, 12.85546875, 13.734375, 14.61328125, 15.4921875, 16.37109375, 17.25, 18.12890625, 19.0078125, 19.88671875, 20.765625, 21.64453125, 22.5234375, 23.40234375, 24.28125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 8.0, 16.0, 10.0, 45.0, 96.0, 178.0, 231.0, 172.0, 119.0, 71.0, 29.0, 16.0, 9.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-353.6455078125, -343.4924621582031, -333.33941650390625, -323.18634033203125, -313.0332946777344, -302.8802490234375, -292.7271728515625, -282.5741271972656, -272.42108154296875, -262.2680358886719, -252.11497497558594, -241.9619140625, -231.80886840820312, -221.65582275390625, -211.5027618408203, -201.34970092773438, -191.1966552734375, -181.04360961914062, -170.8905487060547, -160.73748779296875, -150.58444213867188, -140.431396484375, -130.27833557128906, -120.12528228759766, -109.97222900390625, -99.81917572021484, -89.66612243652344, -79.51306915283203, -69.36001586914062, -59.20696258544922, -49.05390930175781, -38.900856018066406, -28.747802734375, -18.594749450683594, -8.441696166992188, 1.7113571166992188, 11.864410400390625, 22.01746368408203, 32.17051696777344, 42.323570251464844, 52.47662353515625, 62.629676818847656, 72.78273010253906, 82.93578338623047, 93.08883666992188, 103.24188995361328, 113.39494323730469, 123.5479965209961, 133.7010498046875, 143.85409545898438, 154.0071563720703, 164.16021728515625, 174.31326293945312, 184.46630859375, 194.61936950683594, 204.77243041992188, 214.92547607421875, 225.07852172851562, 235.23158264160156, 245.3846435546875, 255.53768920898438, 265.69073486328125, 275.84381103515625, 285.9968566894531, 296.14990234375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 3.0, 3.0, 10.0, 9.0, 20.0, 17.0, 25.0, 30.0, 26.0, 33.0, 39.0, 33.0, 42.0, 52.0, 52.0, 59.0, 50.0, 74.0, 53.0, 44.0, 44.0, 45.0, 41.0, 30.0, 24.0, 20.0, 29.0, 17.0, 16.0, 15.0, 10.0, 8.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.3406982421875, -132.1693878173828, -126.9980697631836, -121.82675170898438, -116.65544128417969, -111.48412322998047, -106.31280517578125, -101.14149475097656, -95.97018432617188, -90.79886627197266, -85.62755584716797, -80.45623779296875, -75.28492736816406, -70.11360931396484, -64.94229125976562, -59.77098083496094, -54.59966278076172, -49.428348541259766, -44.25703430175781, -39.085716247558594, -33.914405822753906, -28.74308967590332, -23.571773529052734, -18.40045928955078, -13.229145050048828, -8.057830810546875, -2.8865156173706055, 2.284799575805664, 7.456113815307617, 12.62742805480957, 17.798744201660156, 22.97005844116211, 28.141372680664062, 33.312686920166016, 38.48400115966797, 43.65531921386719, 48.826629638671875, 53.997947692871094, 59.16926193237305, 64.340576171875, 69.51188659667969, 74.6832046508789, 79.8545150756836, 85.02583312988281, 90.1971435546875, 95.36846160888672, 100.53977966308594, 105.71109008789062, 110.88240814208984, 116.05372619628906, 121.22503662109375, 126.39635467529297, 131.5676727294922, 136.73898315429688, 141.91029357910156, 147.08160400390625, 152.2529296875, 157.4242401123047, 162.59556579589844, 167.76687622070312, 172.9381866455078, 178.1094970703125, 183.28082275390625, 188.45213317871094, 193.62344360351562]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 5.0, 9.0, 11.0, 12.0, 11.0, 23.0, 27.0, 31.0, 47.0, 78.0, 197.0, 435.0, 1715.0, 10707.0, 4158429.0, 19201.0, 2251.0, 564.0, 214.0, 111.0, 54.0, 35.0, 32.0, 19.0, 15.0, 12.0, 8.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.375, -80.4599609375, -77.544921875, -74.6298828125, -71.71484375, -68.7998046875, -65.884765625, -62.9697265625, -60.0546875, -57.1396484375, -54.224609375, -51.3095703125, -48.39453125, -45.4794921875, -42.564453125, -39.6494140625, -36.734375, -33.8193359375, -30.904296875, -27.9892578125, -25.07421875, -22.1591796875, -19.244140625, -16.3291015625, -13.4140625, -10.4990234375, -7.583984375, -4.6689453125, -1.75390625, 1.1611328125, 4.076171875, 6.9912109375, 9.90625, 12.8212890625, 15.736328125, 18.6513671875, 21.56640625, 24.4814453125, 27.396484375, 30.3115234375, 33.2265625, 36.1416015625, 39.056640625, 41.9716796875, 44.88671875, 47.8017578125, 50.716796875, 53.6318359375, 56.546875, 59.4619140625, 62.376953125, 65.2919921875, 68.20703125, 71.1220703125, 74.037109375, 76.9521484375, 79.8671875, 82.7822265625, 85.697265625, 88.6123046875, 91.52734375, 94.4423828125, 97.357421875, 100.2724609375, 103.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 16.0, 17.0, 27.0, 35.0, 42.0, 61.0, 71.0, 80.0, 93.0, 102.0, 90.0, 85.0, 82.0, 46.0, 34.0, 39.0, 22.0, 13.0, 8.0, 8.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.921875, -12.5452880859375, -12.168701171875, -11.7921142578125, -11.41552734375, -11.0389404296875, -10.662353515625, -10.2857666015625, -9.9091796875, -9.5325927734375, -9.156005859375, -8.7794189453125, -8.40283203125, -8.0262451171875, -7.649658203125, -7.2730712890625, -6.896484375, -6.5198974609375, -6.143310546875, -5.7667236328125, -5.39013671875, -5.0135498046875, -4.636962890625, -4.2603759765625, -3.8837890625, -3.5072021484375, -3.130615234375, -2.7540283203125, -2.37744140625, -2.0008544921875, -1.624267578125, -1.2476806640625, -0.87109375, -0.4945068359375, -0.117919921875, 0.2586669921875, 0.63525390625, 1.0118408203125, 1.388427734375, 1.7650146484375, 2.1416015625, 2.5181884765625, 2.894775390625, 3.2713623046875, 3.64794921875, 4.0245361328125, 4.401123046875, 4.7777099609375, 5.154296875, 5.5308837890625, 5.907470703125, 6.2840576171875, 6.66064453125, 7.0372314453125, 7.413818359375, 7.7904052734375, 8.1669921875, 8.5435791015625, 8.920166015625, 9.2967529296875, 9.67333984375, 10.0499267578125, 10.426513671875, 10.8031005859375, 11.1796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 7.0, 10.0, 14.0, 10.0, 26.0, 38.0, 42.0, 53.0, 55.0, 78.0, 75.0, 133.0, 214.0, 283.0, 416.0, 689.0, 1233.0, 2376.0, 5052.0, 13633.0, 102942.0, 4014828.0, 35106.0, 8633.0, 3708.0, 1777.0, 986.0, 525.0, 368.0, 242.0, 157.0, 128.0, 91.0, 71.0, 64.0, 49.0, 42.0, 28.0, 25.0, 10.0, 10.0, 17.0, 6.0, 9.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-30.703125, -29.833251953125, -28.96337890625, -28.093505859375, -27.2236328125, -26.353759765625, -25.48388671875, -24.614013671875, -23.744140625, -22.874267578125, -22.00439453125, -21.134521484375, -20.2646484375, -19.394775390625, -18.52490234375, -17.655029296875, -16.78515625, -15.915283203125, -15.04541015625, -14.175537109375, -13.3056640625, -12.435791015625, -11.56591796875, -10.696044921875, -9.826171875, -8.956298828125, -8.08642578125, -7.216552734375, -6.3466796875, -5.476806640625, -4.60693359375, -3.737060546875, -2.8671875, -1.997314453125, -1.12744140625, -0.257568359375, 0.6123046875, 1.482177734375, 2.35205078125, 3.221923828125, 4.091796875, 4.961669921875, 5.83154296875, 6.701416015625, 7.5712890625, 8.441162109375, 9.31103515625, 10.180908203125, 11.05078125, 11.920654296875, 12.79052734375, 13.660400390625, 14.5302734375, 15.400146484375, 16.27001953125, 17.139892578125, 18.009765625, 18.879638671875, 19.74951171875, 20.619384765625, 21.4892578125, 22.359130859375, 23.22900390625, 24.098876953125, 24.96875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 9.0, 19.0, 30.0, 57.0, 362.0, 3419.0, 89.0, 37.0, 11.0, 8.0, 9.0, 1.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.84375, -8.298583984375, -7.75341796875, -7.208251953125, -6.6630859375, -6.117919921875, -5.57275390625, -5.027587890625, -4.482421875, -3.937255859375, -3.39208984375, -2.846923828125, -2.3017578125, -1.756591796875, -1.21142578125, -0.666259765625, -0.12109375, 0.424072265625, 0.96923828125, 1.514404296875, 2.0595703125, 2.604736328125, 3.14990234375, 3.695068359375, 4.240234375, 4.785400390625, 5.33056640625, 5.875732421875, 6.4208984375, 6.966064453125, 7.51123046875, 8.056396484375, 8.6015625, 9.146728515625, 9.69189453125, 10.237060546875, 10.7822265625, 11.327392578125, 11.87255859375, 12.417724609375, 12.962890625, 13.508056640625, 14.05322265625, 14.598388671875, 15.1435546875, 15.688720703125, 16.23388671875, 16.779052734375, 17.32421875, 17.869384765625, 18.41455078125, 18.959716796875, 19.5048828125, 20.050048828125, 20.59521484375, 21.140380859375, 21.685546875, 22.230712890625, 22.77587890625, 23.321044921875, 23.8662109375, 24.411376953125, 24.95654296875, 25.501708984375, 26.046875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 11.0, 20.0, 29.0, 77.0, 119.0, 224.0, 227.0, 165.0, 72.0, 34.0, 13.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.01180648803711, -58.49818801879883, -55.98456573486328, -53.470947265625, -50.95732879638672, -48.44371032714844, -45.930091857910156, -43.41646957397461, -40.90285110473633, -38.38923263549805, -35.8756103515625, -33.36199188232422, -30.848373413085938, -28.334754943847656, -25.821134567260742, -23.307514190673828, -20.793895721435547, -18.280277252197266, -15.766656875610352, -13.253037452697754, -10.739418029785156, -8.225798606872559, -5.712179183959961, -3.198558807373047, -0.6849403381347656, 1.828679084777832, 4.34229850769043, 6.855917930603027, 9.369537353515625, 11.883156776428223, 14.39677619934082, 16.910396575927734, 19.42401123046875, 21.93762969970703, 24.451250076293945, 26.96487045288086, 29.47848892211914, 31.992107391357422, 34.50572967529297, 37.01934814453125, 39.53296661376953, 42.04658508300781, 44.560203552246094, 47.07382583618164, 49.58744430541992, 52.1010627746582, 54.61468505859375, 57.12830352783203, 59.64192199707031, 62.155540466308594, 64.66915893554688, 67.18277740478516, 69.69639587402344, 72.21002197265625, 74.72364044189453, 77.23725891113281, 79.7508773803711, 82.26449584960938, 84.77811431884766, 87.29173278808594, 89.80535888671875, 92.31897735595703, 94.83259582519531, 97.3462142944336, 99.85983276367188]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 2.0, 9.0, 12.0, 7.0, 15.0, 14.0, 16.0, 27.0, 27.0, 51.0, 52.0, 45.0, 70.0, 69.0, 71.0, 76.0, 83.0, 58.0, 60.0, 51.0, 43.0, 27.0, 30.0, 23.0, 22.0, 13.0, 9.0, 6.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.988483428955078, -30.519575119018555, -29.050668716430664, -27.58176040649414, -26.11285400390625, -24.643945693969727, -23.175037384033203, -21.706130981445312, -20.23722267150879, -18.768314361572266, -17.299407958984375, -15.830499649047852, -14.361592292785645, -12.892684936523438, -11.423776626586914, -9.954869270324707, -8.4859619140625, -7.017054557800293, -5.548146724700928, -4.0792388916015625, -2.6103315353393555, -1.1414241790771484, 0.327484130859375, 1.796391487121582, 3.265298843383789, 4.734206199645996, 6.203114032745361, 7.672021865844727, 9.140929222106934, 10.60983657836914, 12.078744888305664, 13.547652244567871, 15.016559600830078, 16.4854679107666, 17.954374313354492, 19.423282623291016, 20.892189025878906, 22.36109733581543, 23.830005645751953, 25.298912048339844, 26.767820358276367, 28.23672866821289, 29.70563507080078, 31.174543380737305, 32.64345169067383, 34.11235809326172, 35.581268310546875, 37.050174713134766, 38.519081115722656, 39.98798751831055, 41.4568977355957, 42.925804138183594, 44.394710540771484, 45.863616943359375, 47.33252716064453, 48.80143356323242, 50.27033996582031, 51.7392463684082, 53.20815658569336, 54.67706298828125, 56.14596939086914, 57.61487579345703, 59.08378601074219, 60.55269241333008, 62.021602630615234]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 8.0, 13.0, 23.0, 21.0, 35.0, 46.0, 99.0, 158.0, 227.0, 411.0, 681.0, 1373.0, 2854.0, 6246.0, 17036.0, 56312.0, 242590.0, 516102.0, 145913.0, 36956.0, 12019.0, 4653.0, 2109.0, 1143.0, 573.0, 352.0, 231.0, 133.0, 72.0, 47.0, 31.0, 25.0, 18.0, 12.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.4375, -21.764404296875, -21.09130859375, -20.418212890625, -19.7451171875, -19.072021484375, -18.39892578125, -17.725830078125, -17.052734375, -16.379638671875, -15.70654296875, -15.033447265625, -14.3603515625, -13.687255859375, -13.01416015625, -12.341064453125, -11.66796875, -10.994873046875, -10.32177734375, -9.648681640625, -8.9755859375, -8.302490234375, -7.62939453125, -6.956298828125, -6.283203125, -5.610107421875, -4.93701171875, -4.263916015625, -3.5908203125, -2.917724609375, -2.24462890625, -1.571533203125, -0.8984375, -0.225341796875, 0.44775390625, 1.120849609375, 1.7939453125, 2.467041015625, 3.14013671875, 3.813232421875, 4.486328125, 5.159423828125, 5.83251953125, 6.505615234375, 7.1787109375, 7.851806640625, 8.52490234375, 9.197998046875, 9.87109375, 10.544189453125, 11.21728515625, 11.890380859375, 12.5634765625, 13.236572265625, 13.90966796875, 14.582763671875, 15.255859375, 15.928955078125, 16.60205078125, 17.275146484375, 17.9482421875, 18.621337890625, 19.29443359375, 19.967529296875, 20.640625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 4.0, 11.0, 9.0, 16.0, 19.0, 16.0, 26.0, 19.0, 39.0, 52.0, 52.0, 59.0, 57.0, 59.0, 63.0, 72.0, 74.0, 54.0, 61.0, 51.0, 30.0, 26.0, 29.0, 30.0, 19.0, 11.0, 14.0, 2.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.0390625, -9.74951171875, -9.4599609375, -9.17041015625, -8.880859375, -8.59130859375, -8.3017578125, -8.01220703125, -7.72265625, -7.43310546875, -7.1435546875, -6.85400390625, -6.564453125, -6.27490234375, -5.9853515625, -5.69580078125, -5.40625, -5.11669921875, -4.8271484375, -4.53759765625, -4.248046875, -3.95849609375, -3.6689453125, -3.37939453125, -3.08984375, -2.80029296875, -2.5107421875, -2.22119140625, -1.931640625, -1.64208984375, -1.3525390625, -1.06298828125, -0.7734375, -0.48388671875, -0.1943359375, 0.09521484375, 0.384765625, 0.67431640625, 0.9638671875, 1.25341796875, 1.54296875, 1.83251953125, 2.1220703125, 2.41162109375, 2.701171875, 2.99072265625, 3.2802734375, 3.56982421875, 3.859375, 4.14892578125, 4.4384765625, 4.72802734375, 5.017578125, 5.30712890625, 5.5966796875, 5.88623046875, 6.17578125, 6.46533203125, 6.7548828125, 7.04443359375, 7.333984375, 7.62353515625, 7.9130859375, 8.20263671875, 8.4921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 11.0, 6.0, 14.0, 13.0, 27.0, 46.0, 54.0, 76.0, 94.0, 139.0, 239.0, 327.0, 588.0, 1067.0, 2149.0, 5204.0, 18666.0, 117573.0, 711708.0, 156842.0, 22634.0, 6015.0, 2349.0, 1084.0, 576.0, 343.0, 220.0, 153.0, 91.0, 63.0, 47.0, 32.0, 25.0, 17.0, 10.0, 8.0, 10.0, 7.0, 7.0, 8.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-28.734375, -27.823974609375, -26.91357421875, -26.003173828125, -25.0927734375, -24.182373046875, -23.27197265625, -22.361572265625, -21.451171875, -20.540771484375, -19.63037109375, -18.719970703125, -17.8095703125, -16.899169921875, -15.98876953125, -15.078369140625, -14.16796875, -13.257568359375, -12.34716796875, -11.436767578125, -10.5263671875, -9.615966796875, -8.70556640625, -7.795166015625, -6.884765625, -5.974365234375, -5.06396484375, -4.153564453125, -3.2431640625, -2.332763671875, -1.42236328125, -0.511962890625, 0.3984375, 1.308837890625, 2.21923828125, 3.129638671875, 4.0400390625, 4.950439453125, 5.86083984375, 6.771240234375, 7.681640625, 8.592041015625, 9.50244140625, 10.412841796875, 11.3232421875, 12.233642578125, 13.14404296875, 14.054443359375, 14.96484375, 15.875244140625, 16.78564453125, 17.696044921875, 18.6064453125, 19.516845703125, 20.42724609375, 21.337646484375, 22.248046875, 23.158447265625, 24.06884765625, 24.979248046875, 25.8896484375, 26.800048828125, 27.71044921875, 28.620849609375, 29.53125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 6.0, 4.0, 5.0, 7.0, 12.0, 13.0, 11.0, 13.0, 16.0, 14.0, 23.0, 30.0, 29.0, 41.0, 41.0, 34.0, 44.0, 39.0, 46.0, 54.0, 66.0, 47.0, 51.0, 49.0, 42.0, 36.0, 45.0, 36.0, 31.0, 33.0, 16.0, 16.0, 12.0, 5.0, 15.0, 5.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.875, -31.79638671875, -30.7177734375, -29.63916015625, -28.560546875, -27.48193359375, -26.4033203125, -25.32470703125, -24.24609375, -23.16748046875, -22.0888671875, -21.01025390625, -19.931640625, -18.85302734375, -17.7744140625, -16.69580078125, -15.6171875, -14.53857421875, -13.4599609375, -12.38134765625, -11.302734375, -10.22412109375, -9.1455078125, -8.06689453125, -6.98828125, -5.90966796875, -4.8310546875, -3.75244140625, -2.673828125, -1.59521484375, -0.5166015625, 0.56201171875, 1.640625, 2.71923828125, 3.7978515625, 4.87646484375, 5.955078125, 7.03369140625, 8.1123046875, 9.19091796875, 10.26953125, 11.34814453125, 12.4267578125, 13.50537109375, 14.583984375, 15.66259765625, 16.7412109375, 17.81982421875, 18.8984375, 19.97705078125, 21.0556640625, 22.13427734375, 23.212890625, 24.29150390625, 25.3701171875, 26.44873046875, 27.52734375, 28.60595703125, 29.6845703125, 30.76318359375, 31.841796875, 32.92041015625, 33.9990234375, 35.07763671875, 36.15625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 6.0, 11.0, 14.0, 16.0, 19.0, 26.0, 43.0, 79.0, 122.0, 234.0, 443.0, 1001.0, 2907.0, 13957.0, 220001.0, 762878.0, 38627.0, 5322.0, 1577.0, 591.0, 267.0, 167.0, 85.0, 56.0, 42.0, 22.0, 16.0, 13.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796875, -9.335205078125, -8.87353515625, -8.411865234375, -7.9501953125, -7.488525390625, -7.02685546875, -6.565185546875, -6.103515625, -5.641845703125, -5.18017578125, -4.718505859375, -4.2568359375, -3.795166015625, -3.33349609375, -2.871826171875, -2.41015625, -1.948486328125, -1.48681640625, -1.025146484375, -0.5634765625, -0.101806640625, 0.35986328125, 0.821533203125, 1.283203125, 1.744873046875, 2.20654296875, 2.668212890625, 3.1298828125, 3.591552734375, 4.05322265625, 4.514892578125, 4.9765625, 5.438232421875, 5.89990234375, 6.361572265625, 6.8232421875, 7.284912109375, 7.74658203125, 8.208251953125, 8.669921875, 9.131591796875, 9.59326171875, 10.054931640625, 10.5166015625, 10.978271484375, 11.43994140625, 11.901611328125, 12.36328125, 12.824951171875, 13.28662109375, 13.748291015625, 14.2099609375, 14.671630859375, 15.13330078125, 15.594970703125, 16.056640625, 16.518310546875, 16.97998046875, 17.441650390625, 17.9033203125, 18.364990234375, 18.82666015625, 19.288330078125, 19.75]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 4.0, 4.0, 6.0, 12.0, 10.0, 16.0, 19.0, 25.0, 32.0, 65.0, 80.0, 142.0, 161.0, 127.0, 82.0, 61.0, 42.0, 30.0, 26.0, 13.0, 9.0, 9.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024814605712890625, -0.0024049580097198486, -0.0023284554481506348, -0.002251952886581421, -0.002175450325012207, -0.002098947763442993, -0.0020224452018737793, -0.0019459426403045654, -0.0018694400787353516, -0.0017929375171661377, -0.0017164349555969238, -0.00163993239402771, -0.001563429832458496, -0.0014869272708892822, -0.0014104247093200684, -0.0013339221477508545, -0.0012574195861816406, -0.0011809170246124268, -0.0011044144630432129, -0.001027911901473999, -0.0009514093399047852, -0.0008749067783355713, -0.0007984042167663574, -0.0007219016551971436, -0.0006453990936279297, -0.0005688965320587158, -0.000492393970489502, -0.0004158914089202881, -0.0003393888473510742, -0.00026288628578186035, -0.00018638372421264648, -0.00010988116264343262, -3.337860107421875e-05, 4.312396049499512e-05, 0.00011962652206420898, 0.00019612908363342285, 0.0002726316452026367, 0.0003491342067718506, 0.00042563676834106445, 0.0005021393299102783, 0.0005786418914794922, 0.0006551444530487061, 0.0007316470146179199, 0.0008081495761871338, 0.0008846521377563477, 0.0009611546993255615, 0.0010376572608947754, 0.0011141598224639893, 0.0011906623840332031, 0.001267164945602417, 0.0013436675071716309, 0.0014201700687408447, 0.0014966726303100586, 0.0015731751918792725, 0.0016496777534484863, 0.0017261803150177002, 0.001802682876586914, 0.001879185438156128, 0.001955687999725342, 0.0020321905612945557, 0.0021086931228637695, 0.0021851956844329834, 0.0022616982460021973, 0.002338200807571411, 0.002414703369140625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 5.0, 7.0, 10.0, 15.0, 19.0, 33.0, 36.0, 79.0, 122.0, 221.0, 366.0, 736.0, 1410.0, 3480.0, 11253.0, 53132.0, 540789.0, 381097.0, 40472.0, 9324.0, 3094.0, 1348.0, 631.0, 359.0, 192.0, 118.0, 78.0, 41.0, 26.0, 18.0, 17.0, 8.0, 8.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0], "bins": [-15.8046875, -15.427734375, -15.05078125, -14.673828125, -14.296875, -13.919921875, -13.54296875, -13.166015625, -12.7890625, -12.412109375, -12.03515625, -11.658203125, -11.28125, -10.904296875, -10.52734375, -10.150390625, -9.7734375, -9.396484375, -9.01953125, -8.642578125, -8.265625, -7.888671875, -7.51171875, -7.134765625, -6.7578125, -6.380859375, -6.00390625, -5.626953125, -5.25, -4.873046875, -4.49609375, -4.119140625, -3.7421875, -3.365234375, -2.98828125, -2.611328125, -2.234375, -1.857421875, -1.48046875, -1.103515625, -0.7265625, -0.349609375, 0.02734375, 0.404296875, 0.78125, 1.158203125, 1.53515625, 1.912109375, 2.2890625, 2.666015625, 3.04296875, 3.419921875, 3.796875, 4.173828125, 4.55078125, 4.927734375, 5.3046875, 5.681640625, 6.05859375, 6.435546875, 6.8125, 7.189453125, 7.56640625, 7.943359375, 8.3203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 2.0, 9.0, 13.0, 12.0, 14.0, 21.0, 24.0, 23.0, 36.0, 45.0, 53.0, 64.0, 80.0, 83.0, 93.0, 81.0, 81.0, 49.0, 43.0, 50.0, 32.0, 21.0, 19.0, 13.0, 10.0, 12.0, 8.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3359375, -11.021484375, -10.70703125, -10.392578125, -10.078125, -9.763671875, -9.44921875, -9.134765625, -8.8203125, -8.505859375, -8.19140625, -7.876953125, -7.5625, -7.248046875, -6.93359375, -6.619140625, -6.3046875, -5.990234375, -5.67578125, -5.361328125, -5.046875, -4.732421875, -4.41796875, -4.103515625, -3.7890625, -3.474609375, -3.16015625, -2.845703125, -2.53125, -2.216796875, -1.90234375, -1.587890625, -1.2734375, -0.958984375, -0.64453125, -0.330078125, -0.015625, 0.298828125, 0.61328125, 0.927734375, 1.2421875, 1.556640625, 1.87109375, 2.185546875, 2.5, 2.814453125, 3.12890625, 3.443359375, 3.7578125, 4.072265625, 4.38671875, 4.701171875, 5.015625, 5.330078125, 5.64453125, 5.958984375, 6.2734375, 6.587890625, 6.90234375, 7.216796875, 7.53125, 7.845703125, 8.16015625, 8.474609375, 8.7890625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 0.0, 5.0, 7.0, 10.0, 12.0, 33.0, 45.0, 70.0, 108.0, 152.0, 183.0, 129.0, 86.0, 68.0, 43.0, 20.0, 9.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.03890991210938, -170.4988250732422, -163.958740234375, -157.4186553955078, -150.87857055664062, -144.33848571777344, -137.79840087890625, -131.25831604003906, -124.71823120117188, -118.17814636230469, -111.6380615234375, -105.09797668457031, -98.55789184570312, -92.01780700683594, -85.47772216796875, -78.93763732910156, -72.39755249023438, -65.85746765136719, -59.3173828125, -52.77729797363281, -46.237213134765625, -39.69712829589844, -33.15704345703125, -26.616958618164062, -20.076873779296875, -13.536788940429688, -6.9967041015625, -0.4566192626953125, 6.083465576171875, 12.623550415039062, 19.16363525390625, 25.703720092773438, 32.243804931640625, 38.78388977050781, 45.323974609375, 51.86405944824219, 58.404144287109375, 64.94422912597656, 71.48431396484375, 78.02439880371094, 84.56448364257812, 91.10456848144531, 97.6446533203125, 104.18473815917969, 110.72482299804688, 117.26490783691406, 123.80499267578125, 130.34507751464844, 136.88516235351562, 143.4252471923828, 149.96533203125, 156.5054168701172, 163.04550170898438, 169.58558654785156, 176.12567138671875, 182.66575622558594, 189.20584106445312, 195.7459259033203, 202.2860107421875, 208.8260955810547, 215.36618041992188, 221.90626525878906, 228.44635009765625, 234.98643493652344, 241.52651977539062]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 4.0, 12.0, 12.0, 25.0, 23.0, 34.0, 42.0, 50.0, 50.0, 59.0, 67.0, 69.0, 71.0, 89.0, 79.0, 55.0, 46.0, 40.0, 37.0, 31.0, 21.0, 22.0, 14.0, 13.0, 10.0, 5.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.84893798828125, -127.39197540283203, -120.93501281738281, -114.47804260253906, -108.02108001708984, -101.56411743164062, -95.1071548461914, -88.65019226074219, -82.19322204589844, -75.73625946044922, -69.279296875, -62.822330474853516, -56.36536407470703, -49.90840148925781, -43.451438903808594, -36.99447250366211, -30.537513732910156, -24.080549240112305, -17.623584747314453, -11.166622161865234, -4.709657669067383, 1.7473068237304688, 8.204269409179688, 14.661235809326172, 21.11819839477539, 27.575162887573242, 34.032127380371094, 40.48908996582031, 46.94605255126953, 53.403018951416016, 59.859981536865234, 66.31694793701172, 72.77391052246094, 79.23087310791016, 85.68783569335938, 92.14480590820312, 98.60176849365234, 105.05873107910156, 111.51569366455078, 117.97265625, 124.42962646484375, 130.8865966796875, 137.3435516357422, 143.80052185058594, 150.25747680664062, 156.71444702148438, 163.17141723632812, 169.6283721923828, 176.0853271484375, 182.54229736328125, 188.99925231933594, 195.4562225341797, 201.91317749023438, 208.37014770507812, 214.82711791992188, 221.28407287597656, 227.7410430908203, 234.19801330566406, 240.65496826171875, 247.1119384765625, 253.5688934326172, 260.02587890625, 266.4828186035156, 272.9397888183594, 279.3967590332031]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 11.0, 12.0, 25.0, 35.0, 65.0, 82.0, 181.0, 287.0, 535.0, 1074.0, 2373.0, 5658.0, 15999.0, 68953.0, 3617705.0, 433198.0, 31257.0, 9389.0, 3708.0, 1634.0, 848.0, 467.0, 248.0, 159.0, 127.0, 55.0, 44.0, 37.0, 30.0, 21.0, 15.0, 10.0, 8.0, 3.0, 5.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.703125, -20.94921875, -20.1953125, -19.44140625, -18.6875, -17.93359375, -17.1796875, -16.42578125, -15.671875, -14.91796875, -14.1640625, -13.41015625, -12.65625, -11.90234375, -11.1484375, -10.39453125, -9.640625, -8.88671875, -8.1328125, -7.37890625, -6.625, -5.87109375, -5.1171875, -4.36328125, -3.609375, -2.85546875, -2.1015625, -1.34765625, -0.59375, 0.16015625, 0.9140625, 1.66796875, 2.421875, 3.17578125, 3.9296875, 4.68359375, 5.4375, 6.19140625, 6.9453125, 7.69921875, 8.453125, 9.20703125, 9.9609375, 10.71484375, 11.46875, 12.22265625, 12.9765625, 13.73046875, 14.484375, 15.23828125, 15.9921875, 16.74609375, 17.5, 18.25390625, 19.0078125, 19.76171875, 20.515625, 21.26953125, 22.0234375, 22.77734375, 23.53125, 24.28515625, 25.0390625, 25.79296875, 26.546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 18.0, 21.0, 33.0, 54.0, 47.0, 65.0, 93.0, 87.0, 100.0, 109.0, 97.0, 74.0, 59.0, 46.0, 40.0, 21.0, 11.0, 11.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69921875, -6.27032470703125, -5.8414306640625, -5.41253662109375, -4.983642578125, -4.55474853515625, -4.1258544921875, -3.69696044921875, -3.26806640625, -2.83917236328125, -2.4102783203125, -1.98138427734375, -1.552490234375, -1.12359619140625, -0.6947021484375, -0.26580810546875, 0.1630859375, 0.59197998046875, 1.0208740234375, 1.44976806640625, 1.878662109375, 2.30755615234375, 2.7364501953125, 3.16534423828125, 3.59423828125, 4.02313232421875, 4.4520263671875, 4.88092041015625, 5.309814453125, 5.73870849609375, 6.1676025390625, 6.59649658203125, 7.025390625, 7.45428466796875, 7.8831787109375, 8.31207275390625, 8.740966796875, 9.16986083984375, 9.5987548828125, 10.02764892578125, 10.45654296875, 10.88543701171875, 11.3143310546875, 11.74322509765625, 12.172119140625, 12.60101318359375, 13.0299072265625, 13.45880126953125, 13.8876953125, 14.31658935546875, 14.7454833984375, 15.17437744140625, 15.603271484375, 16.03216552734375, 16.4610595703125, 16.88995361328125, 17.31884765625, 17.74774169921875, 18.1766357421875, 18.60552978515625, 19.034423828125, 19.46331787109375, 19.8922119140625, 20.32110595703125, 20.75]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 11.0, 5.0, 24.0, 21.0, 25.0, 37.0, 74.0, 105.0, 166.0, 281.0, 637.0, 1400.0, 3701.0, 11638.0, 43825.0, 541919.0, 3492180.0, 72586.0, 16748.0, 5299.0, 1954.0, 780.0, 368.0, 199.0, 102.0, 66.0, 39.0, 26.0, 15.0, 11.0, 9.0, 6.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.734375, -26.945556640625, -26.15673828125, -25.367919921875, -24.5791015625, -23.790283203125, -23.00146484375, -22.212646484375, -21.423828125, -20.635009765625, -19.84619140625, -19.057373046875, -18.2685546875, -17.479736328125, -16.69091796875, -15.902099609375, -15.11328125, -14.324462890625, -13.53564453125, -12.746826171875, -11.9580078125, -11.169189453125, -10.38037109375, -9.591552734375, -8.802734375, -8.013916015625, -7.22509765625, -6.436279296875, -5.6474609375, -4.858642578125, -4.06982421875, -3.281005859375, -2.4921875, -1.703369140625, -0.91455078125, -0.125732421875, 0.6630859375, 1.451904296875, 2.24072265625, 3.029541015625, 3.818359375, 4.607177734375, 5.39599609375, 6.184814453125, 6.9736328125, 7.762451171875, 8.55126953125, 9.340087890625, 10.12890625, 10.917724609375, 11.70654296875, 12.495361328125, 13.2841796875, 14.072998046875, 14.86181640625, 15.650634765625, 16.439453125, 17.228271484375, 18.01708984375, 18.805908203125, 19.5947265625, 20.383544921875, 21.17236328125, 21.961181640625, 22.75]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 8.0, 9.0, 7.0, 15.0, 15.0, 20.0, 46.0, 67.0, 87.0, 219.0, 847.0, 1860.0, 521.0, 132.0, 74.0, 41.0, 24.0, 23.0, 13.0, 14.0, 7.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.921875, -30.093505859375, -29.26513671875, -28.436767578125, -27.6083984375, -26.780029296875, -25.95166015625, -25.123291015625, -24.294921875, -23.466552734375, -22.63818359375, -21.809814453125, -20.9814453125, -20.153076171875, -19.32470703125, -18.496337890625, -17.66796875, -16.839599609375, -16.01123046875, -15.182861328125, -14.3544921875, -13.526123046875, -12.69775390625, -11.869384765625, -11.041015625, -10.212646484375, -9.38427734375, -8.555908203125, -7.7275390625, -6.899169921875, -6.07080078125, -5.242431640625, -4.4140625, -3.585693359375, -2.75732421875, -1.928955078125, -1.1005859375, -0.272216796875, 0.55615234375, 1.384521484375, 2.212890625, 3.041259765625, 3.86962890625, 4.697998046875, 5.5263671875, 6.354736328125, 7.18310546875, 8.011474609375, 8.83984375, 9.668212890625, 10.49658203125, 11.324951171875, 12.1533203125, 12.981689453125, 13.81005859375, 14.638427734375, 15.466796875, 16.295166015625, 17.12353515625, 17.951904296875, 18.7802734375, 19.608642578125, 20.43701171875, 21.265380859375, 22.09375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 5.0, 15.0, 20.0, 44.0, 71.0, 159.0, 184.0, 208.0, 132.0, 78.0, 23.0, 17.0, 10.0, 12.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-210.898193359375, -204.70199584960938, -198.50579833984375, -192.30960083007812, -186.11341857910156, -179.91722106933594, -173.7210235595703, -167.5248260498047, -161.32864379882812, -155.1324462890625, -148.93624877929688, -142.74005126953125, -136.5438690185547, -130.34767150878906, -124.15147399902344, -117.95527648925781, -111.75907897949219, -105.56288146972656, -99.36669158935547, -93.17049407958984, -86.97430419921875, -80.77810668945312, -74.5819091796875, -68.38571166992188, -62.18952178955078, -55.99332809448242, -49.79713439941406, -43.60093688964844, -37.40474319458008, -31.20854949951172, -25.012351989746094, -18.816158294677734, -12.619964599609375, -6.423769950866699, -0.22757530212402344, 5.968620300292969, 12.164813995361328, 18.361007690429688, 24.557205200195312, 30.753398895263672, 36.94959259033203, 43.14578628540039, 49.34197998046875, 55.538177490234375, 61.734371185302734, 67.9305648803711, 74.12676239013672, 80.32295227050781, 86.51914978027344, 92.71534729003906, 98.91153717041016, 105.10773468017578, 111.30392456054688, 117.5001220703125, 123.69631958007812, 129.89251708984375, 136.08871459960938, 142.284912109375, 148.48110961914062, 154.67730712890625, 160.8734893798828, 167.06968688964844, 173.26588439941406, 179.4620819091797, 185.65826416015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 3.0, 4.0, 11.0, 7.0, 9.0, 18.0, 24.0, 30.0, 38.0, 39.0, 40.0, 53.0, 63.0, 59.0, 61.0, 68.0, 56.0, 40.0, 36.0, 64.0, 43.0, 48.0, 33.0, 30.0, 29.0, 18.0, 17.0, 14.0, 8.0, 7.0, 5.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-115.38067626953125, -111.9517822265625, -108.52289581298828, -105.09400177001953, -101.66510772705078, -98.23622131347656, -94.80732727050781, -91.37843322753906, -87.94954681396484, -84.5206527709961, -81.09176635742188, -77.66287231445312, -74.23397827148438, -70.80509185791016, -67.3761978149414, -63.94730758666992, -60.51841354370117, -57.08952331542969, -53.66062927246094, -50.23173904418945, -46.80284881591797, -43.37395477294922, -39.945064544677734, -36.51617431640625, -33.0872802734375, -29.658388137817383, -26.2294979095459, -22.80060577392578, -19.371715545654297, -15.94282341003418, -12.513931274414062, -9.085041046142578, -5.656150817871094, -2.227259397506714, 1.201632022857666, 4.630523681640625, 8.059414863586426, 11.488306045532227, 14.917198181152344, 18.346088409423828, 21.774980545043945, 25.203872680664062, 28.632762908935547, 32.06165313720703, 35.49054718017578, 38.919437408447266, 42.34832763671875, 45.7772216796875, 49.206111907958984, 52.63500213623047, 56.06389617919922, 59.4927864074707, 62.92167663574219, 66.35057067871094, 69.77946472167969, 73.2083511352539, 76.63724517822266, 80.0661392211914, 83.49502563476562, 86.92391967773438, 90.35281372070312, 93.78170013427734, 97.2105941772461, 100.63948059082031, 104.06837463378906]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 15.0, 24.0, 26.0, 32.0, 58.0, 94.0, 148.0, 277.0, 419.0, 800.0, 1571.0, 3457.0, 8771.0, 26079.0, 94247.0, 420317.0, 371447.0, 82992.0, 23209.0, 8062.0, 3223.0, 1442.0, 719.0, 426.0, 231.0, 165.0, 95.0, 59.0, 50.0, 17.0, 19.0, 12.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.375, -16.77490234375, -16.1748046875, -15.57470703125, -14.974609375, -14.37451171875, -13.7744140625, -13.17431640625, -12.57421875, -11.97412109375, -11.3740234375, -10.77392578125, -10.173828125, -9.57373046875, -8.9736328125, -8.37353515625, -7.7734375, -7.17333984375, -6.5732421875, -5.97314453125, -5.373046875, -4.77294921875, -4.1728515625, -3.57275390625, -2.97265625, -2.37255859375, -1.7724609375, -1.17236328125, -0.572265625, 0.02783203125, 0.6279296875, 1.22802734375, 1.828125, 2.42822265625, 3.0283203125, 3.62841796875, 4.228515625, 4.82861328125, 5.4287109375, 6.02880859375, 6.62890625, 7.22900390625, 7.8291015625, 8.42919921875, 9.029296875, 9.62939453125, 10.2294921875, 10.82958984375, 11.4296875, 12.02978515625, 12.6298828125, 13.22998046875, 13.830078125, 14.43017578125, 15.0302734375, 15.63037109375, 16.23046875, 16.83056640625, 17.4306640625, 18.03076171875, 18.630859375, 19.23095703125, 19.8310546875, 20.43115234375, 21.03125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 3.0, 7.0, 15.0, 15.0, 20.0, 45.0, 30.0, 34.0, 46.0, 41.0, 49.0, 53.0, 64.0, 66.0, 80.0, 67.0, 61.0, 55.0, 40.0, 40.0, 37.0, 31.0, 39.0, 15.0, 15.0, 13.0, 6.0, 9.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8203125, -6.556640625, -6.29296875, -6.029296875, -5.765625, -5.501953125, -5.23828125, -4.974609375, -4.7109375, -4.447265625, -4.18359375, -3.919921875, -3.65625, -3.392578125, -3.12890625, -2.865234375, -2.6015625, -2.337890625, -2.07421875, -1.810546875, -1.546875, -1.283203125, -1.01953125, -0.755859375, -0.4921875, -0.228515625, 0.03515625, 0.298828125, 0.5625, 0.826171875, 1.08984375, 1.353515625, 1.6171875, 1.880859375, 2.14453125, 2.408203125, 2.671875, 2.935546875, 3.19921875, 3.462890625, 3.7265625, 3.990234375, 4.25390625, 4.517578125, 4.78125, 5.044921875, 5.30859375, 5.572265625, 5.8359375, 6.099609375, 6.36328125, 6.626953125, 6.890625, 7.154296875, 7.41796875, 7.681640625, 7.9453125, 8.208984375, 8.47265625, 8.736328125, 9.0, 9.263671875, 9.52734375, 9.791015625, 10.0546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 4.0, 7.0, 9.0, 21.0, 30.0, 23.0, 45.0, 61.0, 112.0, 173.0, 317.0, 652.0, 1654.0, 6146.0, 65666.0, 894668.0, 69166.0, 6456.0, 1766.0, 689.0, 363.0, 174.0, 119.0, 74.0, 51.0, 33.0, 16.0, 20.0, 9.0, 8.0, 3.0, 6.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.84375, -33.529296875, -32.21484375, -30.900390625, -29.5859375, -28.271484375, -26.95703125, -25.642578125, -24.328125, -23.013671875, -21.69921875, -20.384765625, -19.0703125, -17.755859375, -16.44140625, -15.126953125, -13.8125, -12.498046875, -11.18359375, -9.869140625, -8.5546875, -7.240234375, -5.92578125, -4.611328125, -3.296875, -1.982421875, -0.66796875, 0.646484375, 1.9609375, 3.275390625, 4.58984375, 5.904296875, 7.21875, 8.533203125, 9.84765625, 11.162109375, 12.4765625, 13.791015625, 15.10546875, 16.419921875, 17.734375, 19.048828125, 20.36328125, 21.677734375, 22.9921875, 24.306640625, 25.62109375, 26.935546875, 28.25, 29.564453125, 30.87890625, 32.193359375, 33.5078125, 34.822265625, 36.13671875, 37.451171875, 38.765625, 40.080078125, 41.39453125, 42.708984375, 44.0234375, 45.337890625, 46.65234375, 47.966796875, 49.28125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 5.0, 1.0, 7.0, 7.0, 7.0, 20.0, 23.0, 23.0, 33.0, 42.0, 39.0, 42.0, 58.0, 52.0, 80.0, 64.0, 59.0, 65.0, 54.0, 42.0, 36.0, 50.0, 40.0, 33.0, 31.0, 17.0, 15.0, 13.0, 12.0, 9.0, 7.0, 2.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.203125, -29.157470703125, -28.11181640625, -27.066162109375, -26.0205078125, -24.974853515625, -23.92919921875, -22.883544921875, -21.837890625, -20.792236328125, -19.74658203125, -18.700927734375, -17.6552734375, -16.609619140625, -15.56396484375, -14.518310546875, -13.47265625, -12.427001953125, -11.38134765625, -10.335693359375, -9.2900390625, -8.244384765625, -7.19873046875, -6.153076171875, -5.107421875, -4.061767578125, -3.01611328125, -1.970458984375, -0.9248046875, 0.120849609375, 1.16650390625, 2.212158203125, 3.2578125, 4.303466796875, 5.34912109375, 6.394775390625, 7.4404296875, 8.486083984375, 9.53173828125, 10.577392578125, 11.623046875, 12.668701171875, 13.71435546875, 14.760009765625, 15.8056640625, 16.851318359375, 17.89697265625, 18.942626953125, 19.98828125, 21.033935546875, 22.07958984375, 23.125244140625, 24.1708984375, 25.216552734375, 26.26220703125, 27.307861328125, 28.353515625, 29.399169921875, 30.44482421875, 31.490478515625, 32.5361328125, 33.581787109375, 34.62744140625, 35.673095703125, 36.71875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 7.0, 4.0, 10.0, 10.0, 24.0, 30.0, 48.0, 51.0, 86.0, 142.0, 296.0, 741.0, 2001.0, 8513.0, 80542.0, 879736.0, 65448.0, 7636.0, 1911.0, 633.0, 236.0, 131.0, 96.0, 62.0, 41.0, 34.0, 21.0, 14.0, 6.0, 6.0, 3.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.34375, -13.8729248046875, -13.402099609375, -12.9312744140625, -12.46044921875, -11.9896240234375, -11.518798828125, -11.0479736328125, -10.5771484375, -10.1063232421875, -9.635498046875, -9.1646728515625, -8.69384765625, -8.2230224609375, -7.752197265625, -7.2813720703125, -6.810546875, -6.3397216796875, -5.868896484375, -5.3980712890625, -4.92724609375, -4.4564208984375, -3.985595703125, -3.5147705078125, -3.0439453125, -2.5731201171875, -2.102294921875, -1.6314697265625, -1.16064453125, -0.6898193359375, -0.218994140625, 0.2518310546875, 0.72265625, 1.1934814453125, 1.664306640625, 2.1351318359375, 2.60595703125, 3.0767822265625, 3.547607421875, 4.0184326171875, 4.4892578125, 4.9600830078125, 5.430908203125, 5.9017333984375, 6.37255859375, 6.8433837890625, 7.314208984375, 7.7850341796875, 8.255859375, 8.7266845703125, 9.197509765625, 9.6683349609375, 10.13916015625, 10.6099853515625, 11.080810546875, 11.5516357421875, 12.0224609375, 12.4932861328125, 12.964111328125, 13.4349365234375, 13.90576171875, 14.3765869140625, 14.847412109375, 15.3182373046875, 15.7890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 10.0, 6.0, 9.0, 6.0, 9.0, 14.0, 18.0, 15.0, 25.0, 28.0, 38.0, 44.0, 58.0, 82.0, 122.0, 111.0, 89.0, 60.0, 43.0, 41.0, 27.0, 31.0, 21.0, 19.0, 8.0, 10.0, 8.0, 5.0, 10.0, 6.0, 6.0, 9.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011005401611328125, -0.0010582506656646729, -0.0010159611701965332, -0.0009736716747283936, -0.0009313821792602539, -0.0008890926837921143, -0.0008468031883239746, -0.000804513692855835, -0.0007622241973876953, -0.0007199347019195557, -0.000677645206451416, -0.0006353557109832764, -0.0005930662155151367, -0.0005507767200469971, -0.0005084872245788574, -0.0004661977291107178, -0.0004239082336425781, -0.0003816187381744385, -0.00033932924270629883, -0.0002970397472381592, -0.00025475025177001953, -0.00021246075630187988, -0.00017017126083374023, -0.00012788176536560059, -8.559226989746094e-05, -4.330277442932129e-05, -1.0132789611816406e-06, 4.127621650695801e-05, 8.356571197509766e-05, 0.0001258552074432373, 0.00016814470291137695, 0.0002104341983795166, 0.00025272369384765625, 0.0002950131893157959, 0.00033730268478393555, 0.0003795921802520752, 0.00042188167572021484, 0.0004641711711883545, 0.0005064606666564941, 0.0005487501621246338, 0.0005910396575927734, 0.0006333291530609131, 0.0006756186485290527, 0.0007179081439971924, 0.000760197639465332, 0.0008024871349334717, 0.0008447766304016113, 0.000887066125869751, 0.0009293556213378906, 0.0009716451168060303, 0.00101393461227417, 0.0010562241077423096, 0.0010985136032104492, 0.0011408030986785889, 0.0011830925941467285, 0.0012253820896148682, 0.0012676715850830078, 0.0013099610805511475, 0.0013522505760192871, 0.0013945400714874268, 0.0014368295669555664, 0.001479119062423706, 0.0015214085578918457, 0.0015636980533599854, 0.001605987548828125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 6.0, 7.0, 16.0, 28.0, 51.0, 61.0, 125.0, 231.0, 467.0, 1174.0, 3406.0, 15375.0, 204996.0, 775104.0, 38377.0, 6068.0, 1680.0, 666.0, 321.0, 165.0, 90.0, 54.0, 30.0, 12.0, 7.0, 8.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.2379150390625, -14.764892578125, -14.2918701171875, -13.81884765625, -13.3458251953125, -12.872802734375, -12.3997802734375, -11.9267578125, -11.4537353515625, -10.980712890625, -10.5076904296875, -10.03466796875, -9.5616455078125, -9.088623046875, -8.6156005859375, -8.142578125, -7.6695556640625, -7.196533203125, -6.7235107421875, -6.25048828125, -5.7774658203125, -5.304443359375, -4.8314208984375, -4.3583984375, -3.8853759765625, -3.412353515625, -2.9393310546875, -2.46630859375, -1.9932861328125, -1.520263671875, -1.0472412109375, -0.57421875, -0.1011962890625, 0.371826171875, 0.8448486328125, 1.31787109375, 1.7908935546875, 2.263916015625, 2.7369384765625, 3.2099609375, 3.6829833984375, 4.156005859375, 4.6290283203125, 5.10205078125, 5.5750732421875, 6.048095703125, 6.5211181640625, 6.994140625, 7.4671630859375, 7.940185546875, 8.4132080078125, 8.88623046875, 9.3592529296875, 9.832275390625, 10.3052978515625, 10.7783203125, 11.2513427734375, 11.724365234375, 12.1973876953125, 12.67041015625, 13.1434326171875, 13.616455078125, 14.0894775390625, 14.5625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 8.0, 10.0, 23.0, 21.0, 21.0, 25.0, 59.0, 73.0, 89.0, 129.0, 106.0, 91.0, 94.0, 56.0, 35.0, 32.0, 20.0, 18.0, 15.0, 17.0, 5.0, 7.0, 7.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4140625, -10.1021728515625, -9.790283203125, -9.4783935546875, -9.16650390625, -8.8546142578125, -8.542724609375, -8.2308349609375, -7.9189453125, -7.6070556640625, -7.295166015625, -6.9832763671875, -6.67138671875, -6.3594970703125, -6.047607421875, -5.7357177734375, -5.423828125, -5.1119384765625, -4.800048828125, -4.4881591796875, -4.17626953125, -3.8643798828125, -3.552490234375, -3.2406005859375, -2.9287109375, -2.6168212890625, -2.304931640625, -1.9930419921875, -1.68115234375, -1.3692626953125, -1.057373046875, -0.7454833984375, -0.43359375, -0.1217041015625, 0.190185546875, 0.5020751953125, 0.81396484375, 1.1258544921875, 1.437744140625, 1.7496337890625, 2.0615234375, 2.3734130859375, 2.685302734375, 2.9971923828125, 3.30908203125, 3.6209716796875, 3.932861328125, 4.2447509765625, 4.556640625, 4.8685302734375, 5.180419921875, 5.4923095703125, 5.80419921875, 6.1160888671875, 6.427978515625, 6.7398681640625, 7.0517578125, 7.3636474609375, 7.675537109375, 7.9874267578125, 8.29931640625, 8.6112060546875, 8.923095703125, 9.2349853515625, 9.546875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 8.0, 8.0, 15.0, 31.0, 50.0, 102.0, 179.0, 217.0, 164.0, 108.0, 62.0, 26.0, 10.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.73257446289062, -216.55422973632812, -210.37588500976562, -204.19754028320312, -198.01918029785156, -191.84083557128906, -185.66249084472656, -179.48414611816406, -173.3057861328125, -167.12744140625, -160.9490966796875, -154.770751953125, -148.59239196777344, -142.41404724121094, -136.23570251464844, -130.05735778808594, -123.87901306152344, -117.70066833496094, -111.5223159790039, -105.3439712524414, -99.16561889648438, -92.98727416992188, -86.80892944335938, -80.63058471679688, -74.45223236083984, -68.27388763427734, -62.09553527832031, -55.91719055175781, -49.73884201049805, -43.56049346923828, -37.38214874267578, -31.203800201416016, -25.02545166015625, -18.847103118896484, -12.668756484985352, -6.490409851074219, -0.3120613098144531, 5.8662872314453125, 12.044631958007812, 18.222980499267578, 24.401329040527344, 30.57967758178711, 36.758026123046875, 42.936370849609375, 49.11471939086914, 55.293067932128906, 61.471412658691406, 67.64976501464844, 73.82810974121094, 80.00645446777344, 86.18480682373047, 92.36315155029297, 98.54150390625, 104.7198486328125, 110.898193359375, 117.0765380859375, 123.25489044189453, 129.43324279785156, 135.61158752441406, 141.78993225097656, 147.96827697753906, 154.14663696289062, 160.32498168945312, 166.50332641601562, 172.68167114257812]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 3.0, 7.0, 8.0, 8.0, 14.0, 17.0, 23.0, 25.0, 34.0, 47.0, 57.0, 64.0, 74.0, 80.0, 91.0, 81.0, 72.0, 63.0, 44.0, 49.0, 37.0, 32.0, 21.0, 17.0, 14.0, 5.0, 5.0, 3.0, 4.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-206.20257568359375, -201.12625122070312, -196.0499267578125, -190.97360229492188, -185.89727783203125, -180.8209686279297, -175.74464416503906, -170.66831970214844, -165.5919952392578, -160.5156707763672, -155.43934631347656, -150.36302185058594, -145.28671264648438, -140.21038818359375, -135.13406372070312, -130.0577392578125, -124.98141479492188, -119.90509033203125, -114.82876586914062, -109.75244903564453, -104.6761245727539, -99.59980010986328, -94.52348327636719, -89.44715881347656, -84.37083435058594, -79.29450988769531, -74.21818542480469, -69.1418685913086, -64.06554412841797, -58.989219665527344, -53.912899017333984, -48.836578369140625, -43.76025390625, -38.683929443359375, -33.607608795166016, -28.531286239624023, -23.45496368408203, -18.37864112854004, -13.302318572998047, -8.225997924804688, -3.1496734619140625, 1.9266490936279297, 7.002971649169922, 12.079294204711914, 17.155616760253906, 22.2319393157959, 27.30826187133789, 32.38458251953125, 37.460906982421875, 42.5372314453125, 47.61355209350586, 52.68987274169922, 57.766197204589844, 62.84252166748047, 67.91883850097656, 72.99516296386719, 78.07148742675781, 83.14781188964844, 88.22413635253906, 93.30045318603516, 98.37677764892578, 103.4531021118164, 108.5294189453125, 113.60574340820312, 118.68206787109375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 9.0, 7.0, 19.0, 34.0, 40.0, 71.0, 118.0, 206.0, 458.0, 967.0, 2929.0, 11894.0, 140581.0, 3970465.0, 55340.0, 7440.0, 2101.0, 744.0, 349.0, 174.0, 110.0, 73.0, 49.0, 23.0, 23.0, 13.0, 11.0, 11.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.28125, -29.25, -28.21875, -27.1875, -26.15625, -25.125, -24.09375, -23.0625, -22.03125, -21.0, -19.96875, -18.9375, -17.90625, -16.875, -15.84375, -14.8125, -13.78125, -12.75, -11.71875, -10.6875, -9.65625, -8.625, -7.59375, -6.5625, -5.53125, -4.5, -3.46875, -2.4375, -1.40625, -0.375, 0.65625, 1.6875, 2.71875, 3.75, 4.78125, 5.8125, 6.84375, 7.875, 8.90625, 9.9375, 10.96875, 12.0, 13.03125, 14.0625, 15.09375, 16.125, 17.15625, 18.1875, 19.21875, 20.25, 21.28125, 22.3125, 23.34375, 24.375, 25.40625, 26.4375, 27.46875, 28.5, 29.53125, 30.5625, 31.59375, 32.625, 33.65625, 34.6875, 35.71875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 8.0, 9.0, 5.0, 23.0, 24.0, 36.0, 42.0, 60.0, 55.0, 68.0, 68.0, 90.0, 94.0, 85.0, 71.0, 64.0, 56.0, 40.0, 30.0, 20.0, 21.0, 8.0, 8.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-14.2109375, -13.89422607421875, -13.5775146484375, -13.26080322265625, -12.944091796875, -12.62738037109375, -12.3106689453125, -11.99395751953125, -11.67724609375, -11.36053466796875, -11.0438232421875, -10.72711181640625, -10.410400390625, -10.09368896484375, -9.7769775390625, -9.46026611328125, -9.1435546875, -8.82684326171875, -8.5101318359375, -8.19342041015625, -7.876708984375, -7.55999755859375, -7.2432861328125, -6.92657470703125, -6.60986328125, -6.29315185546875, -5.9764404296875, -5.65972900390625, -5.343017578125, -5.02630615234375, -4.7095947265625, -4.39288330078125, -4.076171875, -3.75946044921875, -3.4427490234375, -3.12603759765625, -2.809326171875, -2.49261474609375, -2.1759033203125, -1.85919189453125, -1.54248046875, -1.22576904296875, -0.9090576171875, -0.59234619140625, -0.275634765625, 0.04107666015625, 0.3577880859375, 0.67449951171875, 0.9912109375, 1.30792236328125, 1.6246337890625, 1.94134521484375, 2.258056640625, 2.57476806640625, 2.8914794921875, 3.20819091796875, 3.52490234375, 3.84161376953125, 4.1583251953125, 4.47503662109375, 4.791748046875, 5.10845947265625, 5.4251708984375, 5.74188232421875, 6.05859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 7.0, 4.0, 10.0, 13.0, 21.0, 54.0, 72.0, 138.0, 293.0, 601.0, 1444.0, 4044.0, 12984.0, 60942.0, 2966794.0, 1087368.0, 43231.0, 10255.0, 3404.0, 1391.0, 628.0, 239.0, 158.0, 88.0, 41.0, 20.0, 13.0, 9.0, 6.0, 6.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.0, -22.279296875, -21.55859375, -20.837890625, -20.1171875, -19.396484375, -18.67578125, -17.955078125, -17.234375, -16.513671875, -15.79296875, -15.072265625, -14.3515625, -13.630859375, -12.91015625, -12.189453125, -11.46875, -10.748046875, -10.02734375, -9.306640625, -8.5859375, -7.865234375, -7.14453125, -6.423828125, -5.703125, -4.982421875, -4.26171875, -3.541015625, -2.8203125, -2.099609375, -1.37890625, -0.658203125, 0.0625, 0.783203125, 1.50390625, 2.224609375, 2.9453125, 3.666015625, 4.38671875, 5.107421875, 5.828125, 6.548828125, 7.26953125, 7.990234375, 8.7109375, 9.431640625, 10.15234375, 10.873046875, 11.59375, 12.314453125, 13.03515625, 13.755859375, 14.4765625, 15.197265625, 15.91796875, 16.638671875, 17.359375, 18.080078125, 18.80078125, 19.521484375, 20.2421875, 20.962890625, 21.68359375, 22.404296875, 23.125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 3.0, 2.0, 6.0, 14.0, 13.0, 12.0, 13.0, 22.0, 24.0, 53.0, 65.0, 88.0, 167.0, 360.0, 740.0, 1092.0, 646.0, 321.0, 143.0, 79.0, 62.0, 28.0, 16.0, 26.0, 11.0, 11.0, 12.0, 11.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.6484375, -12.218017578125, -11.78759765625, -11.357177734375, -10.9267578125, -10.496337890625, -10.06591796875, -9.635498046875, -9.205078125, -8.774658203125, -8.34423828125, -7.913818359375, -7.4833984375, -7.052978515625, -6.62255859375, -6.192138671875, -5.76171875, -5.331298828125, -4.90087890625, -4.470458984375, -4.0400390625, -3.609619140625, -3.17919921875, -2.748779296875, -2.318359375, -1.887939453125, -1.45751953125, -1.027099609375, -0.5966796875, -0.166259765625, 0.26416015625, 0.694580078125, 1.125, 1.555419921875, 1.98583984375, 2.416259765625, 2.8466796875, 3.277099609375, 3.70751953125, 4.137939453125, 4.568359375, 4.998779296875, 5.42919921875, 5.859619140625, 6.2900390625, 6.720458984375, 7.15087890625, 7.581298828125, 8.01171875, 8.442138671875, 8.87255859375, 9.302978515625, 9.7333984375, 10.163818359375, 10.59423828125, 11.024658203125, 11.455078125, 11.885498046875, 12.31591796875, 12.746337890625, 13.1767578125, 13.607177734375, 14.03759765625, 14.468017578125, 14.8984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 22.0, 42.0, 66.0, 155.0, 258.0, 211.0, 135.0, 44.0, 26.0, 9.0, 6.0, 3.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-261.2809143066406, -255.47645568847656, -249.6719970703125, -243.86753845214844, -238.06307983398438, -232.25863647460938, -226.45416259765625, -220.64971923828125, -214.8452606201172, -209.04080200195312, -203.23634338378906, -197.431884765625, -191.62742614746094, -185.82296752929688, -180.01852416992188, -174.2140655517578, -168.40960693359375, -162.6051483154297, -156.80068969726562, -150.99623107910156, -145.1917724609375, -139.3873291015625, -133.58285522460938, -127.77841186523438, -121.97393798828125, -116.16947937011719, -110.36502075195312, -104.56056213378906, -98.75611114501953, -92.95165252685547, -87.1471939086914, -81.34274291992188, -75.53828430175781, -69.73382568359375, -63.92937088012695, -58.12491226196289, -52.320457458496094, -46.51599884033203, -40.71154022216797, -34.90708541870117, -29.10262680053711, -23.29817008972168, -17.49371337890625, -11.689254760742188, -5.884798049926758, -0.08034133911132812, 5.724117279052734, 11.528572082519531, 17.333030700683594, 23.137487411499023, 28.941944122314453, 34.746402740478516, 40.55085754394531, 46.355316162109375, 52.15977478027344, 57.964229583740234, 63.7686882019043, 69.5731430053711, 75.37760162353516, 81.18206024169922, 86.98651885986328, 92.79096984863281, 98.59542846679688, 104.39988708496094, 110.204345703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 7.0, 7.0, 11.0, 10.0, 19.0, 23.0, 15.0, 25.0, 25.0, 43.0, 40.0, 41.0, 45.0, 62.0, 48.0, 58.0, 51.0, 55.0, 46.0, 46.0, 48.0, 47.0, 32.0, 31.0, 30.0, 25.0, 18.0, 17.0, 15.0, 15.0, 7.0, 6.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.83555603027344, -48.87010955810547, -46.904666900634766, -44.9392204284668, -42.973777770996094, -41.008331298828125, -39.042884826660156, -37.07744216918945, -35.111995697021484, -33.146549224853516, -31.181106567382812, -29.215660095214844, -27.250215530395508, -25.284770965576172, -23.319326400756836, -21.3538818359375, -19.388437271118164, -17.422992706298828, -15.457547187805176, -13.49210262298584, -11.526657104492188, -9.561212539672852, -7.595767974853516, -5.630322456359863, -3.6648778915405273, -1.6994329690933228, 0.26601195335388184, 2.231456756591797, 4.196901798248291, 6.162346839904785, 8.127791404724121, 10.093236923217773, 12.05868148803711, 14.024126052856445, 15.989571571350098, 17.95501708984375, 19.920461654663086, 21.885906219482422, 23.851350784301758, 25.816795349121094, 27.782241821289062, 29.7476863861084, 31.713130950927734, 33.6785774230957, 35.644020080566406, 37.609466552734375, 39.574913024902344, 41.54035568237305, 43.50579833984375, 45.47124481201172, 47.43668746948242, 49.40213394165039, 51.367576599121094, 53.33302307128906, 55.29846954345703, 57.263912200927734, 59.2293586730957, 61.19480514526367, 63.160247802734375, 65.12569427490234, 67.09114074707031, 69.05657958984375, 71.02202606201172, 72.98747253417969, 74.95291900634766]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 10.0, 9.0, 13.0, 14.0, 35.0, 42.0, 71.0, 101.0, 164.0, 237.0, 364.0, 633.0, 1159.0, 2017.0, 3926.0, 8150.0, 18284.0, 47478.0, 147117.0, 446995.0, 249752.0, 73039.0, 26518.0, 11097.0, 5199.0, 2657.0, 1408.0, 761.0, 449.0, 291.0, 185.0, 104.0, 82.0, 55.0, 33.0, 31.0, 20.0, 13.0, 14.0, 5.0, 1.0, 4.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-14.6171875, -14.1834716796875, -13.749755859375, -13.3160400390625, -12.88232421875, -12.4486083984375, -12.014892578125, -11.5811767578125, -11.1474609375, -10.7137451171875, -10.280029296875, -9.8463134765625, -9.41259765625, -8.9788818359375, -8.545166015625, -8.1114501953125, -7.677734375, -7.2440185546875, -6.810302734375, -6.3765869140625, -5.94287109375, -5.5091552734375, -5.075439453125, -4.6417236328125, -4.2080078125, -3.7742919921875, -3.340576171875, -2.9068603515625, -2.47314453125, -2.0394287109375, -1.605712890625, -1.1719970703125, -0.73828125, -0.3045654296875, 0.129150390625, 0.5628662109375, 0.99658203125, 1.4302978515625, 1.864013671875, 2.2977294921875, 2.7314453125, 3.1651611328125, 3.598876953125, 4.0325927734375, 4.46630859375, 4.9000244140625, 5.333740234375, 5.7674560546875, 6.201171875, 6.6348876953125, 7.068603515625, 7.5023193359375, 7.93603515625, 8.3697509765625, 8.803466796875, 9.2371826171875, 9.6708984375, 10.1046142578125, 10.538330078125, 10.9720458984375, 11.40576171875, 11.8394775390625, 12.273193359375, 12.7069091796875, 13.140625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 9.0, 13.0, 16.0, 12.0, 17.0, 25.0, 22.0, 29.0, 21.0, 44.0, 35.0, 40.0, 43.0, 44.0, 58.0, 51.0, 45.0, 66.0, 46.0, 50.0, 44.0, 54.0, 38.0, 27.0, 24.0, 23.0, 17.0, 14.0, 13.0, 10.0, 9.0, 4.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.85546875, -6.65728759765625, -6.4591064453125, -6.26092529296875, -6.062744140625, -5.86456298828125, -5.6663818359375, -5.46820068359375, -5.27001953125, -5.07183837890625, -4.8736572265625, -4.67547607421875, -4.477294921875, -4.27911376953125, -4.0809326171875, -3.88275146484375, -3.6845703125, -3.48638916015625, -3.2882080078125, -3.09002685546875, -2.891845703125, -2.69366455078125, -2.4954833984375, -2.29730224609375, -2.09912109375, -1.90093994140625, -1.7027587890625, -1.50457763671875, -1.306396484375, -1.10821533203125, -0.9100341796875, -0.71185302734375, -0.513671875, -0.31549072265625, -0.1173095703125, 0.08087158203125, 0.279052734375, 0.47723388671875, 0.6754150390625, 0.87359619140625, 1.07177734375, 1.26995849609375, 1.4681396484375, 1.66632080078125, 1.864501953125, 2.06268310546875, 2.2608642578125, 2.45904541015625, 2.6572265625, 2.85540771484375, 3.0535888671875, 3.25177001953125, 3.449951171875, 3.64813232421875, 3.8463134765625, 4.04449462890625, 4.24267578125, 4.44085693359375, 4.6390380859375, 4.83721923828125, 5.035400390625, 5.23358154296875, 5.4317626953125, 5.62994384765625, 5.828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 5.0, 20.0, 18.0, 21.0, 37.0, 31.0, 47.0, 54.0, 102.0, 144.0, 235.0, 375.0, 615.0, 1207.0, 2851.0, 7666.0, 27542.0, 134999.0, 675531.0, 152526.0, 30094.0, 8316.0, 3021.0, 1257.0, 656.0, 377.0, 236.0, 138.0, 97.0, 89.0, 55.0, 47.0, 23.0, 27.0, 23.0, 13.0, 16.0, 5.0, 6.0, 2.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.8125, -17.188232421875, -16.56396484375, -15.939697265625, -15.3154296875, -14.691162109375, -14.06689453125, -13.442626953125, -12.818359375, -12.194091796875, -11.56982421875, -10.945556640625, -10.3212890625, -9.697021484375, -9.07275390625, -8.448486328125, -7.82421875, -7.199951171875, -6.57568359375, -5.951416015625, -5.3271484375, -4.702880859375, -4.07861328125, -3.454345703125, -2.830078125, -2.205810546875, -1.58154296875, -0.957275390625, -0.3330078125, 0.291259765625, 0.91552734375, 1.539794921875, 2.1640625, 2.788330078125, 3.41259765625, 4.036865234375, 4.6611328125, 5.285400390625, 5.90966796875, 6.533935546875, 7.158203125, 7.782470703125, 8.40673828125, 9.031005859375, 9.6552734375, 10.279541015625, 10.90380859375, 11.528076171875, 12.15234375, 12.776611328125, 13.40087890625, 14.025146484375, 14.6494140625, 15.273681640625, 15.89794921875, 16.522216796875, 17.146484375, 17.770751953125, 18.39501953125, 19.019287109375, 19.6435546875, 20.267822265625, 20.89208984375, 21.516357421875, 22.140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 3.0, 14.0, 7.0, 13.0, 9.0, 15.0, 16.0, 19.0, 18.0, 29.0, 22.0, 28.0, 32.0, 42.0, 42.0, 43.0, 51.0, 45.0, 59.0, 59.0, 44.0, 46.0, 34.0, 43.0, 32.0, 28.0, 30.0, 26.0, 17.0, 15.0, 18.0, 18.0, 16.0, 9.0, 7.0, 9.0, 4.0, 5.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-21.421875, -20.7216796875, -20.021484375, -19.3212890625, -18.62109375, -17.9208984375, -17.220703125, -16.5205078125, -15.8203125, -15.1201171875, -14.419921875, -13.7197265625, -13.01953125, -12.3193359375, -11.619140625, -10.9189453125, -10.21875, -9.5185546875, -8.818359375, -8.1181640625, -7.41796875, -6.7177734375, -6.017578125, -5.3173828125, -4.6171875, -3.9169921875, -3.216796875, -2.5166015625, -1.81640625, -1.1162109375, -0.416015625, 0.2841796875, 0.984375, 1.6845703125, 2.384765625, 3.0849609375, 3.78515625, 4.4853515625, 5.185546875, 5.8857421875, 6.5859375, 7.2861328125, 7.986328125, 8.6865234375, 9.38671875, 10.0869140625, 10.787109375, 11.4873046875, 12.1875, 12.8876953125, 13.587890625, 14.2880859375, 14.98828125, 15.6884765625, 16.388671875, 17.0888671875, 17.7890625, 18.4892578125, 19.189453125, 19.8896484375, 20.58984375, 21.2900390625, 21.990234375, 22.6904296875, 23.390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 9.0, 12.0, 27.0, 52.0, 152.0, 564.0, 3288.0, 144580.0, 888656.0, 9858.0, 960.0, 225.0, 73.0, 40.0, 23.0, 12.0, 9.0, 5.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.578125, -21.8046875, -21.03125, -20.2578125, -19.484375, -18.7109375, -17.9375, -17.1640625, -16.390625, -15.6171875, -14.84375, -14.0703125, -13.296875, -12.5234375, -11.75, -10.9765625, -10.203125, -9.4296875, -8.65625, -7.8828125, -7.109375, -6.3359375, -5.5625, -4.7890625, -4.015625, -3.2421875, -2.46875, -1.6953125, -0.921875, -0.1484375, 0.625, 1.3984375, 2.171875, 2.9453125, 3.71875, 4.4921875, 5.265625, 6.0390625, 6.8125, 7.5859375, 8.359375, 9.1328125, 9.90625, 10.6796875, 11.453125, 12.2265625, 13.0, 13.7734375, 14.546875, 15.3203125, 16.09375, 16.8671875, 17.640625, 18.4140625, 19.1875, 19.9609375, 20.734375, 21.5078125, 22.28125, 23.0546875, 23.828125, 24.6015625, 25.375, 26.1484375, 26.921875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 4.0, 5.0, 6.0, 16.0, 18.0, 21.0, 36.0, 69.0, 138.0, 253.0, 191.0, 102.0, 57.0, 23.0, 19.0, 11.0, 9.0, 7.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0031261444091796875, -0.003033250570297241, -0.002940356731414795, -0.0028474628925323486, -0.0027545690536499023, -0.002661675214767456, -0.0025687813758850098, -0.0024758875370025635, -0.002382993698120117, -0.002290099859237671, -0.0021972060203552246, -0.0021043121814727783, -0.002011418342590332, -0.0019185245037078857, -0.0018256306648254395, -0.0017327368259429932, -0.0016398429870605469, -0.0015469491481781006, -0.0014540553092956543, -0.001361161470413208, -0.0012682676315307617, -0.0011753737926483154, -0.0010824799537658691, -0.0009895861148834229, -0.0008966922760009766, -0.0008037984371185303, -0.000710904598236084, -0.0006180107593536377, -0.0005251169204711914, -0.0004322230815887451, -0.00033932924270629883, -0.00024643540382385254, -0.00015354156494140625, -6.064772605895996e-05, 3.224611282348633e-05, 0.00012513995170593262, 0.0002180337905883789, 0.0003109276294708252, 0.0004038214683532715, 0.0004967153072357178, 0.0005896091461181641, 0.0006825029850006104, 0.0007753968238830566, 0.0008682906627655029, 0.0009611845016479492, 0.0010540783405303955, 0.0011469721794128418, 0.001239866018295288, 0.0013327598571777344, 0.0014256536960601807, 0.001518547534942627, 0.0016114413738250732, 0.0017043352127075195, 0.0017972290515899658, 0.0018901228904724121, 0.0019830167293548584, 0.0020759105682373047, 0.002168804407119751, 0.0022616982460021973, 0.0023545920848846436, 0.00244748592376709, 0.002540379762649536, 0.0026332736015319824, 0.0027261674404144287, 0.002819061279296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 15.0, 9.0, 4.0, 19.0, 24.0, 31.0, 68.0, 119.0, 222.0, 568.0, 1451.0, 5218.0, 35020.0, 702531.0, 279887.0, 18034.0, 3418.0, 1047.0, 423.0, 188.0, 103.0, 55.0, 38.0, 19.0, 9.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.25, -12.833984375, -12.41796875, -12.001953125, -11.5859375, -11.169921875, -10.75390625, -10.337890625, -9.921875, -9.505859375, -9.08984375, -8.673828125, -8.2578125, -7.841796875, -7.42578125, -7.009765625, -6.59375, -6.177734375, -5.76171875, -5.345703125, -4.9296875, -4.513671875, -4.09765625, -3.681640625, -3.265625, -2.849609375, -2.43359375, -2.017578125, -1.6015625, -1.185546875, -0.76953125, -0.353515625, 0.0625, 0.478515625, 0.89453125, 1.310546875, 1.7265625, 2.142578125, 2.55859375, 2.974609375, 3.390625, 3.806640625, 4.22265625, 4.638671875, 5.0546875, 5.470703125, 5.88671875, 6.302734375, 6.71875, 7.134765625, 7.55078125, 7.966796875, 8.3828125, 8.798828125, 9.21484375, 9.630859375, 10.046875, 10.462890625, 10.87890625, 11.294921875, 11.7109375, 12.126953125, 12.54296875, 12.958984375, 13.375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 2.0, 5.0, 7.0, 12.0, 25.0, 32.0, 43.0, 64.0, 96.0, 148.0, 151.0, 136.0, 98.0, 67.0, 40.0, 25.0, 21.0, 11.0, 9.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.96875, -10.5521240234375, -10.135498046875, -9.7188720703125, -9.30224609375, -8.8856201171875, -8.468994140625, -8.0523681640625, -7.6357421875, -7.2191162109375, -6.802490234375, -6.3858642578125, -5.96923828125, -5.5526123046875, -5.135986328125, -4.7193603515625, -4.302734375, -3.8861083984375, -3.469482421875, -3.0528564453125, -2.63623046875, -2.2196044921875, -1.802978515625, -1.3863525390625, -0.9697265625, -0.5531005859375, -0.136474609375, 0.2801513671875, 0.69677734375, 1.1134033203125, 1.530029296875, 1.9466552734375, 2.36328125, 2.7799072265625, 3.196533203125, 3.6131591796875, 4.02978515625, 4.4464111328125, 4.863037109375, 5.2796630859375, 5.6962890625, 6.1129150390625, 6.529541015625, 6.9461669921875, 7.36279296875, 7.7794189453125, 8.196044921875, 8.6126708984375, 9.029296875, 9.4459228515625, 9.862548828125, 10.2791748046875, 10.69580078125, 11.1124267578125, 11.529052734375, 11.9456787109375, 12.3623046875, 12.7789306640625, 13.195556640625, 13.6121826171875, 14.02880859375, 14.4454345703125, 14.862060546875, 15.2786865234375, 15.6953125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 0.0, 6.0, 5.0, 11.0, 6.0, 36.0, 90.0, 140.0, 300.0, 236.0, 106.0, 46.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-352.2567138671875, -344.4075927734375, -336.5585021972656, -328.7093811035156, -320.86029052734375, -313.01116943359375, -305.1620788574219, -297.3129577636719, -289.4638671875, -281.61474609375, -273.7656555175781, -265.9165344238281, -258.06744384765625, -250.2183380126953, -242.36923217773438, -234.52012634277344, -226.6710205078125, -218.82191467285156, -210.97280883789062, -203.1237030029297, -195.27459716796875, -187.4254913330078, -179.57638549804688, -171.72727966308594, -163.87815856933594, -156.029052734375, -148.17994689941406, -140.33084106445312, -132.4817352294922, -124.63262939453125, -116.78352355957031, -108.93441772460938, -101.08531188964844, -93.2362060546875, -85.38710021972656, -77.53799438476562, -69.68888854980469, -61.839778900146484, -53.99067306518555, -46.14156723022461, -38.29246139526367, -30.443355560302734, -22.594249725341797, -14.745141983032227, -6.896036148071289, 0.9530715942382812, 8.802177429199219, 16.651283264160156, 24.500389099121094, 32.34949493408203, 40.19860076904297, 48.047706604003906, 55.896812438964844, 63.74592208862305, 71.59503173828125, 79.44413757324219, 87.29324340820312, 95.14234924316406, 102.991455078125, 110.84056091308594, 118.68966674804688, 126.53877258300781, 134.38787841796875, 142.2369842529297, 150.08609008789062]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 11.0, 12.0, 21.0, 22.0, 24.0, 25.0, 41.0, 50.0, 56.0, 72.0, 81.0, 97.0, 76.0, 65.0, 59.0, 62.0, 49.0, 40.0, 30.0, 27.0, 14.0, 18.0, 12.0, 9.0, 12.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.99954223632812, -118.40872955322266, -113.81791687011719, -109.22710418701172, -104.63629150390625, -100.04547882080078, -95.45466613769531, -90.86386108398438, -86.27304077148438, -81.6822280883789, -77.09141540527344, -72.50060272216797, -67.9097900390625, -63.31897735595703, -58.72816848754883, -54.13735580444336, -49.546546936035156, -44.95573425292969, -40.36492156982422, -35.77410888671875, -31.183298110961914, -26.592485427856445, -22.00167465209961, -17.41086196899414, -12.820049285888672, -8.229236602783203, -3.638424873352051, 0.9523868560791016, 5.54319953918457, 10.134012222290039, 14.724822998046875, 19.315635681152344, 23.906448364257812, 28.49726104736328, 33.08807373046875, 37.67888641357422, 42.26969909667969, 46.860511779785156, 51.45132064819336, 56.04213333129883, 60.6329460144043, 65.2237548828125, 69.81456756591797, 74.40538024902344, 78.9961929321289, 83.58700561523438, 88.17781829833984, 92.76863098144531, 97.35944366455078, 101.95025634765625, 106.54106903076172, 111.13188171386719, 115.72269439697266, 120.31350708007812, 124.90431213378906, 129.49513244628906, 134.0859375, 138.67674255371094, 143.26756286621094, 147.85836791992188, 152.44918823242188, 157.0399932861328, 161.6308135986328, 166.22161865234375, 170.81243896484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 10.0, 21.0, 30.0, 41.0, 87.0, 134.0, 212.0, 401.0, 767.0, 1267.0, 2537.0, 5197.0, 11541.0, 30937.0, 123526.0, 1876090.0, 1962731.0, 127095.0, 30253.0, 10822.0, 4796.0, 2475.0, 1315.0, 733.0, 445.0, 270.0, 162.0, 112.0, 85.0, 57.0, 30.0, 23.0, 16.0, 18.0, 11.0, 13.0, 6.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59375, -9.1767578125, -8.759765625, -8.3427734375, -7.92578125, -7.5087890625, -7.091796875, -6.6748046875, -6.2578125, -5.8408203125, -5.423828125, -5.0068359375, -4.58984375, -4.1728515625, -3.755859375, -3.3388671875, -2.921875, -2.5048828125, -2.087890625, -1.6708984375, -1.25390625, -0.8369140625, -0.419921875, -0.0029296875, 0.4140625, 0.8310546875, 1.248046875, 1.6650390625, 2.08203125, 2.4990234375, 2.916015625, 3.3330078125, 3.75, 4.1669921875, 4.583984375, 5.0009765625, 5.41796875, 5.8349609375, 6.251953125, 6.6689453125, 7.0859375, 7.5029296875, 7.919921875, 8.3369140625, 8.75390625, 9.1708984375, 9.587890625, 10.0048828125, 10.421875, 10.8388671875, 11.255859375, 11.6728515625, 12.08984375, 12.5068359375, 12.923828125, 13.3408203125, 13.7578125, 14.1748046875, 14.591796875, 15.0087890625, 15.42578125, 15.8427734375, 16.259765625, 16.6767578125, 17.09375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 17.0, 24.0, 32.0, 45.0, 49.0, 87.0, 80.0, 108.0, 122.0, 91.0, 96.0, 63.0, 67.0, 40.0, 22.0, 23.0, 16.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90234375, -6.54803466796875, -6.1937255859375, -5.83941650390625, -5.485107421875, -5.13079833984375, -4.7764892578125, -4.42218017578125, -4.06787109375, -3.71356201171875, -3.3592529296875, -3.00494384765625, -2.650634765625, -2.29632568359375, -1.9420166015625, -1.58770751953125, -1.2333984375, -0.87908935546875, -0.5247802734375, -0.17047119140625, 0.183837890625, 0.53814697265625, 0.8924560546875, 1.24676513671875, 1.60107421875, 1.95538330078125, 2.3096923828125, 2.66400146484375, 3.018310546875, 3.37261962890625, 3.7269287109375, 4.08123779296875, 4.435546875, 4.78985595703125, 5.1441650390625, 5.49847412109375, 5.852783203125, 6.20709228515625, 6.5614013671875, 6.91571044921875, 7.27001953125, 7.62432861328125, 7.9786376953125, 8.33294677734375, 8.687255859375, 9.04156494140625, 9.3958740234375, 9.75018310546875, 10.1044921875, 10.45880126953125, 10.8131103515625, 11.16741943359375, 11.521728515625, 11.87603759765625, 12.2303466796875, 12.58465576171875, 12.93896484375, 13.29327392578125, 13.6475830078125, 14.00189208984375, 14.356201171875, 14.71051025390625, 15.0648193359375, 15.41912841796875, 15.7734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 6.0, 7.0, 8.0, 15.0, 16.0, 18.0, 36.0, 75.0, 152.0, 394.0, 1135.0, 3930.0, 18790.0, 223679.0, 3811652.0, 116652.0, 13351.0, 2876.0, 858.0, 329.0, 130.0, 60.0, 37.0, 19.0, 9.0, 15.0, 5.0, 4.0, 3.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.40625, -31.49072265625, -30.5751953125, -29.65966796875, -28.744140625, -27.82861328125, -26.9130859375, -25.99755859375, -25.08203125, -24.16650390625, -23.2509765625, -22.33544921875, -21.419921875, -20.50439453125, -19.5888671875, -18.67333984375, -17.7578125, -16.84228515625, -15.9267578125, -15.01123046875, -14.095703125, -13.18017578125, -12.2646484375, -11.34912109375, -10.43359375, -9.51806640625, -8.6025390625, -7.68701171875, -6.771484375, -5.85595703125, -4.9404296875, -4.02490234375, -3.109375, -2.19384765625, -1.2783203125, -0.36279296875, 0.552734375, 1.46826171875, 2.3837890625, 3.29931640625, 4.21484375, 5.13037109375, 6.0458984375, 6.96142578125, 7.876953125, 8.79248046875, 9.7080078125, 10.62353515625, 11.5390625, 12.45458984375, 13.3701171875, 14.28564453125, 15.201171875, 16.11669921875, 17.0322265625, 17.94775390625, 18.86328125, 19.77880859375, 20.6943359375, 21.60986328125, 22.525390625, 23.44091796875, 24.3564453125, 25.27197265625, 26.1875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 7.0, 6.0, 10.0, 6.0, 11.0, 16.0, 26.0, 28.0, 38.0, 50.0, 70.0, 109.0, 156.0, 323.0, 622.0, 999.0, 698.0, 308.0, 175.0, 119.0, 74.0, 69.0, 40.0, 17.0, 28.0, 16.0, 17.0, 7.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.015625, -15.491455078125, -14.96728515625, -14.443115234375, -13.9189453125, -13.394775390625, -12.87060546875, -12.346435546875, -11.822265625, -11.298095703125, -10.77392578125, -10.249755859375, -9.7255859375, -9.201416015625, -8.67724609375, -8.153076171875, -7.62890625, -7.104736328125, -6.58056640625, -6.056396484375, -5.5322265625, -5.008056640625, -4.48388671875, -3.959716796875, -3.435546875, -2.911376953125, -2.38720703125, -1.863037109375, -1.3388671875, -0.814697265625, -0.29052734375, 0.233642578125, 0.7578125, 1.281982421875, 1.80615234375, 2.330322265625, 2.8544921875, 3.378662109375, 3.90283203125, 4.427001953125, 4.951171875, 5.475341796875, 5.99951171875, 6.523681640625, 7.0478515625, 7.572021484375, 8.09619140625, 8.620361328125, 9.14453125, 9.668701171875, 10.19287109375, 10.717041015625, 11.2412109375, 11.765380859375, 12.28955078125, 12.813720703125, 13.337890625, 13.862060546875, 14.38623046875, 14.910400390625, 15.4345703125, 15.958740234375, 16.48291015625, 17.007080078125, 17.53125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 5.0, 15.0, 26.0, 39.0, 74.0, 133.0, 178.0, 184.0, 145.0, 87.0, 49.0, 20.0, 16.0, 9.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-185.03176879882812, -179.73724365234375, -174.44273376464844, -169.14820861816406, -163.85369873046875, -158.55917358398438, -153.2646484375, -147.9701385498047, -142.6756134033203, -137.38108825683594, -132.08657836914062, -126.79205322265625, -121.4975357055664, -116.20301818847656, -110.90850067138672, -105.61398315429688, -100.31946563720703, -95.02494812011719, -89.73043060302734, -84.4359130859375, -79.14138793945312, -73.84687042236328, -68.55235290527344, -63.25783157348633, -57.963314056396484, -52.66879653930664, -47.37427520751953, -42.07975769042969, -36.785240173339844, -31.490718841552734, -26.19620132446289, -20.90167999267578, -15.607162475585938, -10.312643051147461, -5.018124580383301, 0.2763938903808594, 5.570913314819336, 10.865432739257812, 16.159950256347656, 21.454471588134766, 26.74898910522461, 32.04350662231445, 37.33802795410156, 42.632545471191406, 47.92706298828125, 53.22158432006836, 58.5161018371582, 63.81062316894531, 69.10514068603516, 74.399658203125, 79.69417572021484, 84.98869323730469, 90.28321838378906, 95.5777359008789, 100.87225341796875, 106.16677856445312, 111.46128845214844, 116.75580596923828, 122.05032348632812, 127.3448486328125, 132.6393585205078, 137.9338836669922, 143.2283935546875, 148.52291870117188, 153.81744384765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 10.0, 17.0, 21.0, 40.0, 32.0, 48.0, 42.0, 66.0, 75.0, 75.0, 92.0, 78.0, 77.0, 67.0, 55.0, 57.0, 37.0, 33.0, 23.0, 13.0, 16.0, 7.0, 10.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.98085021972656, -152.24644470214844, -148.5120391845703, -144.7776336669922, -141.04322814941406, -137.30882263183594, -133.5744171142578, -129.8400115966797, -126.10560607910156, -122.37120056152344, -118.63679504394531, -114.90238952636719, -111.16798400878906, -107.43357849121094, -103.69917297363281, -99.96476745605469, -96.2303695678711, -92.49596405029297, -88.76155853271484, -85.02715301513672, -81.2927474975586, -77.55834197998047, -73.82394409179688, -70.08953857421875, -66.35513305664062, -62.6207275390625, -58.886322021484375, -55.15191650390625, -51.417510986328125, -47.68310546875, -43.94870376586914, -40.214298248291016, -36.479896545410156, -32.74549102783203, -29.011085510253906, -25.276681900024414, -21.54227638244629, -17.807870864868164, -14.073467254638672, -10.339061737060547, -6.604656219482422, -2.870251178741455, 0.8641538619995117, 4.59855842590332, 8.332963943481445, 12.06736946105957, 15.801773071289062, 19.536178588867188, 23.270584106445312, 27.004989624023438, 30.739395141601562, 34.47380065917969, 38.20820617675781, 41.94261169433594, 45.6770133972168, 49.41141891479492, 53.14582443237305, 56.88022994995117, 60.6146354675293, 64.34903717041016, 68.08344268798828, 71.8178482055664, 75.55225372314453, 79.28665924072266, 83.02106475830078]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 8.0, 7.0, 12.0, 30.0, 31.0, 46.0, 80.0, 144.0, 223.0, 447.0, 764.0, 1741.0, 4221.0, 12233.0, 42061.0, 160038.0, 491133.0, 244939.0, 62792.0, 17496.0, 5732.0, 2183.0, 985.0, 503.0, 281.0, 167.0, 83.0, 55.0, 33.0, 16.0, 21.0, 15.0, 11.0, 6.0, 5.0, 1.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6328125, -15.138916015625, -14.64501953125, -14.151123046875, -13.6572265625, -13.163330078125, -12.66943359375, -12.175537109375, -11.681640625, -11.187744140625, -10.69384765625, -10.199951171875, -9.7060546875, -9.212158203125, -8.71826171875, -8.224365234375, -7.73046875, -7.236572265625, -6.74267578125, -6.248779296875, -5.7548828125, -5.260986328125, -4.76708984375, -4.273193359375, -3.779296875, -3.285400390625, -2.79150390625, -2.297607421875, -1.8037109375, -1.309814453125, -0.81591796875, -0.322021484375, 0.171875, 0.665771484375, 1.15966796875, 1.653564453125, 2.1474609375, 2.641357421875, 3.13525390625, 3.629150390625, 4.123046875, 4.616943359375, 5.11083984375, 5.604736328125, 6.0986328125, 6.592529296875, 7.08642578125, 7.580322265625, 8.07421875, 8.568115234375, 9.06201171875, 9.555908203125, 10.0498046875, 10.543701171875, 11.03759765625, 11.531494140625, 12.025390625, 12.519287109375, 13.01318359375, 13.507080078125, 14.0009765625, 14.494873046875, 14.98876953125, 15.482666015625, 15.9765625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 4.0, 15.0, 13.0, 10.0, 24.0, 22.0, 25.0, 25.0, 49.0, 44.0, 45.0, 37.0, 55.0, 42.0, 61.0, 42.0, 64.0, 50.0, 47.0, 57.0, 39.0, 37.0, 33.0, 31.0, 26.0, 20.0, 16.0, 11.0, 6.0, 9.0, 6.0, 8.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.8828125, -6.69757080078125, -6.5123291015625, -6.32708740234375, -6.141845703125, -5.95660400390625, -5.7713623046875, -5.58612060546875, -5.40087890625, -5.21563720703125, -5.0303955078125, -4.84515380859375, -4.659912109375, -4.47467041015625, -4.2894287109375, -4.10418701171875, -3.9189453125, -3.73370361328125, -3.5484619140625, -3.36322021484375, -3.177978515625, -2.99273681640625, -2.8074951171875, -2.62225341796875, -2.43701171875, -2.25177001953125, -2.0665283203125, -1.88128662109375, -1.696044921875, -1.51080322265625, -1.3255615234375, -1.14031982421875, -0.955078125, -0.76983642578125, -0.5845947265625, -0.39935302734375, -0.214111328125, -0.02886962890625, 0.1563720703125, 0.34161376953125, 0.52685546875, 0.71209716796875, 0.8973388671875, 1.08258056640625, 1.267822265625, 1.45306396484375, 1.6383056640625, 1.82354736328125, 2.0087890625, 2.19403076171875, 2.3792724609375, 2.56451416015625, 2.749755859375, 2.93499755859375, 3.1202392578125, 3.30548095703125, 3.49072265625, 3.67596435546875, 3.8612060546875, 4.04644775390625, 4.231689453125, 4.41693115234375, 4.6021728515625, 4.78741455078125, 4.97265625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 10.0, 11.0, 13.0, 29.0, 29.0, 50.0, 51.0, 78.0, 117.0, 202.0, 306.0, 471.0, 730.0, 1200.0, 2272.0, 5707.0, 25398.0, 194499.0, 706200.0, 88739.0, 13915.0, 3968.0, 1774.0, 1007.0, 624.0, 390.0, 265.0, 155.0, 100.0, 60.0, 59.0, 26.0, 38.0, 12.0, 9.0, 10.0, 6.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.21875, -21.53125, -20.84375, -20.15625, -19.46875, -18.78125, -18.09375, -17.40625, -16.71875, -16.03125, -15.34375, -14.65625, -13.96875, -13.28125, -12.59375, -11.90625, -11.21875, -10.53125, -9.84375, -9.15625, -8.46875, -7.78125, -7.09375, -6.40625, -5.71875, -5.03125, -4.34375, -3.65625, -2.96875, -2.28125, -1.59375, -0.90625, -0.21875, 0.46875, 1.15625, 1.84375, 2.53125, 3.21875, 3.90625, 4.59375, 5.28125, 5.96875, 6.65625, 7.34375, 8.03125, 8.71875, 9.40625, 10.09375, 10.78125, 11.46875, 12.15625, 12.84375, 13.53125, 14.21875, 14.90625, 15.59375, 16.28125, 16.96875, 17.65625, 18.34375, 19.03125, 19.71875, 20.40625, 21.09375, 21.78125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 6.0, 4.0, 12.0, 6.0, 13.0, 18.0, 18.0, 14.0, 24.0, 21.0, 23.0, 29.0, 27.0, 44.0, 40.0, 35.0, 35.0, 39.0, 38.0, 40.0, 40.0, 42.0, 44.0, 36.0, 40.0, 31.0, 44.0, 35.0, 27.0, 28.0, 32.0, 21.0, 12.0, 14.0, 15.0, 15.0, 8.0, 3.0, 9.0, 5.0, 2.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.6875, -21.031494140625, -20.37548828125, -19.719482421875, -19.0634765625, -18.407470703125, -17.75146484375, -17.095458984375, -16.439453125, -15.783447265625, -15.12744140625, -14.471435546875, -13.8154296875, -13.159423828125, -12.50341796875, -11.847412109375, -11.19140625, -10.535400390625, -9.87939453125, -9.223388671875, -8.5673828125, -7.911376953125, -7.25537109375, -6.599365234375, -5.943359375, -5.287353515625, -4.63134765625, -3.975341796875, -3.3193359375, -2.663330078125, -2.00732421875, -1.351318359375, -0.6953125, -0.039306640625, 0.61669921875, 1.272705078125, 1.9287109375, 2.584716796875, 3.24072265625, 3.896728515625, 4.552734375, 5.208740234375, 5.86474609375, 6.520751953125, 7.1767578125, 7.832763671875, 8.48876953125, 9.144775390625, 9.80078125, 10.456787109375, 11.11279296875, 11.768798828125, 12.4248046875, 13.080810546875, 13.73681640625, 14.392822265625, 15.048828125, 15.704833984375, 16.36083984375, 17.016845703125, 17.6728515625, 18.328857421875, 18.98486328125, 19.640869140625, 20.296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 8.0, 10.0, 23.0, 24.0, 35.0, 53.0, 71.0, 115.0, 245.0, 530.0, 1279.0, 4832.0, 37147.0, 754116.0, 229547.0, 15981.0, 2772.0, 878.0, 385.0, 186.0, 108.0, 67.0, 38.0, 35.0, 22.0, 13.0, 9.0, 6.0, 10.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -9.011962890625, -8.68798828125, -8.364013671875, -8.0400390625, -7.716064453125, -7.39208984375, -7.068115234375, -6.744140625, -6.420166015625, -6.09619140625, -5.772216796875, -5.4482421875, -5.124267578125, -4.80029296875, -4.476318359375, -4.15234375, -3.828369140625, -3.50439453125, -3.180419921875, -2.8564453125, -2.532470703125, -2.20849609375, -1.884521484375, -1.560546875, -1.236572265625, -0.91259765625, -0.588623046875, -0.2646484375, 0.059326171875, 0.38330078125, 0.707275390625, 1.03125, 1.355224609375, 1.67919921875, 2.003173828125, 2.3271484375, 2.651123046875, 2.97509765625, 3.299072265625, 3.623046875, 3.947021484375, 4.27099609375, 4.594970703125, 4.9189453125, 5.242919921875, 5.56689453125, 5.890869140625, 6.21484375, 6.538818359375, 6.86279296875, 7.186767578125, 7.5107421875, 7.834716796875, 8.15869140625, 8.482666015625, 8.806640625, 9.130615234375, 9.45458984375, 9.778564453125, 10.1025390625, 10.426513671875, 10.75048828125, 11.074462890625, 11.3984375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 8.0, 5.0, 12.0, 13.0, 13.0, 19.0, 26.0, 28.0, 37.0, 36.0, 60.0, 84.0, 110.0, 111.0, 112.0, 68.0, 50.0, 36.0, 28.0, 37.0, 20.0, 13.0, 11.0, 10.0, 9.0, 7.0, 4.0, 4.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00138092041015625, -0.0013353228569030762, -0.0012897253036499023, -0.0012441277503967285, -0.0011985301971435547, -0.0011529326438903809, -0.001107335090637207, -0.0010617375373840332, -0.0010161399841308594, -0.0009705424308776855, -0.0009249448776245117, -0.0008793473243713379, -0.0008337497711181641, -0.0007881522178649902, -0.0007425546646118164, -0.0006969571113586426, -0.0006513595581054688, -0.0006057620048522949, -0.0005601644515991211, -0.0005145668983459473, -0.00046896934509277344, -0.0004233717918395996, -0.0003777742385864258, -0.00033217668533325195, -0.0002865791320800781, -0.0002409815788269043, -0.00019538402557373047, -0.00014978647232055664, -0.00010418891906738281, -5.8591365814208984e-05, -1.2993812561035156e-05, 3.260374069213867e-05, 7.82012939453125e-05, 0.00012379884719848633, 0.00016939640045166016, 0.00021499395370483398, 0.0002605915069580078, 0.00030618906021118164, 0.00035178661346435547, 0.0003973841667175293, 0.0004429817199707031, 0.000488579273223877, 0.0005341768264770508, 0.0005797743797302246, 0.0006253719329833984, 0.0006709694862365723, 0.0007165670394897461, 0.0007621645927429199, 0.0008077621459960938, 0.0008533596992492676, 0.0008989572525024414, 0.0009445548057556152, 0.000990152359008789, 0.0010357499122619629, 0.0010813474655151367, 0.0011269450187683105, 0.0011725425720214844, 0.0012181401252746582, 0.001263737678527832, 0.0013093352317810059, 0.0013549327850341797, 0.0014005303382873535, 0.0014461278915405273, 0.0014917254447937012, 0.001537322998046875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 9.0, 9.0, 14.0, 22.0, 32.0, 49.0, 73.0, 123.0, 190.0, 335.0, 730.0, 1454.0, 4293.0, 16710.0, 118258.0, 790114.0, 95051.0, 14318.0, 3891.0, 1424.0, 653.0, 315.0, 163.0, 126.0, 73.0, 33.0, 25.0, 18.0, 15.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.1171875, -10.82037353515625, -10.5235595703125, -10.22674560546875, -9.929931640625, -9.63311767578125, -9.3363037109375, -9.03948974609375, -8.74267578125, -8.44586181640625, -8.1490478515625, -7.85223388671875, -7.555419921875, -7.25860595703125, -6.9617919921875, -6.66497802734375, -6.3681640625, -6.07135009765625, -5.7745361328125, -5.47772216796875, -5.180908203125, -4.88409423828125, -4.5872802734375, -4.29046630859375, -3.99365234375, -3.69683837890625, -3.4000244140625, -3.10321044921875, -2.806396484375, -2.50958251953125, -2.2127685546875, -1.91595458984375, -1.619140625, -1.32232666015625, -1.0255126953125, -0.72869873046875, -0.431884765625, -0.13507080078125, 0.1617431640625, 0.45855712890625, 0.75537109375, 1.05218505859375, 1.3489990234375, 1.64581298828125, 1.942626953125, 2.23944091796875, 2.5362548828125, 2.83306884765625, 3.1298828125, 3.42669677734375, 3.7235107421875, 4.02032470703125, 4.317138671875, 4.61395263671875, 4.9107666015625, 5.20758056640625, 5.50439453125, 5.80120849609375, 6.0980224609375, 6.39483642578125, 6.691650390625, 6.98846435546875, 7.2852783203125, 7.58209228515625, 7.87890625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 4.0, 13.0, 22.0, 32.0, 38.0, 50.0, 57.0, 78.0, 106.0, 140.0, 113.0, 98.0, 60.0, 48.0, 46.0, 27.0, 18.0, 17.0, 7.0, 1.0, 2.0, 9.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23828125, -5.96002197265625, -5.6817626953125, -5.40350341796875, -5.125244140625, -4.84698486328125, -4.5687255859375, -4.29046630859375, -4.01220703125, -3.73394775390625, -3.4556884765625, -3.17742919921875, -2.899169921875, -2.62091064453125, -2.3426513671875, -2.06439208984375, -1.7861328125, -1.50787353515625, -1.2296142578125, -0.95135498046875, -0.673095703125, -0.39483642578125, -0.1165771484375, 0.16168212890625, 0.43994140625, 0.71820068359375, 0.9964599609375, 1.27471923828125, 1.552978515625, 1.83123779296875, 2.1094970703125, 2.38775634765625, 2.666015625, 2.94427490234375, 3.2225341796875, 3.50079345703125, 3.779052734375, 4.05731201171875, 4.3355712890625, 4.61383056640625, 4.89208984375, 5.17034912109375, 5.4486083984375, 5.72686767578125, 6.005126953125, 6.28338623046875, 6.5616455078125, 6.83990478515625, 7.1181640625, 7.39642333984375, 7.6746826171875, 7.95294189453125, 8.231201171875, 8.50946044921875, 8.7877197265625, 9.06597900390625, 9.34423828125, 9.62249755859375, 9.9007568359375, 10.17901611328125, 10.457275390625, 10.73553466796875, 11.0137939453125, 11.29205322265625, 11.5703125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 1.0, 6.0, 9.0, 17.0, 39.0, 90.0, 207.0, 306.0, 194.0, 68.0, 33.0, 18.0, 5.0, 4.0, 0.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.74072265625, -131.2911376953125, -124.84156799316406, -118.39198303222656, -111.9424057006836, -105.49282836914062, -99.04324340820312, -92.59366607666016, -86.14408874511719, -79.69451141357422, -73.24493408203125, -66.79534912109375, -60.34577178955078, -53.89619445800781, -47.44661331176758, -40.997032165527344, -34.547454833984375, -28.097875595092773, -21.648296356201172, -15.19871711730957, -8.749137878417969, -2.299560546875, 4.150020599365234, 10.599601745605469, 17.049179077148438, 23.49875831604004, 29.94833755493164, 36.397918701171875, 42.847496032714844, 49.29707336425781, 55.74665451049805, 62.19623565673828, 68.64581298828125, 75.09539031982422, 81.54496765136719, 87.99455261230469, 94.44412994384766, 100.89370727539062, 107.34329223632812, 113.7928695678711, 120.24244689941406, 126.69202423095703, 133.1416015625, 139.5911865234375, 146.040771484375, 152.49034118652344, 158.93992614746094, 165.38949584960938, 171.83908081054688, 178.28866577148438, 184.7382354736328, 191.1878204345703, 197.63739013671875, 204.08697509765625, 210.53656005859375, 216.98614501953125, 223.4357147216797, 229.8852996826172, 236.33486938476562, 242.78445434570312, 249.23403930664062, 255.68360900878906, 262.1331787109375, 268.582763671875, 275.0323486328125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 6.0, 7.0, 3.0, 15.0, 6.0, 13.0, 22.0, 26.0, 22.0, 22.0, 27.0, 39.0, 39.0, 39.0, 52.0, 53.0, 73.0, 83.0, 60.0, 72.0, 37.0, 36.0, 49.0, 24.0, 28.0, 13.0, 20.0, 18.0, 20.0, 10.0, 10.0, 11.0, 9.0, 8.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-117.97502136230469, -114.72610473632812, -111.47718048095703, -108.22826385498047, -104.9793472290039, -101.73042297363281, -98.48150634765625, -95.23258972167969, -91.98367309570312, -88.73475646972656, -85.48583221435547, -82.2369155883789, -78.98799896240234, -75.73907470703125, -72.49015808105469, -69.24124145507812, -65.99232482910156, -62.743404388427734, -59.49448776245117, -56.245567321777344, -52.99665069580078, -49.74773025512695, -46.498809814453125, -43.24989318847656, -40.00096893310547, -36.75204849243164, -33.50313186645508, -30.25421142578125, -27.005294799804688, -23.75637435913086, -20.507455825805664, -17.25853729248047, -14.009620666503906, -10.760702133178711, -7.511783123016357, -4.262864112854004, -1.0139455795288086, 2.234973907470703, 5.483892440795898, 8.732810974121094, 11.981729507446289, 15.230648040771484, 18.47956657409668, 21.728485107421875, 24.977405548095703, 28.2263240814209, 31.475242614746094, 34.724159240722656, 37.973079681396484, 41.22200012207031, 44.470916748046875, 47.7198371887207, 50.968753814697266, 54.217674255371094, 57.466590881347656, 60.715511322021484, 63.96443176269531, 67.21334838867188, 70.46227264404297, 73.71118927001953, 76.9601058959961, 80.20903015136719, 83.45794677734375, 86.70686340332031, 89.95578002929688]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 11.0, 12.0, 16.0, 17.0, 41.0, 62.0, 103.0, 170.0, 308.0, 493.0, 1030.0, 1870.0, 3977.0, 10851.0, 35322.0, 204270.0, 2938493.0, 886046.0, 79676.0, 19145.0, 6627.0, 2685.0, 1296.0, 676.0, 396.0, 241.0, 145.0, 98.0, 52.0, 44.0, 32.0, 17.0, 9.0, 12.0, 12.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.140625, -10.7784423828125, -10.416259765625, -10.0540771484375, -9.69189453125, -9.3297119140625, -8.967529296875, -8.6053466796875, -8.2431640625, -7.8809814453125, -7.518798828125, -7.1566162109375, -6.79443359375, -6.4322509765625, -6.070068359375, -5.7078857421875, -5.345703125, -4.9835205078125, -4.621337890625, -4.2591552734375, -3.89697265625, -3.5347900390625, -3.172607421875, -2.8104248046875, -2.4482421875, -2.0860595703125, -1.723876953125, -1.3616943359375, -0.99951171875, -0.6373291015625, -0.275146484375, 0.0870361328125, 0.44921875, 0.8114013671875, 1.173583984375, 1.5357666015625, 1.89794921875, 2.2601318359375, 2.622314453125, 2.9844970703125, 3.3466796875, 3.7088623046875, 4.071044921875, 4.4332275390625, 4.79541015625, 5.1575927734375, 5.519775390625, 5.8819580078125, 6.244140625, 6.6063232421875, 6.968505859375, 7.3306884765625, 7.69287109375, 8.0550537109375, 8.417236328125, 8.7794189453125, 9.1416015625, 9.5037841796875, 9.865966796875, 10.2281494140625, 10.59033203125, 10.9525146484375, 11.314697265625, 11.6768798828125, 12.0390625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 13.0, 19.0, 22.0, 38.0, 53.0, 63.0, 61.0, 78.0, 94.0, 80.0, 99.0, 89.0, 71.0, 61.0, 50.0, 41.0, 22.0, 13.0, 16.0, 9.0, 0.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.5390625, -14.23284912109375, -13.9266357421875, -13.62042236328125, -13.314208984375, -13.00799560546875, -12.7017822265625, -12.39556884765625, -12.08935546875, -11.78314208984375, -11.4769287109375, -11.17071533203125, -10.864501953125, -10.55828857421875, -10.2520751953125, -9.94586181640625, -9.6396484375, -9.33343505859375, -9.0272216796875, -8.72100830078125, -8.414794921875, -8.10858154296875, -7.8023681640625, -7.49615478515625, -7.18994140625, -6.88372802734375, -6.5775146484375, -6.27130126953125, -5.965087890625, -5.65887451171875, -5.3526611328125, -5.04644775390625, -4.740234375, -4.43402099609375, -4.1278076171875, -3.82159423828125, -3.515380859375, -3.20916748046875, -2.9029541015625, -2.59674072265625, -2.29052734375, -1.98431396484375, -1.6781005859375, -1.37188720703125, -1.065673828125, -0.75946044921875, -0.4532470703125, -0.14703369140625, 0.1591796875, 0.46539306640625, 0.7716064453125, 1.07781982421875, 1.384033203125, 1.69024658203125, 1.9964599609375, 2.30267333984375, 2.60888671875, 2.91510009765625, 3.2213134765625, 3.52752685546875, 3.833740234375, 4.13995361328125, 4.4461669921875, 4.75238037109375, 5.05859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 9.0, 8.0, 18.0, 27.0, 43.0, 76.0, 176.0, 412.0, 1137.0, 4294.0, 30487.0, 1579879.0, 2535735.0, 35324.0, 4677.0, 1172.0, 426.0, 161.0, 95.0, 49.0, 24.0, 17.0, 10.0, 4.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.76904296875, -23.9443359375, -23.11962890625, -22.294921875, -21.47021484375, -20.6455078125, -19.82080078125, -18.99609375, -18.17138671875, -17.3466796875, -16.52197265625, -15.697265625, -14.87255859375, -14.0478515625, -13.22314453125, -12.3984375, -11.57373046875, -10.7490234375, -9.92431640625, -9.099609375, -8.27490234375, -7.4501953125, -6.62548828125, -5.80078125, -4.97607421875, -4.1513671875, -3.32666015625, -2.501953125, -1.67724609375, -0.8525390625, -0.02783203125, 0.796875, 1.62158203125, 2.4462890625, 3.27099609375, 4.095703125, 4.92041015625, 5.7451171875, 6.56982421875, 7.39453125, 8.21923828125, 9.0439453125, 9.86865234375, 10.693359375, 11.51806640625, 12.3427734375, 13.16748046875, 13.9921875, 14.81689453125, 15.6416015625, 16.46630859375, 17.291015625, 18.11572265625, 18.9404296875, 19.76513671875, 20.58984375, 21.41455078125, 22.2392578125, 23.06396484375, 23.888671875, 24.71337890625, 25.5380859375, 26.36279296875, 27.1875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 8.0, 11.0, 15.0, 29.0, 31.0, 65.0, 115.0, 208.0, 565.0, 1343.0, 998.0, 324.0, 161.0, 76.0, 47.0, 27.0, 19.0, 9.0, 8.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.59375, -18.886962890625, -18.18017578125, -17.473388671875, -16.7666015625, -16.059814453125, -15.35302734375, -14.646240234375, -13.939453125, -13.232666015625, -12.52587890625, -11.819091796875, -11.1123046875, -10.405517578125, -9.69873046875, -8.991943359375, -8.28515625, -7.578369140625, -6.87158203125, -6.164794921875, -5.4580078125, -4.751220703125, -4.04443359375, -3.337646484375, -2.630859375, -1.924072265625, -1.21728515625, -0.510498046875, 0.1962890625, 0.903076171875, 1.60986328125, 2.316650390625, 3.0234375, 3.730224609375, 4.43701171875, 5.143798828125, 5.8505859375, 6.557373046875, 7.26416015625, 7.970947265625, 8.677734375, 9.384521484375, 10.09130859375, 10.798095703125, 11.5048828125, 12.211669921875, 12.91845703125, 13.625244140625, 14.33203125, 15.038818359375, 15.74560546875, 16.452392578125, 17.1591796875, 17.865966796875, 18.57275390625, 19.279541015625, 19.986328125, 20.693115234375, 21.39990234375, 22.106689453125, 22.8134765625, 23.520263671875, 24.22705078125, 24.933837890625, 25.640625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 4.0, 5.0, 11.0, 18.0, 30.0, 67.0, 111.0, 196.0, 195.0, 167.0, 86.0, 50.0, 24.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.5552978515625, -112.13999938964844, -107.72470092773438, -103.30941009521484, -98.89411163330078, -94.47881317138672, -90.06352233886719, -85.64822387695312, -81.23292541503906, -76.817626953125, -72.40232849121094, -67.9870376586914, -63.571739196777344, -59.15644073486328, -54.741146087646484, -50.32585144042969, -45.910552978515625, -41.49525451660156, -37.079959869384766, -32.66466522216797, -28.249366760253906, -23.834070205688477, -19.418773651123047, -15.003477096557617, -10.588180541992188, -6.172883987426758, -1.7575874328613281, 2.6577091217041016, 7.073005676269531, 11.488302230834961, 15.90359878540039, 20.31889533996582, 24.734207153320312, 29.149503707885742, 33.56480026245117, 37.98009490966797, 42.39539337158203, 46.810691833496094, 51.22598648071289, 55.64128112792969, 60.05657958984375, 64.47187805175781, 68.88717651367188, 73.3024673461914, 77.71776580810547, 82.13306427001953, 86.54835510253906, 90.96365356445312, 95.37895202636719, 99.79425048828125, 104.20954895019531, 108.62483978271484, 113.0401382446289, 117.45543670654297, 121.8707275390625, 126.28602600097656, 130.70132446289062, 135.1166229248047, 139.53192138671875, 143.9472198486328, 148.36251831054688, 152.77780151367188, 157.19309997558594, 161.6083984375, 166.02369689941406]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 5.0, 8.0, 14.0, 15.0, 19.0, 24.0, 19.0, 33.0, 27.0, 47.0, 53.0, 34.0, 47.0, 41.0, 59.0, 48.0, 62.0, 47.0, 61.0, 31.0, 37.0, 43.0, 44.0, 30.0, 24.0, 34.0, 15.0, 16.0, 13.0, 11.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.84131622314453, -49.76218032836914, -47.683040618896484, -45.603904724121094, -43.52476501464844, -41.44562911987305, -39.366493225097656, -37.287353515625, -35.20821762084961, -33.12908172607422, -31.049942016601562, -28.970806121826172, -26.89166831970215, -24.812530517578125, -22.733394622802734, -20.65425682067871, -18.575119018554688, -16.495981216430664, -14.416844367980957, -12.33770751953125, -10.258569717407227, -8.179431915283203, -6.100295066833496, -4.021158218383789, -1.9420204162597656, 0.1371169090270996, 2.216254234313965, 4.29539155960083, 6.374528884887695, 8.453666687011719, 10.532803535461426, 12.611940383911133, 14.691085815429688, 16.77022361755371, 18.849361419677734, 20.928497314453125, 23.00763511657715, 25.086772918701172, 27.165908813476562, 29.245046615600586, 31.32418441772461, 33.4033203125, 35.482460021972656, 37.56159591674805, 39.64073181152344, 41.719871520996094, 43.799007415771484, 45.878143310546875, 47.95728302001953, 50.03641891479492, 52.11555862426758, 54.19469451904297, 56.273834228515625, 58.352970123291016, 60.432106018066406, 62.51124572753906, 64.59037780761719, 66.66951751708984, 68.74864959716797, 70.82778930664062, 72.90692901611328, 74.98606872558594, 77.06520080566406, 79.14434051513672, 81.22348022460938]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 3.0, 9.0, 12.0, 15.0, 12.0, 34.0, 35.0, 46.0, 69.0, 90.0, 150.0, 236.0, 361.0, 522.0, 939.0, 1546.0, 2881.0, 5574.0, 11128.0, 23618.0, 53783.0, 130836.0, 329238.0, 288671.0, 110558.0, 46346.0, 20751.0, 9872.0, 4881.0, 2600.0, 1494.0, 875.0, 471.0, 285.0, 189.0, 122.0, 84.0, 59.0, 37.0, 29.0, 26.0, 21.0, 10.0, 10.0, 6.0, 9.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.828125, -9.5201416015625, -9.212158203125, -8.9041748046875, -8.59619140625, -8.2882080078125, -7.980224609375, -7.6722412109375, -7.3642578125, -7.0562744140625, -6.748291015625, -6.4403076171875, -6.13232421875, -5.8243408203125, -5.516357421875, -5.2083740234375, -4.900390625, -4.5924072265625, -4.284423828125, -3.9764404296875, -3.66845703125, -3.3604736328125, -3.052490234375, -2.7445068359375, -2.4365234375, -2.1285400390625, -1.820556640625, -1.5125732421875, -1.20458984375, -0.8966064453125, -0.588623046875, -0.2806396484375, 0.02734375, 0.3353271484375, 0.643310546875, 0.9512939453125, 1.25927734375, 1.5672607421875, 1.875244140625, 2.1832275390625, 2.4912109375, 2.7991943359375, 3.107177734375, 3.4151611328125, 3.72314453125, 4.0311279296875, 4.339111328125, 4.6470947265625, 4.955078125, 5.2630615234375, 5.571044921875, 5.8790283203125, 6.18701171875, 6.4949951171875, 6.802978515625, 7.1109619140625, 7.4189453125, 7.7269287109375, 8.034912109375, 8.3428955078125, 8.65087890625, 8.9588623046875, 9.266845703125, 9.5748291015625, 9.8828125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 16.0, 10.0, 6.0, 16.0, 22.0, 21.0, 24.0, 25.0, 38.0, 42.0, 35.0, 44.0, 37.0, 56.0, 52.0, 62.0, 59.0, 64.0, 66.0, 47.0, 44.0, 36.0, 33.0, 25.0, 29.0, 21.0, 9.0, 15.0, 11.0, 11.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76171875, -6.5760498046875, -6.390380859375, -6.2047119140625, -6.01904296875, -5.8333740234375, -5.647705078125, -5.4620361328125, -5.2763671875, -5.0906982421875, -4.905029296875, -4.7193603515625, -4.53369140625, -4.3480224609375, -4.162353515625, -3.9766845703125, -3.791015625, -3.6053466796875, -3.419677734375, -3.2340087890625, -3.04833984375, -2.8626708984375, -2.677001953125, -2.4913330078125, -2.3056640625, -2.1199951171875, -1.934326171875, -1.7486572265625, -1.56298828125, -1.3773193359375, -1.191650390625, -1.0059814453125, -0.8203125, -0.6346435546875, -0.448974609375, -0.2633056640625, -0.07763671875, 0.1080322265625, 0.293701171875, 0.4793701171875, 0.6650390625, 0.8507080078125, 1.036376953125, 1.2220458984375, 1.40771484375, 1.5933837890625, 1.779052734375, 1.9647216796875, 2.150390625, 2.3360595703125, 2.521728515625, 2.7073974609375, 2.89306640625, 3.0787353515625, 3.264404296875, 3.4500732421875, 3.6357421875, 3.8214111328125, 4.007080078125, 4.1927490234375, 4.37841796875, 4.5640869140625, 4.749755859375, 4.9354248046875, 5.12109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 7.0, 5.0, 9.0, 17.0, 23.0, 43.0, 95.0, 147.0, 287.0, 556.0, 1233.0, 3532.0, 20745.0, 599411.0, 398213.0, 18558.0, 3298.0, 1216.0, 595.0, 247.0, 138.0, 81.0, 41.0, 21.0, 17.0, 11.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.25, -35.18310546875, -34.1162109375, -33.04931640625, -31.982421875, -30.91552734375, -29.8486328125, -28.78173828125, -27.71484375, -26.64794921875, -25.5810546875, -24.51416015625, -23.447265625, -22.38037109375, -21.3134765625, -20.24658203125, -19.1796875, -18.11279296875, -17.0458984375, -15.97900390625, -14.912109375, -13.84521484375, -12.7783203125, -11.71142578125, -10.64453125, -9.57763671875, -8.5107421875, -7.44384765625, -6.376953125, -5.31005859375, -4.2431640625, -3.17626953125, -2.109375, -1.04248046875, 0.0244140625, 1.09130859375, 2.158203125, 3.22509765625, 4.2919921875, 5.35888671875, 6.42578125, 7.49267578125, 8.5595703125, 9.62646484375, 10.693359375, 11.76025390625, 12.8271484375, 13.89404296875, 14.9609375, 16.02783203125, 17.0947265625, 18.16162109375, 19.228515625, 20.29541015625, 21.3623046875, 22.42919921875, 23.49609375, 24.56298828125, 25.6298828125, 26.69677734375, 27.763671875, 28.83056640625, 29.8974609375, 30.96435546875, 32.03125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 8.0, 6.0, 3.0, 13.0, 4.0, 7.0, 8.0, 22.0, 19.0, 20.0, 27.0, 21.0, 40.0, 43.0, 40.0, 31.0, 42.0, 48.0, 40.0, 56.0, 55.0, 53.0, 41.0, 41.0, 46.0, 43.0, 28.0, 34.0, 33.0, 27.0, 18.0, 14.0, 20.0, 15.0, 5.0, 7.0, 8.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.46875, -19.8642578125, -19.259765625, -18.6552734375, -18.05078125, -17.4462890625, -16.841796875, -16.2373046875, -15.6328125, -15.0283203125, -14.423828125, -13.8193359375, -13.21484375, -12.6103515625, -12.005859375, -11.4013671875, -10.796875, -10.1923828125, -9.587890625, -8.9833984375, -8.37890625, -7.7744140625, -7.169921875, -6.5654296875, -5.9609375, -5.3564453125, -4.751953125, -4.1474609375, -3.54296875, -2.9384765625, -2.333984375, -1.7294921875, -1.125, -0.5205078125, 0.083984375, 0.6884765625, 1.29296875, 1.8974609375, 2.501953125, 3.1064453125, 3.7109375, 4.3154296875, 4.919921875, 5.5244140625, 6.12890625, 6.7333984375, 7.337890625, 7.9423828125, 8.546875, 9.1513671875, 9.755859375, 10.3603515625, 10.96484375, 11.5693359375, 12.173828125, 12.7783203125, 13.3828125, 13.9873046875, 14.591796875, 15.1962890625, 15.80078125, 16.4052734375, 17.009765625, 17.6142578125, 18.21875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 7.0, 9.0, 11.0, 17.0, 21.0, 30.0, 42.0, 63.0, 110.0, 207.0, 431.0, 1345.0, 8272.0, 176340.0, 839462.0, 18529.0, 2365.0, 654.0, 251.0, 136.0, 70.0, 45.0, 32.0, 32.0, 18.0, 9.0, 7.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-17.09375, -16.6339111328125, -16.174072265625, -15.7142333984375, -15.25439453125, -14.7945556640625, -14.334716796875, -13.8748779296875, -13.4150390625, -12.9552001953125, -12.495361328125, -12.0355224609375, -11.57568359375, -11.1158447265625, -10.656005859375, -10.1961669921875, -9.736328125, -9.2764892578125, -8.816650390625, -8.3568115234375, -7.89697265625, -7.4371337890625, -6.977294921875, -6.5174560546875, -6.0576171875, -5.5977783203125, -5.137939453125, -4.6781005859375, -4.21826171875, -3.7584228515625, -3.298583984375, -2.8387451171875, -2.37890625, -1.9190673828125, -1.459228515625, -0.9993896484375, -0.53955078125, -0.0797119140625, 0.380126953125, 0.8399658203125, 1.2998046875, 1.7596435546875, 2.219482421875, 2.6793212890625, 3.13916015625, 3.5989990234375, 4.058837890625, 4.5186767578125, 4.978515625, 5.4383544921875, 5.898193359375, 6.3580322265625, 6.81787109375, 7.2777099609375, 7.737548828125, 8.1973876953125, 8.6572265625, 9.1170654296875, 9.576904296875, 10.0367431640625, 10.49658203125, 10.9564208984375, 11.416259765625, 11.8760986328125, 12.3359375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 10.0, 12.0, 15.0, 23.0, 22.0, 35.0, 49.0, 81.0, 122.0, 185.0, 153.0, 78.0, 58.0, 36.0, 24.0, 15.0, 21.0, 19.0, 8.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00225830078125, -0.002193272113800049, -0.0021282434463500977, -0.0020632147789001465, -0.0019981861114501953, -0.0019331574440002441, -0.001868128776550293, -0.0018031001091003418, -0.0017380714416503906, -0.0016730427742004395, -0.0016080141067504883, -0.0015429854393005371, -0.001477956771850586, -0.0014129281044006348, -0.0013478994369506836, -0.0012828707695007324, -0.0012178421020507812, -0.00115281343460083, -0.001087784767150879, -0.0010227560997009277, -0.0009577274322509766, -0.0008926987648010254, -0.0008276700973510742, -0.000762641429901123, -0.0006976127624511719, -0.0006325840950012207, -0.0005675554275512695, -0.0005025267601013184, -0.0004374980926513672, -0.000372469425201416, -0.00030744075775146484, -0.00024241209030151367, -0.0001773834228515625, -0.00011235475540161133, -4.7326087951660156e-05, 1.7702579498291016e-05, 8.273124694824219e-05, 0.00014775991439819336, 0.00021278858184814453, 0.0002778172492980957, 0.0003428459167480469, 0.00040787458419799805, 0.0004729032516479492, 0.0005379319190979004, 0.0006029605865478516, 0.0006679892539978027, 0.0007330179214477539, 0.0007980465888977051, 0.0008630752563476562, 0.0009281039237976074, 0.0009931325912475586, 0.0010581612586975098, 0.001123189926147461, 0.0011882185935974121, 0.0012532472610473633, 0.0013182759284973145, 0.0013833045959472656, 0.0014483332633972168, 0.001513361930847168, 0.0015783905982971191, 0.0016434192657470703, 0.0017084479331970215, 0.0017734766006469727, 0.0018385052680969238, 0.001903533935546875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 5.0, 5.0, 11.0, 11.0, 13.0, 28.0, 36.0, 58.0, 115.0, 146.0, 244.0, 467.0, 832.0, 1720.0, 3957.0, 12426.0, 62560.0, 721865.0, 205757.0, 26098.0, 6931.0, 2598.0, 1190.0, 600.0, 332.0, 203.0, 126.0, 69.0, 51.0, 28.0, 23.0, 17.0, 9.0, 6.0, 9.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.08984375, -6.8665771484375, -6.643310546875, -6.4200439453125, -6.19677734375, -5.9735107421875, -5.750244140625, -5.5269775390625, -5.3037109375, -5.0804443359375, -4.857177734375, -4.6339111328125, -4.41064453125, -4.1873779296875, -3.964111328125, -3.7408447265625, -3.517578125, -3.2943115234375, -3.071044921875, -2.8477783203125, -2.62451171875, -2.4012451171875, -2.177978515625, -1.9547119140625, -1.7314453125, -1.5081787109375, -1.284912109375, -1.0616455078125, -0.83837890625, -0.6151123046875, -0.391845703125, -0.1685791015625, 0.0546875, 0.2779541015625, 0.501220703125, 0.7244873046875, 0.94775390625, 1.1710205078125, 1.394287109375, 1.6175537109375, 1.8408203125, 2.0640869140625, 2.287353515625, 2.5106201171875, 2.73388671875, 2.9571533203125, 3.180419921875, 3.4036865234375, 3.626953125, 3.8502197265625, 4.073486328125, 4.2967529296875, 4.52001953125, 4.7432861328125, 4.966552734375, 5.1898193359375, 5.4130859375, 5.6363525390625, 5.859619140625, 6.0828857421875, 6.30615234375, 6.5294189453125, 6.752685546875, 6.9759521484375, 7.19921875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 5.0, 5.0, 6.0, 5.0, 4.0, 7.0, 10.0, 18.0, 23.0, 19.0, 23.0, 41.0, 56.0, 88.0, 105.0, 118.0, 107.0, 97.0, 68.0, 44.0, 35.0, 26.0, 16.0, 19.0, 11.0, 10.0, 10.0, 7.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.80517578125, -4.6259765625, -4.44677734375, -4.267578125, -4.08837890625, -3.9091796875, -3.72998046875, -3.55078125, -3.37158203125, -3.1923828125, -3.01318359375, -2.833984375, -2.65478515625, -2.4755859375, -2.29638671875, -2.1171875, -1.93798828125, -1.7587890625, -1.57958984375, -1.400390625, -1.22119140625, -1.0419921875, -0.86279296875, -0.68359375, -0.50439453125, -0.3251953125, -0.14599609375, 0.033203125, 0.21240234375, 0.3916015625, 0.57080078125, 0.75, 0.92919921875, 1.1083984375, 1.28759765625, 1.466796875, 1.64599609375, 1.8251953125, 2.00439453125, 2.18359375, 2.36279296875, 2.5419921875, 2.72119140625, 2.900390625, 3.07958984375, 3.2587890625, 3.43798828125, 3.6171875, 3.79638671875, 3.9755859375, 4.15478515625, 4.333984375, 4.51318359375, 4.6923828125, 4.87158203125, 5.05078125, 5.22998046875, 5.4091796875, 5.58837890625, 5.767578125, 5.94677734375, 6.1259765625, 6.30517578125, 6.484375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 27.0, 96.0, 320.0, 370.0, 123.0, 32.0, 15.0, 2.0, 6.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.9695281982422, -161.98699951171875, -153.00448608398438, -144.02195739746094, -135.03944396972656, -126.05691528320312, -117.07439422607422, -108.09187316894531, -99.1093521118164, -90.1268310546875, -81.1443099975586, -72.16178894042969, -63.179264068603516, -54.19674301147461, -45.21421813964844, -36.23169708251953, -27.249176025390625, -18.26665496826172, -9.28413200378418, -0.3016090393066406, 8.680912017822266, 17.663433074951172, 26.645957946777344, 35.62847900390625, 44.611000061035156, 53.59352111816406, 62.57604217529297, 71.55856323242188, 80.54109191894531, 89.52360534667969, 98.50613403320312, 107.48865509033203, 116.47119140625, 125.4537124633789, 134.4362335205078, 143.41876220703125, 152.40127563476562, 161.38380432128906, 170.3663330078125, 179.34884643554688, 188.33135986328125, 197.3138885498047, 206.29640197753906, 215.2789306640625, 224.26144409179688, 233.2439727783203, 242.22650146484375, 251.20901489257812, 260.1915283203125, 269.1740417480469, 278.1565856933594, 287.13909912109375, 296.1216125488281, 305.1041259765625, 314.086669921875, 323.0691833496094, 332.0517272949219, 341.03424072265625, 350.01678466796875, 358.9992980957031, 367.9818115234375, 376.9643249511719, 385.9468688964844, 394.92938232421875, 403.9118957519531]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 6.0, 0.0, 1.0, 5.0, 3.0, 6.0, 4.0, 8.0, 7.0, 7.0, 23.0, 14.0, 16.0, 9.0, 18.0, 25.0, 22.0, 27.0, 26.0, 24.0, 30.0, 38.0, 49.0, 45.0, 65.0, 51.0, 62.0, 47.0, 35.0, 40.0, 33.0, 31.0, 31.0, 26.0, 23.0, 17.0, 19.0, 21.0, 19.0, 14.0, 8.0, 10.0, 12.0, 7.0, 7.0, 1.0, 5.0, 8.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.10136413574219, -62.89226531982422, -60.68316650390625, -58.47406768798828, -56.26496887207031, -54.055870056152344, -51.846771240234375, -49.637672424316406, -47.42857360839844, -45.21947479248047, -43.0103759765625, -40.80127716064453, -38.59217834472656, -36.383079528808594, -34.173980712890625, -31.964881896972656, -29.755783081054688, -27.54668426513672, -25.33758544921875, -23.12848663330078, -20.919387817382812, -18.710289001464844, -16.501190185546875, -14.292091369628906, -12.082992553710938, -9.873893737792969, -7.664794921875, -5.455696105957031, -3.2465972900390625, -1.0374984741210938, 1.171600341796875, 3.3806991577148438, 5.5897979736328125, 7.798896789550781, 10.00799560546875, 12.217094421386719, 14.426193237304688, 16.635292053222656, 18.844390869140625, 21.053489685058594, 23.262588500976562, 25.47168731689453, 27.6807861328125, 29.88988494873047, 32.09898376464844, 34.308082580566406, 36.517181396484375, 38.726280212402344, 40.93537902832031, 43.14447784423828, 45.35357666015625, 47.56267547607422, 49.77177429199219, 51.980873107910156, 54.189971923828125, 56.399070739746094, 58.60816955566406, 60.81726837158203, 63.0263671875, 65.23546600341797, 67.44456481933594, 69.6536636352539, 71.86276245117188, 74.07186126708984, 76.28096008300781]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 5.0, 0.0, 8.0, 8.0, 8.0, 16.0, 37.0, 65.0, 89.0, 162.0, 259.0, 437.0, 737.0, 1449.0, 3023.0, 6906.0, 21752.0, 132968.0, 3038851.0, 911631.0, 53647.0, 12611.0, 4676.0, 2178.0, 1083.0, 626.0, 358.0, 223.0, 162.0, 88.0, 55.0, 44.0, 45.0, 20.0, 15.0, 16.0, 10.0, 7.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3984375, -7.9945068359375, -7.590576171875, -7.1866455078125, -6.78271484375, -6.3787841796875, -5.974853515625, -5.5709228515625, -5.1669921875, -4.7630615234375, -4.359130859375, -3.9552001953125, -3.55126953125, -3.1473388671875, -2.743408203125, -2.3394775390625, -1.935546875, -1.5316162109375, -1.127685546875, -0.7237548828125, -0.31982421875, 0.0841064453125, 0.488037109375, 0.8919677734375, 1.2958984375, 1.6998291015625, 2.103759765625, 2.5076904296875, 2.91162109375, 3.3155517578125, 3.719482421875, 4.1234130859375, 4.52734375, 4.9312744140625, 5.335205078125, 5.7391357421875, 6.14306640625, 6.5469970703125, 6.950927734375, 7.3548583984375, 7.7587890625, 8.1627197265625, 8.566650390625, 8.9705810546875, 9.37451171875, 9.7784423828125, 10.182373046875, 10.5863037109375, 10.990234375, 11.3941650390625, 11.798095703125, 12.2020263671875, 12.60595703125, 13.0098876953125, 13.413818359375, 13.8177490234375, 14.2216796875, 14.6256103515625, 15.029541015625, 15.4334716796875, 15.83740234375, 16.2413330078125, 16.645263671875, 17.0491943359375, 17.453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 9.0, 6.0, 8.0, 15.0, 19.0, 29.0, 36.0, 42.0, 46.0, 52.0, 58.0, 76.0, 83.0, 74.0, 81.0, 71.0, 54.0, 47.0, 44.0, 36.0, 20.0, 26.0, 23.0, 13.0, 11.0, 8.0, 7.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -8.09332275390625, -7.8819580078125, -7.67059326171875, -7.459228515625, -7.24786376953125, -7.0364990234375, -6.82513427734375, -6.61376953125, -6.40240478515625, -6.1910400390625, -5.97967529296875, -5.768310546875, -5.55694580078125, -5.3455810546875, -5.13421630859375, -4.9228515625, -4.71148681640625, -4.5001220703125, -4.28875732421875, -4.077392578125, -3.86602783203125, -3.6546630859375, -3.44329833984375, -3.23193359375, -3.02056884765625, -2.8092041015625, -2.59783935546875, -2.386474609375, -2.17510986328125, -1.9637451171875, -1.75238037109375, -1.541015625, -1.32965087890625, -1.1182861328125, -0.90692138671875, -0.695556640625, -0.48419189453125, -0.2728271484375, -0.06146240234375, 0.14990234375, 0.36126708984375, 0.5726318359375, 0.78399658203125, 0.995361328125, 1.20672607421875, 1.4180908203125, 1.62945556640625, 1.8408203125, 2.05218505859375, 2.2635498046875, 2.47491455078125, 2.686279296875, 2.89764404296875, 3.1090087890625, 3.32037353515625, 3.53173828125, 3.74310302734375, 3.9544677734375, 4.16583251953125, 4.377197265625, 4.58856201171875, 4.7999267578125, 5.01129150390625, 5.22265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 8.0, 6.0, 8.0, 21.0, 15.0, 34.0, 60.0, 72.0, 118.0, 224.0, 502.0, 1156.0, 3358.0, 12203.0, 89408.0, 3699827.0, 353648.0, 23973.0, 5811.0, 1986.0, 853.0, 428.0, 217.0, 119.0, 77.0, 50.0, 27.0, 22.0, 5.0, 12.0, 8.0, 9.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.21875, -16.59716796875, -15.9755859375, -15.35400390625, -14.732421875, -14.11083984375, -13.4892578125, -12.86767578125, -12.24609375, -11.62451171875, -11.0029296875, -10.38134765625, -9.759765625, -9.13818359375, -8.5166015625, -7.89501953125, -7.2734375, -6.65185546875, -6.0302734375, -5.40869140625, -4.787109375, -4.16552734375, -3.5439453125, -2.92236328125, -2.30078125, -1.67919921875, -1.0576171875, -0.43603515625, 0.185546875, 0.80712890625, 1.4287109375, 2.05029296875, 2.671875, 3.29345703125, 3.9150390625, 4.53662109375, 5.158203125, 5.77978515625, 6.4013671875, 7.02294921875, 7.64453125, 8.26611328125, 8.8876953125, 9.50927734375, 10.130859375, 10.75244140625, 11.3740234375, 11.99560546875, 12.6171875, 13.23876953125, 13.8603515625, 14.48193359375, 15.103515625, 15.72509765625, 16.3466796875, 16.96826171875, 17.58984375, 18.21142578125, 18.8330078125, 19.45458984375, 20.076171875, 20.69775390625, 21.3193359375, 21.94091796875, 22.5625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 11.0, 20.0, 25.0, 42.0, 73.0, 131.0, 245.0, 562.0, 1136.0, 1020.0, 394.0, 163.0, 93.0, 44.0, 29.0, 23.0, 17.0, 11.0, 3.0, 8.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.46875, -11.921875, -11.375, -10.828125, -10.28125, -9.734375, -9.1875, -8.640625, -8.09375, -7.546875, -7.0, -6.453125, -5.90625, -5.359375, -4.8125, -4.265625, -3.71875, -3.171875, -2.625, -2.078125, -1.53125, -0.984375, -0.4375, 0.109375, 0.65625, 1.203125, 1.75, 2.296875, 2.84375, 3.390625, 3.9375, 4.484375, 5.03125, 5.578125, 6.125, 6.671875, 7.21875, 7.765625, 8.3125, 8.859375, 9.40625, 9.953125, 10.5, 11.046875, 11.59375, 12.140625, 12.6875, 13.234375, 13.78125, 14.328125, 14.875, 15.421875, 15.96875, 16.515625, 17.0625, 17.609375, 18.15625, 18.703125, 19.25, 19.796875, 20.34375, 20.890625, 21.4375, 21.984375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 7.0, 6.0, 20.0, 16.0, 68.0, 140.0, 246.0, 260.0, 133.0, 46.0, 25.0, 10.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.8594207763672, -143.5474853515625, -138.2355499267578, -132.92361450195312, -127.61167907714844, -122.29974365234375, -116.9878158569336, -111.6758804321289, -106.36394500732422, -101.05200958251953, -95.74007415771484, -90.42813873291016, -85.1162109375, -79.80427551269531, -74.49234008789062, -69.18040466308594, -63.86846923828125, -58.55653381347656, -53.244598388671875, -47.93266677856445, -42.620731353759766, -37.30879592895508, -31.996862411499023, -26.68492889404297, -21.37299346923828, -16.061058044433594, -10.749124526977539, -5.437190055847168, -0.12525558471679688, 5.186679840087891, 10.498613357543945, 15.810546875, 21.122467041015625, 26.434402465820312, 31.746335983276367, 37.05826950073242, 42.37020492553711, 47.6821403503418, 52.99407196044922, 58.306007385253906, 63.617942810058594, 68.92987823486328, 74.24181365966797, 79.55374908447266, 84.86567687988281, 90.1776123046875, 95.48954772949219, 100.80148315429688, 106.11341857910156, 111.42535400390625, 116.73728942871094, 122.04922485351562, 127.36116027832031, 132.673095703125, 137.9850311279297, 143.29696655273438, 148.60888671875, 153.9208221435547, 159.23275756835938, 164.54469299316406, 169.85662841796875, 175.16856384277344, 180.48049926757812, 185.79241943359375, 191.1043701171875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 7.0, 10.0, 21.0, 19.0, 33.0, 40.0, 47.0, 72.0, 90.0, 80.0, 89.0, 83.0, 85.0, 72.0, 73.0, 47.0, 37.0, 26.0, 17.0, 17.0, 11.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.43803405761719, -74.84020233154297, -72.24237823486328, -69.64454650878906, -67.04672241210938, -64.44889068603516, -61.85105895996094, -59.253231048583984, -56.65540313720703, -54.05757522583008, -51.459747314453125, -48.861915588378906, -46.26408767700195, -43.666259765625, -41.06842803955078, -38.47060012817383, -35.872772216796875, -33.27494430541992, -30.677114486694336, -28.07928466796875, -25.481456756591797, -22.883628845214844, -20.285799026489258, -17.687969207763672, -15.090141296386719, -12.49231243133545, -9.89448356628418, -7.29665470123291, -4.698825836181641, -2.100996971130371, 0.49683189392089844, 3.0946617126464844, 5.6924896240234375, 8.290318489074707, 10.888147354125977, 13.485976219177246, 16.083805084228516, 18.68163299560547, 21.279462814331055, 23.87729263305664, 26.475120544433594, 29.072948455810547, 31.670778274536133, 34.26860809326172, 36.86643600463867, 39.464263916015625, 42.062095642089844, 44.6599235534668, 47.25775146484375, 49.8555793762207, 52.453407287597656, 55.051239013671875, 57.64906692504883, 60.24689483642578, 62.8447265625, 65.44255065917969, 68.0403823852539, 70.63821411132812, 73.23603820800781, 75.83386993408203, 78.43170166015625, 81.02952575683594, 83.62735748291016, 86.22518920898438, 88.82301330566406]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 16.0, 33.0, 51.0, 99.0, 216.0, 498.0, 1116.0, 3138.0, 10522.0, 46584.0, 292704.0, 557867.0, 107225.0, 19961.0, 5416.0, 1751.0, 675.0, 308.0, 146.0, 100.0, 53.0, 25.0, 12.0, 9.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0546875, -12.5159912109375, -11.977294921875, -11.4385986328125, -10.89990234375, -10.3612060546875, -9.822509765625, -9.2838134765625, -8.7451171875, -8.2064208984375, -7.667724609375, -7.1290283203125, -6.59033203125, -6.0516357421875, -5.512939453125, -4.9742431640625, -4.435546875, -3.8968505859375, -3.358154296875, -2.8194580078125, -2.28076171875, -1.7420654296875, -1.203369140625, -0.6646728515625, -0.1259765625, 0.4127197265625, 0.951416015625, 1.4901123046875, 2.02880859375, 2.5675048828125, 3.106201171875, 3.6448974609375, 4.18359375, 4.7222900390625, 5.260986328125, 5.7996826171875, 6.33837890625, 6.8770751953125, 7.415771484375, 7.9544677734375, 8.4931640625, 9.0318603515625, 9.570556640625, 10.1092529296875, 10.64794921875, 11.1866455078125, 11.725341796875, 12.2640380859375, 12.802734375, 13.3414306640625, 13.880126953125, 14.4188232421875, 14.95751953125, 15.4962158203125, 16.034912109375, 16.5736083984375, 17.1123046875, 17.6510009765625, 18.189697265625, 18.7283935546875, 19.26708984375, 19.8057861328125, 20.344482421875, 20.8831787109375, 21.421875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 10.0, 9.0, 13.0, 17.0, 20.0, 31.0, 42.0, 55.0, 59.0, 65.0, 69.0, 72.0, 91.0, 78.0, 67.0, 66.0, 48.0, 52.0, 38.0, 32.0, 20.0, 10.0, 16.0, 7.0, 9.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.7265625, -9.49658203125, -9.2666015625, -9.03662109375, -8.806640625, -8.57666015625, -8.3466796875, -8.11669921875, -7.88671875, -7.65673828125, -7.4267578125, -7.19677734375, -6.966796875, -6.73681640625, -6.5068359375, -6.27685546875, -6.046875, -5.81689453125, -5.5869140625, -5.35693359375, -5.126953125, -4.89697265625, -4.6669921875, -4.43701171875, -4.20703125, -3.97705078125, -3.7470703125, -3.51708984375, -3.287109375, -3.05712890625, -2.8271484375, -2.59716796875, -2.3671875, -2.13720703125, -1.9072265625, -1.67724609375, -1.447265625, -1.21728515625, -0.9873046875, -0.75732421875, -0.52734375, -0.29736328125, -0.0673828125, 0.16259765625, 0.392578125, 0.62255859375, 0.8525390625, 1.08251953125, 1.3125, 1.54248046875, 1.7724609375, 2.00244140625, 2.232421875, 2.46240234375, 2.6923828125, 2.92236328125, 3.15234375, 3.38232421875, 3.6123046875, 3.84228515625, 4.072265625, 4.30224609375, 4.5322265625, 4.76220703125, 4.9921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 13.0, 10.0, 26.0, 34.0, 37.0, 70.0, 103.0, 165.0, 346.0, 730.0, 2013.0, 7905.0, 44910.0, 512349.0, 424829.0, 43707.0, 7742.0, 2025.0, 694.0, 334.0, 186.0, 95.0, 73.0, 42.0, 31.0, 19.0, 17.0, 10.0, 7.0, 3.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.453125, -18.880859375, -18.30859375, -17.736328125, -17.1640625, -16.591796875, -16.01953125, -15.447265625, -14.875, -14.302734375, -13.73046875, -13.158203125, -12.5859375, -12.013671875, -11.44140625, -10.869140625, -10.296875, -9.724609375, -9.15234375, -8.580078125, -8.0078125, -7.435546875, -6.86328125, -6.291015625, -5.71875, -5.146484375, -4.57421875, -4.001953125, -3.4296875, -2.857421875, -2.28515625, -1.712890625, -1.140625, -0.568359375, 0.00390625, 0.576171875, 1.1484375, 1.720703125, 2.29296875, 2.865234375, 3.4375, 4.009765625, 4.58203125, 5.154296875, 5.7265625, 6.298828125, 6.87109375, 7.443359375, 8.015625, 8.587890625, 9.16015625, 9.732421875, 10.3046875, 10.876953125, 11.44921875, 12.021484375, 12.59375, 13.166015625, 13.73828125, 14.310546875, 14.8828125, 15.455078125, 16.02734375, 16.599609375, 17.171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 11.0, 11.0, 7.0, 13.0, 18.0, 19.0, 32.0, 21.0, 30.0, 28.0, 35.0, 41.0, 58.0, 48.0, 47.0, 49.0, 45.0, 50.0, 54.0, 42.0, 41.0, 39.0, 27.0, 42.0, 34.0, 22.0, 23.0, 17.0, 17.0, 16.0, 10.0, 16.0, 5.0, 5.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9453125, -15.4278564453125, -14.910400390625, -14.3929443359375, -13.87548828125, -13.3580322265625, -12.840576171875, -12.3231201171875, -11.8056640625, -11.2882080078125, -10.770751953125, -10.2532958984375, -9.73583984375, -9.2183837890625, -8.700927734375, -8.1834716796875, -7.666015625, -7.1485595703125, -6.631103515625, -6.1136474609375, -5.59619140625, -5.0787353515625, -4.561279296875, -4.0438232421875, -3.5263671875, -3.0089111328125, -2.491455078125, -1.9739990234375, -1.45654296875, -0.9390869140625, -0.421630859375, 0.0958251953125, 0.61328125, 1.1307373046875, 1.648193359375, 2.1656494140625, 2.68310546875, 3.2005615234375, 3.718017578125, 4.2354736328125, 4.7529296875, 5.2703857421875, 5.787841796875, 6.3052978515625, 6.82275390625, 7.3402099609375, 7.857666015625, 8.3751220703125, 8.892578125, 9.4100341796875, 9.927490234375, 10.4449462890625, 10.96240234375, 11.4798583984375, 11.997314453125, 12.5147705078125, 13.0322265625, 13.5496826171875, 14.067138671875, 14.5845947265625, 15.10205078125, 15.6195068359375, 16.136962890625, 16.6544189453125, 17.171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 8.0, 3.0, 13.0, 16.0, 23.0, 26.0, 60.0, 111.0, 196.0, 431.0, 1049.0, 2910.0, 9241.0, 39477.0, 244440.0, 650571.0, 77251.0, 15577.0, 4467.0, 1469.0, 612.0, 280.0, 141.0, 77.0, 32.0, 30.0, 13.0, 11.0, 11.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21484375, -4.05987548828125, -3.9049072265625, -3.74993896484375, -3.594970703125, -3.44000244140625, -3.2850341796875, -3.13006591796875, -2.97509765625, -2.82012939453125, -2.6651611328125, -2.51019287109375, -2.355224609375, -2.20025634765625, -2.0452880859375, -1.89031982421875, -1.7353515625, -1.58038330078125, -1.4254150390625, -1.27044677734375, -1.115478515625, -0.96051025390625, -0.8055419921875, -0.65057373046875, -0.49560546875, -0.34063720703125, -0.1856689453125, -0.03070068359375, 0.124267578125, 0.27923583984375, 0.4342041015625, 0.58917236328125, 0.744140625, 0.89910888671875, 1.0540771484375, 1.20904541015625, 1.364013671875, 1.51898193359375, 1.6739501953125, 1.82891845703125, 1.98388671875, 2.13885498046875, 2.2938232421875, 2.44879150390625, 2.603759765625, 2.75872802734375, 2.9136962890625, 3.06866455078125, 3.2236328125, 3.37860107421875, 3.5335693359375, 3.68853759765625, 3.843505859375, 3.99847412109375, 4.1534423828125, 4.30841064453125, 4.46337890625, 4.61834716796875, 4.7733154296875, 4.92828369140625, 5.083251953125, 5.23822021484375, 5.3931884765625, 5.54815673828125, 5.703125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 6.0, 11.0, 10.0, 17.0, 25.0, 18.0, 36.0, 48.0, 50.0, 79.0, 85.0, 125.0, 129.0, 85.0, 70.0, 49.0, 31.0, 26.0, 18.0, 16.0, 11.0, 10.0, 5.0, 2.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0012149810791015625, -0.001180984079837799, -0.0011469870805740356, -0.0011129900813102722, -0.0010789930820465088, -0.0010449960827827454, -0.001010999083518982, -0.0009770020842552185, -0.0009430050849914551, -0.0009090080857276917, -0.0008750110864639282, -0.0008410140872001648, -0.0008070170879364014, -0.0007730200886726379, -0.0007390230894088745, -0.0007050260901451111, -0.0006710290908813477, -0.0006370320916175842, -0.0006030350923538208, -0.0005690380930900574, -0.0005350410938262939, -0.0005010440945625305, -0.0004670470952987671, -0.00043305009603500366, -0.00039905309677124023, -0.0003650560975074768, -0.0003310590982437134, -0.00029706209897994995, -0.0002630650997161865, -0.0002290681004524231, -0.00019507110118865967, -0.00016107410192489624, -0.0001270771026611328, -9.308010339736938e-05, -5.908310413360596e-05, -2.508610486984253e-05, 8.910894393920898e-06, 4.2907893657684326e-05, 7.690489292144775e-05, 0.00011090189218521118, 0.0001448988914489746, 0.00017889589071273804, 0.00021289288997650146, 0.0002468898892402649, 0.0002808868885040283, 0.00031488388776779175, 0.0003488808870315552, 0.0003828778862953186, 0.00041687488555908203, 0.00045087188482284546, 0.0004848688840866089, 0.0005188658833503723, 0.0005528628826141357, 0.0005868598818778992, 0.0006208568811416626, 0.000654853880405426, 0.0006888508796691895, 0.0007228478789329529, 0.0007568448781967163, 0.0007908418774604797, 0.0008248388767242432, 0.0008588358759880066, 0.00089283287525177, 0.0009268298745155334, 0.0009608268737792969]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 12.0, 18.0, 41.0, 49.0, 111.0, 248.0, 628.0, 2483.0, 17643.0, 262423.0, 723781.0, 35360.0, 4254.0, 871.0, 314.0, 145.0, 78.0, 35.0, 18.0, 13.0, 12.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5625, -8.296142578125, -8.02978515625, -7.763427734375, -7.4970703125, -7.230712890625, -6.96435546875, -6.697998046875, -6.431640625, -6.165283203125, -5.89892578125, -5.632568359375, -5.3662109375, -5.099853515625, -4.83349609375, -4.567138671875, -4.30078125, -4.034423828125, -3.76806640625, -3.501708984375, -3.2353515625, -2.968994140625, -2.70263671875, -2.436279296875, -2.169921875, -1.903564453125, -1.63720703125, -1.370849609375, -1.1044921875, -0.838134765625, -0.57177734375, -0.305419921875, -0.0390625, 0.227294921875, 0.49365234375, 0.760009765625, 1.0263671875, 1.292724609375, 1.55908203125, 1.825439453125, 2.091796875, 2.358154296875, 2.62451171875, 2.890869140625, 3.1572265625, 3.423583984375, 3.68994140625, 3.956298828125, 4.22265625, 4.489013671875, 4.75537109375, 5.021728515625, 5.2880859375, 5.554443359375, 5.82080078125, 6.087158203125, 6.353515625, 6.619873046875, 6.88623046875, 7.152587890625, 7.4189453125, 7.685302734375, 7.95166015625, 8.218017578125, 8.484375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 8.0, 19.0, 22.0, 33.0, 55.0, 104.0, 110.0, 160.0, 145.0, 126.0, 72.0, 40.0, 38.0, 21.0, 17.0, 11.0, 3.0, 5.0, 2.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.265625, -6.0411376953125, -5.816650390625, -5.5921630859375, -5.36767578125, -5.1431884765625, -4.918701171875, -4.6942138671875, -4.4697265625, -4.2452392578125, -4.020751953125, -3.7962646484375, -3.57177734375, -3.3472900390625, -3.122802734375, -2.8983154296875, -2.673828125, -2.4493408203125, -2.224853515625, -2.0003662109375, -1.77587890625, -1.5513916015625, -1.326904296875, -1.1024169921875, -0.8779296875, -0.6534423828125, -0.428955078125, -0.2044677734375, 0.02001953125, 0.2445068359375, 0.468994140625, 0.6934814453125, 0.91796875, 1.1424560546875, 1.366943359375, 1.5914306640625, 1.81591796875, 2.0404052734375, 2.264892578125, 2.4893798828125, 2.7138671875, 2.9383544921875, 3.162841796875, 3.3873291015625, 3.61181640625, 3.8363037109375, 4.060791015625, 4.2852783203125, 4.509765625, 4.7342529296875, 4.958740234375, 5.1832275390625, 5.40771484375, 5.6322021484375, 5.856689453125, 6.0811767578125, 6.3056640625, 6.5301513671875, 6.754638671875, 6.9791259765625, 7.20361328125, 7.4281005859375, 7.652587890625, 7.8770751953125, 8.1015625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 7.0, 14.0, 32.0, 45.0, 97.0, 160.0, 280.0, 157.0, 88.0, 51.0, 31.0, 11.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.98385620117188, -131.5725555419922, -128.16127014160156, -124.7499771118164, -121.33868408203125, -117.9273910522461, -114.51609802246094, -111.10480499267578, -107.69351196289062, -104.28221893310547, -100.87092590332031, -97.45963287353516, -94.04833984375, -90.63704681396484, -87.22575378417969, -83.81446075439453, -80.40316772460938, -76.99187469482422, -73.58058166503906, -70.1692886352539, -66.75799560546875, -63.346702575683594, -59.93540954589844, -56.52411651611328, -53.112815856933594, -49.70152282714844, -46.29022979736328, -42.878936767578125, -39.46764373779297, -36.05635070800781, -32.645057678222656, -29.233762741088867, -25.822471618652344, -22.411178588867188, -18.99988555908203, -15.588591575622559, -12.177298545837402, -8.76600456237793, -5.354711532592773, -1.9434185028076172, 1.467874526977539, 4.879167556762695, 8.290460586547852, 11.701754570007324, 15.11304759979248, 18.524341583251953, 21.93563461303711, 25.346927642822266, 28.758220672607422, 32.16951370239258, 35.580806732177734, 38.99209976196289, 42.40339279174805, 45.81468963623047, 49.225982666015625, 52.63727569580078, 56.04856872558594, 59.459861755371094, 62.87115478515625, 66.2824478149414, 69.69374084472656, 73.10503387451172, 76.51632690429688, 79.92761993408203, 83.33891296386719]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 7.0, 8.0, 7.0, 14.0, 14.0, 11.0, 10.0, 14.0, 18.0, 20.0, 19.0, 31.0, 30.0, 30.0, 25.0, 34.0, 62.0, 69.0, 73.0, 72.0, 60.0, 34.0, 33.0, 28.0, 41.0, 33.0, 25.0, 24.0, 30.0, 17.0, 19.0, 14.0, 12.0, 13.0, 7.0, 7.0, 19.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-63.28192138671875, -61.413936614990234, -59.545955657958984, -57.67797088623047, -55.80998611450195, -53.94200134277344, -52.07402038574219, -50.20603561401367, -48.338050842285156, -46.47006607055664, -44.60208511352539, -42.734100341796875, -40.86611557006836, -38.998130798339844, -37.130149841308594, -35.26216506958008, -33.39418411254883, -31.526201248168945, -29.65821647644043, -27.790233612060547, -25.92224884033203, -24.05426597595215, -22.186283111572266, -20.31829833984375, -18.450315475463867, -16.582332611083984, -14.714347839355469, -12.846364974975586, -10.978381156921387, -9.110397338867188, -7.242414474487305, -5.3744306564331055, -3.5064430236816406, -1.6384594440460205, 0.2295241355895996, 2.0975074768066406, 3.96549129486084, 5.833475112915039, 7.701457977294922, 9.569441795349121, 11.43742561340332, 13.30540943145752, 15.173393249511719, 17.0413761138916, 18.909358978271484, 20.77734375, 22.645326614379883, 24.513309478759766, 26.38129425048828, 28.249277114868164, 30.11726188659668, 31.985244750976562, 33.85322952270508, 35.721214294433594, 37.589195251464844, 39.45718002319336, 41.325164794921875, 43.19314956665039, 45.06113052368164, 46.929115295410156, 48.79710006713867, 50.66508483886719, 52.53306579589844, 54.40105056762695, 56.2690315246582]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 8.0, 9.0, 13.0, 21.0, 27.0, 31.0, 49.0, 69.0, 93.0, 144.0, 239.0, 409.0, 619.0, 1181.0, 2405.0, 5789.0, 19620.0, 153836.0, 3571117.0, 396118.0, 28746.0, 7288.0, 2921.0, 1340.0, 762.0, 484.0, 293.0, 190.0, 115.0, 88.0, 66.0, 54.0, 30.0, 28.0, 16.0, 16.0, 12.0, 11.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.34375, -12.877685546875, -12.41162109375, -11.945556640625, -11.4794921875, -11.013427734375, -10.54736328125, -10.081298828125, -9.615234375, -9.149169921875, -8.68310546875, -8.217041015625, -7.7509765625, -7.284912109375, -6.81884765625, -6.352783203125, -5.88671875, -5.420654296875, -4.95458984375, -4.488525390625, -4.0224609375, -3.556396484375, -3.09033203125, -2.624267578125, -2.158203125, -1.692138671875, -1.22607421875, -0.760009765625, -0.2939453125, 0.172119140625, 0.63818359375, 1.104248046875, 1.5703125, 2.036376953125, 2.50244140625, 2.968505859375, 3.4345703125, 3.900634765625, 4.36669921875, 4.832763671875, 5.298828125, 5.764892578125, 6.23095703125, 6.697021484375, 7.1630859375, 7.629150390625, 8.09521484375, 8.561279296875, 9.02734375, 9.493408203125, 9.95947265625, 10.425537109375, 10.8916015625, 11.357666015625, 11.82373046875, 12.289794921875, 12.755859375, 13.221923828125, 13.68798828125, 14.154052734375, 14.6201171875, 15.086181640625, 15.55224609375, 16.018310546875, 16.484375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 6.0, 8.0, 7.0, 21.0, 16.0, 29.0, 29.0, 40.0, 59.0, 56.0, 80.0, 78.0, 87.0, 88.0, 61.0, 71.0, 57.0, 49.0, 48.0, 22.0, 21.0, 27.0, 13.0, 10.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.792724609375, -8.57763671875, -8.362548828125, -8.1474609375, -7.932373046875, -7.71728515625, -7.502197265625, -7.287109375, -7.072021484375, -6.85693359375, -6.641845703125, -6.4267578125, -6.211669921875, -5.99658203125, -5.781494140625, -5.56640625, -5.351318359375, -5.13623046875, -4.921142578125, -4.7060546875, -4.490966796875, -4.27587890625, -4.060791015625, -3.845703125, -3.630615234375, -3.41552734375, -3.200439453125, -2.9853515625, -2.770263671875, -2.55517578125, -2.340087890625, -2.125, -1.909912109375, -1.69482421875, -1.479736328125, -1.2646484375, -1.049560546875, -0.83447265625, -0.619384765625, -0.404296875, -0.189208984375, 0.02587890625, 0.240966796875, 0.4560546875, 0.671142578125, 0.88623046875, 1.101318359375, 1.31640625, 1.531494140625, 1.74658203125, 1.961669921875, 2.1767578125, 2.391845703125, 2.60693359375, 2.822021484375, 3.037109375, 3.252197265625, 3.46728515625, 3.682373046875, 3.8974609375, 4.112548828125, 4.32763671875, 4.542724609375, 4.7578125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 6.0, 6.0, 3.0, 7.0, 19.0, 18.0, 39.0, 40.0, 77.0, 113.0, 207.0, 358.0, 775.0, 1874.0, 5556.0, 22034.0, 178407.0, 3672364.0, 274080.0, 27315.0, 6656.0, 2305.0, 931.0, 507.0, 233.0, 119.0, 60.0, 39.0, 24.0, 33.0, 17.0, 11.0, 9.0, 3.0, 5.0, 5.0, 3.0, 8.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0859375, -12.6112060546875, -12.136474609375, -11.6617431640625, -11.18701171875, -10.7122802734375, -10.237548828125, -9.7628173828125, -9.2880859375, -8.8133544921875, -8.338623046875, -7.8638916015625, -7.38916015625, -6.9144287109375, -6.439697265625, -5.9649658203125, -5.490234375, -5.0155029296875, -4.540771484375, -4.0660400390625, -3.59130859375, -3.1165771484375, -2.641845703125, -2.1671142578125, -1.6923828125, -1.2176513671875, -0.742919921875, -0.2681884765625, 0.20654296875, 0.6812744140625, 1.156005859375, 1.6307373046875, 2.10546875, 2.5802001953125, 3.054931640625, 3.5296630859375, 4.00439453125, 4.4791259765625, 4.953857421875, 5.4285888671875, 5.9033203125, 6.3780517578125, 6.852783203125, 7.3275146484375, 7.80224609375, 8.2769775390625, 8.751708984375, 9.2264404296875, 9.701171875, 10.1759033203125, 10.650634765625, 11.1253662109375, 11.60009765625, 12.0748291015625, 12.549560546875, 13.0242919921875, 13.4990234375, 13.9737548828125, 14.448486328125, 14.9232177734375, 15.39794921875, 15.8726806640625, 16.347412109375, 16.8221435546875, 17.296875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 3.0, 8.0, 10.0, 10.0, 19.0, 21.0, 29.0, 25.0, 71.0, 94.0, 147.0, 204.0, 425.0, 744.0, 814.0, 568.0, 302.0, 181.0, 101.0, 73.0, 52.0, 46.0, 32.0, 14.0, 16.0, 7.0, 9.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.0625, -8.728515625, -8.39453125, -8.060546875, -7.7265625, -7.392578125, -7.05859375, -6.724609375, -6.390625, -6.056640625, -5.72265625, -5.388671875, -5.0546875, -4.720703125, -4.38671875, -4.052734375, -3.71875, -3.384765625, -3.05078125, -2.716796875, -2.3828125, -2.048828125, -1.71484375, -1.380859375, -1.046875, -0.712890625, -0.37890625, -0.044921875, 0.2890625, 0.623046875, 0.95703125, 1.291015625, 1.625, 1.958984375, 2.29296875, 2.626953125, 2.9609375, 3.294921875, 3.62890625, 3.962890625, 4.296875, 4.630859375, 4.96484375, 5.298828125, 5.6328125, 5.966796875, 6.30078125, 6.634765625, 6.96875, 7.302734375, 7.63671875, 7.970703125, 8.3046875, 8.638671875, 8.97265625, 9.306640625, 9.640625, 9.974609375, 10.30859375, 10.642578125, 10.9765625, 11.310546875, 11.64453125, 11.978515625, 12.3125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 14.0, 46.0, 221.0, 393.0, 215.0, 81.0, 24.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.633544921875, -125.03172302246094, -117.42990112304688, -109.82808685302734, -102.22626495361328, -94.62444305419922, -87.02262878417969, -79.42080688476562, -71.81898498535156, -64.2171630859375, -56.6153450012207, -49.013526916503906, -41.411705017089844, -33.80988311767578, -26.208065032958984, -18.606246948242188, -11.004425048828125, -3.4026050567626953, 4.199214935302734, 11.801034927368164, 19.402854919433594, 27.004676818847656, 34.60649490356445, 42.20831298828125, 49.81013488769531, 57.411956787109375, 65.01377868652344, 72.61559295654297, 80.21741485595703, 87.8192367553711, 95.42105102539062, 103.02287292480469, 110.62469482421875, 118.22651672363281, 125.82833862304688, 133.43016052246094, 141.031982421875, 148.6337890625, 156.23561096191406, 163.83743286132812, 171.4392547607422, 179.04107666015625, 186.6428985595703, 194.24472045898438, 201.84652709960938, 209.4483642578125, 217.0501708984375, 224.65199279785156, 232.25381469726562, 239.8556365966797, 247.45745849609375, 255.0592803955078, 262.6611022949219, 270.2629089355469, 277.86474609375, 285.466552734375, 293.068359375, 300.670166015625, 308.2720031738281, 315.8738098144531, 323.47564697265625, 331.07745361328125, 338.6792907714844, 346.2810974121094, 353.8829345703125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 7.0, 4.0, 5.0, 5.0, 12.0, 13.0, 24.0, 23.0, 21.0, 24.0, 19.0, 32.0, 40.0, 40.0, 35.0, 46.0, 33.0, 48.0, 45.0, 39.0, 44.0, 42.0, 34.0, 36.0, 44.0, 32.0, 39.0, 39.0, 32.0, 22.0, 31.0, 23.0, 17.0, 14.0, 9.0, 8.0, 6.0, 2.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.04206848144531, -50.46010971069336, -48.878150939941406, -47.29619216918945, -45.7142333984375, -44.13227844238281, -42.55031967163086, -40.968360900878906, -39.38640213012695, -37.804443359375, -36.22248458862305, -34.640525817871094, -33.058570861816406, -31.47661018371582, -29.8946533203125, -28.312694549560547, -26.730735778808594, -25.14877700805664, -23.566818237304688, -21.984861373901367, -20.402902603149414, -18.82094383239746, -17.23898696899414, -15.657028198242188, -14.075069427490234, -12.493110656738281, -10.911152839660645, -9.329195022583008, -7.747236251831055, -6.16527795791626, -4.583319664001465, -3.001361846923828, -1.419403076171875, 0.16255521774291992, 1.7445135116577148, 3.3264718055725098, 4.908430099487305, 6.4903883934021, 8.072346687316895, 9.654304504394531, 11.236263275146484, 12.818222045898438, 14.400179862976074, 15.982137680053711, 17.564096450805664, 19.146055221557617, 20.728012084960938, 22.30997085571289, 23.891929626464844, 25.473888397216797, 27.05584716796875, 28.63780403137207, 30.219762802124023, 31.801721572875977, 33.3836784362793, 34.96563720703125, 36.5475959777832, 38.129554748535156, 39.71151351928711, 41.29347229003906, 42.87542724609375, 44.4573860168457, 46.039344787597656, 47.62130355834961, 49.20326232910156]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 2.0, 2.0, 4.0, 5.0, 7.0, 12.0, 16.0, 16.0, 23.0, 44.0, 44.0, 87.0, 112.0, 196.0, 262.0, 505.0, 914.0, 1608.0, 3190.0, 6533.0, 15080.0, 38743.0, 114374.0, 343775.0, 342243.0, 113705.0, 38708.0, 14858.0, 6416.0, 3103.0, 1664.0, 855.0, 541.0, 306.0, 204.0, 155.0, 77.0, 41.0, 39.0, 34.0, 16.0, 12.0, 4.0, 8.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 3.0], "bins": [-9.9921875, -9.72210693359375, -9.4520263671875, -9.18194580078125, -8.911865234375, -8.64178466796875, -8.3717041015625, -8.10162353515625, -7.83154296875, -7.56146240234375, -7.2913818359375, -7.02130126953125, -6.751220703125, -6.48114013671875, -6.2110595703125, -5.94097900390625, -5.6708984375, -5.40081787109375, -5.1307373046875, -4.86065673828125, -4.590576171875, -4.32049560546875, -4.0504150390625, -3.78033447265625, -3.51025390625, -3.24017333984375, -2.9700927734375, -2.70001220703125, -2.429931640625, -2.15985107421875, -1.8897705078125, -1.61968994140625, -1.349609375, -1.07952880859375, -0.8094482421875, -0.53936767578125, -0.269287109375, 0.00079345703125, 0.2708740234375, 0.54095458984375, 0.81103515625, 1.08111572265625, 1.3511962890625, 1.62127685546875, 1.891357421875, 2.16143798828125, 2.4315185546875, 2.70159912109375, 2.9716796875, 3.24176025390625, 3.5118408203125, 3.78192138671875, 4.052001953125, 4.32208251953125, 4.5921630859375, 4.86224365234375, 5.13232421875, 5.40240478515625, 5.6724853515625, 5.94256591796875, 6.212646484375, 6.48272705078125, 6.7528076171875, 7.02288818359375, 7.29296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 9.0, 10.0, 10.0, 16.0, 15.0, 32.0, 33.0, 46.0, 50.0, 60.0, 63.0, 72.0, 57.0, 76.0, 71.0, 52.0, 68.0, 51.0, 51.0, 44.0, 28.0, 23.0, 20.0, 13.0, 8.0, 7.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.90625, -8.6904296875, -8.474609375, -8.2587890625, -8.04296875, -7.8271484375, -7.611328125, -7.3955078125, -7.1796875, -6.9638671875, -6.748046875, -6.5322265625, -6.31640625, -6.1005859375, -5.884765625, -5.6689453125, -5.453125, -5.2373046875, -5.021484375, -4.8056640625, -4.58984375, -4.3740234375, -4.158203125, -3.9423828125, -3.7265625, -3.5107421875, -3.294921875, -3.0791015625, -2.86328125, -2.6474609375, -2.431640625, -2.2158203125, -2.0, -1.7841796875, -1.568359375, -1.3525390625, -1.13671875, -0.9208984375, -0.705078125, -0.4892578125, -0.2734375, -0.0576171875, 0.158203125, 0.3740234375, 0.58984375, 0.8056640625, 1.021484375, 1.2373046875, 1.453125, 1.6689453125, 1.884765625, 2.1005859375, 2.31640625, 2.5322265625, 2.748046875, 2.9638671875, 3.1796875, 3.3955078125, 3.611328125, 3.8271484375, 4.04296875, 4.2587890625, 4.474609375, 4.6904296875, 4.90625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 9.0, 15.0, 10.0, 28.0, 40.0, 49.0, 81.0, 145.0, 232.0, 364.0, 658.0, 1290.0, 4254.0, 25257.0, 334500.0, 642058.0, 31554.0, 4893.0, 1476.0, 679.0, 353.0, 214.0, 114.0, 104.0, 48.0, 39.0, 34.0, 15.0, 11.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.9375, -18.32763671875, -17.7177734375, -17.10791015625, -16.498046875, -15.88818359375, -15.2783203125, -14.66845703125, -14.05859375, -13.44873046875, -12.8388671875, -12.22900390625, -11.619140625, -11.00927734375, -10.3994140625, -9.78955078125, -9.1796875, -8.56982421875, -7.9599609375, -7.35009765625, -6.740234375, -6.13037109375, -5.5205078125, -4.91064453125, -4.30078125, -3.69091796875, -3.0810546875, -2.47119140625, -1.861328125, -1.25146484375, -0.6416015625, -0.03173828125, 0.578125, 1.18798828125, 1.7978515625, 2.40771484375, 3.017578125, 3.62744140625, 4.2373046875, 4.84716796875, 5.45703125, 6.06689453125, 6.6767578125, 7.28662109375, 7.896484375, 8.50634765625, 9.1162109375, 9.72607421875, 10.3359375, 10.94580078125, 11.5556640625, 12.16552734375, 12.775390625, 13.38525390625, 13.9951171875, 14.60498046875, 15.21484375, 15.82470703125, 16.4345703125, 17.04443359375, 17.654296875, 18.26416015625, 18.8740234375, 19.48388671875, 20.09375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 7.0, 7.0, 7.0, 6.0, 16.0, 10.0, 13.0, 19.0, 25.0, 28.0, 27.0, 34.0, 33.0, 35.0, 40.0, 57.0, 40.0, 49.0, 44.0, 45.0, 42.0, 48.0, 44.0, 41.0, 43.0, 45.0, 28.0, 28.0, 22.0, 23.0, 19.0, 11.0, 13.0, 6.0, 7.0, 8.0, 3.0, 2.0, 5.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.109375, -16.62060546875, -16.1318359375, -15.64306640625, -15.154296875, -14.66552734375, -14.1767578125, -13.68798828125, -13.19921875, -12.71044921875, -12.2216796875, -11.73291015625, -11.244140625, -10.75537109375, -10.2666015625, -9.77783203125, -9.2890625, -8.80029296875, -8.3115234375, -7.82275390625, -7.333984375, -6.84521484375, -6.3564453125, -5.86767578125, -5.37890625, -4.89013671875, -4.4013671875, -3.91259765625, -3.423828125, -2.93505859375, -2.4462890625, -1.95751953125, -1.46875, -0.97998046875, -0.4912109375, -0.00244140625, 0.486328125, 0.97509765625, 1.4638671875, 1.95263671875, 2.44140625, 2.93017578125, 3.4189453125, 3.90771484375, 4.396484375, 4.88525390625, 5.3740234375, 5.86279296875, 6.3515625, 6.84033203125, 7.3291015625, 7.81787109375, 8.306640625, 8.79541015625, 9.2841796875, 9.77294921875, 10.26171875, 10.75048828125, 11.2392578125, 11.72802734375, 12.216796875, 12.70556640625, 13.1943359375, 13.68310546875, 14.171875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 8.0, 11.0, 18.0, 27.0, 47.0, 68.0, 165.0, 375.0, 1146.0, 4407.0, 24078.0, 348898.0, 635457.0, 26956.0, 4856.0, 1206.0, 418.0, 159.0, 95.0, 50.0, 35.0, 18.0, 11.0, 14.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-8.9453125, -8.7100830078125, -8.474853515625, -8.2396240234375, -8.00439453125, -7.7691650390625, -7.533935546875, -7.2987060546875, -7.0634765625, -6.8282470703125, -6.593017578125, -6.3577880859375, -6.12255859375, -5.8873291015625, -5.652099609375, -5.4168701171875, -5.181640625, -4.9464111328125, -4.711181640625, -4.4759521484375, -4.24072265625, -4.0054931640625, -3.770263671875, -3.5350341796875, -3.2998046875, -3.0645751953125, -2.829345703125, -2.5941162109375, -2.35888671875, -2.1236572265625, -1.888427734375, -1.6531982421875, -1.41796875, -1.1827392578125, -0.947509765625, -0.7122802734375, -0.47705078125, -0.2418212890625, -0.006591796875, 0.2286376953125, 0.4638671875, 0.6990966796875, 0.934326171875, 1.1695556640625, 1.40478515625, 1.6400146484375, 1.875244140625, 2.1104736328125, 2.345703125, 2.5809326171875, 2.816162109375, 3.0513916015625, 3.28662109375, 3.5218505859375, 3.757080078125, 3.9923095703125, 4.2275390625, 4.4627685546875, 4.697998046875, 4.9332275390625, 5.16845703125, 5.4036865234375, 5.638916015625, 5.8741455078125, 6.109375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 4.0, 4.0, 5.0, 8.0, 8.0, 20.0, 33.0, 40.0, 71.0, 99.0, 185.0, 184.0, 113.0, 77.0, 43.0, 29.0, 25.0, 16.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001995086669921875, -0.0019441097974777222, -0.0018931329250335693, -0.0018421560525894165, -0.0017911791801452637, -0.0017402023077011108, -0.001689225435256958, -0.0016382485628128052, -0.0015872716903686523, -0.0015362948179244995, -0.0014853179454803467, -0.0014343410730361938, -0.001383364200592041, -0.0013323873281478882, -0.0012814104557037354, -0.0012304335832595825, -0.0011794567108154297, -0.0011284798383712769, -0.001077502965927124, -0.0010265260934829712, -0.0009755492210388184, -0.0009245723485946655, -0.0008735954761505127, -0.0008226186037063599, -0.000771641731262207, -0.0007206648588180542, -0.0006696879863739014, -0.0006187111139297485, -0.0005677342414855957, -0.0005167573690414429, -0.00046578049659729004, -0.0004148036241531372, -0.0003638267517089844, -0.00031284987926483154, -0.0002618730068206787, -0.00021089613437652588, -0.00015991926193237305, -0.00010894238948822021, -5.796551704406738e-05, -6.988644599914551e-06, 4.398822784423828e-05, 9.496510028839111e-05, 0.00014594197273254395, 0.00019691884517669678, 0.0002478957176208496, 0.00029887259006500244, 0.0003498494625091553, 0.0004008263349533081, 0.00045180320739746094, 0.0005027800798416138, 0.0005537569522857666, 0.0006047338247299194, 0.0006557106971740723, 0.0007066875696182251, 0.0007576644420623779, 0.0008086413145065308, 0.0008596181869506836, 0.0009105950593948364, 0.0009615719318389893, 0.001012548804283142, 0.001063525676727295, 0.0011145025491714478, 0.0011654794216156006, 0.0012164562940597534, 0.0012674331665039062]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 7.0, 6.0, 5.0, 4.0, 16.0, 15.0, 26.0, 29.0, 44.0, 78.0, 144.0, 188.0, 350.0, 688.0, 1491.0, 3877.0, 11839.0, 58203.0, 704022.0, 224028.0, 30753.0, 7686.0, 2582.0, 1094.0, 560.0, 305.0, 181.0, 103.0, 65.0, 58.0, 30.0, 18.0, 12.0, 20.0, 7.0, 9.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.96917724609375, -5.7977294921875, -5.62628173828125, -5.454833984375, -5.28338623046875, -5.1119384765625, -4.94049072265625, -4.76904296875, -4.59759521484375, -4.4261474609375, -4.25469970703125, -4.083251953125, -3.91180419921875, -3.7403564453125, -3.56890869140625, -3.3974609375, -3.22601318359375, -3.0545654296875, -2.88311767578125, -2.711669921875, -2.54022216796875, -2.3687744140625, -2.19732666015625, -2.02587890625, -1.85443115234375, -1.6829833984375, -1.51153564453125, -1.340087890625, -1.16864013671875, -0.9971923828125, -0.82574462890625, -0.654296875, -0.48284912109375, -0.3114013671875, -0.13995361328125, 0.031494140625, 0.20294189453125, 0.3743896484375, 0.54583740234375, 0.71728515625, 0.88873291015625, 1.0601806640625, 1.23162841796875, 1.403076171875, 1.57452392578125, 1.7459716796875, 1.91741943359375, 2.0888671875, 2.26031494140625, 2.4317626953125, 2.60321044921875, 2.774658203125, 2.94610595703125, 3.1175537109375, 3.28900146484375, 3.46044921875, 3.63189697265625, 3.8033447265625, 3.97479248046875, 4.146240234375, 4.31768798828125, 4.4891357421875, 4.66058349609375, 4.83203125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 10.0, 8.0, 17.0, 15.0, 17.0, 22.0, 27.0, 28.0, 58.0, 74.0, 98.0, 122.0, 118.0, 101.0, 63.0, 48.0, 34.0, 31.0, 15.0, 19.0, 13.0, 11.0, 4.0, 9.0, 8.0, 4.0, 4.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-4.203125, -4.067138671875, -3.93115234375, -3.795166015625, -3.6591796875, -3.523193359375, -3.38720703125, -3.251220703125, -3.115234375, -2.979248046875, -2.84326171875, -2.707275390625, -2.5712890625, -2.435302734375, -2.29931640625, -2.163330078125, -2.02734375, -1.891357421875, -1.75537109375, -1.619384765625, -1.4833984375, -1.347412109375, -1.21142578125, -1.075439453125, -0.939453125, -0.803466796875, -0.66748046875, -0.531494140625, -0.3955078125, -0.259521484375, -0.12353515625, 0.012451171875, 0.1484375, 0.284423828125, 0.42041015625, 0.556396484375, 0.6923828125, 0.828369140625, 0.96435546875, 1.100341796875, 1.236328125, 1.372314453125, 1.50830078125, 1.644287109375, 1.7802734375, 1.916259765625, 2.05224609375, 2.188232421875, 2.32421875, 2.460205078125, 2.59619140625, 2.732177734375, 2.8681640625, 3.004150390625, 3.14013671875, 3.276123046875, 3.412109375, 3.548095703125, 3.68408203125, 3.820068359375, 3.9560546875, 4.092041015625, 4.22802734375, 4.364013671875, 4.5]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 7.0, 12.0, 23.0, 54.0, 98.0, 245.0, 276.0, 139.0, 56.0, 35.0, 19.0, 8.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-70.0380859375, -66.36478424072266, -62.69148254394531, -59.018184661865234, -55.34488296508789, -51.67158126831055, -47.99828338623047, -44.324981689453125, -40.65167999267578, -36.97837829589844, -33.305076599121094, -29.631778717041016, -25.958477020263672, -22.285175323486328, -18.611875534057617, -14.938575744628906, -11.265274047851562, -7.591973304748535, -3.918672561645508, -0.24537181854248047, 3.427928924560547, 7.101230621337891, 10.774530410766602, 14.447830200195312, 18.121131896972656, 21.79443359375, 25.46773338317871, 29.141033172607422, 32.814334869384766, 36.48763656616211, 40.16093444824219, 43.83423614501953, 47.507537841796875, 51.18083953857422, 54.85414123535156, 58.52743911743164, 62.200740814208984, 65.87403869628906, 69.5473403930664, 73.22064208984375, 76.8939437866211, 80.56724548339844, 84.24054718017578, 87.91384887695312, 91.58714294433594, 95.26045227050781, 98.93374633789062, 102.60704803466797, 106.28034973144531, 109.95365142822266, 113.626953125, 117.30025482177734, 120.97355651855469, 124.6468505859375, 128.32015991210938, 131.9934539794922, 135.666748046875, 139.3400421142578, 143.0133514404297, 146.6866455078125, 150.35995483398438, 154.0332489013672, 157.70655822753906, 161.37985229492188, 165.05316162109375]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 13.0, 12.0, 7.0, 4.0, 6.0, 15.0, 12.0, 18.0, 23.0, 25.0, 24.0, 31.0, 31.0, 28.0, 48.0, 48.0, 72.0, 107.0, 80.0, 64.0, 44.0, 39.0, 37.0, 34.0, 22.0, 21.0, 18.0, 19.0, 11.0, 13.0, 7.0, 9.0, 7.0, 6.0, 7.0, 6.0, 7.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.684410095214844, -59.739498138427734, -57.79458236694336, -55.84967041015625, -53.904754638671875, -51.959842681884766, -50.014930725097656, -48.07001495361328, -46.12510299682617, -44.18019104003906, -42.23527526855469, -40.29036331176758, -38.34545135498047, -36.400535583496094, -34.455623626708984, -32.510711669921875, -30.5657958984375, -28.620882034301758, -26.675968170166016, -24.731056213378906, -22.786142349243164, -20.841228485107422, -18.896316528320312, -16.95140266418457, -15.006488800048828, -13.061574935913086, -11.11666202545166, -9.171749114990234, -7.226835250854492, -5.28192138671875, -3.337008476257324, -1.3920955657958984, 0.5528182983398438, 2.4977316856384277, 4.442645072937012, 6.387558460235596, 8.33247184753418, 10.277385711669922, 12.222298622131348, 14.167211532592773, 16.112125396728516, 18.057039260864258, 20.001953125, 21.94686508178711, 23.89177894592285, 25.836692810058594, 27.781604766845703, 29.726518630981445, 31.671432495117188, 33.6163444519043, 35.56126022338867, 37.50617218017578, 39.451087951660156, 41.395999908447266, 43.340911865234375, 45.28582763671875, 47.23073959350586, 49.17565155029297, 51.120567321777344, 53.06547927856445, 55.01039123535156, 56.95530700683594, 58.90021896362305, 60.845130920410156, 62.79004669189453]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 11.0, 15.0, 22.0, 50.0, 84.0, 124.0, 208.0, 362.0, 670.0, 1198.0, 2736.0, 7762.0, 35614.0, 600523.0, 3348691.0, 168782.0, 18194.0, 4893.0, 1992.0, 1023.0, 485.0, 293.0, 174.0, 118.0, 79.0, 38.0, 23.0, 23.0, 24.0, 17.0, 13.0, 11.0, 8.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.734375, -12.28466796875, -11.8349609375, -11.38525390625, -10.935546875, -10.48583984375, -10.0361328125, -9.58642578125, -9.13671875, -8.68701171875, -8.2373046875, -7.78759765625, -7.337890625, -6.88818359375, -6.4384765625, -5.98876953125, -5.5390625, -5.08935546875, -4.6396484375, -4.18994140625, -3.740234375, -3.29052734375, -2.8408203125, -2.39111328125, -1.94140625, -1.49169921875, -1.0419921875, -0.59228515625, -0.142578125, 0.30712890625, 0.7568359375, 1.20654296875, 1.65625, 2.10595703125, 2.5556640625, 3.00537109375, 3.455078125, 3.90478515625, 4.3544921875, 4.80419921875, 5.25390625, 5.70361328125, 6.1533203125, 6.60302734375, 7.052734375, 7.50244140625, 7.9521484375, 8.40185546875, 8.8515625, 9.30126953125, 9.7509765625, 10.20068359375, 10.650390625, 11.10009765625, 11.5498046875, 11.99951171875, 12.44921875, 12.89892578125, 13.3486328125, 13.79833984375, 14.248046875, 14.69775390625, 15.1474609375, 15.59716796875, 16.046875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 10.0, 7.0, 13.0, 11.0, 23.0, 27.0, 24.0, 39.0, 43.0, 59.0, 54.0, 63.0, 59.0, 70.0, 62.0, 56.0, 54.0, 56.0, 41.0, 47.0, 38.0, 28.0, 31.0, 22.0, 10.0, 8.0, 11.0, 10.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.2734375, -6.09466552734375, -5.9158935546875, -5.73712158203125, -5.558349609375, -5.37957763671875, -5.2008056640625, -5.02203369140625, -4.84326171875, -4.66448974609375, -4.4857177734375, -4.30694580078125, -4.128173828125, -3.94940185546875, -3.7706298828125, -3.59185791015625, -3.4130859375, -3.23431396484375, -3.0555419921875, -2.87677001953125, -2.697998046875, -2.51922607421875, -2.3404541015625, -2.16168212890625, -1.98291015625, -1.80413818359375, -1.6253662109375, -1.44659423828125, -1.267822265625, -1.08905029296875, -0.9102783203125, -0.73150634765625, -0.552734375, -0.37396240234375, -0.1951904296875, -0.01641845703125, 0.162353515625, 0.34112548828125, 0.5198974609375, 0.69866943359375, 0.87744140625, 1.05621337890625, 1.2349853515625, 1.41375732421875, 1.592529296875, 1.77130126953125, 1.9500732421875, 2.12884521484375, 2.3076171875, 2.48638916015625, 2.6651611328125, 2.84393310546875, 3.022705078125, 3.20147705078125, 3.3802490234375, 3.55902099609375, 3.73779296875, 3.91656494140625, 4.0953369140625, 4.27410888671875, 4.452880859375, 4.63165283203125, 4.8104248046875, 4.98919677734375, 5.16796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 6.0, 8.0, 9.0, 10.0, 14.0, 19.0, 33.0, 63.0, 143.0, 298.0, 728.0, 2452.0, 9777.0, 80224.0, 3671474.0, 400551.0, 22085.0, 4310.0, 1259.0, 411.0, 164.0, 81.0, 55.0, 31.0, 18.0, 15.0, 7.0, 7.0, 9.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.15625, -20.56396484375, -19.9716796875, -19.37939453125, -18.787109375, -18.19482421875, -17.6025390625, -17.01025390625, -16.41796875, -15.82568359375, -15.2333984375, -14.64111328125, -14.048828125, -13.45654296875, -12.8642578125, -12.27197265625, -11.6796875, -11.08740234375, -10.4951171875, -9.90283203125, -9.310546875, -8.71826171875, -8.1259765625, -7.53369140625, -6.94140625, -6.34912109375, -5.7568359375, -5.16455078125, -4.572265625, -3.97998046875, -3.3876953125, -2.79541015625, -2.203125, -1.61083984375, -1.0185546875, -0.42626953125, 0.166015625, 0.75830078125, 1.3505859375, 1.94287109375, 2.53515625, 3.12744140625, 3.7197265625, 4.31201171875, 4.904296875, 5.49658203125, 6.0888671875, 6.68115234375, 7.2734375, 7.86572265625, 8.4580078125, 9.05029296875, 9.642578125, 10.23486328125, 10.8271484375, 11.41943359375, 12.01171875, 12.60400390625, 13.1962890625, 13.78857421875, 14.380859375, 14.97314453125, 15.5654296875, 16.15771484375, 16.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 11.0, 4.0, 11.0, 8.0, 12.0, 21.0, 27.0, 33.0, 39.0, 68.0, 123.0, 176.0, 320.0, 590.0, 769.0, 694.0, 426.0, 271.0, 148.0, 105.0, 52.0, 36.0, 31.0, 27.0, 13.0, 12.0, 18.0, 4.0, 5.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.5625, -13.1832275390625, -12.803955078125, -12.4246826171875, -12.04541015625, -11.6661376953125, -11.286865234375, -10.9075927734375, -10.5283203125, -10.1490478515625, -9.769775390625, -9.3905029296875, -9.01123046875, -8.6319580078125, -8.252685546875, -7.8734130859375, -7.494140625, -7.1148681640625, -6.735595703125, -6.3563232421875, -5.97705078125, -5.5977783203125, -5.218505859375, -4.8392333984375, -4.4599609375, -4.0806884765625, -3.701416015625, -3.3221435546875, -2.94287109375, -2.5635986328125, -2.184326171875, -1.8050537109375, -1.42578125, -1.0465087890625, -0.667236328125, -0.2879638671875, 0.09130859375, 0.4705810546875, 0.849853515625, 1.2291259765625, 1.6083984375, 1.9876708984375, 2.366943359375, 2.7462158203125, 3.12548828125, 3.5047607421875, 3.884033203125, 4.2633056640625, 4.642578125, 5.0218505859375, 5.401123046875, 5.7803955078125, 6.15966796875, 6.5389404296875, 6.918212890625, 7.2974853515625, 7.6767578125, 8.0560302734375, 8.435302734375, 8.8145751953125, 9.19384765625, 9.5731201171875, 9.952392578125, 10.3316650390625, 10.7109375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 5.0, 3.0, 3.0, 11.0, 21.0, 25.0, 54.0, 108.0, 188.0, 185.0, 153.0, 114.0, 59.0, 28.0, 12.0, 9.0, 8.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-162.49269104003906, -158.9102325439453, -155.32777404785156, -151.7453155517578, -148.16285705566406, -144.5803985595703, -140.99794006347656, -137.41546630859375, -133.8330078125, -130.25054931640625, -126.6680908203125, -123.08563232421875, -119.503173828125, -115.92071533203125, -112.33824920654297, -108.75579071044922, -105.17333984375, -101.59088134765625, -98.0084228515625, -94.42596435546875, -90.843505859375, -87.26104736328125, -83.67858123779297, -80.09612274169922, -76.51366424560547, -72.93120574951172, -69.34874725341797, -65.76628875732422, -62.1838264465332, -58.60136795043945, -55.01890563964844, -51.43644714355469, -47.85398864746094, -44.27153015136719, -40.68907165527344, -37.10660934448242, -33.52415084838867, -29.941692352294922, -26.35923194885254, -22.776771545410156, -19.194313049316406, -15.61185359954834, -12.029394149780273, -8.446934700012207, -4.864475250244141, -1.2820167541503906, 2.300443649291992, 5.882904052734375, 9.465362548828125, 13.047821998596191, 16.630281448364258, 20.21274185180664, 23.79520034790039, 27.37765884399414, 30.960119247436523, 34.542579650878906, 38.125038146972656, 41.707496643066406, 45.289955139160156, 48.87241744995117, 52.45487594604492, 56.03733444213867, 59.61979675292969, 63.20225524902344, 66.78471374511719]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 8.0, 5.0, 2.0, 9.0, 15.0, 16.0, 18.0, 19.0, 30.0, 20.0, 26.0, 36.0, 34.0, 32.0, 46.0, 46.0, 55.0, 43.0, 47.0, 51.0, 53.0, 42.0, 53.0, 37.0, 35.0, 25.0, 37.0, 28.0, 27.0, 16.0, 19.0, 13.0, 11.0, 8.0, 4.0, 9.0, 6.0, 1.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.50724792480469, -40.9830436706543, -39.45883560180664, -37.93463134765625, -36.41042709350586, -34.88622283935547, -33.36201477050781, -31.837810516357422, -30.31360626220703, -28.789400100708008, -27.265195846557617, -25.740989685058594, -24.216785430908203, -22.69257926940918, -21.168373107910156, -19.644168853759766, -18.119962692260742, -16.59575653076172, -15.071552276611328, -13.547346115112305, -12.023141860961914, -10.49893569946289, -8.974730491638184, -7.450525283813477, -5.9263200759887695, -4.4021148681640625, -2.8779094219207764, -1.3537039756774902, 0.1705012321472168, 1.6947064399719238, 3.218912124633789, 4.743117332458496, 6.267322540283203, 7.79152774810791, 9.315732955932617, 10.83993911743164, 12.364143371582031, 13.888349533081055, 15.412554740905762, 16.93675994873047, 18.46096420288086, 19.985170364379883, 21.509374618530273, 23.033580780029297, 24.557785034179688, 26.08199119567871, 27.606197357177734, 29.130401611328125, 30.65460777282715, 32.17881393432617, 33.70301818847656, 35.22722244262695, 36.75143051147461, 38.275634765625, 39.79983901977539, 41.32404327392578, 42.84825134277344, 44.37245559692383, 45.896663665771484, 47.420867919921875, 48.945072174072266, 50.469276428222656, 51.99348449707031, 53.5176887512207, 55.041893005371094]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 8.0, 10.0, 12.0, 18.0, 19.0, 30.0, 49.0, 57.0, 103.0, 156.0, 258.0, 397.0, 675.0, 1186.0, 2244.0, 4478.0, 9580.0, 22281.0, 60420.0, 201298.0, 463594.0, 185680.0, 56575.0, 21180.0, 8872.0, 4326.0, 2072.0, 1187.0, 691.0, 388.0, 239.0, 133.0, 90.0, 75.0, 48.0, 47.0, 18.0, 15.0, 17.0, 7.0, 11.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.568603515625, -8.27783203125, -7.987060546875, -7.6962890625, -7.405517578125, -7.11474609375, -6.823974609375, -6.533203125, -6.242431640625, -5.95166015625, -5.660888671875, -5.3701171875, -5.079345703125, -4.78857421875, -4.497802734375, -4.20703125, -3.916259765625, -3.62548828125, -3.334716796875, -3.0439453125, -2.753173828125, -2.46240234375, -2.171630859375, -1.880859375, -1.590087890625, -1.29931640625, -1.008544921875, -0.7177734375, -0.427001953125, -0.13623046875, 0.154541015625, 0.4453125, 0.736083984375, 1.02685546875, 1.317626953125, 1.6083984375, 1.899169921875, 2.18994140625, 2.480712890625, 2.771484375, 3.062255859375, 3.35302734375, 3.643798828125, 3.9345703125, 4.225341796875, 4.51611328125, 4.806884765625, 5.09765625, 5.388427734375, 5.67919921875, 5.969970703125, 6.2607421875, 6.551513671875, 6.84228515625, 7.133056640625, 7.423828125, 7.714599609375, 8.00537109375, 8.296142578125, 8.5869140625, 8.877685546875, 9.16845703125, 9.459228515625, 9.75]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 2.0, 6.0, 9.0, 11.0, 12.0, 17.0, 18.0, 22.0, 27.0, 33.0, 39.0, 48.0, 47.0, 44.0, 76.0, 45.0, 65.0, 41.0, 52.0, 49.0, 49.0, 46.0, 46.0, 48.0, 27.0, 24.0, 23.0, 16.0, 12.0, 8.0, 7.0, 10.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -6.043701171875, -5.86474609375, -5.685791015625, -5.5068359375, -5.327880859375, -5.14892578125, -4.969970703125, -4.791015625, -4.612060546875, -4.43310546875, -4.254150390625, -4.0751953125, -3.896240234375, -3.71728515625, -3.538330078125, -3.359375, -3.180419921875, -3.00146484375, -2.822509765625, -2.6435546875, -2.464599609375, -2.28564453125, -2.106689453125, -1.927734375, -1.748779296875, -1.56982421875, -1.390869140625, -1.2119140625, -1.032958984375, -0.85400390625, -0.675048828125, -0.49609375, -0.317138671875, -0.13818359375, 0.040771484375, 0.2197265625, 0.398681640625, 0.57763671875, 0.756591796875, 0.935546875, 1.114501953125, 1.29345703125, 1.472412109375, 1.6513671875, 1.830322265625, 2.00927734375, 2.188232421875, 2.3671875, 2.546142578125, 2.72509765625, 2.904052734375, 3.0830078125, 3.261962890625, 3.44091796875, 3.619873046875, 3.798828125, 3.977783203125, 4.15673828125, 4.335693359375, 4.5146484375, 4.693603515625, 4.87255859375, 5.051513671875, 5.23046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 8.0, 8.0, 7.0, 10.0, 14.0, 27.0, 25.0, 34.0, 42.0, 65.0, 80.0, 110.0, 129.0, 195.0, 263.0, 407.0, 651.0, 1065.0, 2149.0, 5484.0, 21913.0, 158752.0, 770156.0, 66381.0, 12310.0, 3817.0, 1571.0, 989.0, 542.0, 353.0, 278.0, 185.0, 139.0, 88.0, 80.0, 76.0, 37.0, 25.0, 20.0, 17.0, 8.0, 12.0, 6.0, 7.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-15.4375, -14.9739990234375, -14.510498046875, -14.0469970703125, -13.58349609375, -13.1199951171875, -12.656494140625, -12.1929931640625, -11.7294921875, -11.2659912109375, -10.802490234375, -10.3389892578125, -9.87548828125, -9.4119873046875, -8.948486328125, -8.4849853515625, -8.021484375, -7.5579833984375, -7.094482421875, -6.6309814453125, -6.16748046875, -5.7039794921875, -5.240478515625, -4.7769775390625, -4.3134765625, -3.8499755859375, -3.386474609375, -2.9229736328125, -2.45947265625, -1.9959716796875, -1.532470703125, -1.0689697265625, -0.60546875, -0.1419677734375, 0.321533203125, 0.7850341796875, 1.24853515625, 1.7120361328125, 2.175537109375, 2.6390380859375, 3.1025390625, 3.5660400390625, 4.029541015625, 4.4930419921875, 4.95654296875, 5.4200439453125, 5.883544921875, 6.3470458984375, 6.810546875, 7.2740478515625, 7.737548828125, 8.2010498046875, 8.66455078125, 9.1280517578125, 9.591552734375, 10.0550537109375, 10.5185546875, 10.9820556640625, 11.445556640625, 11.9090576171875, 12.37255859375, 12.8360595703125, 13.299560546875, 13.7630615234375, 14.2265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 9.0, 7.0, 8.0, 7.0, 12.0, 10.0, 20.0, 18.0, 30.0, 29.0, 26.0, 29.0, 45.0, 50.0, 58.0, 57.0, 56.0, 43.0, 54.0, 54.0, 43.0, 37.0, 46.0, 41.0, 37.0, 33.0, 17.0, 21.0, 21.0, 17.0, 11.0, 10.0, 10.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.125, -19.51708984375, -18.9091796875, -18.30126953125, -17.693359375, -17.08544921875, -16.4775390625, -15.86962890625, -15.26171875, -14.65380859375, -14.0458984375, -13.43798828125, -12.830078125, -12.22216796875, -11.6142578125, -11.00634765625, -10.3984375, -9.79052734375, -9.1826171875, -8.57470703125, -7.966796875, -7.35888671875, -6.7509765625, -6.14306640625, -5.53515625, -4.92724609375, -4.3193359375, -3.71142578125, -3.103515625, -2.49560546875, -1.8876953125, -1.27978515625, -0.671875, -0.06396484375, 0.5439453125, 1.15185546875, 1.759765625, 2.36767578125, 2.9755859375, 3.58349609375, 4.19140625, 4.79931640625, 5.4072265625, 6.01513671875, 6.623046875, 7.23095703125, 7.8388671875, 8.44677734375, 9.0546875, 9.66259765625, 10.2705078125, 10.87841796875, 11.486328125, 12.09423828125, 12.7021484375, 13.31005859375, 13.91796875, 14.52587890625, 15.1337890625, 15.74169921875, 16.349609375, 16.95751953125, 17.5654296875, 18.17333984375, 18.78125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 8.0, 2.0, 6.0, 2.0, 12.0, 13.0, 10.0, 18.0, 23.0, 20.0, 40.0, 38.0, 54.0, 80.0, 133.0, 205.0, 288.0, 514.0, 993.0, 2042.0, 4626.0, 12177.0, 46938.0, 652184.0, 272051.0, 37385.0, 10591.0, 4096.0, 1808.0, 876.0, 495.0, 272.0, 164.0, 98.0, 87.0, 45.0, 29.0, 29.0, 25.0, 16.0, 18.0, 9.0, 8.0, 10.0, 8.0, 3.0, 0.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.94140625, -3.81396484375, -3.6865234375, -3.55908203125, -3.431640625, -3.30419921875, -3.1767578125, -3.04931640625, -2.921875, -2.79443359375, -2.6669921875, -2.53955078125, -2.412109375, -2.28466796875, -2.1572265625, -2.02978515625, -1.90234375, -1.77490234375, -1.6474609375, -1.52001953125, -1.392578125, -1.26513671875, -1.1376953125, -1.01025390625, -0.8828125, -0.75537109375, -0.6279296875, -0.50048828125, -0.373046875, -0.24560546875, -0.1181640625, 0.00927734375, 0.13671875, 0.26416015625, 0.3916015625, 0.51904296875, 0.646484375, 0.77392578125, 0.9013671875, 1.02880859375, 1.15625, 1.28369140625, 1.4111328125, 1.53857421875, 1.666015625, 1.79345703125, 1.9208984375, 2.04833984375, 2.17578125, 2.30322265625, 2.4306640625, 2.55810546875, 2.685546875, 2.81298828125, 2.9404296875, 3.06787109375, 3.1953125, 3.32275390625, 3.4501953125, 3.57763671875, 3.705078125, 3.83251953125, 3.9599609375, 4.08740234375, 4.21484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 7.0, 8.0, 7.0, 12.0, 17.0, 15.0, 14.0, 21.0, 40.0, 48.0, 88.0, 140.0, 147.0, 125.0, 83.0, 60.0, 44.0, 28.0, 14.0, 22.0, 9.0, 6.0, 6.0, 9.0, 2.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0011501312255859375, -0.0011111795902252197, -0.001072227954864502, -0.0010332763195037842, -0.0009943246841430664, -0.0009553730487823486, -0.0009164214134216309, -0.0008774697780609131, -0.0008385181427001953, -0.0007995665073394775, -0.0007606148719787598, -0.000721663236618042, -0.0006827116012573242, -0.0006437599658966064, -0.0006048083305358887, -0.0005658566951751709, -0.0005269050598144531, -0.00048795342445373535, -0.0004490017890930176, -0.0004100501537322998, -0.00037109851837158203, -0.00033214688301086426, -0.0002931952476501465, -0.0002542436122894287, -0.00021529197692871094, -0.00017634034156799316, -0.0001373887062072754, -9.843707084655762e-05, -5.9485435485839844e-05, -2.053380012512207e-05, 1.8417835235595703e-05, 5.7369470596313477e-05, 9.632110595703125e-05, 0.00013527274131774902, 0.0001742243766784668, 0.00021317601203918457, 0.00025212764739990234, 0.0002910792827606201, 0.0003300309181213379, 0.00036898255348205566, 0.00040793418884277344, 0.0004468858242034912, 0.000485837459564209, 0.0005247890949249268, 0.0005637407302856445, 0.0006026923656463623, 0.0006416440010070801, 0.0006805956363677979, 0.0007195472717285156, 0.0007584989070892334, 0.0007974505424499512, 0.0008364021778106689, 0.0008753538131713867, 0.0009143054485321045, 0.0009532570838928223, 0.00099220871925354, 0.0010311603546142578, 0.0010701119899749756, 0.0011090636253356934, 0.0011480152606964111, 0.001186966896057129, 0.0012259185314178467, 0.0012648701667785645, 0.0013038218021392822, 0.0013427734375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 5.0, 11.0, 19.0, 13.0, 37.0, 53.0, 76.0, 96.0, 124.0, 184.0, 317.0, 481.0, 813.0, 1594.0, 3040.0, 6600.0, 17065.0, 55590.0, 261469.0, 596098.0, 69322.0, 20279.0, 7650.0, 3404.0, 1693.0, 889.0, 569.0, 352.0, 205.0, 146.0, 93.0, 77.0, 46.0, 31.0, 24.0, 23.0, 14.0, 16.0, 8.0, 7.0, 3.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.859375, -2.764312744140625, -2.66925048828125, -2.574188232421875, -2.4791259765625, -2.384063720703125, -2.28900146484375, -2.193939208984375, -2.098876953125, -2.003814697265625, -1.90875244140625, -1.813690185546875, -1.7186279296875, -1.623565673828125, -1.52850341796875, -1.433441162109375, -1.33837890625, -1.243316650390625, -1.14825439453125, -1.053192138671875, -0.9581298828125, -0.863067626953125, -0.76800537109375, -0.672943115234375, -0.577880859375, -0.482818603515625, -0.38775634765625, -0.292694091796875, -0.1976318359375, -0.102569580078125, -0.00750732421875, 0.087554931640625, 0.1826171875, 0.277679443359375, 0.37274169921875, 0.467803955078125, 0.5628662109375, 0.657928466796875, 0.75299072265625, 0.848052978515625, 0.943115234375, 1.038177490234375, 1.13323974609375, 1.228302001953125, 1.3233642578125, 1.418426513671875, 1.51348876953125, 1.608551025390625, 1.70361328125, 1.798675537109375, 1.89373779296875, 1.988800048828125, 2.0838623046875, 2.178924560546875, 2.27398681640625, 2.369049072265625, 2.464111328125, 2.559173583984375, 2.65423583984375, 2.749298095703125, 2.8443603515625, 2.939422607421875, 3.03448486328125, 3.129547119140625, 3.224609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 1.0, 8.0, 6.0, 15.0, 14.0, 19.0, 23.0, 22.0, 38.0, 32.0, 43.0, 37.0, 68.0, 62.0, 73.0, 87.0, 81.0, 64.0, 63.0, 44.0, 40.0, 35.0, 23.0, 19.0, 15.0, 21.0, 15.0, 6.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.501953125, -2.394866943359375, -2.28778076171875, -2.180694580078125, -2.0736083984375, -1.966522216796875, -1.85943603515625, -1.752349853515625, -1.645263671875, -1.538177490234375, -1.43109130859375, -1.324005126953125, -1.2169189453125, -1.109832763671875, -1.00274658203125, -0.895660400390625, -0.78857421875, -0.681488037109375, -0.57440185546875, -0.467315673828125, -0.3602294921875, -0.253143310546875, -0.14605712890625, -0.038970947265625, 0.068115234375, 0.175201416015625, 0.28228759765625, 0.389373779296875, 0.4964599609375, 0.603546142578125, 0.71063232421875, 0.817718505859375, 0.9248046875, 1.031890869140625, 1.13897705078125, 1.246063232421875, 1.3531494140625, 1.460235595703125, 1.56732177734375, 1.674407958984375, 1.781494140625, 1.888580322265625, 1.99566650390625, 2.102752685546875, 2.2098388671875, 2.316925048828125, 2.42401123046875, 2.531097412109375, 2.63818359375, 2.745269775390625, 2.85235595703125, 2.959442138671875, 3.0665283203125, 3.173614501953125, 3.28070068359375, 3.387786865234375, 3.494873046875, 3.601959228515625, 3.70904541015625, 3.816131591796875, 3.9232177734375, 4.030303955078125, 4.13739013671875, 4.244476318359375, 4.3515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 9.0, 19.0, 39.0, 115.0, 374.0, 242.0, 106.0, 48.0, 16.0, 13.0, 11.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-174.19482421875, -169.34356689453125, -164.49232482910156, -159.64108276367188, -154.78982543945312, -149.93856811523438, -145.0873260498047, -140.236083984375, -135.38482666015625, -130.5335693359375, -125.68232727050781, -120.8310775756836, -115.97982788085938, -111.12857818603516, -106.27732849121094, -101.42607879638672, -96.5748291015625, -91.72357940673828, -86.87232971191406, -82.02108001708984, -77.16983032226562, -72.3185806274414, -67.46733093261719, -62.61608123779297, -57.76483154296875, -52.91358184814453, -48.06233215332031, -43.211082458496094, -38.359832763671875, -33.508583068847656, -28.657333374023438, -23.80608367919922, -18.954849243164062, -14.103599548339844, -9.252349853515625, -4.401100158691406, 0.4501495361328125, 5.301399230957031, 10.15264892578125, 15.003898620605469, 19.855148315429688, 24.706398010253906, 29.557647705078125, 34.408897399902344, 39.26014709472656, 44.11139678955078, 48.962646484375, 53.81389617919922, 58.66514587402344, 63.516395568847656, 68.36764526367188, 73.2188949584961, 78.07014465332031, 82.92139434814453, 87.77264404296875, 92.62389373779297, 97.47514343261719, 102.3263931274414, 107.17764282226562, 112.02889251708984, 116.88014221191406, 121.73139190673828, 126.5826416015625, 131.43389892578125, 136.28514099121094]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 5.0, 7.0, 10.0, 13.0, 10.0, 11.0, 18.0, 24.0, 23.0, 27.0, 27.0, 34.0, 38.0, 37.0, 70.0, 156.0, 139.0, 47.0, 44.0, 35.0, 26.0, 24.0, 32.0, 27.0, 27.0, 21.0, 14.0, 6.0, 14.0, 8.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.88471221923828, -79.38744354248047, -76.89017486572266, -74.39290618896484, -71.89564514160156, -69.39837646484375, -66.90110778808594, -64.40383911132812, -61.90657043457031, -59.4093017578125, -56.91203308105469, -54.41476821899414, -51.91749954223633, -49.420230865478516, -46.92296600341797, -44.425697326660156, -41.928428649902344, -39.43115997314453, -36.93389129638672, -34.43662643432617, -31.93935775756836, -29.442089080810547, -26.944822311401367, -24.447555541992188, -21.950286865234375, -19.453018188476562, -16.955751419067383, -14.458483695983887, -11.96121597290039, -9.463948249816895, -6.966680526733398, -4.469413757324219, -1.972137451171875, 0.5251302719116211, 3.022397994995117, 5.519665718078613, 8.01693344116211, 10.514201164245605, 13.011468887329102, 15.508735656738281, 18.006004333496094, 20.503273010253906, 23.000539779663086, 25.497806549072266, 27.995075225830078, 30.49234390258789, 32.98960876464844, 35.48687744140625, 37.98414611816406, 40.481414794921875, 42.97868347167969, 45.475948333740234, 47.97321701049805, 50.47048568725586, 52.967750549316406, 55.46501922607422, 57.96228790283203, 60.459556579589844, 62.956825256347656, 65.45409393310547, 67.95135498046875, 70.44862365722656, 72.94589233398438, 75.44316101074219, 77.9404296875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 2.0, 6.0, 12.0, 22.0, 36.0, 59.0, 87.0, 131.0, 217.0, 358.0, 561.0, 937.0, 1709.0, 3067.0, 6135.0, 14528.0, 48351.0, 346586.0, 2567203.0, 1059102.0, 103798.0, 23294.0, 8557.0, 4072.0, 2155.0, 1238.0, 724.0, 424.0, 272.0, 169.0, 139.0, 67.0, 74.0, 49.0, 31.0, 15.0, 26.0, 18.0, 17.0, 9.0, 4.0, 4.0, 5.0, 9.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.1953125, -11.7984619140625, -11.401611328125, -11.0047607421875, -10.60791015625, -10.2110595703125, -9.814208984375, -9.4173583984375, -9.0205078125, -8.6236572265625, -8.226806640625, -7.8299560546875, -7.43310546875, -7.0362548828125, -6.639404296875, -6.2425537109375, -5.845703125, -5.4488525390625, -5.052001953125, -4.6551513671875, -4.25830078125, -3.8614501953125, -3.464599609375, -3.0677490234375, -2.6708984375, -2.2740478515625, -1.877197265625, -1.4803466796875, -1.08349609375, -0.6866455078125, -0.289794921875, 0.1070556640625, 0.50390625, 0.9007568359375, 1.297607421875, 1.6944580078125, 2.09130859375, 2.4881591796875, 2.885009765625, 3.2818603515625, 3.6787109375, 4.0755615234375, 4.472412109375, 4.8692626953125, 5.26611328125, 5.6629638671875, 6.059814453125, 6.4566650390625, 6.853515625, 7.2503662109375, 7.647216796875, 8.0440673828125, 8.44091796875, 8.8377685546875, 9.234619140625, 9.6314697265625, 10.0283203125, 10.4251708984375, 10.822021484375, 11.2188720703125, 11.61572265625, 12.0125732421875, 12.409423828125, 12.8062744140625, 13.203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 14.0, 10.0, 8.0, 9.0, 24.0, 25.0, 24.0, 45.0, 52.0, 51.0, 48.0, 49.0, 58.0, 62.0, 49.0, 59.0, 57.0, 71.0, 33.0, 40.0, 37.0, 49.0, 27.0, 17.0, 24.0, 16.0, 10.0, 3.0, 6.0, 5.0, 5.0, 6.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.34765625, -6.16845703125, -5.9892578125, -5.81005859375, -5.630859375, -5.45166015625, -5.2724609375, -5.09326171875, -4.9140625, -4.73486328125, -4.5556640625, -4.37646484375, -4.197265625, -4.01806640625, -3.8388671875, -3.65966796875, -3.48046875, -3.30126953125, -3.1220703125, -2.94287109375, -2.763671875, -2.58447265625, -2.4052734375, -2.22607421875, -2.046875, -1.86767578125, -1.6884765625, -1.50927734375, -1.330078125, -1.15087890625, -0.9716796875, -0.79248046875, -0.61328125, -0.43408203125, -0.2548828125, -0.07568359375, 0.103515625, 0.28271484375, 0.4619140625, 0.64111328125, 0.8203125, 0.99951171875, 1.1787109375, 1.35791015625, 1.537109375, 1.71630859375, 1.8955078125, 2.07470703125, 2.25390625, 2.43310546875, 2.6123046875, 2.79150390625, 2.970703125, 3.14990234375, 3.3291015625, 3.50830078125, 3.6875, 3.86669921875, 4.0458984375, 4.22509765625, 4.404296875, 4.58349609375, 4.7626953125, 4.94189453125, 5.12109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 4.0, 1.0, 8.0, 14.0, 17.0, 29.0, 47.0, 50.0, 99.0, 122.0, 284.0, 556.0, 1438.0, 5365.0, 42697.0, 3845235.0, 280583.0, 13191.0, 2695.0, 911.0, 401.0, 198.0, 122.0, 79.0, 39.0, 31.0, 26.0, 17.0, 6.0, 10.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.96875, -31.82177734375, -30.6748046875, -29.52783203125, -28.380859375, -27.23388671875, -26.0869140625, -24.93994140625, -23.79296875, -22.64599609375, -21.4990234375, -20.35205078125, -19.205078125, -18.05810546875, -16.9111328125, -15.76416015625, -14.6171875, -13.47021484375, -12.3232421875, -11.17626953125, -10.029296875, -8.88232421875, -7.7353515625, -6.58837890625, -5.44140625, -4.29443359375, -3.1474609375, -2.00048828125, -0.853515625, 0.29345703125, 1.4404296875, 2.58740234375, 3.734375, 4.88134765625, 6.0283203125, 7.17529296875, 8.322265625, 9.46923828125, 10.6162109375, 11.76318359375, 12.91015625, 14.05712890625, 15.2041015625, 16.35107421875, 17.498046875, 18.64501953125, 19.7919921875, 20.93896484375, 22.0859375, 23.23291015625, 24.3798828125, 25.52685546875, 26.673828125, 27.82080078125, 28.9677734375, 30.11474609375, 31.26171875, 32.40869140625, 33.5556640625, 34.70263671875, 35.849609375, 36.99658203125, 38.1435546875, 39.29052734375, 40.4375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 9.0, 11.0, 12.0, 19.0, 25.0, 26.0, 47.0, 71.0, 113.0, 164.0, 293.0, 423.0, 702.0, 776.0, 505.0, 302.0, 176.0, 114.0, 82.0, 65.0, 40.0, 21.0, 22.0, 17.0, 7.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.359375, -23.662109375, -22.96484375, -22.267578125, -21.5703125, -20.873046875, -20.17578125, -19.478515625, -18.78125, -18.083984375, -17.38671875, -16.689453125, -15.9921875, -15.294921875, -14.59765625, -13.900390625, -13.203125, -12.505859375, -11.80859375, -11.111328125, -10.4140625, -9.716796875, -9.01953125, -8.322265625, -7.625, -6.927734375, -6.23046875, -5.533203125, -4.8359375, -4.138671875, -3.44140625, -2.744140625, -2.046875, -1.349609375, -0.65234375, 0.044921875, 0.7421875, 1.439453125, 2.13671875, 2.833984375, 3.53125, 4.228515625, 4.92578125, 5.623046875, 6.3203125, 7.017578125, 7.71484375, 8.412109375, 9.109375, 9.806640625, 10.50390625, 11.201171875, 11.8984375, 12.595703125, 13.29296875, 13.990234375, 14.6875, 15.384765625, 16.08203125, 16.779296875, 17.4765625, 18.173828125, 18.87109375, 19.568359375, 20.265625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 14.0, 13.0, 36.0, 68.0, 161.0, 323.0, 206.0, 89.0, 40.0, 20.0, 8.0, 6.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.24046325683594, -161.1050262451172, -149.9696044921875, -138.83416748046875, -127.69873046875, -116.56330108642578, -105.42787170410156, -94.29243469238281, -83.1570053100586, -72.02157592773438, -60.886138916015625, -49.750709533691406, -38.61527633666992, -27.479843139648438, -16.34441375732422, -5.208976745605469, 5.92645263671875, 17.061885833740234, 28.197317123413086, 39.33274841308594, 50.46818161010742, 61.603614807128906, 72.73904418945312, 83.87448120117188, 95.0099105834961, 106.14533996582031, 117.28077697753906, 128.41619873046875, 139.5516357421875, 150.68707275390625, 161.822509765625, 172.95794677734375, 184.09335327148438, 195.22879028320312, 206.3642120361328, 217.49964904785156, 228.6350860595703, 239.7705078125, 250.90594482421875, 262.0413818359375, 273.17681884765625, 284.312255859375, 295.44769287109375, 306.5831298828125, 317.7185363769531, 328.8539733886719, 339.9894104003906, 351.1248474121094, 362.26025390625, 373.39569091796875, 384.5311279296875, 395.66656494140625, 406.8019714355469, 417.9374084472656, 429.0728454589844, 440.2082824707031, 451.3437194824219, 462.4791564941406, 473.6145935058594, 484.75, 495.88543701171875, 507.0208740234375, 518.1563110351562, 529.291748046875, 540.4271850585938]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 5.0, 4.0, 5.0, 6.0, 3.0, 8.0, 10.0, 12.0, 16.0, 24.0, 21.0, 23.0, 25.0, 29.0, 27.0, 36.0, 43.0, 45.0, 49.0, 57.0, 64.0, 61.0, 54.0, 43.0, 60.0, 44.0, 31.0, 26.0, 24.0, 25.0, 17.0, 22.0, 12.0, 18.0, 18.0, 6.0, 4.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.39584350585938, -107.88689422607422, -104.37794494628906, -100.8689956665039, -97.36004638671875, -93.8510971069336, -90.34214782714844, -86.83319854736328, -83.32424926757812, -79.81529998779297, -76.30635070800781, -72.79740142822266, -69.2884521484375, -65.77950286865234, -62.27055358886719, -58.76160430908203, -55.252655029296875, -51.74370574951172, -48.23475646972656, -44.725807189941406, -41.21685791015625, -37.707908630371094, -34.19895935058594, -30.69001007080078, -27.181060791015625, -23.67211151123047, -20.163162231445312, -16.654212951660156, -13.145263671875, -9.636314392089844, -6.1273651123046875, -2.6184158325195312, 0.8905410766601562, 4.3994903564453125, 7.908439636230469, 11.417388916015625, 14.926338195800781, 18.435287475585938, 21.944236755371094, 25.45318603515625, 28.962135314941406, 32.47108459472656, 35.98003387451172, 39.488983154296875, 42.99793243408203, 46.50688171386719, 50.015830993652344, 53.5247802734375, 57.033729553222656, 60.54267883300781, 64.05162811279297, 67.56057739257812, 71.06952667236328, 74.57847595214844, 78.0874252319336, 81.59637451171875, 85.1053237915039, 88.61427307128906, 92.12322235107422, 95.63217163085938, 99.14112091064453, 102.65007019042969, 106.15901947021484, 109.66796875, 113.17691802978516]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 5.0, 3.0, 4.0, 5.0, 18.0, 22.0, 23.0, 42.0, 71.0, 90.0, 159.0, 251.0, 457.0, 905.0, 1928.0, 4635.0, 12690.0, 45957.0, 361189.0, 540462.0, 55601.0, 14594.0, 5067.0, 2127.0, 993.0, 503.0, 292.0, 170.0, 96.0, 62.0, 46.0, 29.0, 12.0, 12.0, 10.0, 3.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5390625, -10.1763916015625, -9.813720703125, -9.4510498046875, -9.08837890625, -8.7257080078125, -8.363037109375, -8.0003662109375, -7.6376953125, -7.2750244140625, -6.912353515625, -6.5496826171875, -6.18701171875, -5.8243408203125, -5.461669921875, -5.0989990234375, -4.736328125, -4.3736572265625, -4.010986328125, -3.6483154296875, -3.28564453125, -2.9229736328125, -2.560302734375, -2.1976318359375, -1.8349609375, -1.4722900390625, -1.109619140625, -0.7469482421875, -0.38427734375, -0.0216064453125, 0.341064453125, 0.7037353515625, 1.06640625, 1.4290771484375, 1.791748046875, 2.1544189453125, 2.51708984375, 2.8797607421875, 3.242431640625, 3.6051025390625, 3.9677734375, 4.3304443359375, 4.693115234375, 5.0557861328125, 5.41845703125, 5.7811279296875, 6.143798828125, 6.5064697265625, 6.869140625, 7.2318115234375, 7.594482421875, 7.9571533203125, 8.31982421875, 8.6824951171875, 9.045166015625, 9.4078369140625, 9.7705078125, 10.1331787109375, 10.495849609375, 10.8585205078125, 11.22119140625, 11.5838623046875, 11.946533203125, 12.3092041015625, 12.671875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 4.0, 7.0, 6.0, 11.0, 10.0, 18.0, 17.0, 20.0, 35.0, 39.0, 35.0, 50.0, 46.0, 42.0, 61.0, 49.0, 71.0, 55.0, 46.0, 56.0, 53.0, 61.0, 36.0, 33.0, 27.0, 17.0, 21.0, 16.0, 12.0, 9.0, 7.0, 5.0, 8.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53515625, -6.30535888671875, -6.0755615234375, -5.84576416015625, -5.615966796875, -5.38616943359375, -5.1563720703125, -4.92657470703125, -4.69677734375, -4.46697998046875, -4.2371826171875, -4.00738525390625, -3.777587890625, -3.54779052734375, -3.3179931640625, -3.08819580078125, -2.8583984375, -2.62860107421875, -2.3988037109375, -2.16900634765625, -1.939208984375, -1.70941162109375, -1.4796142578125, -1.24981689453125, -1.02001953125, -0.79022216796875, -0.5604248046875, -0.33062744140625, -0.100830078125, 0.12896728515625, 0.3587646484375, 0.58856201171875, 0.818359375, 1.04815673828125, 1.2779541015625, 1.50775146484375, 1.737548828125, 1.96734619140625, 2.1971435546875, 2.42694091796875, 2.65673828125, 2.88653564453125, 3.1163330078125, 3.34613037109375, 3.575927734375, 3.80572509765625, 4.0355224609375, 4.26531982421875, 4.4951171875, 4.72491455078125, 4.9547119140625, 5.18450927734375, 5.414306640625, 5.64410400390625, 5.8739013671875, 6.10369873046875, 6.33349609375, 6.56329345703125, 6.7930908203125, 7.02288818359375, 7.252685546875, 7.48248291015625, 7.7122802734375, 7.94207763671875, 8.171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 3.0, 8.0, 8.0, 11.0, 16.0, 19.0, 25.0, 32.0, 62.0, 71.0, 96.0, 142.0, 219.0, 402.0, 668.0, 1364.0, 3681.0, 15499.0, 170925.0, 823036.0, 23927.0, 4798.0, 1589.0, 764.0, 402.0, 246.0, 138.0, 109.0, 78.0, 55.0, 36.0, 31.0, 26.0, 14.0, 15.0, 8.0, 9.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.6015625, -14.197265625, -13.79296875, -13.388671875, -12.984375, -12.580078125, -12.17578125, -11.771484375, -11.3671875, -10.962890625, -10.55859375, -10.154296875, -9.75, -9.345703125, -8.94140625, -8.537109375, -8.1328125, -7.728515625, -7.32421875, -6.919921875, -6.515625, -6.111328125, -5.70703125, -5.302734375, -4.8984375, -4.494140625, -4.08984375, -3.685546875, -3.28125, -2.876953125, -2.47265625, -2.068359375, -1.6640625, -1.259765625, -0.85546875, -0.451171875, -0.046875, 0.357421875, 0.76171875, 1.166015625, 1.5703125, 1.974609375, 2.37890625, 2.783203125, 3.1875, 3.591796875, 3.99609375, 4.400390625, 4.8046875, 5.208984375, 5.61328125, 6.017578125, 6.421875, 6.826171875, 7.23046875, 7.634765625, 8.0390625, 8.443359375, 8.84765625, 9.251953125, 9.65625, 10.060546875, 10.46484375, 10.869140625, 11.2734375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 14.0, 10.0, 6.0, 10.0, 17.0, 14.0, 24.0, 17.0, 26.0, 30.0, 33.0, 44.0, 60.0, 70.0, 70.0, 84.0, 95.0, 50.0, 57.0, 35.0, 38.0, 39.0, 29.0, 23.0, 11.0, 14.0, 17.0, 12.0, 7.0, 10.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.90625, -27.119384765625, -26.33251953125, -25.545654296875, -24.7587890625, -23.971923828125, -23.18505859375, -22.398193359375, -21.611328125, -20.824462890625, -20.03759765625, -19.250732421875, -18.4638671875, -17.677001953125, -16.89013671875, -16.103271484375, -15.31640625, -14.529541015625, -13.74267578125, -12.955810546875, -12.1689453125, -11.382080078125, -10.59521484375, -9.808349609375, -9.021484375, -8.234619140625, -7.44775390625, -6.660888671875, -5.8740234375, -5.087158203125, -4.30029296875, -3.513427734375, -2.7265625, -1.939697265625, -1.15283203125, -0.365966796875, 0.4208984375, 1.207763671875, 1.99462890625, 2.781494140625, 3.568359375, 4.355224609375, 5.14208984375, 5.928955078125, 6.7158203125, 7.502685546875, 8.28955078125, 9.076416015625, 9.86328125, 10.650146484375, 11.43701171875, 12.223876953125, 13.0107421875, 13.797607421875, 14.58447265625, 15.371337890625, 16.158203125, 16.945068359375, 17.73193359375, 18.518798828125, 19.3056640625, 20.092529296875, 20.87939453125, 21.666259765625, 22.453125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 18.0, 16.0, 28.0, 22.0, 39.0, 67.0, 66.0, 116.0, 234.0, 415.0, 806.0, 2121.0, 5810.0, 25944.0, 749342.0, 232497.0, 22131.0, 5288.0, 1799.0, 803.0, 354.0, 204.0, 120.0, 90.0, 51.0, 42.0, 28.0, 20.0, 13.0, 17.0, 9.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.451171875, -2.38104248046875, -2.3109130859375, -2.24078369140625, -2.170654296875, -2.10052490234375, -2.0303955078125, -1.96026611328125, -1.89013671875, -1.82000732421875, -1.7498779296875, -1.67974853515625, -1.609619140625, -1.53948974609375, -1.4693603515625, -1.39923095703125, -1.3291015625, -1.25897216796875, -1.1888427734375, -1.11871337890625, -1.048583984375, -0.97845458984375, -0.9083251953125, -0.83819580078125, -0.76806640625, -0.69793701171875, -0.6278076171875, -0.55767822265625, -0.487548828125, -0.41741943359375, -0.3472900390625, -0.27716064453125, -0.20703125, -0.13690185546875, -0.0667724609375, 0.00335693359375, 0.073486328125, 0.14361572265625, 0.2137451171875, 0.28387451171875, 0.35400390625, 0.42413330078125, 0.4942626953125, 0.56439208984375, 0.634521484375, 0.70465087890625, 0.7747802734375, 0.84490966796875, 0.9150390625, 0.98516845703125, 1.0552978515625, 1.12542724609375, 1.195556640625, 1.26568603515625, 1.3358154296875, 1.40594482421875, 1.47607421875, 1.54620361328125, 1.6163330078125, 1.68646240234375, 1.756591796875, 1.82672119140625, 1.8968505859375, 1.96697998046875, 2.037109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 8.0, 13.0, 10.0, 15.0, 32.0, 44.0, 47.0, 61.0, 82.0, 117.0, 120.0, 123.0, 82.0, 65.0, 33.0, 29.0, 29.0, 14.0, 16.0, 11.0, 7.0, 13.0, 4.0, 1.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004901885986328125, -0.0004759691655635834, -0.00046174973249435425, -0.0004475302994251251, -0.000433310866355896, -0.00041909143328666687, -0.00040487200021743774, -0.0003906525671482086, -0.0003764331340789795, -0.00036221370100975037, -0.00034799426794052124, -0.0003337748348712921, -0.000319555401802063, -0.00030533596873283386, -0.00029111653566360474, -0.0002768971025943756, -0.0002626776695251465, -0.00024845823645591736, -0.00023423880338668823, -0.0002200193703174591, -0.00020579993724822998, -0.00019158050417900085, -0.00017736107110977173, -0.0001631416380405426, -0.00014892220497131348, -0.00013470277190208435, -0.00012048333883285522, -0.0001062639057636261, -9.204447269439697e-05, -7.782503962516785e-05, -6.360560655593872e-05, -4.9386173486709595e-05, -3.516674041748047e-05, -2.0947307348251343e-05, -6.727874279022217e-06, 7.491558790206909e-06, 2.1710991859436035e-05, 3.593042492866516e-05, 5.014985799789429e-05, 6.436929106712341e-05, 7.858872413635254e-05, 9.280815720558167e-05, 0.00010702759027481079, 0.00012124702334403992, 0.00013546645641326904, 0.00014968588948249817, 0.0001639053225517273, 0.00017812475562095642, 0.00019234418869018555, 0.00020656362175941467, 0.0002207830548286438, 0.00023500248789787292, 0.00024922192096710205, 0.0002634413540363312, 0.0002776607871055603, 0.00029188022017478943, 0.00030609965324401855, 0.0003203190863132477, 0.0003345385193824768, 0.00034875795245170593, 0.00036297738552093506, 0.0003771968185901642, 0.0003914162516593933, 0.00040563568472862244, 0.00041985511779785156]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 9.0, 11.0, 17.0, 34.0, 43.0, 63.0, 140.0, 254.0, 566.0, 1220.0, 3501.0, 11962.0, 70989.0, 885370.0, 58344.0, 10558.0, 3063.0, 1229.0, 541.0, 285.0, 136.0, 73.0, 50.0, 26.0, 27.0, 14.0, 8.0, 5.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.450775146484375, -2.37030029296875, -2.289825439453125, -2.2093505859375, -2.128875732421875, -2.04840087890625, -1.967926025390625, -1.887451171875, -1.806976318359375, -1.72650146484375, -1.646026611328125, -1.5655517578125, -1.485076904296875, -1.40460205078125, -1.324127197265625, -1.24365234375, -1.163177490234375, -1.08270263671875, -1.002227783203125, -0.9217529296875, -0.841278076171875, -0.76080322265625, -0.680328369140625, -0.599853515625, -0.519378662109375, -0.43890380859375, -0.358428955078125, -0.2779541015625, -0.197479248046875, -0.11700439453125, -0.036529541015625, 0.0439453125, 0.124420166015625, 0.20489501953125, 0.285369873046875, 0.3658447265625, 0.446319580078125, 0.52679443359375, 0.607269287109375, 0.687744140625, 0.768218994140625, 0.84869384765625, 0.929168701171875, 1.0096435546875, 1.090118408203125, 1.17059326171875, 1.251068115234375, 1.33154296875, 1.412017822265625, 1.49249267578125, 1.572967529296875, 1.6534423828125, 1.733917236328125, 1.81439208984375, 1.894866943359375, 1.975341796875, 2.055816650390625, 2.13629150390625, 2.216766357421875, 2.2972412109375, 2.377716064453125, 2.45819091796875, 2.538665771484375, 2.619140625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 4.0, 4.0, 5.0, 5.0, 7.0, 11.0, 15.0, 29.0, 30.0, 26.0, 29.0, 50.0, 58.0, 58.0, 103.0, 103.0, 93.0, 68.0, 59.0, 50.0, 25.0, 26.0, 18.0, 27.0, 12.0, 17.0, 6.0, 17.0, 8.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.73046875, -1.6731719970703125, -1.615875244140625, -1.5585784912109375, -1.50128173828125, -1.4439849853515625, -1.386688232421875, -1.3293914794921875, -1.2720947265625, -1.2147979736328125, -1.157501220703125, -1.1002044677734375, -1.04290771484375, -0.9856109619140625, -0.928314208984375, -0.8710174560546875, -0.813720703125, -0.7564239501953125, -0.699127197265625, -0.6418304443359375, -0.58453369140625, -0.5272369384765625, -0.469940185546875, -0.4126434326171875, -0.3553466796875, -0.2980499267578125, -0.240753173828125, -0.1834564208984375, -0.12615966796875, -0.0688629150390625, -0.011566162109375, 0.0457305908203125, 0.10302734375, 0.1603240966796875, 0.217620849609375, 0.2749176025390625, 0.33221435546875, 0.3895111083984375, 0.446807861328125, 0.5041046142578125, 0.5614013671875, 0.6186981201171875, 0.675994873046875, 0.7332916259765625, 0.79058837890625, 0.8478851318359375, 0.905181884765625, 0.9624786376953125, 1.019775390625, 1.0770721435546875, 1.134368896484375, 1.1916656494140625, 1.24896240234375, 1.3062591552734375, 1.363555908203125, 1.4208526611328125, 1.4781494140625, 1.5354461669921875, 1.592742919921875, 1.6500396728515625, 1.70733642578125, 1.7646331787109375, 1.821929931640625, 1.8792266845703125, 1.9365234375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 21.0, 39.0, 115.0, 593.0, 150.0, 45.0, 18.0, 13.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.4081573486328, -153.24716186523438, -148.08615112304688, -142.92515563964844, -137.76414489746094, -132.6031494140625, -127.44214630126953, -122.28114318847656, -117.1201400756836, -111.95913696289062, -106.79813385009766, -101.63713073730469, -96.47613525390625, -91.31512451171875, -86.15412902832031, -80.99312591552734, -75.83212280273438, -70.6711196899414, -65.51011657714844, -60.349117279052734, -55.188114166259766, -50.0271110534668, -44.866111755371094, -39.705108642578125, -34.544105529785156, -29.383102416992188, -24.22210121154785, -19.061100006103516, -13.900096893310547, -8.739093780517578, -3.578092575073242, 1.5829086303710938, 6.743927001953125, 11.904929161071777, 17.06593132019043, 22.226932525634766, 27.387935638427734, 32.5489387512207, 37.709938049316406, 42.870941162109375, 48.031944274902344, 53.19294738769531, 58.35395050048828, 63.514949798583984, 68.67594909667969, 73.83695983886719, 78.99795532226562, 84.1589584350586, 89.31996154785156, 94.48096466064453, 99.6419677734375, 104.80297088623047, 109.96397399902344, 115.12496948242188, 120.28597259521484, 125.44697570800781, 130.60797119140625, 135.7689666748047, 140.9299774169922, 146.09097290039062, 151.25198364257812, 156.41297912597656, 161.57398986816406, 166.7349853515625, 171.89599609375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 4.0, 5.0, 6.0, 3.0, 6.0, 3.0, 11.0, 9.0, 9.0, 12.0, 14.0, 14.0, 16.0, 18.0, 24.0, 19.0, 23.0, 23.0, 24.0, 70.0, 223.0, 177.0, 74.0, 26.0, 16.0, 18.0, 23.0, 15.0, 11.0, 12.0, 13.0, 18.0, 10.0, 8.0, 2.0, 8.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.091651916503906, -54.33134460449219, -52.57103729248047, -50.81072998046875, -49.0504264831543, -47.29011917114258, -45.52981185913086, -43.76950454711914, -42.00920104980469, -40.24889373779297, -38.48858642578125, -36.72827911376953, -34.96797561645508, -33.20766830444336, -31.44736099243164, -29.687053680419922, -27.926746368408203, -26.166439056396484, -24.4061336517334, -22.64582633972168, -20.885520935058594, -19.125213623046875, -17.364906311035156, -15.604599952697754, -13.844293594360352, -12.08398723602295, -10.323680877685547, -8.563373565673828, -6.803067207336426, -5.042760848999023, -3.2824535369873047, -1.5221471786499023, 0.23816299438476562, 1.998469591140747, 3.7587761878967285, 5.519083023071289, 7.279389381408691, 9.039695739746094, 10.800003051757812, 12.560309410095215, 14.320615768432617, 16.080923080444336, 17.841228485107422, 19.60153579711914, 21.36184310913086, 23.122148513793945, 24.882455825805664, 26.64276123046875, 28.40306854248047, 30.163375854492188, 31.923681259155273, 33.683990478515625, 35.44429397583008, 37.2046012878418, 38.964908599853516, 40.725215911865234, 42.48551940917969, 44.245826721191406, 46.006134033203125, 47.766441345214844, 49.5267448425293, 51.287052154541016, 53.047359466552734, 54.80766677856445, 56.56797409057617]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 10.0, 5.0, 7.0, 11.0, 7.0, 16.0, 17.0, 17.0, 14.0, 15.0, 23.0, 40.0, 24.0, 33.0, 49.0, 114.0, 239.0, 65.0, 36.0, 35.0, 23.0, 27.0, 21.0, 18.0, 17.0, 27.0, 10.0, 12.0, 9.0, 12.0, 13.0, 4.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-6.33984375, -6.16998291015625, -6.0001220703125, -5.83026123046875, -5.660400390625, -5.49053955078125, -5.3206787109375, -5.15081787109375, -4.98095703125, -4.81109619140625, -4.6412353515625, -4.47137451171875, -4.301513671875, -4.13165283203125, -3.9617919921875, -3.79193115234375, -3.6220703125, -3.45220947265625, -3.2823486328125, -3.11248779296875, -2.942626953125, -2.77276611328125, -2.6029052734375, -2.43304443359375, -2.26318359375, -2.09332275390625, -1.9234619140625, -1.75360107421875, -1.583740234375, -1.41387939453125, -1.2440185546875, -1.07415771484375, -0.904296875, -0.73443603515625, -0.5645751953125, -0.39471435546875, -0.224853515625, -0.05499267578125, 0.1148681640625, 0.28472900390625, 0.45458984375, 0.62445068359375, 0.7943115234375, 0.96417236328125, 1.134033203125, 1.30389404296875, 1.4737548828125, 1.64361572265625, 1.8134765625, 1.98333740234375, 2.1531982421875, 2.32305908203125, 2.492919921875, 2.66278076171875, 2.8326416015625, 3.00250244140625, 3.17236328125, 3.34222412109375, 3.5120849609375, 3.68194580078125, 3.851806640625, 4.02166748046875, 4.1915283203125, 4.36138916015625, 4.53125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 12.0, 5.0, 8.0, 11.0, 7.0, 13.0, 16.0, 24.0, 28.0, 54.0, 88.0, 180.0, 330.0, 858.0, 2339.0, 9095.0, 8297883.0, 69186.0, 5443.0, 1649.0, 632.0, 306.0, 164.0, 106.0, 43.0, 30.0, 23.0, 16.0, 10.0, 7.0, 8.0, 2.0, 1.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.49687194824219, -64.64118194580078, -62.78549575805664, -60.9298095703125, -59.074119567871094, -57.21843338012695, -55.36274719238281, -53.507057189941406, -51.651371002197266, -49.795684814453125, -47.93999481201172, -46.08430862426758, -44.22862243652344, -42.37293243408203, -40.51724624633789, -38.66156005859375, -36.805870056152344, -34.9501838684082, -33.0944938659668, -31.238807678222656, -29.383119583129883, -27.52743148803711, -25.67174530029297, -23.816057205200195, -21.960369110107422, -20.10468101501465, -18.248992919921875, -16.393306732177734, -14.537618637084961, -12.681930541992188, -10.82624340057373, -8.970556259155273, -7.114871978759766, -5.25918436050415, -3.403496742248535, -1.54780912399292, 0.3078784942626953, 2.1635665893554688, 4.019253730773926, 5.874940872192383, 7.730628967285156, 9.58631706237793, 11.442004203796387, 13.297691345214844, 15.153379440307617, 17.00906753540039, 18.86475372314453, 20.720441818237305, 22.576129913330078, 24.43181800842285, 26.287506103515625, 28.143192291259766, 29.99888038635254, 31.854568481445312, 33.71025466918945, 35.565940856933594, 37.421630859375, 39.27731704711914, 41.13300704956055, 42.98869323730469, 44.844383239746094, 46.700069427490234, 48.555755615234375, 50.41144561767578, 52.26713180541992]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 10.0, 4.0, 4.0, 2.0, 7.0, 5.0, 7.0, 6.0, 11.0, 6.0, 8.0, 1.0, 4.0, 4.0, 7.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-102.57066345214844, -99.26937866210938, -95.96809387207031, -92.66680908203125, -89.36552429199219, -86.06423950195312, -82.7629623413086, -79.46167755126953, -76.16039276123047, -72.8591079711914, -69.55782318115234, -66.25653839111328, -62.955257415771484, -59.65397262573242, -56.352691650390625, -53.05140686035156, -49.7501220703125, -46.44883728027344, -43.147552490234375, -39.84627151489258, -36.544986724853516, -33.24370193481445, -29.942419052124023, -26.641136169433594, -23.33985137939453, -20.03856658935547, -16.73728370666504, -13.435999870300293, -10.134716033935547, -6.833431243896484, -3.5321483612060547, -0.230865478515625, 3.0704269409179688, 6.371710777282715, 9.672994613647461, 12.974278450012207, 16.275562286376953, 19.576847076416016, 22.878129959106445, 26.179412841796875, 29.480697631835938, 32.781982421875, 36.08326721191406, 39.38454818725586, 42.68583297729492, 45.987117767333984, 49.28839874267578, 52.589683532714844, 55.890968322753906, 59.19225311279297, 62.49353790283203, 65.7948226928711, 69.09609985351562, 72.39738464355469, 75.69866943359375, 78.99995422363281, 82.30123901367188, 85.60252380371094, 88.90380859375, 92.20509338378906, 95.50637817382812, 98.80766296386719, 102.10894012451172, 105.41022491455078, 108.71150970458984]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 11.0, 17.0, 7.0, 19.0, 34.0, 37.0, 79.0, 80.0, 148.0, 259.0, 425.0, 853.0, 1751.0, 4147.0, 11559.0, 38185.0, 139262.0, 221160.0, 73601.0, 20658.0, 6718.0, 2612.0, 1176.0, 572.0, 319.0, 204.0, 120.0, 79.0, 53.0, 32.0, 22.0, 16.0, 16.0, 5.0, 6.0, 4.0, 10.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.65625, -55.86865234375, -54.0810546875, -52.29345703125, -50.505859375, -48.71826171875, -46.9306640625, -45.14306640625, -43.35546875, -41.56787109375, -39.7802734375, -37.99267578125, -36.205078125, -34.41748046875, -32.6298828125, -30.84228515625, -29.0546875, -27.26708984375, -25.4794921875, -23.69189453125, -21.904296875, -20.11669921875, -18.3291015625, -16.54150390625, -14.75390625, -12.96630859375, -11.1787109375, -9.39111328125, -7.603515625, -5.81591796875, -4.0283203125, -2.24072265625, -0.453125, 1.33447265625, 3.1220703125, 4.90966796875, 6.697265625, 8.48486328125, 10.2724609375, 12.06005859375, 13.84765625, 15.63525390625, 17.4228515625, 19.21044921875, 20.998046875, 22.78564453125, 24.5732421875, 26.36083984375, 28.1484375, 29.93603515625, 31.7236328125, 33.51123046875, 35.298828125, 37.08642578125, 38.8740234375, 40.66162109375, 42.44921875, 44.23681640625, 46.0244140625, 47.81201171875, 49.599609375, 51.38720703125, 53.1748046875, 54.96240234375, 56.75]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 5.0, 7.0, 6.0, 8.0, 11.0, 18.0, 11.0, 15.0, 16.0, 23.0, 39.0, 50.0, 40.0, 55.0, 70.0, 60.0, 64.0, 61.0, 70.0, 69.0, 56.0, 42.0, 37.0, 32.0, 29.0, 24.0, 13.0, 14.0, 18.0, 11.0, 6.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4765625, -6.2684326171875, -6.060302734375, -5.8521728515625, -5.64404296875, -5.4359130859375, -5.227783203125, -5.0196533203125, -4.8115234375, -4.6033935546875, -4.395263671875, -4.1871337890625, -3.97900390625, -3.7708740234375, -3.562744140625, -3.3546142578125, -3.146484375, -2.9383544921875, -2.730224609375, -2.5220947265625, -2.31396484375, -2.1058349609375, -1.897705078125, -1.6895751953125, -1.4814453125, -1.2733154296875, -1.065185546875, -0.8570556640625, -0.64892578125, -0.4407958984375, -0.232666015625, -0.0245361328125, 0.18359375, 0.3917236328125, 0.599853515625, 0.8079833984375, 1.01611328125, 1.2242431640625, 1.432373046875, 1.6405029296875, 1.8486328125, 2.0567626953125, 2.264892578125, 2.4730224609375, 2.68115234375, 2.8892822265625, 3.097412109375, 3.3055419921875, 3.513671875, 3.7218017578125, 3.929931640625, 4.1380615234375, 4.34619140625, 4.5543212890625, 4.762451171875, 4.9705810546875, 5.1787109375, 5.3868408203125, 5.594970703125, 5.8031005859375, 6.01123046875, 6.2193603515625, 6.427490234375, 6.6356201171875, 6.84375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 4.0, 26.0, 47.0, 95.0, 120.0, 60.0, 41.0, 14.0, 19.0, 6.0, 7.0, 9.0, 6.0, 5.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.663326263427734, -37.947410583496094, -36.23149108886719, -34.51557540893555, -32.79965591430664, -31.083740234375, -29.367822647094727, -27.651905059814453, -25.93598747253418, -24.220069885253906, -22.504152297973633, -20.78823471069336, -19.07231903076172, -17.356399536132812, -15.640483856201172, -13.924566268920898, -12.208648681640625, -10.492731094360352, -8.776813507080078, -7.060896873474121, -5.344979286193848, -3.629061698913574, -1.9131450653076172, -0.19722747802734375, 1.5186901092529297, 3.234607458114624, 4.950524806976318, 6.666441917419434, 8.382359504699707, 10.09827709197998, 11.814193725585938, 13.530111312866211, 15.24603271484375, 16.961950302124023, 18.677867889404297, 20.393783569335938, 22.109703063964844, 23.825618743896484, 25.541536331176758, 27.25745391845703, 28.973371505737305, 30.689289093017578, 32.40520477294922, 34.121124267578125, 35.837039947509766, 37.55295944213867, 39.26887512207031, 40.98479461669922, 42.70071029663086, 44.4166259765625, 46.132545471191406, 47.84846115112305, 49.56438064575195, 51.280296325683594, 52.9962158203125, 54.71213150024414, 56.42804718017578, 58.14396286010742, 59.85988235473633, 61.57579803466797, 63.291717529296875, 65.00763702392578, 66.72354888916016, 68.43946838378906, 70.15538787841797]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 2.0, 11.0, 2.0, 5.0, 17.0, 41.0, 84.0, 117.0, 79.0, 36.0, 18.0, 11.0, 9.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.75114440917969, -46.61176681518555, -45.47239303588867, -44.33301544189453, -43.193641662597656, -42.054264068603516, -40.914886474609375, -39.7755126953125, -38.63613510131836, -37.49675750732422, -36.357383728027344, -35.2180061340332, -34.07863235473633, -32.93925476074219, -31.79987907409668, -30.660503387451172, -29.521127700805664, -28.381752014160156, -27.24237632751465, -26.10300064086914, -24.963623046875, -23.824247360229492, -22.684871673583984, -21.545495986938477, -20.40612030029297, -19.26674461364746, -18.127368927001953, -16.987991333007812, -15.848615646362305, -14.709239959716797, -13.569864273071289, -12.430488586425781, -11.291112899780273, -10.151737213134766, -9.012360572814941, -7.872984886169434, -6.733608722686768, -5.594232559204102, -4.454856872558594, -3.3154807090759277, -2.1761045455932617, -1.0367285013198853, 0.10264754295349121, 1.2420234680175781, 2.381399631500244, 3.52077579498291, 4.660151481628418, 5.799527645111084, 6.93890380859375, 8.078279495239258, 9.217656135559082, 10.35703182220459, 11.496408462524414, 12.635784149169922, 13.77515983581543, 14.914535522460938, 16.053913116455078, 17.193288803100586, 18.332664489746094, 19.472042083740234, 20.611417770385742, 21.75079345703125, 22.890169143676758, 24.029544830322266, 25.168920516967773]}, "eval/loss": 5.751396656036377, "eval/wer": 1.2104093497628827, "eval/runtime": 447.2057, "eval/samples_per_second": 5.908, "eval/steps_per_second": 0.371} \ No newline at end of file