{
  "best_metric": 2.132894992828369,
  "best_model_checkpoint": "/tmp/wandb/run-20240211_061007-slcnkgcr/files/train_output/checkpoint-10000",
  "epoch": 2.042133333333333,
  "eval_steps": 500,
  "global_step": 10000,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "MSE": 891.9713033040365,
      "MSE/layer0": 891.9713033040365,
      "dead_code_fraction": 0.1506,
      "dead_code_fraction/layer0": 0.1506,
      "epoch": 0.0,
      "input_norm": 31.997233708699547,
      "input_norm/layer0": 31.997233708699547,
      "learning_rate": 0.0005,
      "loss": 8.0845,
      "max_norm": 34.580135345458984,
      "max_norm/layer0": 34.580135345458984,
      "mean_norm": 31.989344596862793,
      "mean_norm/layer0": 31.989344596862793,
      "multicode_k": 1,
      "output_norm": 8.584638833999634,
      "output_norm/layer0": 8.584638833999634,
      "step": 1
    },
    {
      "MSE": 883.0105907414232,
      "MSE/layer0": 883.0105907414232,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.01,
      "input_norm": 31.99778711876902,
      "input_norm/layer0": 31.99778711876902,
      "learning_rate": 0.0005,
      "loss": 4.8444,
      "max_norm": 34.610191345214844,
      "max_norm/layer0": 34.610191345214844,
      "mean_norm": 32.02294731140137,
      "mean_norm/layer0": 32.02294731140137,
      "multicode_k": 1,
      "output_norm": 8.645599765842462,
      "output_norm/layer0": 8.645599765842462,
      "step": 50
    },
    {
      "MSE": 872.9267329915364,
      "MSE/layer0": 872.9267329915364,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.01,
      "input_norm": 31.998572165171304,
      "input_norm/layer0": 31.998572165171304,
      "learning_rate": 0.0005,
      "loss": 3.9294,
      "max_norm": 34.62763595581055,
      "max_norm/layer0": 34.62763595581055,
      "mean_norm": 32.06278419494629,
      "mean_norm/layer0": 32.06278419494629,
      "multicode_k": 1,
      "output_norm": 8.74148860613505,
      "output_norm/layer0": 8.74148860613505,
      "step": 100
    },
    {
      "MSE": 866.7590488688152,
      "MSE/layer0": 866.7590488688152,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.01,
      "input_norm": 31.99865425427754,
      "input_norm/layer0": 31.99865425427754,
      "learning_rate": 0.0005,
      "loss": 3.5413,
      "max_norm": 34.65019607543945,
      "max_norm/layer0": 34.65019607543945,
      "mean_norm": 32.1027717590332,
      "mean_norm/layer0": 32.1027717590332,
      "multicode_k": 1,
      "output_norm": 8.811674615542097,
      "output_norm/layer0": 8.811674615542097,
      "step": 150
    },
    {
      "MSE": 858.8314244588221,
      "MSE/layer0": 858.8314244588221,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.02,
      "input_norm": 31.998634125391646,
      "input_norm/layer0": 31.998634125391646,
      "learning_rate": 0.0005,
      "loss": 3.3381,
      "max_norm": 34.73014831542969,
      "max_norm/layer0": 34.73014831542969,
      "mean_norm": 32.17362403869629,
      "mean_norm/layer0": 32.17362403869629,
      "multicode_k": 1,
      "output_norm": 8.925555121103923,
      "output_norm/layer0": 8.925555121103923,
      "step": 200
    },
    {
      "MSE": 849.6408699544276,
      "MSE/layer0": 849.6408699544276,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.03,
      "input_norm": 31.9986141427358,
      "input_norm/layer0": 31.9986141427358,
      "learning_rate": 0.0005,
      "loss": 3.2486,
      "max_norm": 34.8281364440918,
      "max_norm/layer0": 34.8281364440918,
      "mean_norm": 32.26718330383301,
      "mean_norm/layer0": 32.26718330383301,
      "multicode_k": 1,
      "output_norm": 9.101092262268068,
      "output_norm/layer0": 9.101092262268068,
      "step": 250
    },
    {
      "MSE": 841.0051658121741,
      "MSE/layer0": 841.0051658121741,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.03,
      "input_norm": 31.99862952232361,
      "input_norm/layer0": 31.99862952232361,
      "learning_rate": 0.0005,
      "loss": 3.1503,
      "max_norm": 34.946006774902344,
      "max_norm/layer0": 34.946006774902344,
      "mean_norm": 32.361915588378906,
      "mean_norm/layer0": 32.361915588378906,
      "multicode_k": 1,
      "output_norm": 9.305952178637185,
      "output_norm/layer0": 9.305952178637185,
      "step": 300
    },
    {
      "MSE": 833.1103855387371,
      "MSE/layer0": 833.1103855387371,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.04,
      "input_norm": 31.998617506027223,
      "input_norm/layer0": 31.998617506027223,
      "learning_rate": 0.0005,
      "loss": 3.0966,
      "max_norm": 35.09696578979492,
      "max_norm/layer0": 35.09696578979492,
      "mean_norm": 32.463951110839844,
      "mean_norm/layer0": 32.463951110839844,
      "multicode_k": 1,
      "output_norm": 9.513547644615176,
      "output_norm/layer0": 9.513547644615176,
      "step": 350
    },
    {
      "MSE": 824.8635622151694,
      "MSE/layer0": 824.8635622151694,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.04,
      "input_norm": 31.998617092768363,
      "input_norm/layer0": 31.998617092768363,
      "learning_rate": 0.0005,
      "loss": 3.0998,
      "max_norm": 35.28767013549805,
      "max_norm/layer0": 35.28767013549805,
      "mean_norm": 32.571420669555664,
      "mean_norm/layer0": 32.571420669555664,
      "multicode_k": 1,
      "output_norm": 9.74717748324076,
      "output_norm/layer0": 9.74717748324076,
      "step": 400
    },
    {
      "MSE": 817.218793334961,
      "MSE/layer0": 817.218793334961,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.04,
      "input_norm": 31.99862334251403,
      "input_norm/layer0": 31.99862334251403,
      "learning_rate": 0.0005,
      "loss": 3.0603,
      "max_norm": 35.4771842956543,
      "max_norm/layer0": 35.4771842956543,
      "mean_norm": 32.68177795410156,
      "mean_norm/layer0": 32.68177795410156,
      "multicode_k": 1,
      "output_norm": 9.985308513641357,
      "output_norm/layer0": 9.985308513641357,
      "step": 450
    },
    {
      "MSE": 809.1558084106446,
      "MSE/layer0": 809.1558084106446,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.05,
      "input_norm": 31.998615137736,
      "input_norm/layer0": 31.998615137736,
      "learning_rate": 0.0005,
      "loss": 3.0494,
      "max_norm": 35.6486701965332,
      "max_norm/layer0": 35.6486701965332,
      "mean_norm": 32.793779373168945,
      "mean_norm/layer0": 32.793779373168945,
      "multicode_k": 1,
      "output_norm": 10.232081251144415,
      "output_norm/layer0": 10.232081251144415,
      "step": 500
    },
    {
      "epoch": 0.05,
      "eval_MSE/layer0": 805.1675846628777,
      "eval_accuracy": 0.41770872781318447,
      "eval_dead_code_fraction/layer0": 0.0,
      "eval_input_norm/layer0": 31.998606410347342,
      "eval_loss": 2.992654323577881,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 10.360000263063938,
      "eval_runtime": 159.8847,
      "eval_samples_per_second": 28.915,
      "eval_steps_per_second": 1.808,
      "step": 500
    },
    {
      "MSE": 801.7215725708003,
      "MSE/layer0": 801.7215725708003,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.06,
      "input_norm": 31.998598546981817,
      "input_norm/layer0": 31.998598546981817,
      "learning_rate": 0.0005,
      "loss": 2.9547,
      "max_norm": 35.86976623535156,
      "max_norm/layer0": 35.86976623535156,
      "mean_norm": 32.91193962097168,
      "mean_norm/layer0": 32.91193962097168,
      "multicode_k": 1,
      "output_norm": 10.47719025929769,
      "output_norm/layer0": 10.47719025929769,
      "step": 550
    },
    {
      "MSE": 794.043483174642,
      "MSE/layer0": 794.043483174642,
      "dead_code_fraction": 0.0,
      "dead_code_fraction/layer0": 0.0,
      "epoch": 0.06,
      "input_norm": 31.99859639167787,
      "input_norm/layer0": 31.99859639167787,
      "learning_rate": 0.0005,
      "loss": 2.9506,
      "max_norm": 36.08134078979492,
      "max_norm/layer0": 36.08134078979492,
      "mean_norm": 33.03110313415527,
      "mean_norm/layer0": 33.03110313415527,
      "multicode_k": 1,
      "output_norm": 10.729146582285566,
      "output_norm/layer0": 10.729146582285566,
      "step": 600
    },
    {
      "MSE": 786.3193520100913,
      "MSE/layer0": 786.3193520100913,
      "dead_code_fraction": 5e-05,
      "dead_code_fraction/layer0": 5e-05,
      "epoch": 0.07,
      "input_norm": 31.99857716878254,
      "input_norm/layer0": 31.99857716878254,
      "learning_rate": 0.0005,
      "loss": 2.8944,
      "max_norm": 36.33954620361328,
      "max_norm/layer0": 36.33954620361328,
      "mean_norm": 33.15106773376465,
      "mean_norm/layer0": 33.15106773376465,
      "multicode_k": 1,
      "output_norm": 10.987898168563845,
      "output_norm/layer0": 10.987898168563845,
      "step": 650
    },
    {
      "MSE": 780.0598099772137,
      "MSE/layer0": 780.0598099772137,
      "dead_code_fraction": 0.0001,
      "dead_code_fraction/layer0": 0.0001,
      "epoch": 0.07,
      "input_norm": 31.998565645217887,
      "input_norm/layer0": 31.998565645217887,
      "learning_rate": 0.0005,
      "loss": 2.8643,
      "max_norm": 36.55862808227539,
      "max_norm/layer0": 36.55862808227539,
      "mean_norm": 33.269744873046875,
      "mean_norm/layer0": 33.269744873046875,
      "multicode_k": 1,
      "output_norm": 11.218051005999246,
      "output_norm/layer0": 11.218051005999246,
      "step": 700
    },
    {
      "MSE": 772.4797055053714,
      "MSE/layer0": 772.4797055053714,
      "dead_code_fraction": 0.00045,
      "dead_code_fraction/layer0": 0.00045,
      "epoch": 0.07,
      "input_norm": 31.998559678395594,
      "input_norm/layer0": 31.998559678395594,
      "learning_rate": 0.0005,
      "loss": 2.8618,
      "max_norm": 36.793521881103516,
      "max_norm/layer0": 36.793521881103516,
      "mean_norm": 33.39421844482422,
      "mean_norm/layer0": 33.39421844482422,
      "multicode_k": 1,
      "output_norm": 11.470201053619387,
      "output_norm/layer0": 11.470201053619387,
      "step": 750
    },
    {
      "MSE": 766.037492879232,
      "MSE/layer0": 766.037492879232,
      "dead_code_fraction": 0.00055,
      "dead_code_fraction/layer0": 0.00055,
      "epoch": 0.08,
      "input_norm": 31.99854364713033,
      "input_norm/layer0": 31.99854364713033,
      "learning_rate": 0.0005,
      "loss": 2.8403,
      "max_norm": 37.0079231262207,
      "max_norm/layer0": 37.0079231262207,
      "mean_norm": 33.52132034301758,
      "mean_norm/layer0": 33.52132034301758,
      "multicode_k": 1,
      "output_norm": 11.711471532185875,
      "output_norm/layer0": 11.711471532185875,
      "step": 800
    },
    {
      "MSE": 759.9610600789387,
      "MSE/layer0": 759.9610600789387,
      "dead_code_fraction": 0.00135,
      "dead_code_fraction/layer0": 0.00135,
      "epoch": 0.09,
      "input_norm": 31.998529828389472,
      "input_norm/layer0": 31.998529828389472,
      "learning_rate": 0.0005,
      "loss": 2.7453,
      "max_norm": 37.20747375488281,
      "max_norm/layer0": 37.20747375488281,
      "mean_norm": 33.64577674865723,
      "mean_norm/layer0": 33.64577674865723,
      "multicode_k": 1,
      "output_norm": 11.93199801921844,
      "output_norm/layer0": 11.93199801921844,
      "step": 850
    },
    {
      "MSE": 753.5576912434896,
      "MSE/layer0": 753.5576912434896,
      "dead_code_fraction": 0.00205,
      "dead_code_fraction/layer0": 0.00205,
      "epoch": 0.09,
      "input_norm": 31.99852911949157,
      "input_norm/layer0": 31.99852911949157,
      "learning_rate": 0.0005,
      "loss": 2.7975,
      "max_norm": 37.432743072509766,
      "max_norm/layer0": 37.432743072509766,
      "mean_norm": 33.778066635131836,
      "mean_norm/layer0": 33.778066635131836,
      "multicode_k": 1,
      "output_norm": 12.165767738024394,
      "output_norm/layer0": 12.165767738024394,
      "step": 900
    },
    {
      "MSE": 747.6473927815753,
      "MSE/layer0": 747.6473927815753,
      "dead_code_fraction": 0.00335,
      "dead_code_fraction/layer0": 0.00335,
      "epoch": 0.1,
      "input_norm": 31.998517106374106,
      "input_norm/layer0": 31.998517106374106,
      "learning_rate": 0.0005,
      "loss": 2.7378,
      "max_norm": 37.62055969238281,
      "max_norm/layer0": 37.62055969238281,
      "mean_norm": 33.90963554382324,
      "mean_norm/layer0": 33.90963554382324,
      "multicode_k": 1,
      "output_norm": 12.390189347267153,
      "output_norm/layer0": 12.390189347267153,
      "step": 950
    },
    {
      "MSE": 742.6674826049805,
      "MSE/layer0": 742.6674826049805,
      "dead_code_fraction": 0.0048,
      "dead_code_fraction/layer0": 0.0048,
      "epoch": 0.1,
      "input_norm": 31.998499689102182,
      "input_norm/layer0": 31.998499689102182,
      "learning_rate": 0.0005,
      "loss": 2.6986,
      "max_norm": 37.880615234375,
      "max_norm/layer0": 37.880615234375,
      "mean_norm": 34.04428672790527,
      "mean_norm/layer0": 34.04428672790527,
      "multicode_k": 1,
      "output_norm": 12.59642965157827,
      "output_norm/layer0": 12.59642965157827,
      "step": 1000
    },
    {
      "epoch": 0.1,
      "eval_MSE/layer0": 739.3243520424373,
      "eval_accuracy": 0.44721058737930897,
      "eval_dead_code_fraction/layer0": 0.00845,
      "eval_input_norm/layer0": 31.998487053973697,
      "eval_loss": 2.707960367202759,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 12.71647696584792,
      "eval_runtime": 157.5908,
      "eval_samples_per_second": 29.335,
      "eval_steps_per_second": 1.834,
      "step": 1000
    },
    {
      "MSE": 736.2877898152667,
      "MSE/layer0": 736.2877898152667,
      "dead_code_fraction": 0.00735,
      "dead_code_fraction/layer0": 0.00735,
      "epoch": 0.1,
      "input_norm": 31.998484554290766,
      "input_norm/layer0": 31.998484554290766,
      "learning_rate": 0.0005,
      "loss": 2.7222,
      "max_norm": 38.21133804321289,
      "max_norm/layer0": 38.21133804321289,
      "mean_norm": 34.17984199523926,
      "mean_norm/layer0": 34.17984199523926,
      "multicode_k": 1,
      "output_norm": 12.82279133001963,
      "output_norm/layer0": 12.82279133001963,
      "step": 1050
    },
    {
      "MSE": 731.6754523722336,
      "MSE/layer0": 731.6754523722336,
      "dead_code_fraction": 0.01015,
      "dead_code_fraction/layer0": 0.01015,
      "epoch": 0.11,
      "input_norm": 31.998473711013787,
      "input_norm/layer0": 31.998473711013787,
      "learning_rate": 0.0005,
      "loss": 2.652,
      "max_norm": 38.533973693847656,
      "max_norm/layer0": 38.533973693847656,
      "mean_norm": 34.31424903869629,
      "mean_norm/layer0": 34.31424903869629,
      "multicode_k": 1,
      "output_norm": 13.017293116251633,
      "output_norm/layer0": 13.017293116251633,
      "step": 1100
    },
    {
      "MSE": 726.8081079101562,
      "MSE/layer0": 726.8081079101562,
      "dead_code_fraction": 0.013,
      "dead_code_fraction/layer0": 0.013,
      "epoch": 0.12,
      "input_norm": 31.99846080144247,
      "input_norm/layer0": 31.99846080144247,
      "learning_rate": 0.0005,
      "loss": 2.6519,
      "max_norm": 38.87154769897461,
      "max_norm/layer0": 38.87154769897461,
      "mean_norm": 34.454498291015625,
      "mean_norm/layer0": 34.454498291015625,
      "multicode_k": 1,
      "output_norm": 13.209378539721174,
      "output_norm/layer0": 13.209378539721174,
      "step": 1150
    },
    {
      "MSE": 722.3268162027996,
      "MSE/layer0": 722.3268162027996,
      "dead_code_fraction": 0.01565,
      "dead_code_fraction/layer0": 0.01565,
      "epoch": 0.12,
      "input_norm": 31.998446766535434,
      "input_norm/layer0": 31.998446766535434,
      "learning_rate": 0.0005,
      "loss": 2.6464,
      "max_norm": 39.23857879638672,
      "max_norm/layer0": 39.23857879638672,
      "mean_norm": 34.597312927246094,
      "mean_norm/layer0": 34.597312927246094,
      "multicode_k": 1,
      "output_norm": 13.40400979042053,
      "output_norm/layer0": 13.40400979042053,
      "step": 1200
    },
    {
      "MSE": 717.3231912231446,
      "MSE/layer0": 717.3231912231446,
      "dead_code_fraction": 0.0241,
      "dead_code_fraction/layer0": 0.0241,
      "epoch": 0.12,
      "input_norm": 31.998441489537555,
      "input_norm/layer0": 31.998441489537555,
      "learning_rate": 0.0005,
      "loss": 2.6563,
      "max_norm": 39.60569381713867,
      "max_norm/layer0": 39.60569381713867,
      "mean_norm": 34.73863220214844,
      "mean_norm/layer0": 34.73863220214844,
      "multicode_k": 1,
      "output_norm": 13.590513488451638,
      "output_norm/layer0": 13.590513488451638,
      "step": 1250
    },
    {
      "MSE": 713.6523872884117,
      "MSE/layer0": 713.6523872884117,
      "dead_code_fraction": 0.02485,
      "dead_code_fraction/layer0": 0.02485,
      "epoch": 0.13,
      "input_norm": 31.998419742584225,
      "input_norm/layer0": 31.998419742584225,
      "learning_rate": 0.0005,
      "loss": 2.5806,
      "max_norm": 39.939239501953125,
      "max_norm/layer0": 39.939239501953125,
      "mean_norm": 34.87986946105957,
      "mean_norm/layer0": 34.87986946105957,
      "multicode_k": 1,
      "output_norm": 13.766959317525227,
      "output_norm/layer0": 13.766959317525227,
      "step": 1300
    },
    {
      "MSE": 709.5852165730794,
      "MSE/layer0": 709.5852165730794,
      "dead_code_fraction": 0.02925,
      "dead_code_fraction/layer0": 0.02925,
      "epoch": 0.14,
      "input_norm": 31.998412898381545,
      "input_norm/layer0": 31.998412898381545,
      "learning_rate": 0.0005,
      "loss": 2.5789,
      "max_norm": 40.28993225097656,
      "max_norm/layer0": 40.28993225097656,
      "mean_norm": 35.022348403930664,
      "mean_norm/layer0": 35.022348403930664,
      "multicode_k": 1,
      "output_norm": 13.93345036347707,
      "output_norm/layer0": 13.93345036347707,
      "step": 1350
    },
    {
      "MSE": 705.2143248494463,
      "MSE/layer0": 705.2143248494463,
      "dead_code_fraction": 0.03375,
      "dead_code_fraction/layer0": 0.03375,
      "epoch": 0.14,
      "input_norm": 31.9984123802185,
      "input_norm/layer0": 31.9984123802185,
      "learning_rate": 0.0005,
      "loss": 2.5943,
      "max_norm": 40.63530349731445,
      "max_norm/layer0": 40.63530349731445,
      "mean_norm": 35.164276123046875,
      "mean_norm/layer0": 35.164276123046875,
      "multicode_k": 1,
      "output_norm": 14.105911358197524,
      "output_norm/layer0": 14.105911358197524,
      "step": 1400
    },
    {
      "MSE": 702.3593349202476,
      "MSE/layer0": 702.3593349202476,
      "dead_code_fraction": 0.0404,
      "dead_code_fraction/layer0": 0.0404,
      "epoch": 0.14,
      "input_norm": 31.99839937845865,
      "input_norm/layer0": 31.99839937845865,
      "learning_rate": 0.0005,
      "loss": 2.5407,
      "max_norm": 40.98182678222656,
      "max_norm/layer0": 40.98182678222656,
      "mean_norm": 35.30343246459961,
      "mean_norm/layer0": 35.30343246459961,
      "multicode_k": 1,
      "output_norm": 14.2450444761912,
      "output_norm/layer0": 14.2450444761912,
      "step": 1450
    },
    {
      "MSE": 699.0307844034837,
      "MSE/layer0": 699.0307844034837,
      "dead_code_fraction": 0.04535,
      "dead_code_fraction/layer0": 0.04535,
      "epoch": 0.15,
      "input_norm": 31.998390986124676,
      "input_norm/layer0": 31.998390986124676,
      "learning_rate": 0.0005,
      "loss": 2.5145,
      "max_norm": 41.328433990478516,
      "max_norm/layer0": 41.328433990478516,
      "mean_norm": 35.445411682128906,
      "mean_norm/layer0": 35.445411682128906,
      "multicode_k": 1,
      "output_norm": 14.399013953208918,
      "output_norm/layer0": 14.399013953208918,
      "step": 1500
    },
    {
      "epoch": 0.15,
      "eval_MSE/layer0": 697.1178701616536,
      "eval_accuracy": 0.4637486628652817,
      "eval_dead_code_fraction/layer0": 0.05465,
      "eval_input_norm/layer0": 31.99837304089923,
      "eval_loss": 2.525156259536743,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 14.48893911880305,
      "eval_runtime": 156.9005,
      "eval_samples_per_second": 29.465,
      "eval_steps_per_second": 1.842,
      "step": 1500
    },
    {
      "MSE": 696.0442759195965,
      "MSE/layer0": 696.0442759195965,
      "dead_code_fraction": 0.05145,
      "dead_code_fraction/layer0": 0.05145,
      "epoch": 0.15,
      "input_norm": 31.99836520512899,
      "input_norm/layer0": 31.99836520512899,
      "learning_rate": 0.0005,
      "loss": 2.4631,
      "max_norm": 41.6606559753418,
      "max_norm/layer0": 41.6606559753418,
      "mean_norm": 35.58424758911133,
      "mean_norm/layer0": 35.58424758911133,
      "multicode_k": 1,
      "output_norm": 14.54295777956645,
      "output_norm/layer0": 14.54295777956645,
      "step": 1550
    },
    {
      "MSE": 691.8516132609051,
      "MSE/layer0": 691.8516132609051,
      "dead_code_fraction": 0.0558,
      "dead_code_fraction/layer0": 0.0558,
      "epoch": 0.16,
      "input_norm": 31.998375968933097,
      "input_norm/layer0": 31.998375968933097,
      "learning_rate": 0.0005,
      "loss": 2.5501,
      "max_norm": 42.08574676513672,
      "max_norm/layer0": 42.08574676513672,
      "mean_norm": 35.72518730163574,
      "mean_norm/layer0": 35.72518730163574,
      "multicode_k": 1,
      "output_norm": 14.692513732910157,
      "output_norm/layer0": 14.692513732910157,
      "step": 1600
    },
    {
      "MSE": 688.7181396484375,
      "MSE/layer0": 688.7181396484375,
      "dead_code_fraction": 0.0595,
      "dead_code_fraction/layer0": 0.0595,
      "epoch": 0.17,
      "input_norm": 31.99835859616598,
      "input_norm/layer0": 31.99835859616598,
      "learning_rate": 0.0005,
      "loss": 2.4699,
      "max_norm": 42.610233306884766,
      "max_norm/layer0": 42.610233306884766,
      "mean_norm": 35.86595916748047,
      "mean_norm/layer0": 35.86595916748047,
      "multicode_k": 1,
      "output_norm": 14.833582207361854,
      "output_norm/layer0": 14.833582207361854,
      "step": 1650
    },
    {
      "MSE": 685.5445822143549,
      "MSE/layer0": 685.5445822143549,
      "dead_code_fraction": 0.06595,
      "dead_code_fraction/layer0": 0.06595,
      "epoch": 0.17,
      "input_norm": 31.99835782368978,
      "input_norm/layer0": 31.99835782368978,
      "learning_rate": 0.0005,
      "loss": 2.5014,
      "max_norm": 43.15216064453125,
      "max_norm/layer0": 43.15216064453125,
      "mean_norm": 36.00602149963379,
      "mean_norm/layer0": 36.00602149963379,
      "multicode_k": 1,
      "output_norm": 14.96381513118744,
      "output_norm/layer0": 14.96381513118744,
      "step": 1700
    },
    {
      "MSE": 683.2388099161783,
      "MSE/layer0": 683.2388099161783,
      "dead_code_fraction": 0.0708,
      "dead_code_fraction/layer0": 0.0708,
      "epoch": 0.17,
      "input_norm": 31.998353064854925,
      "input_norm/layer0": 31.998353064854925,
      "learning_rate": 0.0005,
      "loss": 2.4762,
      "max_norm": 43.683807373046875,
      "max_norm/layer0": 43.683807373046875,
      "mean_norm": 36.14344596862793,
      "mean_norm/layer0": 36.14344596862793,
      "multicode_k": 1,
      "output_norm": 15.08479848066965,
      "output_norm/layer0": 15.08479848066965,
      "step": 1750
    },
    {
      "MSE": 680.5147140502929,
      "MSE/layer0": 680.5147140502929,
      "dead_code_fraction": 0.0711,
      "dead_code_fraction/layer0": 0.0711,
      "epoch": 0.18,
      "input_norm": 31.998323942820228,
      "input_norm/layer0": 31.998323942820228,
      "learning_rate": 0.0005,
      "loss": 2.4017,
      "max_norm": 44.204158782958984,
      "max_norm/layer0": 44.204158782958984,
      "mean_norm": 36.281328201293945,
      "mean_norm/layer0": 36.281328201293945,
      "multicode_k": 1,
      "output_norm": 15.21150853157043,
      "output_norm/layer0": 15.21150853157043,
      "step": 1800
    },
    {
      "MSE": 677.8235699462891,
      "MSE/layer0": 677.8235699462891,
      "dead_code_fraction": 0.0789,
      "dead_code_fraction/layer0": 0.0789,
      "epoch": 0.18,
      "input_norm": 31.99832211176553,
      "input_norm/layer0": 31.99832211176553,
      "learning_rate": 0.0005,
      "loss": 2.4204,
      "max_norm": 44.73421096801758,
      "max_norm/layer0": 44.73421096801758,
      "mean_norm": 36.41860580444336,
      "mean_norm/layer0": 36.41860580444336,
      "multicode_k": 1,
      "output_norm": 15.32913914521535,
      "output_norm/layer0": 15.32913914521535,
      "step": 1850
    },
    {
      "MSE": 674.8260657755535,
      "MSE/layer0": 674.8260657755535,
      "dead_code_fraction": 0.0859,
      "dead_code_fraction/layer0": 0.0859,
      "epoch": 0.19,
      "input_norm": 31.998327109018952,
      "input_norm/layer0": 31.998327109018952,
      "learning_rate": 0.0005,
      "loss": 2.4612,
      "max_norm": 45.264217376708984,
      "max_norm/layer0": 45.264217376708984,
      "mean_norm": 36.55377197265625,
      "mean_norm/layer0": 36.55377197265625,
      "multicode_k": 1,
      "output_norm": 15.449233846664427,
      "output_norm/layer0": 15.449233846664427,
      "step": 1900
    },
    {
      "MSE": 672.4308366902667,
      "MSE/layer0": 672.4308366902667,
      "dead_code_fraction": 0.08975,
      "dead_code_fraction/layer0": 0.08975,
      "epoch": 0.2,
      "input_norm": 31.998313461939492,
      "input_norm/layer0": 31.998313461939492,
      "learning_rate": 0.0005,
      "loss": 2.413,
      "max_norm": 45.7476692199707,
      "max_norm/layer0": 45.7476692199707,
      "mean_norm": 36.687320709228516,
      "mean_norm/layer0": 36.687320709228516,
      "multicode_k": 1,
      "output_norm": 15.564360074996952,
      "output_norm/layer0": 15.564360074996952,
      "step": 1950
    },
    {
      "MSE": 669.9350853474932,
      "MSE/layer0": 669.9350853474932,
      "dead_code_fraction": 0.09495,
      "dead_code_fraction/layer0": 0.09495,
      "epoch": 0.2,
      "input_norm": 31.998307892481467,
      "input_norm/layer0": 31.998307892481467,
      "learning_rate": 0.0005,
      "loss": 2.4197,
      "max_norm": 46.2595100402832,
      "max_norm/layer0": 46.2595100402832,
      "mean_norm": 36.82127571105957,
      "mean_norm/layer0": 36.82127571105957,
      "multicode_k": 1,
      "output_norm": 15.671763955752056,
      "output_norm/layer0": 15.671763955752056,
      "step": 2000
    },
    {
      "epoch": 0.2,
      "eval_MSE/layer0": 670.0254334077002,
      "eval_accuracy": 0.47584128742153486,
      "eval_dead_code_fraction/layer0": 0.0988,
      "eval_input_norm/layer0": 31.99830309178647,
      "eval_loss": 2.409283399581909,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 15.728763990528059,
      "eval_runtime": 158.0617,
      "eval_samples_per_second": 29.248,
      "eval_steps_per_second": 1.828,
      "step": 2000
    },
    {
      "MSE": 667.9600658162435,
      "MSE/layer0": 667.9600658162435,
      "dead_code_fraction": 0.09825,
      "dead_code_fraction/layer0": 0.09825,
      "epoch": 0.2,
      "input_norm": 31.99829890569051,
      "input_norm/layer0": 31.99829890569051,
      "learning_rate": 0.0005,
      "loss": 2.3908,
      "max_norm": 46.76186752319336,
      "max_norm/layer0": 46.76186752319336,
      "mean_norm": 36.954044342041016,
      "mean_norm/layer0": 36.954044342041016,
      "multicode_k": 1,
      "output_norm": 15.786985732714339,
      "output_norm/layer0": 15.786985732714339,
      "step": 2050
    },
    {
      "MSE": 665.8677533976238,
      "MSE/layer0": 665.8677533976238,
      "dead_code_fraction": 0.10105,
      "dead_code_fraction/layer0": 0.10105,
      "epoch": 0.21,
      "input_norm": 31.998287776311233,
      "input_norm/layer0": 31.998287776311233,
      "learning_rate": 0.0005,
      "loss": 2.3532,
      "max_norm": 47.23879623413086,
      "max_norm/layer0": 47.23879623413086,
      "mean_norm": 37.08414268493652,
      "mean_norm/layer0": 37.08414268493652,
      "multicode_k": 1,
      "output_norm": 15.887771523793544,
      "output_norm/layer0": 15.887771523793544,
      "step": 2100
    },
    {
      "MSE": 664.0484969075521,
      "MSE/layer0": 664.0484969075521,
      "dead_code_fraction": 0.10515,
      "dead_code_fraction/layer0": 0.10515,
      "epoch": 0.21,
      "input_norm": 31.998289143244435,
      "input_norm/layer0": 31.998289143244435,
      "learning_rate": 0.0005,
      "loss": 2.3835,
      "max_norm": 47.72446823120117,
      "max_norm/layer0": 47.72446823120117,
      "mean_norm": 37.21368408203125,
      "mean_norm/layer0": 37.21368408203125,
      "multicode_k": 1,
      "output_norm": 15.987558364868171,
      "output_norm/layer0": 15.987558364868171,
      "step": 2150
    },
    {
      "MSE": 662.043323059082,
      "MSE/layer0": 662.043323059082,
      "dead_code_fraction": 0.11065,
      "dead_code_fraction/layer0": 0.11065,
      "epoch": 0.22,
      "input_norm": 31.998284489313747,
      "input_norm/layer0": 31.998284489313747,
      "learning_rate": 0.0005,
      "loss": 2.3711,
      "max_norm": 48.21998596191406,
      "max_norm/layer0": 48.21998596191406,
      "mean_norm": 37.34214973449707,
      "mean_norm/layer0": 37.34214973449707,
      "multicode_k": 1,
      "output_norm": 16.084624527295432,
      "output_norm/layer0": 16.084624527295432,
      "step": 2200
    },
    {
      "MSE": 660.071201883952,
      "MSE/layer0": 660.071201883952,
      "dead_code_fraction": 0.1138,
      "dead_code_fraction/layer0": 0.1138,
      "epoch": 0.23,
      "input_norm": 31.998274552027382,
      "input_norm/layer0": 31.998274552027382,
      "learning_rate": 0.0005,
      "loss": 2.3361,
      "max_norm": 48.656124114990234,
      "max_norm/layer0": 48.656124114990234,
      "mean_norm": 37.46707344055176,
      "mean_norm/layer0": 37.46707344055176,
      "multicode_k": 1,
      "output_norm": 16.1770029671987,
      "output_norm/layer0": 16.1770029671987,
      "step": 2250
    },
    {
      "MSE": 658.2848066202794,
      "MSE/layer0": 658.2848066202794,
      "dead_code_fraction": 0.11715,
      "dead_code_fraction/layer0": 0.11715,
      "epoch": 0.23,
      "input_norm": 31.998281342188513,
      "input_norm/layer0": 31.998281342188513,
      "learning_rate": 0.0005,
      "loss": 2.3697,
      "max_norm": 49.14850616455078,
      "max_norm/layer0": 49.14850616455078,
      "mean_norm": 37.592119216918945,
      "mean_norm/layer0": 37.592119216918945,
      "multicode_k": 1,
      "output_norm": 16.273267321586616,
      "output_norm/layer0": 16.273267321586616,
      "step": 2300
    },
    {
      "MSE": 656.6614913940434,
      "MSE/layer0": 656.6614913940434,
      "dead_code_fraction": 0.1208,
      "dead_code_fraction/layer0": 0.1208,
      "epoch": 0.23,
      "input_norm": 31.99827545166017,
      "input_norm/layer0": 31.99827545166017,
      "learning_rate": 0.0005,
      "loss": 2.3691,
      "max_norm": 49.611228942871094,
      "max_norm/layer0": 49.611228942871094,
      "mean_norm": 37.71496772766113,
      "mean_norm/layer0": 37.71496772766113,
      "multicode_k": 1,
      "output_norm": 16.361617434819536,
      "output_norm/layer0": 16.361617434819536,
      "step": 2350
    },
    {
      "MSE": 654.7551118977863,
      "MSE/layer0": 654.7551118977863,
      "dead_code_fraction": 0.12205,
      "dead_code_fraction/layer0": 0.12205,
      "epoch": 0.24,
      "input_norm": 31.998258228302007,
      "input_norm/layer0": 31.998258228302007,
      "learning_rate": 0.0005,
      "loss": 2.3413,
      "max_norm": 50.082008361816406,
      "max_norm/layer0": 50.082008361816406,
      "mean_norm": 37.836740493774414,
      "mean_norm/layer0": 37.836740493774414,
      "multicode_k": 1,
      "output_norm": 16.442067163785307,
      "output_norm/layer0": 16.442067163785307,
      "step": 2400
    },
    {
      "MSE": 653.2320398966472,
      "MSE/layer0": 653.2320398966472,
      "dead_code_fraction": 0.1261,
      "dead_code_fraction/layer0": 0.1261,
      "epoch": 0.24,
      "input_norm": 31.99826599121093,
      "input_norm/layer0": 31.99826599121093,
      "learning_rate": 0.0005,
      "loss": 2.3415,
      "max_norm": 50.542850494384766,
      "max_norm/layer0": 50.542850494384766,
      "mean_norm": 37.956573486328125,
      "mean_norm/layer0": 37.956573486328125,
      "multicode_k": 1,
      "output_norm": 16.545647277832018,
      "output_norm/layer0": 16.545647277832018,
      "step": 2450
    },
    {
      "MSE": 652.0689453124999,
      "MSE/layer0": 652.0689453124999,
      "dead_code_fraction": 0.1305,
      "dead_code_fraction/layer0": 0.1305,
      "epoch": 0.25,
      "input_norm": 31.998266054789227,
      "input_norm/layer0": 31.998266054789227,
      "learning_rate": 0.0005,
      "loss": 2.3541,
      "max_norm": 50.972904205322266,
      "max_norm/layer0": 50.972904205322266,
      "mean_norm": 38.07469177246094,
      "mean_norm/layer0": 38.07469177246094,
      "multicode_k": 1,
      "output_norm": 16.614015088081356,
      "output_norm/layer0": 16.614015088081356,
      "step": 2500
    },
    {
      "epoch": 0.25,
      "eval_MSE/layer0": 651.1296869864225,
      "eval_accuracy": 0.48371217143066175,
      "eval_dead_code_fraction/layer0": 0.1337,
      "eval_input_norm/layer0": 31.998264631048162,
      "eval_loss": 2.340399742126465,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 16.66022368217996,
      "eval_runtime": 157.8946,
      "eval_samples_per_second": 29.279,
      "eval_steps_per_second": 1.83,
      "step": 2500
    },
    {
      "MSE": 650.5154676310221,
      "MSE/layer0": 650.5154676310221,
      "dead_code_fraction": 0.1312,
      "dead_code_fraction/layer0": 0.1312,
      "epoch": 0.26,
      "input_norm": 31.99826429367065,
      "input_norm/layer0": 31.99826429367065,
      "learning_rate": 0.0005,
      "loss": 2.3374,
      "max_norm": 51.42794418334961,
      "max_norm/layer0": 51.42794418334961,
      "mean_norm": 38.19082260131836,
      "mean_norm/layer0": 38.19082260131836,
      "multicode_k": 1,
      "output_norm": 16.705677251815793,
      "output_norm/layer0": 16.705677251815793,
      "step": 2550
    },
    {
      "MSE": 649.4798397827149,
      "MSE/layer0": 649.4798397827149,
      "dead_code_fraction": 0.13625,
      "dead_code_fraction/layer0": 0.13625,
      "epoch": 0.26,
      "input_norm": 31.99826188405354,
      "input_norm/layer0": 31.99826188405354,
      "learning_rate": 0.0005,
      "loss": 2.3364,
      "max_norm": 51.84079360961914,
      "max_norm/layer0": 51.84079360961914,
      "mean_norm": 38.306650161743164,
      "mean_norm/layer0": 38.306650161743164,
      "multicode_k": 1,
      "output_norm": 16.774758176803587,
      "output_norm/layer0": 16.774758176803587,
      "step": 2600
    },
    {
      "MSE": 648.4373052978513,
      "MSE/layer0": 648.4373052978513,
      "dead_code_fraction": 0.13795,
      "dead_code_fraction/layer0": 0.13795,
      "epoch": 0.27,
      "input_norm": 31.998252007166542,
      "input_norm/layer0": 31.998252007166542,
      "learning_rate": 0.0005,
      "loss": 2.3162,
      "max_norm": 52.24661636352539,
      "max_norm/layer0": 52.24661636352539,
      "mean_norm": 38.41937828063965,
      "mean_norm/layer0": 38.41937828063965,
      "multicode_k": 1,
      "output_norm": 16.851604979832963,
      "output_norm/layer0": 16.851604979832963,
      "step": 2650
    },
    {
      "MSE": 647.0678014119467,
      "MSE/layer0": 647.0678014119467,
      "dead_code_fraction": 0.1397,
      "dead_code_fraction/layer0": 0.1397,
      "epoch": 0.27,
      "input_norm": 31.998265930811563,
      "input_norm/layer0": 31.998265930811563,
      "learning_rate": 0.0005,
      "loss": 2.3497,
      "max_norm": 52.66170120239258,
      "max_norm/layer0": 52.66170120239258,
      "mean_norm": 38.53024482727051,
      "mean_norm/layer0": 38.53024482727051,
      "multicode_k": 1,
      "output_norm": 16.925416787465398,
      "output_norm/layer0": 16.925416787465398,
      "step": 2700
    },
    {
      "MSE": 646.4085242716471,
      "MSE/layer0": 646.4085242716471,
      "dead_code_fraction": 0.14125,
      "dead_code_fraction/layer0": 0.14125,
      "epoch": 0.28,
      "input_norm": 31.99825245221455,
      "input_norm/layer0": 31.99825245221455,
      "learning_rate": 0.0005,
      "loss": 2.301,
      "max_norm": 53.03037643432617,
      "max_norm/layer0": 53.03037643432617,
      "mean_norm": 38.63713836669922,
      "mean_norm/layer0": 38.63713836669922,
      "multicode_k": 1,
      "output_norm": 16.985576423009235,
      "output_norm/layer0": 16.985576423009235,
      "step": 2750
    },
    {
      "MSE": 644.7344170125325,
      "MSE/layer0": 644.7344170125325,
      "dead_code_fraction": 0.14415,
      "dead_code_fraction/layer0": 0.14415,
      "epoch": 0.28,
      "input_norm": 31.998260081609082,
      "input_norm/layer0": 31.998260081609082,
      "learning_rate": 0.0005,
      "loss": 2.3395,
      "max_norm": 53.41487503051758,
      "max_norm/layer0": 53.41487503051758,
      "mean_norm": 38.74285697937012,
      "mean_norm/layer0": 38.74285697937012,
      "multicode_k": 1,
      "output_norm": 17.068980147043867,
      "output_norm/layer0": 17.068980147043867,
      "step": 2800
    },
    {
      "MSE": 644.636144104004,
      "MSE/layer0": 644.636144104004,
      "dead_code_fraction": 0.14565,
      "dead_code_fraction/layer0": 0.14565,
      "epoch": 0.28,
      "input_norm": 31.998243366877247,
      "input_norm/layer0": 31.998243366877247,
      "learning_rate": 0.0005,
      "loss": 2.2757,
      "max_norm": 53.792579650878906,
      "max_norm/layer0": 53.792579650878906,
      "mean_norm": 38.84635543823242,
      "mean_norm/layer0": 38.84635543823242,
      "multicode_k": 1,
      "output_norm": 17.124992834726967,
      "output_norm/layer0": 17.124992834726967,
      "step": 2850
    },
    {
      "MSE": 643.8843309529623,
      "MSE/layer0": 643.8843309529623,
      "dead_code_fraction": 0.14495,
      "dead_code_fraction/layer0": 0.14495,
      "epoch": 0.29,
      "input_norm": 31.998242295583093,
      "input_norm/layer0": 31.998242295583093,
      "learning_rate": 0.0005,
      "loss": 2.3057,
      "max_norm": 54.146453857421875,
      "max_norm/layer0": 54.146453857421875,
      "mean_norm": 38.947309494018555,
      "mean_norm/layer0": 38.947309494018555,
      "multicode_k": 1,
      "output_norm": 17.17694611549377,
      "output_norm/layer0": 17.17694611549377,
      "step": 2900
    },
    {
      "MSE": 642.6776557413741,
      "MSE/layer0": 642.6776557413741,
      "dead_code_fraction": 0.1504,
      "dead_code_fraction/layer0": 0.1504,
      "epoch": 0.29,
      "input_norm": 31.998272593816125,
      "input_norm/layer0": 31.998272593816125,
      "learning_rate": 0.0005,
      "loss": 2.3545,
      "max_norm": 54.51527404785156,
      "max_norm/layer0": 54.51527404785156,
      "mean_norm": 39.047607421875,
      "mean_norm/layer0": 39.047607421875,
      "multicode_k": 1,
      "output_norm": 17.240235595703133,
      "output_norm/layer0": 17.240235595703133,
      "step": 2950
    },
    {
      "MSE": 643.1047460937498,
      "MSE/layer0": 643.1047460937498,
      "dead_code_fraction": 0.1483,
      "dead_code_fraction/layer0": 0.1483,
      "epoch": 0.3,
      "input_norm": 31.998249003092454,
      "input_norm/layer0": 31.998249003092454,
      "learning_rate": 0.0005,
      "loss": 2.2742,
      "max_norm": 54.86568832397461,
      "max_norm/layer0": 54.86568832397461,
      "mean_norm": 39.14469337463379,
      "mean_norm/layer0": 39.14469337463379,
      "multicode_k": 1,
      "output_norm": 17.28876600265503,
      "output_norm/layer0": 17.28876600265503,
      "step": 3000
    },
    {
      "epoch": 0.3,
      "eval_MSE/layer0": 642.6360311704152,
      "eval_accuracy": 0.49030507287608877,
      "eval_dead_code_fraction/layer0": 0.14995,
      "eval_input_norm/layer0": 31.998255163205542,
      "eval_loss": 2.2907073497772217,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 17.324301861386118,
      "eval_runtime": 157.9262,
      "eval_samples_per_second": 29.273,
      "eval_steps_per_second": 1.83,
      "step": 3000
    },
    {
      "MSE": 641.9817254638668,
      "MSE/layer0": 641.9817254638668,
      "dead_code_fraction": 0.1511,
      "dead_code_fraction/layer0": 0.1511,
      "epoch": 0.3,
      "input_norm": 31.99826343536376,
      "input_norm/layer0": 31.99826343536376,
      "learning_rate": 0.0005,
      "loss": 2.3422,
      "max_norm": 55.2226676940918,
      "max_norm/layer0": 55.2226676940918,
      "mean_norm": 39.23999786376953,
      "mean_norm/layer0": 39.23999786376953,
      "multicode_k": 1,
      "output_norm": 17.350644410451252,
      "output_norm/layer0": 17.350644410451252,
      "step": 3050
    },
    {
      "MSE": 641.9993333943689,
      "MSE/layer0": 641.9993333943689,
      "dead_code_fraction": 0.1504,
      "dead_code_fraction/layer0": 0.1504,
      "epoch": 0.31,
      "input_norm": 31.998250141143807,
      "input_norm/layer0": 31.998250141143807,
      "learning_rate": 0.0005,
      "loss": 2.2814,
      "max_norm": 55.56163787841797,
      "max_norm/layer0": 55.56163787841797,
      "mean_norm": 39.33370780944824,
      "mean_norm/layer0": 39.33370780944824,
      "multicode_k": 1,
      "output_norm": 17.39312816301982,
      "output_norm/layer0": 17.39312816301982,
      "step": 3100
    },
    {
      "MSE": 641.5148900349936,
      "MSE/layer0": 641.5148900349936,
      "dead_code_fraction": 0.15185,
      "dead_code_fraction/layer0": 0.15185,
      "epoch": 0.32,
      "input_norm": 31.998260364532467,
      "input_norm/layer0": 31.998260364532467,
      "learning_rate": 0.0005,
      "loss": 2.3152,
      "max_norm": 55.8856315612793,
      "max_norm/layer0": 55.8856315612793,
      "mean_norm": 39.42481803894043,
      "mean_norm/layer0": 39.42481803894043,
      "multicode_k": 1,
      "output_norm": 17.44178107897441,
      "output_norm/layer0": 17.44178107897441,
      "step": 3150
    },
    {
      "MSE": 640.499552408854,
      "MSE/layer0": 640.499552408854,
      "dead_code_fraction": 0.1516,
      "dead_code_fraction/layer0": 0.1516,
      "epoch": 0.32,
      "input_norm": 31.99825292587281,
      "input_norm/layer0": 31.99825292587281,
      "learning_rate": 0.0005,
      "loss": 2.2462,
      "max_norm": 56.21445846557617,
      "max_norm/layer0": 56.21445846557617,
      "mean_norm": 39.51395606994629,
      "mean_norm/layer0": 39.51395606994629,
      "multicode_k": 1,
      "output_norm": 17.50789775530497,
      "output_norm/layer0": 17.50789775530497,
      "step": 3200
    },
    {
      "MSE": 640.565166829427,
      "MSE/layer0": 640.565166829427,
      "dead_code_fraction": 0.15285,
      "dead_code_fraction/layer0": 0.15285,
      "epoch": 0.33,
      "input_norm": 31.998250306447353,
      "input_norm/layer0": 31.998250306447353,
      "learning_rate": 0.0005,
      "loss": 2.2595,
      "max_norm": 56.526973724365234,
      "max_norm/layer0": 56.526973724365234,
      "mean_norm": 39.601173400878906,
      "mean_norm/layer0": 39.601173400878906,
      "multicode_k": 1,
      "output_norm": 17.54366443951924,
      "output_norm/layer0": 17.54366443951924,
      "step": 3250
    },
    {
      "MSE": 640.8991118367509,
      "MSE/layer0": 640.8991118367509,
      "dead_code_fraction": 0.1531,
      "dead_code_fraction/layer0": 0.1531,
      "epoch": 0.33,
      "input_norm": 31.998245798746755,
      "input_norm/layer0": 31.998245798746755,
      "learning_rate": 0.0005,
      "loss": 2.2326,
      "max_norm": 56.82651138305664,
      "max_norm/layer0": 56.82651138305664,
      "mean_norm": 39.684635162353516,
      "mean_norm/layer0": 39.684635162353516,
      "multicode_k": 1,
      "output_norm": 17.578553660710664,
      "output_norm/layer0": 17.578553660710664,
      "step": 3300
    },
    {
      "MSE": 640.486218770345,
      "MSE/layer0": 640.486218770345,
      "dead_code_fraction": 0.15345,
      "dead_code_fraction/layer0": 0.15345,
      "epoch": 0.34,
      "input_norm": 31.998255780537924,
      "input_norm/layer0": 31.998255780537924,
      "learning_rate": 0.0005,
      "loss": 2.2733,
      "max_norm": 57.12877655029297,
      "max_norm/layer0": 57.12877655029297,
      "mean_norm": 39.76711463928223,
      "mean_norm/layer0": 39.76711463928223,
      "multicode_k": 1,
      "output_norm": 17.619242086410516,
      "output_norm/layer0": 17.619242086410516,
      "step": 3350
    },
    {
      "MSE": 639.5240251668292,
      "MSE/layer0": 639.5240251668292,
      "dead_code_fraction": 0.15565,
      "dead_code_fraction/layer0": 0.15565,
      "epoch": 0.34,
      "input_norm": 31.998264500300095,
      "input_norm/layer0": 31.998264500300095,
      "learning_rate": 0.0005,
      "loss": 2.2633,
      "max_norm": 57.42041778564453,
      "max_norm/layer0": 57.42041778564453,
      "mean_norm": 39.84800338745117,
      "mean_norm/layer0": 39.84800338745117,
      "multicode_k": 1,
      "output_norm": 17.667484652201342,
      "output_norm/layer0": 17.667484652201342,
      "step": 3400
    },
    {
      "MSE": 639.2691174316408,
      "MSE/layer0": 639.2691174316408,
      "dead_code_fraction": 0.15605,
      "dead_code_fraction/layer0": 0.15605,
      "epoch": 0.34,
      "input_norm": 31.99825723965962,
      "input_norm/layer0": 31.99825723965962,
      "learning_rate": 0.0005,
      "loss": 2.2495,
      "max_norm": 57.706260681152344,
      "max_norm/layer0": 57.706260681152344,
      "mean_norm": 39.92698097229004,
      "mean_norm/layer0": 39.92698097229004,
      "multicode_k": 1,
      "output_norm": 17.705148900349947,
      "output_norm/layer0": 17.705148900349947,
      "step": 3450
    },
    {
      "MSE": 639.3908192952478,
      "MSE/layer0": 639.3908192952478,
      "dead_code_fraction": 0.15655,
      "dead_code_fraction/layer0": 0.15655,
      "epoch": 0.35,
      "input_norm": 31.9982618745168,
      "input_norm/layer0": 31.9982618745168,
      "learning_rate": 0.0005,
      "loss": 2.2488,
      "max_norm": 57.98209762573242,
      "max_norm/layer0": 57.98209762573242,
      "mean_norm": 40.005022048950195,
      "mean_norm/layer0": 40.005022048950195,
      "multicode_k": 1,
      "output_norm": 17.73683495521545,
      "output_norm/layer0": 17.73683495521545,
      "step": 3500
    },
    {
      "epoch": 0.35,
      "eval_MSE/layer0": 640.3158307464355,
      "eval_accuracy": 0.49451074349024987,
      "eval_dead_code_fraction/layer0": 0.1575,
      "eval_input_norm/layer0": 31.99825158244007,
      "eval_loss": 2.2564537525177,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 17.756634140179678,
      "eval_runtime": 157.599,
      "eval_samples_per_second": 29.334,
      "eval_steps_per_second": 1.834,
      "step": 3500
    },
    {
      "MSE": 639.6838141886391,
      "MSE/layer0": 639.6838141886391,
      "dead_code_fraction": 0.157,
      "dead_code_fraction/layer0": 0.157,
      "epoch": 0.35,
      "input_norm": 31.99826737085978,
      "input_norm/layer0": 31.99826737085978,
      "learning_rate": 0.0005,
      "loss": 2.2738,
      "max_norm": 58.24713897705078,
      "max_norm/layer0": 58.24713897705078,
      "mean_norm": 40.08023262023926,
      "mean_norm/layer0": 40.08023262023926,
      "multicode_k": 1,
      "output_norm": 17.755876312255864,
      "output_norm/layer0": 17.755876312255864,
      "step": 3550
    },
    {
      "MSE": 639.2954257202149,
      "MSE/layer0": 639.2954257202149,
      "dead_code_fraction": 0.1559,
      "dead_code_fraction/layer0": 0.1559,
      "epoch": 0.36,
      "input_norm": 31.998245531717938,
      "input_norm/layer0": 31.998245531717938,
      "learning_rate": 0.0005,
      "loss": 2.2036,
      "max_norm": 58.50635528564453,
      "max_norm/layer0": 58.50635528564453,
      "mean_norm": 40.15370178222656,
      "mean_norm/layer0": 40.15370178222656,
      "multicode_k": 1,
      "output_norm": 17.812968953450515,
      "output_norm/layer0": 17.812968953450515,
      "step": 3600
    },
    {
      "MSE": 639.3338773600263,
      "MSE/layer0": 639.3338773600263,
      "dead_code_fraction": 0.15905,
      "dead_code_fraction/layer0": 0.15905,
      "epoch": 0.36,
      "input_norm": 31.99827084223429,
      "input_norm/layer0": 31.99827084223429,
      "learning_rate": 0.0005,
      "loss": 2.2672,
      "max_norm": 58.76622009277344,
      "max_norm/layer0": 58.76622009277344,
      "mean_norm": 40.22719192504883,
      "mean_norm/layer0": 40.22719192504883,
      "multicode_k": 1,
      "output_norm": 17.821751413345332,
      "output_norm/layer0": 17.821751413345332,
      "step": 3650
    },
    {
      "MSE": 639.0531684366863,
      "MSE/layer0": 639.0531684366863,
      "dead_code_fraction": 0.15975,
      "dead_code_fraction/layer0": 0.15975,
      "epoch": 0.37,
      "input_norm": 31.99827636400858,
      "input_norm/layer0": 31.99827636400858,
      "learning_rate": 0.0005,
      "loss": 2.2444,
      "max_norm": 59.02393341064453,
      "max_norm/layer0": 59.02393341064453,
      "mean_norm": 40.298166275024414,
      "mean_norm/layer0": 40.298166275024414,
      "multicode_k": 1,
      "output_norm": 17.85403926849365,
      "output_norm/layer0": 17.85403926849365,
      "step": 3700
    },
    {
      "MSE": 638.9355230712894,
      "MSE/layer0": 638.9355230712894,
      "dead_code_fraction": 0.1605,
      "dead_code_fraction/layer0": 0.1605,
      "epoch": 0.38,
      "input_norm": 31.99827863057454,
      "input_norm/layer0": 31.99827863057454,
      "learning_rate": 0.0005,
      "loss": 2.2454,
      "max_norm": 59.28853225708008,
      "max_norm/layer0": 59.28853225708008,
      "mean_norm": 40.36880111694336,
      "mean_norm/layer0": 40.36880111694336,
      "multicode_k": 1,
      "output_norm": 17.88599282582601,
      "output_norm/layer0": 17.88599282582601,
      "step": 3750
    },
    {
      "MSE": 639.0086972045899,
      "MSE/layer0": 639.0086972045899,
      "dead_code_fraction": 0.16125,
      "dead_code_fraction/layer0": 0.16125,
      "epoch": 0.38,
      "input_norm": 31.9982850710551,
      "input_norm/layer0": 31.9982850710551,
      "learning_rate": 0.0005,
      "loss": 2.27,
      "max_norm": 59.546451568603516,
      "max_norm/layer0": 59.546451568603516,
      "mean_norm": 40.43776512145996,
      "mean_norm/layer0": 40.43776512145996,
      "multicode_k": 1,
      "output_norm": 17.90943570454915,
      "output_norm/layer0": 17.90943570454915,
      "step": 3800
    },
    {
      "MSE": 638.9462019856769,
      "MSE/layer0": 638.9462019856769,
      "dead_code_fraction": 0.1583,
      "dead_code_fraction/layer0": 0.1583,
      "epoch": 0.39,
      "input_norm": 31.998278980255122,
      "input_norm/layer0": 31.998278980255122,
      "learning_rate": 0.0005,
      "loss": 2.2438,
      "max_norm": 59.80894470214844,
      "max_norm/layer0": 59.80894470214844,
      "mean_norm": 40.50556945800781,
      "mean_norm/layer0": 40.50556945800781,
      "multicode_k": 1,
      "output_norm": 17.947645209630338,
      "output_norm/layer0": 17.947645209630338,
      "step": 3850
    },
    {
      "MSE": 639.4130173746743,
      "MSE/layer0": 639.4130173746743,
      "dead_code_fraction": 0.16135,
      "dead_code_fraction/layer0": 0.16135,
      "epoch": 0.39,
      "input_norm": 31.998284943898526,
      "input_norm/layer0": 31.998284943898526,
      "learning_rate": 0.0005,
      "loss": 2.2526,
      "max_norm": 60.04655075073242,
      "max_norm/layer0": 60.04655075073242,
      "mean_norm": 40.57136535644531,
      "mean_norm/layer0": 40.57136535644531,
      "multicode_k": 1,
      "output_norm": 17.960218969980872,
      "output_norm/layer0": 17.960218969980872,
      "step": 3900
    },
    {
      "MSE": 639.8756245930986,
      "MSE/layer0": 639.8756245930986,
      "dead_code_fraction": 0.15755,
      "dead_code_fraction/layer0": 0.15755,
      "epoch": 0.4,
      "input_norm": 31.998285398483272,
      "input_norm/layer0": 31.998285398483272,
      "learning_rate": 0.0005,
      "loss": 2.2266,
      "max_norm": 60.29011154174805,
      "max_norm/layer0": 60.29011154174805,
      "mean_norm": 40.63625144958496,
      "mean_norm/layer0": 40.63625144958496,
      "multicode_k": 1,
      "output_norm": 17.97526204744974,
      "output_norm/layer0": 17.97526204744974,
      "step": 3950
    },
    {
      "MSE": 640.046054585775,
      "MSE/layer0": 640.046054585775,
      "dead_code_fraction": 0.1605,
      "dead_code_fraction/layer0": 0.1605,
      "epoch": 0.4,
      "input_norm": 31.998285433451336,
      "input_norm/layer0": 31.998285433451336,
      "learning_rate": 0.0005,
      "loss": 2.2287,
      "max_norm": 60.52168655395508,
      "max_norm/layer0": 60.52168655395508,
      "mean_norm": 40.698753356933594,
      "mean_norm/layer0": 40.698753356933594,
      "multicode_k": 1,
      "output_norm": 17.997498016357426,
      "output_norm/layer0": 17.997498016357426,
      "step": 4000
    },
    {
      "epoch": 0.4,
      "eval_MSE/layer0": 638.8422855589264,
      "eval_accuracy": 0.49670513512593434,
      "eval_dead_code_fraction/layer0": 0.16135,
      "eval_input_norm/layer0": 31.99827300782795,
      "eval_loss": 2.2332887649536133,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 18.022313365115252,
      "eval_runtime": 158.1975,
      "eval_samples_per_second": 29.223,
      "eval_steps_per_second": 1.827,
      "step": 4000
    },
    {
      "MSE": 639.952128804525,
      "MSE/layer0": 639.952128804525,
      "dead_code_fraction": 0.16035,
      "dead_code_fraction/layer0": 0.16035,
      "epoch": 0.41,
      "input_norm": 31.998286927541105,
      "input_norm/layer0": 31.998286927541105,
      "learning_rate": 0.0005,
      "loss": 2.2193,
      "max_norm": 60.76009750366211,
      "max_norm/layer0": 60.76009750366211,
      "mean_norm": 40.75992393493652,
      "mean_norm/layer0": 40.75992393493652,
      "multicode_k": 1,
      "output_norm": 18.024092137018826,
      "output_norm/layer0": 18.024092137018826,
      "step": 4050
    },
    {
      "MSE": 640.5730131022133,
      "MSE/layer0": 640.5730131022133,
      "dead_code_fraction": 0.1634,
      "dead_code_fraction/layer0": 0.1634,
      "epoch": 0.41,
      "input_norm": 31.99828769365946,
      "input_norm/layer0": 31.99828769365946,
      "learning_rate": 0.0005,
      "loss": 2.2301,
      "max_norm": 60.98118591308594,
      "max_norm/layer0": 60.98118591308594,
      "mean_norm": 40.8208122253418,
      "mean_norm/layer0": 40.8208122253418,
      "multicode_k": 1,
      "output_norm": 18.02807092984518,
      "output_norm/layer0": 18.02807092984518,
      "step": 4100
    },
    {
      "MSE": 640.4258350626628,
      "MSE/layer0": 640.4258350626628,
      "dead_code_fraction": 0.1612,
      "dead_code_fraction/layer0": 0.1612,
      "epoch": 0.41,
      "input_norm": 31.998297268549607,
      "input_norm/layer0": 31.998297268549607,
      "learning_rate": 0.0005,
      "loss": 2.2307,
      "max_norm": 61.19542694091797,
      "max_norm/layer0": 61.19542694091797,
      "mean_norm": 40.88128852844238,
      "mean_norm/layer0": 40.88128852844238,
      "multicode_k": 1,
      "output_norm": 18.04158842404684,
      "output_norm/layer0": 18.04158842404684,
      "step": 4150
    },
    {
      "MSE": 639.5022987874349,
      "MSE/layer0": 639.5022987874349,
      "dead_code_fraction": 0.16015,
      "dead_code_fraction/layer0": 0.16015,
      "epoch": 0.42,
      "input_norm": 31.99830362319948,
      "input_norm/layer0": 31.99830362319948,
      "learning_rate": 0.0005,
      "loss": 2.247,
      "max_norm": 61.4282341003418,
      "max_norm/layer0": 61.4282341003418,
      "mean_norm": 40.941017150878906,
      "mean_norm/layer0": 40.941017150878906,
      "multicode_k": 1,
      "output_norm": 18.079462760289516,
      "output_norm/layer0": 18.079462760289516,
      "step": 4200
    },
    {
      "MSE": 640.0252755737306,
      "MSE/layer0": 640.0252755737306,
      "dead_code_fraction": 0.1604,
      "dead_code_fraction/layer0": 0.1604,
      "epoch": 0.42,
      "input_norm": 31.99830138524374,
      "input_norm/layer0": 31.99830138524374,
      "learning_rate": 0.0005,
      "loss": 2.2314,
      "max_norm": 61.648414611816406,
      "max_norm/layer0": 61.648414611816406,
      "mean_norm": 40.99977684020996,
      "mean_norm/layer0": 40.99977684020996,
      "multicode_k": 1,
      "output_norm": 18.09024664878845,
      "output_norm/layer0": 18.09024664878845,
      "step": 4250
    },
    {
      "MSE": 639.7621870930992,
      "MSE/layer0": 639.7621870930992,
      "dead_code_fraction": 0.16365,
      "dead_code_fraction/layer0": 0.16365,
      "epoch": 0.43,
      "input_norm": 31.99830169359842,
      "input_norm/layer0": 31.99830169359842,
      "learning_rate": 0.0005,
      "loss": 2.2144,
      "max_norm": 61.86562728881836,
      "max_norm/layer0": 61.86562728881836,
      "mean_norm": 41.05688667297363,
      "mean_norm/layer0": 41.05688667297363,
      "multicode_k": 1,
      "output_norm": 18.11899041493734,
      "output_norm/layer0": 18.11899041493734,
      "step": 4300
    },
    {
      "MSE": 640.3955947875975,
      "MSE/layer0": 640.3955947875975,
      "dead_code_fraction": 0.1592,
      "dead_code_fraction/layer0": 0.1592,
      "epoch": 0.43,
      "input_norm": 31.998302787144976,
      "input_norm/layer0": 31.998302787144976,
      "learning_rate": 0.0005,
      "loss": 2.2077,
      "max_norm": 62.060550689697266,
      "max_norm/layer0": 62.060550689697266,
      "mean_norm": 41.11246681213379,
      "mean_norm/layer0": 41.11246681213379,
      "multicode_k": 1,
      "output_norm": 18.121066271464024,
      "output_norm/layer0": 18.121066271464024,
      "step": 4350
    },
    {
      "MSE": 639.8066222127281,
      "MSE/layer0": 639.8066222127281,
      "dead_code_fraction": 0.1635,
      "dead_code_fraction/layer0": 0.1635,
      "epoch": 0.44,
      "input_norm": 31.998314228057872,
      "input_norm/layer0": 31.998314228057872,
      "learning_rate": 0.0005,
      "loss": 2.2287,
      "max_norm": 62.275943756103516,
      "max_norm/layer0": 62.275943756103516,
      "mean_norm": 41.167396545410156,
      "mean_norm/layer0": 41.167396545410156,
      "multicode_k": 1,
      "output_norm": 18.142933632532753,
      "output_norm/layer0": 18.142933632532753,
      "step": 4400
    },
    {
      "MSE": 639.8160334269206,
      "MSE/layer0": 639.8160334269206,
      "dead_code_fraction": 0.16385,
      "dead_code_fraction/layer0": 0.16385,
      "epoch": 0.45,
      "input_norm": 31.99831516901653,
      "input_norm/layer0": 31.99831516901653,
      "learning_rate": 0.0005,
      "loss": 2.215,
      "max_norm": 62.486793518066406,
      "max_norm/layer0": 62.486793518066406,
      "mean_norm": 41.221702575683594,
      "mean_norm/layer0": 41.221702575683594,
      "multicode_k": 1,
      "output_norm": 18.167670075098677,
      "output_norm/layer0": 18.167670075098677,
      "step": 4450
    },
    {
      "MSE": 640.1416244506836,
      "MSE/layer0": 640.1416244506836,
      "dead_code_fraction": 0.16675,
      "dead_code_fraction/layer0": 0.16675,
      "epoch": 0.45,
      "input_norm": 31.998327512741074,
      "input_norm/layer0": 31.998327512741074,
      "learning_rate": 0.0005,
      "loss": 2.2576,
      "max_norm": 62.67790222167969,
      "max_norm/layer0": 62.67790222167969,
      "mean_norm": 41.275705337524414,
      "mean_norm/layer0": 41.275705337524414,
      "multicode_k": 1,
      "output_norm": 18.162402251561495,
      "output_norm/layer0": 18.162402251561495,
      "step": 4500
    },
    {
      "epoch": 0.45,
      "eval_MSE/layer0": 639.7464034476376,
      "eval_accuracy": 0.49916912103175737,
      "eval_dead_code_fraction/layer0": 0.16755,
      "eval_input_norm/layer0": 31.998309449821527,
      "eval_loss": 2.215489387512207,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 18.191884751910905,
      "eval_runtime": 157.9108,
      "eval_samples_per_second": 29.276,
      "eval_steps_per_second": 1.83,
      "step": 4500
    },
    {
      "MSE": 640.4858755493162,
      "MSE/layer0": 640.4858755493162,
      "dead_code_fraction": 0.1633,
      "dead_code_fraction/layer0": 0.1633,
      "epoch": 0.46,
      "input_norm": 31.99831475257874,
      "input_norm/layer0": 31.99831475257874,
      "learning_rate": 0.0005,
      "loss": 2.1869,
      "max_norm": 62.88029861450195,
      "max_norm/layer0": 62.88029861450195,
      "mean_norm": 41.32845115661621,
      "mean_norm/layer0": 41.32845115661621,
      "multicode_k": 1,
      "output_norm": 18.18791744550069,
      "output_norm/layer0": 18.18791744550069,
      "step": 4550
    },
    {
      "MSE": 640.7411174519859,
      "MSE/layer0": 640.7411174519859,
      "dead_code_fraction": 0.16375,
      "dead_code_fraction/layer0": 0.16375,
      "epoch": 0.46,
      "input_norm": 31.998337395985924,
      "input_norm/layer0": 31.998337395985924,
      "learning_rate": 0.0005,
      "loss": 2.2426,
      "max_norm": 63.06687545776367,
      "max_norm/layer0": 63.06687545776367,
      "mean_norm": 41.38063049316406,
      "mean_norm/layer0": 41.38063049316406,
      "multicode_k": 1,
      "output_norm": 18.185693721771244,
      "output_norm/layer0": 18.185693721771244,
      "step": 4600
    },
    {
      "MSE": 640.3254055786131,
      "MSE/layer0": 640.3254055786131,
      "dead_code_fraction": 0.1637,
      "dead_code_fraction/layer0": 0.1637,
      "epoch": 0.47,
      "input_norm": 31.998331034978236,
      "input_norm/layer0": 31.998331034978236,
      "learning_rate": 0.0005,
      "loss": 2.2103,
      "max_norm": 63.24494171142578,
      "max_norm/layer0": 63.24494171142578,
      "mean_norm": 41.4316463470459,
      "mean_norm/layer0": 41.4316463470459,
      "multicode_k": 1,
      "output_norm": 18.215761318206788,
      "output_norm/layer0": 18.215761318206788,
      "step": 4650
    },
    {
      "MSE": 640.0117889404299,
      "MSE/layer0": 640.0117889404299,
      "dead_code_fraction": 0.1653,
      "dead_code_fraction/layer0": 0.1653,
      "epoch": 0.47,
      "input_norm": 31.998331683476753,
      "input_norm/layer0": 31.998331683476753,
      "learning_rate": 0.0005,
      "loss": 2.189,
      "max_norm": 63.429969787597656,
      "max_norm/layer0": 63.429969787597656,
      "mean_norm": 41.481590270996094,
      "mean_norm/layer0": 41.481590270996094,
      "multicode_k": 1,
      "output_norm": 18.22781534512837,
      "output_norm/layer0": 18.22781534512837,
      "step": 4700
    },
    {
      "MSE": 640.034366455078,
      "MSE/layer0": 640.034366455078,
      "dead_code_fraction": 0.16355,
      "dead_code_fraction/layer0": 0.16355,
      "epoch": 0.47,
      "input_norm": 31.998335037231442,
      "input_norm/layer0": 31.998335037231442,
      "learning_rate": 0.0005,
      "loss": 2.1746,
      "max_norm": 63.604644775390625,
      "max_norm/layer0": 63.604644775390625,
      "mean_norm": 41.530447006225586,
      "mean_norm/layer0": 41.530447006225586,
      "multicode_k": 1,
      "output_norm": 18.247568238576257,
      "output_norm/layer0": 18.247568238576257,
      "step": 4750
    },
    {
      "MSE": 641.3402144411094,
      "MSE/layer0": 641.3402144411094,
      "dead_code_fraction": 0.16465,
      "dead_code_fraction/layer0": 0.16465,
      "epoch": 1.0,
      "input_norm": 31.998328861016873,
      "input_norm/layer0": 31.998328861016873,
      "learning_rate": 0.0005,
      "loss": 2.1589,
      "max_norm": 63.7794303894043,
      "max_norm/layer0": 63.7794303894043,
      "mean_norm": 41.577613830566406,
      "mean_norm/layer0": 41.577613830566406,
      "multicode_k": 1,
      "output_norm": 18.227145007068557,
      "output_norm/layer0": 18.227145007068557,
      "step": 4800
    },
    {
      "MSE": 640.0454110717772,
      "MSE/layer0": 640.0454110717772,
      "dead_code_fraction": 0.16635,
      "dead_code_fraction/layer0": 0.16635,
      "epoch": 1.01,
      "input_norm": 31.998361120224008,
      "input_norm/layer0": 31.998361120224008,
      "learning_rate": 0.0005,
      "loss": 2.2585,
      "max_norm": 63.96126937866211,
      "max_norm/layer0": 63.96126937866211,
      "mean_norm": 41.62501525878906,
      "mean_norm/layer0": 41.62501525878906,
      "multicode_k": 1,
      "output_norm": 18.258941303888953,
      "output_norm/layer0": 18.258941303888953,
      "step": 4850
    },
    {
      "MSE": 640.0055624389651,
      "MSE/layer0": 640.0055624389651,
      "dead_code_fraction": 0.16515,
      "dead_code_fraction/layer0": 0.16515,
      "epoch": 1.01,
      "input_norm": 31.998340495427446,
      "input_norm/layer0": 31.998340495427446,
      "learning_rate": 0.0005,
      "loss": 2.1578,
      "max_norm": 64.13137817382812,
      "max_norm/layer0": 64.13137817382812,
      "mean_norm": 41.672542572021484,
      "mean_norm/layer0": 41.672542572021484,
      "multicode_k": 1,
      "output_norm": 18.272732003529867,
      "output_norm/layer0": 18.272732003529867,
      "step": 4900
    },
    {
      "MSE": 640.108183898926,
      "MSE/layer0": 640.108183898926,
      "dead_code_fraction": 0.1668,
      "dead_code_fraction/layer0": 0.1668,
      "epoch": 1.02,
      "input_norm": 31.998351519902535,
      "input_norm/layer0": 31.998351519902535,
      "learning_rate": 0.0005,
      "loss": 2.1809,
      "max_norm": 64.30120086669922,
      "max_norm/layer0": 64.30120086669922,
      "mean_norm": 41.71914291381836,
      "mean_norm/layer0": 41.71914291381836,
      "multicode_k": 1,
      "output_norm": 18.278290322621658,
      "output_norm/layer0": 18.278290322621658,
      "step": 4950
    },
    {
      "MSE": 639.8438139851887,
      "MSE/layer0": 639.8438139851887,
      "dead_code_fraction": 0.1671,
      "dead_code_fraction/layer0": 0.1671,
      "epoch": 1.02,
      "input_norm": 31.998358796437586,
      "input_norm/layer0": 31.998358796437586,
      "learning_rate": 0.0005,
      "loss": 2.1901,
      "max_norm": 64.4720230102539,
      "max_norm/layer0": 64.4720230102539,
      "mean_norm": 41.76571464538574,
      "mean_norm/layer0": 41.76571464538574,
      "multicode_k": 1,
      "output_norm": 18.29636260350546,
      "output_norm/layer0": 18.29636260350546,
      "step": 5000
    },
    {
      "epoch": 1.02,
      "eval_MSE/layer0": 638.1766108092672,
      "eval_accuracy": 0.5013711247409516,
      "eval_dead_code_fraction/layer0": 0.16955,
      "eval_input_norm/layer0": 31.99836045128427,
      "eval_loss": 2.202561616897583,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 18.311866774487846,
      "eval_runtime": 158.3836,
      "eval_samples_per_second": 29.189,
      "eval_steps_per_second": 1.825,
      "step": 5000
    },
    {
      "MSE": 639.5863418579103,
      "MSE/layer0": 639.5863418579103,
      "dead_code_fraction": 0.1675,
      "dead_code_fraction/layer0": 0.1675,
      "epoch": 1.03,
      "input_norm": 31.99836014429728,
      "input_norm/layer0": 31.99836014429728,
      "learning_rate": 0.0005,
      "loss": 2.1914,
      "max_norm": 64.65907287597656,
      "max_norm/layer0": 64.65907287597656,
      "mean_norm": 41.8120174407959,
      "mean_norm/layer0": 41.8120174407959,
      "multicode_k": 1,
      "output_norm": 18.301887426376346,
      "output_norm/layer0": 18.301887426376346,
      "step": 5050
    },
    {
      "MSE": 639.5830181884764,
      "MSE/layer0": 639.5830181884764,
      "dead_code_fraction": 0.16545,
      "dead_code_fraction/layer0": 0.16545,
      "epoch": 1.03,
      "input_norm": 31.998363596598292,
      "input_norm/layer0": 31.998363596598292,
      "learning_rate": 0.0005,
      "loss": 2.1503,
      "max_norm": 64.83207702636719,
      "max_norm/layer0": 64.83207702636719,
      "mean_norm": 41.85700988769531,
      "mean_norm/layer0": 41.85700988769531,
      "multicode_k": 1,
      "output_norm": 18.3204355875651,
      "output_norm/layer0": 18.3204355875651,
      "step": 5100
    },
    {
      "MSE": 640.3749603271485,
      "MSE/layer0": 640.3749603271485,
      "dead_code_fraction": 0.16725,
      "dead_code_fraction/layer0": 0.16725,
      "epoch": 1.04,
      "input_norm": 31.9983703358968,
      "input_norm/layer0": 31.9983703358968,
      "learning_rate": 0.0005,
      "loss": 2.1634,
      "max_norm": 65.003662109375,
      "max_norm/layer0": 65.003662109375,
      "mean_norm": 41.90180778503418,
      "mean_norm/layer0": 41.90180778503418,
      "multicode_k": 1,
      "output_norm": 18.316434319814057,
      "output_norm/layer0": 18.316434319814057,
      "step": 5150
    },
    {
      "MSE": 639.0211893717446,
      "MSE/layer0": 639.0211893717446,
      "dead_code_fraction": 0.16875,
      "dead_code_fraction/layer0": 0.16875,
      "epoch": 1.04,
      "input_norm": 31.998389561971024,
      "input_norm/layer0": 31.998389561971024,
      "learning_rate": 0.0005,
      "loss": 2.224,
      "max_norm": 65.19213104248047,
      "max_norm/layer0": 65.19213104248047,
      "mean_norm": 41.94645309448242,
      "mean_norm/layer0": 41.94645309448242,
      "multicode_k": 1,
      "output_norm": 18.33804360071819,
      "output_norm/layer0": 18.33804360071819,
      "step": 5200
    },
    {
      "MSE": 638.6207899983721,
      "MSE/layer0": 638.6207899983721,
      "dead_code_fraction": 0.17055,
      "dead_code_fraction/layer0": 0.17055,
      "epoch": 1.05,
      "input_norm": 31.998394203186038,
      "input_norm/layer0": 31.998394203186038,
      "learning_rate": 0.0005,
      "loss": 2.2235,
      "max_norm": 65.36846160888672,
      "max_norm/layer0": 65.36846160888672,
      "mean_norm": 41.991315841674805,
      "mean_norm/layer0": 41.991315841674805,
      "multicode_k": 1,
      "output_norm": 18.346421286265045,
      "output_norm/layer0": 18.346421286265045,
      "step": 5250
    },
    {
      "MSE": 638.3484961954751,
      "MSE/layer0": 638.3484961954751,
      "dead_code_fraction": 0.1704,
      "dead_code_fraction/layer0": 0.1704,
      "epoch": 1.05,
      "input_norm": 31.998402004241942,
      "input_norm/layer0": 31.998402004241942,
      "learning_rate": 0.0005,
      "loss": 2.209,
      "max_norm": 65.53041076660156,
      "max_norm/layer0": 65.53041076660156,
      "mean_norm": 42.0357780456543,
      "mean_norm/layer0": 42.0357780456543,
      "multicode_k": 1,
      "output_norm": 18.351918992996215,
      "output_norm/layer0": 18.351918992996215,
      "step": 5300
    },
    {
      "MSE": 638.9349023437496,
      "MSE/layer0": 638.9349023437496,
      "dead_code_fraction": 0.1671,
      "dead_code_fraction/layer0": 0.1671,
      "epoch": 1.06,
      "input_norm": 31.998392171859756,
      "input_norm/layer0": 31.998392171859756,
      "learning_rate": 0.0005,
      "loss": 2.1737,
      "max_norm": 65.69444274902344,
      "max_norm/layer0": 65.69444274902344,
      "mean_norm": 42.078935623168945,
      "mean_norm/layer0": 42.078935623168945,
      "multicode_k": 1,
      "output_norm": 18.365610707600908,
      "output_norm/layer0": 18.365610707600908,
      "step": 5350
    },
    {
      "MSE": 638.1850768025716,
      "MSE/layer0": 638.1850768025716,
      "dead_code_fraction": 0.17125,
      "dead_code_fraction/layer0": 0.17125,
      "epoch": 1.06,
      "input_norm": 31.99840373039246,
      "input_norm/layer0": 31.99840373039246,
      "learning_rate": 0.0005,
      "loss": 2.1904,
      "max_norm": 65.84613037109375,
      "max_norm/layer0": 65.84613037109375,
      "mean_norm": 42.122589111328125,
      "mean_norm/layer0": 42.122589111328125,
      "multicode_k": 1,
      "output_norm": 18.371175734202062,
      "output_norm/layer0": 18.371175734202062,
      "step": 5400
    },
    {
      "MSE": 637.5771400960282,
      "MSE/layer0": 637.5771400960282,
      "dead_code_fraction": 0.17005,
      "dead_code_fraction/layer0": 0.17005,
      "epoch": 1.07,
      "input_norm": 31.998408838907892,
      "input_norm/layer0": 31.998408838907892,
      "learning_rate": 0.0005,
      "loss": 2.2013,
      "max_norm": 66.00259399414062,
      "max_norm/layer0": 66.00259399414062,
      "mean_norm": 42.16551399230957,
      "mean_norm/layer0": 42.16551399230957,
      "multicode_k": 1,
      "output_norm": 18.396056934992465,
      "output_norm/layer0": 18.396056934992465,
      "step": 5450
    },
    {
      "MSE": 637.4973764038084,
      "MSE/layer0": 637.4973764038084,
      "dead_code_fraction": 0.17135,
      "dead_code_fraction/layer0": 0.17135,
      "epoch": 1.07,
      "input_norm": 31.998402996063238,
      "input_norm/layer0": 31.998402996063238,
      "learning_rate": 0.0005,
      "loss": 2.1686,
      "max_norm": 66.15951538085938,
      "max_norm/layer0": 66.15951538085938,
      "mean_norm": 42.207963943481445,
      "mean_norm/layer0": 42.207963943481445,
      "multicode_k": 1,
      "output_norm": 18.402882191340133,
      "output_norm/layer0": 18.402882191340133,
      "step": 5500
    },
    {
      "epoch": 1.07,
      "eval_MSE/layer0": 638.6084431543663,
      "eval_accuracy": 0.5026125270625071,
      "eval_dead_code_fraction/layer0": 0.17165,
      "eval_input_norm/layer0": 31.99841410479916,
      "eval_loss": 2.1934523582458496,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 18.401259186926417,
      "eval_runtime": 158.4926,
      "eval_samples_per_second": 29.169,
      "eval_steps_per_second": 1.823,
      "step": 5500
    },
    {
      "MSE": 637.3816906738282,
      "MSE/layer0": 637.3816906738282,
      "dead_code_fraction": 0.17125,
      "dead_code_fraction/layer0": 0.17125,
      "epoch": 1.08,
      "input_norm": 31.998415158589676,
      "input_norm/layer0": 31.998415158589676,
      "learning_rate": 0.0005,
      "loss": 2.2097,
      "max_norm": 66.32366180419922,
      "max_norm/layer0": 66.32366180419922,
      "mean_norm": 42.25027084350586,
      "mean_norm/layer0": 42.25027084350586,
      "multicode_k": 1,
      "output_norm": 18.40568763732911,
      "output_norm/layer0": 18.40568763732911,
      "step": 5550
    },
    {
      "MSE": 636.5928268432615,
      "MSE/layer0": 636.5928268432615,
      "dead_code_fraction": 0.1711,
      "dead_code_fraction/layer0": 0.1711,
      "epoch": 1.08,
      "input_norm": 31.99841807047526,
      "input_norm/layer0": 31.99841807047526,
      "learning_rate": 0.0005,
      "loss": 2.1987,
      "max_norm": 66.49840545654297,
      "max_norm/layer0": 66.49840545654297,
      "mean_norm": 42.29284858703613,
      "mean_norm/layer0": 42.29284858703613,
      "multicode_k": 1,
      "output_norm": 18.424939454396565,
      "output_norm/layer0": 18.424939454396565,
      "step": 5600
    },
    {
      "MSE": 637.195534973145,
      "MSE/layer0": 637.195534973145,
      "dead_code_fraction": 0.17175,
      "dead_code_fraction/layer0": 0.17175,
      "epoch": 1.09,
      "input_norm": 31.99841377894082,
      "input_norm/layer0": 31.99841377894082,
      "learning_rate": 0.0005,
      "loss": 2.1571,
      "max_norm": 66.6655502319336,
      "max_norm/layer0": 66.6655502319336,
      "mean_norm": 42.33401679992676,
      "mean_norm/layer0": 42.33401679992676,
      "multicode_k": 1,
      "output_norm": 18.427337226867675,
      "output_norm/layer0": 18.427337226867675,
      "step": 5650
    },
    {
      "MSE": 635.8865025838217,
      "MSE/layer0": 635.8865025838217,
      "dead_code_fraction": 0.1736,
      "dead_code_fraction/layer0": 0.1736,
      "epoch": 1.09,
      "input_norm": 31.998435058593753,
      "input_norm/layer0": 31.998435058593753,
      "learning_rate": 0.0005,
      "loss": 2.2146,
      "max_norm": 66.82868957519531,
      "max_norm/layer0": 66.82868957519531,
      "mean_norm": 42.37582206726074,
      "mean_norm/layer0": 42.37582206726074,
      "multicode_k": 1,
      "output_norm": 18.443573204676298,
      "output_norm/layer0": 18.443573204676298,
      "step": 5700
    },
    {
      "MSE": 636.1581252034503,
      "MSE/layer0": 636.1581252034503,
      "dead_code_fraction": 0.17225,
      "dead_code_fraction/layer0": 0.17225,
      "epoch": 1.1,
      "input_norm": 31.998433354695635,
      "input_norm/layer0": 31.998433354695635,
      "learning_rate": 0.0005,
      "loss": 2.171,
      "max_norm": 66.9796371459961,
      "max_norm/layer0": 66.9796371459961,
      "mean_norm": 42.41728591918945,
      "mean_norm/layer0": 42.41728591918945,
      "multicode_k": 1,
      "output_norm": 18.440257479349775,
      "output_norm/layer0": 18.440257479349775,
      "step": 5750
    },
    {
      "MSE": 636.7286339314779,
      "MSE/layer0": 636.7286339314779,
      "dead_code_fraction": 0.1738,
      "dead_code_fraction/layer0": 0.1738,
      "epoch": 1.1,
      "input_norm": 31.998429416020713,
      "input_norm/layer0": 31.998429416020713,
      "learning_rate": 0.0005,
      "loss": 2.1502,
      "max_norm": 67.13478088378906,
      "max_norm/layer0": 67.13478088378906,
      "mean_norm": 42.45817756652832,
      "mean_norm/layer0": 42.45817756652832,
      "multicode_k": 1,
      "output_norm": 18.442232058842986,
      "output_norm/layer0": 18.442232058842986,
      "step": 5800
    },
    {
      "MSE": 635.2576449584958,
      "MSE/layer0": 635.2576449584958,
      "dead_code_fraction": 0.17405,
      "dead_code_fraction/layer0": 0.17405,
      "epoch": 1.11,
      "input_norm": 31.99844219843547,
      "input_norm/layer0": 31.99844219843547,
      "learning_rate": 0.0005,
      "loss": 2.2067,
      "max_norm": 67.28919982910156,
      "max_norm/layer0": 67.28919982910156,
      "mean_norm": 42.49948501586914,
      "mean_norm/layer0": 42.49948501586914,
      "multicode_k": 1,
      "output_norm": 18.46717386881511,
      "output_norm/layer0": 18.46717386881511,
      "step": 5850
    },
    {
      "MSE": 636.0759664916989,
      "MSE/layer0": 636.0759664916989,
      "dead_code_fraction": 0.17355,
      "dead_code_fraction/layer0": 0.17355,
      "epoch": 1.11,
      "input_norm": 31.998439470926915,
      "input_norm/layer0": 31.998439470926915,
      "learning_rate": 0.0005,
      "loss": 2.1543,
      "max_norm": 67.44383239746094,
      "max_norm/layer0": 67.44383239746094,
      "mean_norm": 42.53946495056152,
      "mean_norm/layer0": 42.53946495056152,
      "multicode_k": 1,
      "output_norm": 18.469777971903483,
      "output_norm/layer0": 18.469777971903483,
      "step": 5900
    },
    {
      "MSE": 635.3813305664057,
      "MSE/layer0": 635.3813305664057,
      "dead_code_fraction": 0.17405,
      "dead_code_fraction/layer0": 0.17405,
      "epoch": 1.12,
      "input_norm": 31.99844372113545,
      "input_norm/layer0": 31.99844372113545,
      "learning_rate": 0.0005,
      "loss": 2.1846,
      "max_norm": 67.59025573730469,
      "max_norm/layer0": 67.59025573730469,
      "mean_norm": 42.58071327209473,
      "mean_norm/layer0": 42.58071327209473,
      "multicode_k": 1,
      "output_norm": 18.477715517679847,
      "output_norm/layer0": 18.477715517679847,
      "step": 5950
    },
    {
      "MSE": 634.5524212646484,
      "MSE/layer0": 634.5524212646484,
      "dead_code_fraction": 0.17535,
      "dead_code_fraction/layer0": 0.17535,
      "epoch": 1.12,
      "input_norm": 31.998457225163776,
      "input_norm/layer0": 31.998457225163776,
      "learning_rate": 0.0005,
      "loss": 2.2158,
      "max_norm": 67.7379379272461,
      "max_norm/layer0": 67.7379379272461,
      "mean_norm": 42.62178421020508,
      "mean_norm/layer0": 42.62178421020508,
      "multicode_k": 1,
      "output_norm": 18.489366165796913,
      "output_norm/layer0": 18.489366165796913,
      "step": 6000
    },
    {
      "epoch": 1.12,
      "eval_MSE/layer0": 632.9325560995336,
      "eval_accuracy": 0.5036799089257694,
      "eval_dead_code_fraction/layer0": 0.17795,
      "eval_input_norm/layer0": 31.998461353451354,
      "eval_loss": 2.1832942962646484,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 18.51493810096293,
      "eval_runtime": 158.8489,
      "eval_samples_per_second": 29.103,
      "eval_steps_per_second": 1.819,
      "step": 6000
    },
    {
      "MSE": 634.7784757486979,
      "MSE/layer0": 634.7784757486979,
      "dead_code_fraction": 0.1755,
      "dead_code_fraction/layer0": 0.1755,
      "epoch": 1.13,
      "input_norm": 31.99845712025961,
      "input_norm/layer0": 31.99845712025961,
      "learning_rate": 0.0005,
      "loss": 2.1789,
      "max_norm": 67.8902816772461,
      "max_norm/layer0": 67.8902816772461,
      "mean_norm": 42.66269874572754,
      "mean_norm/layer0": 42.66269874572754,
      "multicode_k": 1,
      "output_norm": 18.49625307718913,
      "output_norm/layer0": 18.49625307718913,
      "step": 6050
    },
    {
      "MSE": 634.5078458658851,
      "MSE/layer0": 634.5078458658851,
      "dead_code_fraction": 0.17445,
      "dead_code_fraction/layer0": 0.17445,
      "epoch": 1.13,
      "input_norm": 31.99845917383831,
      "input_norm/layer0": 31.99845917383831,
      "learning_rate": 0.0005,
      "loss": 2.2009,
      "max_norm": 68.04124450683594,
      "max_norm/layer0": 68.04124450683594,
      "mean_norm": 42.70250701904297,
      "mean_norm/layer0": 42.70250701904297,
      "multicode_k": 1,
      "output_norm": 18.514623686472582,
      "output_norm/layer0": 18.514623686472582,
      "step": 6100
    },
    {
      "MSE": 634.443066914876,
      "MSE/layer0": 634.443066914876,
      "dead_code_fraction": 0.17575,
      "dead_code_fraction/layer0": 0.17575,
      "epoch": 1.14,
      "input_norm": 31.99845913887024,
      "input_norm/layer0": 31.99845913887024,
      "learning_rate": 0.0005,
      "loss": 2.1623,
      "max_norm": 68.17865753173828,
      "max_norm/layer0": 68.17865753173828,
      "mean_norm": 42.742488861083984,
      "mean_norm/layer0": 42.742488861083984,
      "multicode_k": 1,
      "output_norm": 18.513023862838743,
      "output_norm/layer0": 18.513023862838743,
      "step": 6150
    },
    {
      "MSE": 633.6522382609048,
      "MSE/layer0": 633.6522382609048,
      "dead_code_fraction": 0.17475,
      "dead_code_fraction/layer0": 0.17475,
      "epoch": 1.14,
      "input_norm": 31.998471844991045,
      "input_norm/layer0": 31.998471844991045,
      "learning_rate": 0.0005,
      "loss": 2.1824,
      "max_norm": 68.31253051757812,
      "max_norm/layer0": 68.31253051757812,
      "mean_norm": 42.782148361206055,
      "mean_norm/layer0": 42.782148361206055,
      "multicode_k": 1,
      "output_norm": 18.529316590627033,
      "output_norm/layer0": 18.529316590627033,
      "step": 6200
    },
    {
      "MSE": 634.0474910481774,
      "MSE/layer0": 634.0474910481774,
      "dead_code_fraction": 0.1771,
      "dead_code_fraction/layer0": 0.1771,
      "epoch": 1.15,
      "input_norm": 31.998480736414585,
      "input_norm/layer0": 31.998480736414585,
      "learning_rate": 0.0005,
      "loss": 2.1948,
      "max_norm": 68.44271850585938,
      "max_norm/layer0": 68.44271850585938,
      "mean_norm": 42.82079887390137,
      "mean_norm/layer0": 42.82079887390137,
      "multicode_k": 1,
      "output_norm": 18.524528849919633,
      "output_norm/layer0": 18.524528849919633,
      "step": 6250
    },
    {
      "MSE": 633.648407084147,
      "MSE/layer0": 633.648407084147,
      "dead_code_fraction": 0.1745,
      "dead_code_fraction/layer0": 0.1745,
      "epoch": 1.15,
      "input_norm": 31.998468182881673,
      "input_norm/layer0": 31.998468182881673,
      "learning_rate": 0.0005,
      "loss": 2.1145,
      "max_norm": 68.57721710205078,
      "max_norm/layer0": 68.57721710205078,
      "mean_norm": 42.859825134277344,
      "mean_norm/layer0": 42.859825134277344,
      "multicode_k": 1,
      "output_norm": 18.540853935877482,
      "output_norm/layer0": 18.540853935877482,
      "step": 6300
    },
    {
      "MSE": 633.5945191446937,
      "MSE/layer0": 633.5945191446937,
      "dead_code_fraction": 0.17705,
      "dead_code_fraction/layer0": 0.17705,
      "epoch": 1.16,
      "input_norm": 31.99847273508707,
      "input_norm/layer0": 31.99847273508707,
      "learning_rate": 0.0005,
      "loss": 2.1507,
      "max_norm": 68.7186050415039,
      "max_norm/layer0": 68.7186050415039,
      "mean_norm": 42.897830963134766,
      "mean_norm/layer0": 42.897830963134766,
      "multicode_k": 1,
      "output_norm": 18.55124579429626,
      "output_norm/layer0": 18.55124579429626,
      "step": 6350
    },
    {
      "MSE": 632.1478841145836,
      "MSE/layer0": 632.1478841145836,
      "dead_code_fraction": 0.1775,
      "dead_code_fraction/layer0": 0.1775,
      "epoch": 1.16,
      "input_norm": 31.9984964243571,
      "input_norm/layer0": 31.9984964243571,
      "learning_rate": 0.0005,
      "loss": 2.1962,
      "max_norm": 68.85418701171875,
      "max_norm/layer0": 68.85418701171875,
      "mean_norm": 42.937448501586914,
      "mean_norm/layer0": 42.937448501586914,
      "multicode_k": 1,
      "output_norm": 18.5615934785207,
      "output_norm/layer0": 18.5615934785207,
      "step": 6400
    },
    {
      "MSE": 632.57952931722,
      "MSE/layer0": 632.57952931722,
      "dead_code_fraction": 0.1777,
      "dead_code_fraction/layer0": 0.1777,
      "epoch": 1.17,
      "input_norm": 31.998487294514977,
      "input_norm/layer0": 31.998487294514977,
      "learning_rate": 0.0005,
      "loss": 2.1627,
      "max_norm": 69.0008316040039,
      "max_norm/layer0": 69.0008316040039,
      "mean_norm": 42.97622108459473,
      "mean_norm/layer0": 42.97622108459473,
      "multicode_k": 1,
      "output_norm": 18.57248200734457,
      "output_norm/layer0": 18.57248200734457,
      "step": 6450
    },
    {
      "MSE": 631.0360174560547,
      "MSE/layer0": 631.0360174560547,
      "dead_code_fraction": 0.1784,
      "dead_code_fraction/layer0": 0.1784,
      "epoch": 1.17,
      "input_norm": 31.998495709101356,
      "input_norm/layer0": 31.998495709101356,
      "learning_rate": 0.0005,
      "loss": 2.1843,
      "max_norm": 69.13652038574219,
      "max_norm/layer0": 69.13652038574219,
      "mean_norm": 43.01558876037598,
      "mean_norm/layer0": 43.01558876037598,
      "multicode_k": 1,
      "output_norm": 18.591586551666268,
      "output_norm/layer0": 18.591586551666268,
      "step": 6500
    },
    {
      "epoch": 1.17,
      "eval_MSE/layer0": 631.2925020152297,
      "eval_accuracy": 0.5039093283634951,
      "eval_dead_code_fraction/layer0": 0.1797,
      "eval_input_norm/layer0": 31.99848882414009,
      "eval_loss": 2.175981044769287,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 18.598594732777567,
      "eval_runtime": 158.1453,
      "eval_samples_per_second": 29.233,
      "eval_steps_per_second": 1.827,
      "step": 6500
    },
    {
      "MSE": 631.294188741048,
      "MSE/layer0": 631.294188741048,
      "dead_code_fraction": 0.1796,
      "dead_code_fraction/layer0": 0.1796,
      "epoch": 1.18,
      "input_norm": 31.998505541483564,
      "input_norm/layer0": 31.998505541483564,
      "learning_rate": 0.0005,
      "loss": 2.1855,
      "max_norm": 69.26646423339844,
      "max_norm/layer0": 69.26646423339844,
      "mean_norm": 43.0548152923584,
      "mean_norm/layer0": 43.0548152923584,
      "multicode_k": 1,
      "output_norm": 18.585241152445477,
      "output_norm/layer0": 18.585241152445477,
      "step": 6550
    },
    {
      "MSE": 631.297376505534,
      "MSE/layer0": 631.297376505534,
      "dead_code_fraction": 0.1779,
      "dead_code_fraction/layer0": 0.1779,
      "epoch": 1.18,
      "input_norm": 31.998487745920816,
      "input_norm/layer0": 31.998487745920816,
      "learning_rate": 0.0005,
      "loss": 2.1197,
      "max_norm": 69.3987808227539,
      "max_norm/layer0": 69.3987808227539,
      "mean_norm": 43.093589782714844,
      "mean_norm/layer0": 43.093589782714844,
      "multicode_k": 1,
      "output_norm": 18.605287278493257,
      "output_norm/layer0": 18.605287278493257,
      "step": 6600
    },
    {
      "MSE": 630.8991915893555,
      "MSE/layer0": 630.8991915893555,
      "dead_code_fraction": 0.17815,
      "dead_code_fraction/layer0": 0.17815,
      "epoch": 1.19,
      "input_norm": 31.99848988215129,
      "input_norm/layer0": 31.99848988215129,
      "learning_rate": 0.0005,
      "loss": 2.1248,
      "max_norm": 69.52507019042969,
      "max_norm/layer0": 69.52507019042969,
      "mean_norm": 43.132524490356445,
      "mean_norm/layer0": 43.132524490356445,
      "multicode_k": 1,
      "output_norm": 18.61235850652059,
      "output_norm/layer0": 18.61235850652059,
      "step": 6650
    },
    {
      "MSE": 629.604686584473,
      "MSE/layer0": 629.604686584473,
      "dead_code_fraction": 0.17965,
      "dead_code_fraction/layer0": 0.17965,
      "epoch": 1.19,
      "input_norm": 31.99852681477865,
      "input_norm/layer0": 31.99852681477865,
      "learning_rate": 0.0005,
      "loss": 2.2265,
      "max_norm": 69.66030883789062,
      "max_norm/layer0": 69.66030883789062,
      "mean_norm": 43.17206573486328,
      "mean_norm/layer0": 43.17206573486328,
      "multicode_k": 1,
      "output_norm": 18.626948499679564,
      "output_norm/layer0": 18.626948499679564,
      "step": 6700
    },
    {
      "MSE": 629.7875715128578,
      "MSE/layer0": 629.7875715128578,
      "dead_code_fraction": 0.1802,
      "dead_code_fraction/layer0": 0.1802,
      "epoch": 1.2,
      "input_norm": 31.998509550094596,
      "input_norm/layer0": 31.998509550094596,
      "learning_rate": 0.0005,
      "loss": 2.1432,
      "max_norm": 69.78119659423828,
      "max_norm/layer0": 69.78119659423828,
      "mean_norm": 43.21029472351074,
      "mean_norm/layer0": 43.21029472351074,
      "multicode_k": 1,
      "output_norm": 18.639319947560622,
      "output_norm/layer0": 18.639319947560622,
      "step": 6750
    },
    {
      "MSE": 629.3708419799802,
      "MSE/layer0": 629.3708419799802,
      "dead_code_fraction": 0.18015,
      "dead_code_fraction/layer0": 0.18015,
      "epoch": 1.2,
      "input_norm": 31.99851152102152,
      "input_norm/layer0": 31.99851152102152,
      "learning_rate": 0.0005,
      "loss": 2.1606,
      "max_norm": 69.91252899169922,
      "max_norm/layer0": 69.91252899169922,
      "mean_norm": 43.24948692321777,
      "mean_norm/layer0": 43.24948692321777,
      "multicode_k": 1,
      "output_norm": 18.64606482187906,
      "output_norm/layer0": 18.64606482187906,
      "step": 6800
    },
    {
      "MSE": 628.4038922119142,
      "MSE/layer0": 628.4038922119142,
      "dead_code_fraction": 0.1806,
      "dead_code_fraction/layer0": 0.1806,
      "epoch": 1.21,
      "input_norm": 31.998516721725462,
      "input_norm/layer0": 31.998516721725462,
      "learning_rate": 0.0005,
      "loss": 2.1582,
      "max_norm": 70.04332733154297,
      "max_norm/layer0": 70.04332733154297,
      "mean_norm": 43.28862762451172,
      "mean_norm/layer0": 43.28862762451172,
      "multicode_k": 1,
      "output_norm": 18.669758415222162,
      "output_norm/layer0": 18.669758415222162,
      "step": 6850
    },
    {
      "MSE": 628.1812467447919,
      "MSE/layer0": 628.1812467447919,
      "dead_code_fraction": 0.18055,
      "dead_code_fraction/layer0": 0.18055,
      "epoch": 1.21,
      "input_norm": 31.998515844345086,
      "input_norm/layer0": 31.998515844345086,
      "learning_rate": 0.0005,
      "loss": 2.1433,
      "max_norm": 70.16979217529297,
      "max_norm/layer0": 70.16979217529297,
      "mean_norm": 43.327192306518555,
      "mean_norm/layer0": 43.327192306518555,
      "multicode_k": 1,
      "output_norm": 18.674684073130294,
      "output_norm/layer0": 18.674684073130294,
      "step": 6900
    },
    {
      "MSE": 628.1862957763672,
      "MSE/layer0": 628.1862957763672,
      "dead_code_fraction": 0.18045,
      "dead_code_fraction/layer0": 0.18045,
      "epoch": 1.22,
      "input_norm": 31.99852259953816,
      "input_norm/layer0": 31.99852259953816,
      "learning_rate": 0.0005,
      "loss": 2.1458,
      "max_norm": 70.29747772216797,
      "max_norm/layer0": 70.29747772216797,
      "mean_norm": 43.36609077453613,
      "mean_norm/layer0": 43.36609077453613,
      "multicode_k": 1,
      "output_norm": 18.682749029795335,
      "output_norm/layer0": 18.682749029795335,
      "step": 6950
    },
    {
      "MSE": 627.7981392415361,
      "MSE/layer0": 627.7981392415361,
      "dead_code_fraction": 0.18045,
      "dead_code_fraction/layer0": 0.18045,
      "epoch": 1.22,
      "input_norm": 31.998523871103927,
      "input_norm/layer0": 31.998523871103927,
      "learning_rate": 0.0005,
      "loss": 2.1339,
      "max_norm": 70.425537109375,
      "max_norm/layer0": 70.425537109375,
      "mean_norm": 43.40445899963379,
      "mean_norm/layer0": 43.40445899963379,
      "multicode_k": 1,
      "output_norm": 18.696380834579458,
      "output_norm/layer0": 18.696380834579458,
      "step": 7000
    },
    {
      "epoch": 1.22,
      "eval_MSE/layer0": 627.9790743019787,
      "eval_accuracy": 0.5048263717749389,
      "eval_dead_code_fraction/layer0": 0.1819,
      "eval_input_norm/layer0": 31.998524618592334,
      "eval_loss": 2.1696202754974365,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 18.705300997223095,
      "eval_runtime": 159.1692,
      "eval_samples_per_second": 29.045,
      "eval_steps_per_second": 1.816,
      "step": 7000
    },
    {
      "MSE": 627.3165437825519,
      "MSE/layer0": 627.3165437825519,
      "dead_code_fraction": 0.1822,
      "dead_code_fraction/layer0": 0.1822,
      "epoch": 1.23,
      "input_norm": 31.99852600097656,
      "input_norm/layer0": 31.99852600097656,
      "learning_rate": 0.0005,
      "loss": 2.1483,
      "max_norm": 70.54450988769531,
      "max_norm/layer0": 70.54450988769531,
      "mean_norm": 43.442848205566406,
      "mean_norm/layer0": 43.442848205566406,
      "multicode_k": 1,
      "output_norm": 18.700957148869843,
      "output_norm/layer0": 18.700957148869843,
      "step": 7050
    },
    {
      "MSE": 626.7479965209961,
      "MSE/layer0": 626.7479965209961,
      "dead_code_fraction": 0.1804,
      "dead_code_fraction/layer0": 0.1804,
      "epoch": 1.23,
      "input_norm": 31.998541386922206,
      "input_norm/layer0": 31.998541386922206,
      "learning_rate": 0.0005,
      "loss": 2.1512,
      "max_norm": 70.66608428955078,
      "max_norm/layer0": 70.66608428955078,
      "mean_norm": 43.48159599304199,
      "mean_norm/layer0": 43.48159599304199,
      "multicode_k": 1,
      "output_norm": 18.714396947224948,
      "output_norm/layer0": 18.714396947224948,
      "step": 7100
    },
    {
      "MSE": 626.4450497436519,
      "MSE/layer0": 626.4450497436519,
      "dead_code_fraction": 0.1823,
      "dead_code_fraction/layer0": 0.1823,
      "epoch": 1.24,
      "input_norm": 31.998545411427806,
      "input_norm/layer0": 31.998545411427806,
      "learning_rate": 0.0005,
      "loss": 2.1586,
      "max_norm": 70.7937240600586,
      "max_norm/layer0": 70.7937240600586,
      "mean_norm": 43.5198860168457,
      "mean_norm/layer0": 43.5198860168457,
      "multicode_k": 1,
      "output_norm": 18.726943721771242,
      "output_norm/layer0": 18.726943721771242,
      "step": 7150
    },
    {
      "MSE": 626.1652618408202,
      "MSE/layer0": 626.1652618408202,
      "dead_code_fraction": 0.1814,
      "dead_code_fraction/layer0": 0.1814,
      "epoch": 1.24,
      "input_norm": 31.998541978200272,
      "input_norm/layer0": 31.998541978200272,
      "learning_rate": 0.0005,
      "loss": 2.1552,
      "max_norm": 70.90862274169922,
      "max_norm/layer0": 70.90862274169922,
      "mean_norm": 43.55833053588867,
      "mean_norm/layer0": 43.55833053588867,
      "multicode_k": 1,
      "output_norm": 18.731371542612706,
      "output_norm/layer0": 18.731371542612706,
      "step": 7200
    },
    {
      "MSE": 625.2572497558597,
      "MSE/layer0": 625.2572497558597,
      "dead_code_fraction": 0.1839,
      "dead_code_fraction/layer0": 0.1839,
      "epoch": 1.25,
      "input_norm": 31.998552770614626,
      "input_norm/layer0": 31.998552770614626,
      "learning_rate": 0.0005,
      "loss": 2.1673,
      "max_norm": 71.0332260131836,
      "max_norm/layer0": 71.0332260131836,
      "mean_norm": 43.5967960357666,
      "mean_norm/layer0": 43.5967960357666,
      "multicode_k": 1,
      "output_norm": 18.756609748204536,
      "output_norm/layer0": 18.756609748204536,
      "step": 7250
    },
    {
      "MSE": 624.7860372924804,
      "MSE/layer0": 624.7860372924804,
      "dead_code_fraction": 0.1831,
      "dead_code_fraction/layer0": 0.1831,
      "epoch": 1.25,
      "input_norm": 31.998555002212534,
      "input_norm/layer0": 31.998555002212534,
      "learning_rate": 0.0005,
      "loss": 2.1575,
      "max_norm": 71.15364837646484,
      "max_norm/layer0": 71.15364837646484,
      "mean_norm": 43.63525199890137,
      "mean_norm/layer0": 43.63525199890137,
      "multicode_k": 1,
      "output_norm": 18.767410192489628,
      "output_norm/layer0": 18.767410192489628,
      "step": 7300
    },
    {
      "MSE": 624.7060753377278,
      "MSE/layer0": 624.7060753377278,
      "dead_code_fraction": 0.18335,
      "dead_code_fraction/layer0": 0.18335,
      "epoch": 1.26,
      "input_norm": 31.99856230099995,
      "input_norm/layer0": 31.99856230099995,
      "learning_rate": 0.0005,
      "loss": 2.1622,
      "max_norm": 71.2812271118164,
      "max_norm/layer0": 71.2812271118164,
      "mean_norm": 43.67383575439453,
      "mean_norm/layer0": 43.67383575439453,
      "multicode_k": 1,
      "output_norm": 18.77556623776755,
      "output_norm/layer0": 18.77556623776755,
      "step": 7350
    },
    {
      "MSE": 623.9612900797528,
      "MSE/layer0": 623.9612900797528,
      "dead_code_fraction": 0.1834,
      "dead_code_fraction/layer0": 0.1834,
      "epoch": 1.26,
      "input_norm": 31.998564265569062,
      "input_norm/layer0": 31.998564265569062,
      "learning_rate": 0.0005,
      "loss": 2.1721,
      "max_norm": 71.4082260131836,
      "max_norm/layer0": 71.4082260131836,
      "mean_norm": 43.71280097961426,
      "mean_norm/layer0": 43.71280097961426,
      "multicode_k": 1,
      "output_norm": 18.78839166323344,
      "output_norm/layer0": 18.78839166323344,
      "step": 7400
    },
    {
      "MSE": 623.9870674641929,
      "MSE/layer0": 623.9870674641929,
      "dead_code_fraction": 0.18355,
      "dead_code_fraction/layer0": 0.18355,
      "epoch": 1.27,
      "input_norm": 31.998560991287228,
      "input_norm/layer0": 31.998560991287228,
      "learning_rate": 0.0005,
      "loss": 2.1424,
      "max_norm": 71.52973937988281,
      "max_norm/layer0": 71.52973937988281,
      "mean_norm": 43.75117111206055,
      "mean_norm/layer0": 43.75117111206055,
      "multicode_k": 1,
      "output_norm": 18.79942525227863,
      "output_norm/layer0": 18.79942525227863,
      "step": 7450
    },
    {
      "MSE": 622.7629538981118,
      "MSE/layer0": 622.7629538981118,
      "dead_code_fraction": 0.1844,
      "dead_code_fraction/layer0": 0.1844,
      "epoch": 1.27,
      "input_norm": 31.998580735524506,
      "input_norm/layer0": 31.998580735524506,
      "learning_rate": 0.0005,
      "loss": 2.187,
      "max_norm": 71.64968872070312,
      "max_norm/layer0": 71.64968872070312,
      "mean_norm": 43.790061950683594,
      "mean_norm/layer0": 43.790061950683594,
      "multicode_k": 1,
      "output_norm": 18.81509483655294,
      "output_norm/layer0": 18.81509483655294,
      "step": 7500
    },
    {
      "epoch": 1.27,
      "eval_MSE/layer0": 622.122652727573,
      "eval_accuracy": 0.5062701283839631,
      "eval_dead_code_fraction/layer0": 0.18665,
      "eval_input_norm/layer0": 31.998566619663464,
      "eval_loss": 2.1583967208862305,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 18.83381110374323,
      "eval_runtime": 158.6442,
      "eval_samples_per_second": 29.141,
      "eval_steps_per_second": 1.822,
      "step": 7500
    },
    {
      "MSE": 622.9042826334635,
      "MSE/layer0": 622.9042826334635,
      "dead_code_fraction": 0.1841,
      "dead_code_fraction/layer0": 0.1841,
      "epoch": 1.28,
      "input_norm": 31.998572101593023,
      "input_norm/layer0": 31.998572101593023,
      "learning_rate": 0.0005,
      "loss": 2.1434,
      "max_norm": 71.76019287109375,
      "max_norm/layer0": 71.76019287109375,
      "mean_norm": 43.828460693359375,
      "mean_norm/layer0": 43.828460693359375,
      "multicode_k": 1,
      "output_norm": 18.82229045232136,
      "output_norm/layer0": 18.82229045232136,
      "step": 7550
    },
    {
      "MSE": 621.695281575521,
      "MSE/layer0": 621.695281575521,
      "dead_code_fraction": 0.1854,
      "dead_code_fraction/layer0": 0.1854,
      "epoch": 1.28,
      "input_norm": 31.998584995269773,
      "input_norm/layer0": 31.998584995269773,
      "learning_rate": 0.0005,
      "loss": 2.1712,
      "max_norm": 71.87606048583984,
      "max_norm/layer0": 71.87606048583984,
      "mean_norm": 43.867136001586914,
      "mean_norm/layer0": 43.867136001586914,
      "multicode_k": 1,
      "output_norm": 18.84749958992006,
      "output_norm/layer0": 18.84749958992006,
      "step": 7600
    },
    {
      "MSE": 622.6274766031902,
      "MSE/layer0": 622.6274766031902,
      "dead_code_fraction": 0.18355,
      "dead_code_fraction/layer0": 0.18355,
      "epoch": 1.29,
      "input_norm": 31.998571812311802,
      "input_norm/layer0": 31.998571812311802,
      "learning_rate": 0.0005,
      "loss": 2.1412,
      "max_norm": 71.98139953613281,
      "max_norm/layer0": 71.98139953613281,
      "mean_norm": 43.90544891357422,
      "mean_norm/layer0": 43.90544891357422,
      "multicode_k": 1,
      "output_norm": 18.83851943016053,
      "output_norm/layer0": 18.83851943016053,
      "step": 7650
    },
    {
      "MSE": 621.3046355183919,
      "MSE/layer0": 621.3046355183919,
      "dead_code_fraction": 0.18495,
      "dead_code_fraction/layer0": 0.18495,
      "epoch": 1.29,
      "input_norm": 31.998585087458295,
      "input_norm/layer0": 31.998585087458295,
      "learning_rate": 0.0005,
      "loss": 2.1711,
      "max_norm": 72.08447265625,
      "max_norm/layer0": 72.08447265625,
      "mean_norm": 43.94407653808594,
      "mean_norm/layer0": 43.94407653808594,
      "multicode_k": 1,
      "output_norm": 18.86037411053976,
      "output_norm/layer0": 18.86037411053976,
      "step": 7700
    },
    {
      "MSE": 620.5873645019533,
      "MSE/layer0": 620.5873645019533,
      "dead_code_fraction": 0.18485,
      "dead_code_fraction/layer0": 0.18485,
      "epoch": 1.3,
      "input_norm": 31.998606751759848,
      "input_norm/layer0": 31.998606751759848,
      "learning_rate": 0.0005,
      "loss": 2.2069,
      "max_norm": 72.18034362792969,
      "max_norm/layer0": 72.18034362792969,
      "mean_norm": 43.9833927154541,
      "mean_norm/layer0": 43.9833927154541,
      "multicode_k": 1,
      "output_norm": 18.87507179578146,
      "output_norm/layer0": 18.87507179578146,
      "step": 7750
    },
    {
      "MSE": 621.2272378540041,
      "MSE/layer0": 621.2272378540041,
      "dead_code_fraction": 0.18385,
      "dead_code_fraction/layer0": 0.18385,
      "epoch": 1.3,
      "input_norm": 31.998583949406935,
      "input_norm/layer0": 31.998583949406935,
      "learning_rate": 0.0005,
      "loss": 2.1217,
      "max_norm": 72.27928924560547,
      "max_norm/layer0": 72.27928924560547,
      "mean_norm": 44.021806716918945,
      "mean_norm/layer0": 44.021806716918945,
      "multicode_k": 1,
      "output_norm": 18.877027104695642,
      "output_norm/layer0": 18.877027104695642,
      "step": 7800
    },
    {
      "MSE": 620.067134602865,
      "MSE/layer0": 620.067134602865,
      "dead_code_fraction": 0.18535,
      "dead_code_fraction/layer0": 0.18535,
      "epoch": 1.31,
      "input_norm": 31.998594888051343,
      "input_norm/layer0": 31.998594888051343,
      "learning_rate": 0.0005,
      "loss": 2.1753,
      "max_norm": 72.39033508300781,
      "max_norm/layer0": 72.39033508300781,
      "mean_norm": 44.060611724853516,
      "mean_norm/layer0": 44.060611724853516,
      "multicode_k": 1,
      "output_norm": 18.89820697466533,
      "output_norm/layer0": 18.89820697466533,
      "step": 7850
    },
    {
      "MSE": 620.6704218546549,
      "MSE/layer0": 620.6704218546549,
      "dead_code_fraction": 0.18735,
      "dead_code_fraction/layer0": 0.18735,
      "epoch": 1.31,
      "input_norm": 31.998597246805822,
      "input_norm/layer0": 31.998597246805822,
      "learning_rate": 0.0005,
      "loss": 2.1778,
      "max_norm": 72.4916000366211,
      "max_norm/layer0": 72.4916000366211,
      "mean_norm": 44.09913635253906,
      "mean_norm/layer0": 44.09913635253906,
      "multicode_k": 1,
      "output_norm": 18.890051161448145,
      "output_norm/layer0": 18.890051161448145,
      "step": 7900
    },
    {
      "MSE": 619.2155123901367,
      "MSE/layer0": 619.2155123901367,
      "dead_code_fraction": 0.1863,
      "dead_code_fraction/layer0": 0.1863,
      "epoch": 1.32,
      "input_norm": 31.99860541343688,
      "input_norm/layer0": 31.99860541343688,
      "learning_rate": 0.0005,
      "loss": 2.1684,
      "max_norm": 72.59037017822266,
      "max_norm/layer0": 72.59037017822266,
      "mean_norm": 44.13744926452637,
      "mean_norm/layer0": 44.13744926452637,
      "multicode_k": 1,
      "output_norm": 18.920912733078,
      "output_norm/layer0": 18.920912733078,
      "step": 7950
    },
    {
      "MSE": 618.8985408528646,
      "MSE/layer0": 618.8985408528646,
      "dead_code_fraction": 0.1867,
      "dead_code_fraction/layer0": 0.1867,
      "epoch": 1.32,
      "input_norm": 31.998596220016488,
      "input_norm/layer0": 31.998596220016488,
      "learning_rate": 0.0005,
      "loss": 2.1302,
      "max_norm": 72.69281768798828,
      "max_norm/layer0": 72.69281768798828,
      "mean_norm": 44.176042556762695,
      "mean_norm/layer0": 44.176042556762695,
      "multicode_k": 1,
      "output_norm": 18.93559975624085,
      "output_norm/layer0": 18.93559975624085,
      "step": 8000
    },
    {
      "epoch": 1.32,
      "eval_MSE/layer0": 617.7161538934592,
      "eval_accuracy": 0.5071360017457022,
      "eval_dead_code_fraction/layer0": 0.18755,
      "eval_input_norm/layer0": 31.99860155017712,
      "eval_loss": 2.150786876678467,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 18.949325338731256,
      "eval_runtime": 158.4669,
      "eval_samples_per_second": 29.173,
      "eval_steps_per_second": 1.824,
      "step": 8000
    },
    {
      "MSE": 619.1937561035155,
      "MSE/layer0": 619.1937561035155,
      "dead_code_fraction": 0.18685,
      "dead_code_fraction/layer0": 0.18685,
      "epoch": 1.33,
      "input_norm": 31.998596970240285,
      "input_norm/layer0": 31.998596970240285,
      "learning_rate": 0.0005,
      "loss": 2.1279,
      "max_norm": 72.79032135009766,
      "max_norm/layer0": 72.79032135009766,
      "mean_norm": 44.21445846557617,
      "mean_norm/layer0": 44.21445846557617,
      "multicode_k": 1,
      "output_norm": 18.93686810175578,
      "output_norm/layer0": 18.93686810175578,
      "step": 8050
    },
    {
      "MSE": 619.539402567546,
      "MSE/layer0": 619.539402567546,
      "dead_code_fraction": 0.18665,
      "dead_code_fraction/layer0": 0.18665,
      "epoch": 1.33,
      "input_norm": 31.998598492940268,
      "input_norm/layer0": 31.998598492940268,
      "learning_rate": 0.0005,
      "loss": 2.1113,
      "max_norm": 72.88322448730469,
      "max_norm/layer0": 72.88322448730469,
      "mean_norm": 44.251609802246094,
      "mean_norm/layer0": 44.251609802246094,
      "multicode_k": 1,
      "output_norm": 18.939144274393726,
      "output_norm/layer0": 18.939144274393726,
      "step": 8100
    },
    {
      "MSE": 617.7248203531905,
      "MSE/layer0": 617.7248203531905,
      "dead_code_fraction": 0.18555,
      "dead_code_fraction/layer0": 0.18555,
      "epoch": 1.34,
      "input_norm": 31.99861437161764,
      "input_norm/layer0": 31.99861437161764,
      "learning_rate": 0.0005,
      "loss": 2.1592,
      "max_norm": 72.97504425048828,
      "max_norm/layer0": 72.97504425048828,
      "mean_norm": 44.289913177490234,
      "mean_norm/layer0": 44.289913177490234,
      "multicode_k": 1,
      "output_norm": 18.963457323710102,
      "output_norm/layer0": 18.963457323710102,
      "step": 8150
    },
    {
      "MSE": 617.1626446533202,
      "MSE/layer0": 617.1626446533202,
      "dead_code_fraction": 0.1856,
      "dead_code_fraction/layer0": 0.1856,
      "epoch": 1.34,
      "input_norm": 31.998610553741443,
      "input_norm/layer0": 31.998610553741443,
      "learning_rate": 0.0005,
      "loss": 2.1339,
      "max_norm": 73.06546020507812,
      "max_norm/layer0": 73.06546020507812,
      "mean_norm": 44.32819747924805,
      "mean_norm/layer0": 44.32819747924805,
      "multicode_k": 1,
      "output_norm": 18.980771627426144,
      "output_norm/layer0": 18.980771627426144,
      "step": 8200
    },
    {
      "MSE": 616.5359758504233,
      "MSE/layer0": 616.5359758504233,
      "dead_code_fraction": 0.18785,
      "dead_code_fraction/layer0": 0.18785,
      "epoch": 1.35,
      "input_norm": 31.99861484845479,
      "input_norm/layer0": 31.99861484845479,
      "learning_rate": 0.0005,
      "loss": 2.1287,
      "max_norm": 73.1684341430664,
      "max_norm/layer0": 73.1684341430664,
      "mean_norm": 44.36627197265625,
      "mean_norm/layer0": 44.36627197265625,
      "multicode_k": 1,
      "output_norm": 19.002285525004055,
      "output_norm/layer0": 19.002285525004055,
      "step": 8250
    },
    {
      "MSE": 616.9324924723311,
      "MSE/layer0": 616.9324924723311,
      "dead_code_fraction": 0.18715,
      "dead_code_fraction/layer0": 0.18715,
      "epoch": 1.35,
      "input_norm": 31.998625895182286,
      "input_norm/layer0": 31.998625895182286,
      "learning_rate": 0.0005,
      "loss": 2.1575,
      "max_norm": 73.259521484375,
      "max_norm/layer0": 73.259521484375,
      "mean_norm": 44.40446090698242,
      "mean_norm/layer0": 44.40446090698242,
      "multicode_k": 1,
      "output_norm": 18.992992315292362,
      "output_norm/layer0": 18.992992315292362,
      "step": 8300
    },
    {
      "MSE": 616.2650039672851,
      "MSE/layer0": 616.2650039672851,
      "dead_code_fraction": 0.18655,
      "dead_code_fraction/layer0": 0.18655,
      "epoch": 1.36,
      "input_norm": 31.99862662315369,
      "input_norm/layer0": 31.99862662315369,
      "learning_rate": 0.0005,
      "loss": 2.139,
      "max_norm": 73.36270141601562,
      "max_norm/layer0": 73.36270141601562,
      "mean_norm": 44.44254493713379,
      "mean_norm/layer0": 44.44254493713379,
      "multicode_k": 1,
      "output_norm": 19.00672375679015,
      "output_norm/layer0": 19.00672375679015,
      "step": 8350
    },
    {
      "MSE": 615.5159185791019,
      "MSE/layer0": 615.5159185791019,
      "dead_code_fraction": 0.18685,
      "dead_code_fraction/layer0": 0.18685,
      "epoch": 1.36,
      "input_norm": 31.998618663152055,
      "input_norm/layer0": 31.998618663152055,
      "learning_rate": 0.0005,
      "loss": 2.1207,
      "max_norm": 73.45561981201172,
      "max_norm/layer0": 73.45561981201172,
      "mean_norm": 44.48077201843262,
      "mean_norm/layer0": 44.48077201843262,
      "multicode_k": 1,
      "output_norm": 19.030768597920748,
      "output_norm/layer0": 19.030768597920748,
      "step": 8400
    },
    {
      "MSE": 615.7112675984704,
      "MSE/layer0": 615.7112675984704,
      "dead_code_fraction": 0.18675,
      "dead_code_fraction/layer0": 0.18675,
      "epoch": 1.37,
      "input_norm": 31.99863114674885,
      "input_norm/layer0": 31.99863114674885,
      "learning_rate": 0.0005,
      "loss": 2.1394,
      "max_norm": 73.54468536376953,
      "max_norm/layer0": 73.54468536376953,
      "mean_norm": 44.5194206237793,
      "mean_norm/layer0": 44.5194206237793,
      "multicode_k": 1,
      "output_norm": 19.03362373669942,
      "output_norm/layer0": 19.03362373669942,
      "step": 8450
    },
    {
      "MSE": 615.0864140828453,
      "MSE/layer0": 615.0864140828453,
      "dead_code_fraction": 0.1866,
      "dead_code_fraction/layer0": 0.1866,
      "epoch": 1.37,
      "input_norm": 31.9986399269104,
      "input_norm/layer0": 31.9986399269104,
      "learning_rate": 0.0005,
      "loss": 2.1471,
      "max_norm": 73.64068603515625,
      "max_norm/layer0": 73.64068603515625,
      "mean_norm": 44.55780220031738,
      "mean_norm/layer0": 44.55780220031738,
      "multicode_k": 1,
      "output_norm": 19.04360143979391,
      "output_norm/layer0": 19.04360143979391,
      "step": 8500
    },
    {
      "epoch": 1.37,
      "eval_MSE/layer0": 613.7248421548741,
      "eval_accuracy": 0.5081896395873495,
      "eval_dead_code_fraction/layer0": 0.1885,
      "eval_input_norm/layer0": 31.998632826486393,
      "eval_loss": 2.1443779468536377,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 19.066619998676906,
      "eval_runtime": 158.5923,
      "eval_samples_per_second": 29.15,
      "eval_steps_per_second": 1.822,
      "step": 8500
    },
    {
      "MSE": 614.1585445149744,
      "MSE/layer0": 614.1585445149744,
      "dead_code_fraction": 0.18715,
      "dead_code_fraction/layer0": 0.18715,
      "epoch": 1.38,
      "input_norm": 31.99863867441813,
      "input_norm/layer0": 31.99863867441813,
      "learning_rate": 0.0005,
      "loss": 2.1506,
      "max_norm": 73.73002624511719,
      "max_norm/layer0": 73.73002624511719,
      "mean_norm": 44.597002029418945,
      "mean_norm/layer0": 44.597002029418945,
      "multicode_k": 1,
      "output_norm": 19.06499721844991,
      "output_norm/layer0": 19.06499721844991,
      "step": 8550
    },
    {
      "MSE": 614.256539204915,
      "MSE/layer0": 614.256539204915,
      "dead_code_fraction": 0.1879,
      "dead_code_fraction/layer0": 0.1879,
      "epoch": 1.38,
      "input_norm": 31.998648173014317,
      "input_norm/layer0": 31.998648173014317,
      "learning_rate": 0.0005,
      "loss": 2.1643,
      "max_norm": 73.80333709716797,
      "max_norm/layer0": 73.80333709716797,
      "mean_norm": 44.63543891906738,
      "mean_norm/layer0": 44.63543891906738,
      "multicode_k": 1,
      "output_norm": 19.078293412526467,
      "output_norm/layer0": 19.078293412526467,
      "step": 8600
    },
    {
      "MSE": 613.3546946207681,
      "MSE/layer0": 613.3546946207681,
      "dead_code_fraction": 0.1879,
      "dead_code_fraction/layer0": 0.1879,
      "epoch": 1.39,
      "input_norm": 31.99864864667257,
      "input_norm/layer0": 31.99864864667257,
      "learning_rate": 0.0005,
      "loss": 2.1535,
      "max_norm": 73.89517974853516,
      "max_norm/layer0": 73.89517974853516,
      "mean_norm": 44.674211502075195,
      "mean_norm/layer0": 44.674211502075195,
      "multicode_k": 1,
      "output_norm": 19.09559381167095,
      "output_norm/layer0": 19.09559381167095,
      "step": 8650
    },
    {
      "MSE": 613.6053087361654,
      "MSE/layer0": 613.6053087361654,
      "dead_code_fraction": 0.18645,
      "dead_code_fraction/layer0": 0.18645,
      "epoch": 1.39,
      "input_norm": 31.998652140299477,
      "input_norm/layer0": 31.998652140299477,
      "learning_rate": 0.0005,
      "loss": 2.137,
      "max_norm": 73.9770736694336,
      "max_norm/layer0": 73.9770736694336,
      "mean_norm": 44.71265983581543,
      "mean_norm/layer0": 44.71265983581543,
      "multicode_k": 1,
      "output_norm": 19.098618446985878,
      "output_norm/layer0": 19.098618446985878,
      "step": 8700
    },
    {
      "MSE": 613.292506408691,
      "MSE/layer0": 613.292506408691,
      "dead_code_fraction": 0.1876,
      "dead_code_fraction/layer0": 0.1876,
      "epoch": 1.4,
      "input_norm": 31.998654588063562,
      "input_norm/layer0": 31.998654588063562,
      "learning_rate": 0.0005,
      "loss": 2.1482,
      "max_norm": 74.05269622802734,
      "max_norm/layer0": 74.05269622802734,
      "mean_norm": 44.750946044921875,
      "mean_norm/layer0": 44.750946044921875,
      "multicode_k": 1,
      "output_norm": 19.104494848251342,
      "output_norm/layer0": 19.104494848251342,
      "step": 8750
    },
    {
      "MSE": 613.8824895222986,
      "MSE/layer0": 613.8824895222986,
      "dead_code_fraction": 0.1868,
      "dead_code_fraction/layer0": 0.1868,
      "epoch": 1.4,
      "input_norm": 31.998655049006146,
      "input_norm/layer0": 31.998655049006146,
      "learning_rate": 0.0005,
      "loss": 2.1331,
      "max_norm": 74.12651824951172,
      "max_norm/layer0": 74.12651824951172,
      "mean_norm": 44.7886848449707,
      "mean_norm/layer0": 44.7886848449707,
      "multicode_k": 1,
      "output_norm": 19.110120385487882,
      "output_norm/layer0": 19.110120385487882,
      "step": 8800
    },
    {
      "MSE": 613.8568901570636,
      "MSE/layer0": 613.8568901570636,
      "dead_code_fraction": 0.18675,
      "dead_code_fraction/layer0": 0.18675,
      "epoch": 1.41,
      "input_norm": 31.99864878336588,
      "input_norm/layer0": 31.99864878336588,
      "learning_rate": 0.0005,
      "loss": 2.1038,
      "max_norm": 74.20288848876953,
      "max_norm/layer0": 74.20288848876953,
      "mean_norm": 44.82563400268555,
      "mean_norm/layer0": 44.82563400268555,
      "multicode_k": 1,
      "output_norm": 19.120709832509363,
      "output_norm/layer0": 19.120709832509363,
      "step": 8850
    },
    {
      "MSE": 612.8203454589843,
      "MSE/layer0": 612.8203454589843,
      "dead_code_fraction": 0.18635,
      "dead_code_fraction/layer0": 0.18635,
      "epoch": 1.41,
      "input_norm": 31.99866209030152,
      "input_norm/layer0": 31.99866209030152,
      "learning_rate": 0.0005,
      "loss": 2.1619,
      "max_norm": 74.27029418945312,
      "max_norm/layer0": 74.27029418945312,
      "mean_norm": 44.863847732543945,
      "mean_norm/layer0": 44.863847732543945,
      "multicode_k": 1,
      "output_norm": 19.13362557093303,
      "output_norm/layer0": 19.13362557093303,
      "step": 8900
    },
    {
      "MSE": 612.7508836873369,
      "MSE/layer0": 612.7508836873369,
      "dead_code_fraction": 0.1865,
      "dead_code_fraction/layer0": 0.1865,
      "epoch": 1.42,
      "input_norm": 31.998662964502977,
      "input_norm/layer0": 31.998662964502977,
      "learning_rate": 0.0005,
      "loss": 2.1274,
      "max_norm": 74.35165405273438,
      "max_norm/layer0": 74.35165405273438,
      "mean_norm": 44.90276908874512,
      "mean_norm/layer0": 44.90276908874512,
      "multicode_k": 1,
      "output_norm": 19.13368027687074,
      "output_norm/layer0": 19.13368027687074,
      "step": 8950
    },
    {
      "MSE": 611.3088948567707,
      "MSE/layer0": 611.3088948567707,
      "dead_code_fraction": 0.18625,
      "dead_code_fraction/layer0": 0.18625,
      "epoch": 1.42,
      "input_norm": 31.998670199712116,
      "input_norm/layer0": 31.998670199712116,
      "learning_rate": 0.0005,
      "loss": 2.1556,
      "max_norm": 74.43575286865234,
      "max_norm/layer0": 74.43575286865234,
      "mean_norm": 44.94179916381836,
      "mean_norm/layer0": 44.94179916381836,
      "multicode_k": 1,
      "output_norm": 19.165478760401413,
      "output_norm/layer0": 19.165478760401413,
      "step": 9000
    },
    {
      "epoch": 1.42,
      "eval_MSE/layer0": 610.3757424029645,
      "eval_accuracy": 0.5087341142897861,
      "eval_dead_code_fraction/layer0": 0.18805,
      "eval_input_norm/layer0": 31.998659288421646,
      "eval_loss": 2.139230489730835,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 19.181722183648382,
      "eval_runtime": 158.0526,
      "eval_samples_per_second": 29.25,
      "eval_steps_per_second": 1.829,
      "step": 9000
    },
    {
      "MSE": 611.2356985473632,
      "MSE/layer0": 611.2356985473632,
      "dead_code_fraction": 0.1879,
      "dead_code_fraction/layer0": 0.1879,
      "epoch": 1.43,
      "input_norm": 31.998666836420703,
      "input_norm/layer0": 31.998666836420703,
      "learning_rate": 0.0005,
      "loss": 2.1388,
      "max_norm": 74.51050567626953,
      "max_norm/layer0": 74.51050567626953,
      "mean_norm": 44.98063850402832,
      "mean_norm/layer0": 44.98063850402832,
      "multicode_k": 1,
      "output_norm": 19.177389281590777,
      "output_norm/layer0": 19.177389281590777,
      "step": 9050
    },
    {
      "MSE": 610.8344569905598,
      "MSE/layer0": 610.8344569905598,
      "dead_code_fraction": 0.18865,
      "dead_code_fraction/layer0": 0.18865,
      "epoch": 1.43,
      "input_norm": 31.99867141723631,
      "input_norm/layer0": 31.99867141723631,
      "learning_rate": 0.0005,
      "loss": 2.1328,
      "max_norm": 74.59440612792969,
      "max_norm/layer0": 74.59440612792969,
      "mean_norm": 45.01910400390625,
      "mean_norm/layer0": 45.01910400390625,
      "multicode_k": 1,
      "output_norm": 19.185275354385375,
      "output_norm/layer0": 19.185275354385375,
      "step": 9100
    },
    {
      "MSE": 610.7402758789062,
      "MSE/layer0": 610.7402758789062,
      "dead_code_fraction": 0.1871,
      "dead_code_fraction/layer0": 0.1871,
      "epoch": 1.44,
      "input_norm": 31.99866997400921,
      "input_norm/layer0": 31.99866997400921,
      "learning_rate": 0.0005,
      "loss": 2.117,
      "max_norm": 74.67122650146484,
      "max_norm/layer0": 74.67122650146484,
      "mean_norm": 45.05727577209473,
      "mean_norm/layer0": 45.05727577209473,
      "multicode_k": 1,
      "output_norm": 19.190109596252437,
      "output_norm/layer0": 19.190109596252437,
      "step": 9150
    },
    {
      "MSE": 610.1339531453451,
      "MSE/layer0": 610.1339531453451,
      "dead_code_fraction": 0.18745,
      "dead_code_fraction/layer0": 0.18745,
      "epoch": 1.44,
      "input_norm": 31.998679358164473,
      "input_norm/layer0": 31.998679358164473,
      "learning_rate": 0.0005,
      "loss": 2.1459,
      "max_norm": 74.7430419921875,
      "max_norm/layer0": 74.7430419921875,
      "mean_norm": 45.095571517944336,
      "mean_norm/layer0": 45.095571517944336,
      "multicode_k": 1,
      "output_norm": 19.203376553853335,
      "output_norm/layer0": 19.203376553853335,
      "step": 9200
    },
    {
      "MSE": 609.6957601928709,
      "MSE/layer0": 609.6957601928709,
      "dead_code_fraction": 0.1878,
      "dead_code_fraction/layer0": 0.1878,
      "epoch": 1.45,
      "input_norm": 31.99868172009785,
      "input_norm/layer0": 31.99868172009785,
      "learning_rate": 0.0005,
      "loss": 2.142,
      "max_norm": 74.8177490234375,
      "max_norm/layer0": 74.8177490234375,
      "mean_norm": 45.133853912353516,
      "mean_norm/layer0": 45.133853912353516,
      "multicode_k": 1,
      "output_norm": 19.22210531552632,
      "output_norm/layer0": 19.22210531552632,
      "step": 9250
    },
    {
      "MSE": 609.5997785441082,
      "MSE/layer0": 609.5997785441082,
      "dead_code_fraction": 0.18805,
      "dead_code_fraction/layer0": 0.18805,
      "epoch": 1.45,
      "input_norm": 31.998693205515544,
      "input_norm/layer0": 31.998693205515544,
      "learning_rate": 0.0005,
      "loss": 2.18,
      "max_norm": 74.87744140625,
      "max_norm/layer0": 74.87744140625,
      "mean_norm": 45.172555923461914,
      "mean_norm/layer0": 45.172555923461914,
      "multicode_k": 1,
      "output_norm": 19.226630802154542,
      "output_norm/layer0": 19.226630802154542,
      "step": 9300
    },
    {
      "MSE": 609.8342389933271,
      "MSE/layer0": 609.8342389933271,
      "dead_code_fraction": 0.18735,
      "dead_code_fraction/layer0": 0.18735,
      "epoch": 1.46,
      "input_norm": 31.998687505722053,
      "input_norm/layer0": 31.998687505722053,
      "learning_rate": 0.0005,
      "loss": 2.1164,
      "max_norm": 74.94609069824219,
      "max_norm/layer0": 74.94609069824219,
      "mean_norm": 45.21059799194336,
      "mean_norm/layer0": 45.21059799194336,
      "multicode_k": 1,
      "output_norm": 19.234882882436114,
      "output_norm/layer0": 19.234882882436114,
      "step": 9350
    },
    {
      "MSE": 609.2034523518882,
      "MSE/layer0": 609.2034523518882,
      "dead_code_fraction": 0.1869,
      "dead_code_fraction/layer0": 0.1869,
      "epoch": 1.46,
      "input_norm": 31.99869050979616,
      "input_norm/layer0": 31.99869050979616,
      "learning_rate": 0.0005,
      "loss": 2.1316,
      "max_norm": 75.01142883300781,
      "max_norm/layer0": 75.01142883300781,
      "mean_norm": 45.248979568481445,
      "mean_norm/layer0": 45.248979568481445,
      "multicode_k": 1,
      "output_norm": 19.247848326365144,
      "output_norm/layer0": 19.247848326365144,
      "step": 9400
    },
    {
      "MSE": 609.0324313354497,
      "MSE/layer0": 609.0324313354497,
      "dead_code_fraction": 0.18745,
      "dead_code_fraction/layer0": 0.18745,
      "epoch": 1.47,
      "input_norm": 31.99869132041931,
      "input_norm/layer0": 31.99869132041931,
      "learning_rate": 0.0005,
      "loss": 2.1214,
      "max_norm": 75.07112121582031,
      "max_norm/layer0": 75.07112121582031,
      "mean_norm": 45.287214279174805,
      "mean_norm/layer0": 45.287214279174805,
      "multicode_k": 1,
      "output_norm": 19.25519768079122,
      "output_norm/layer0": 19.25519768079122,
      "step": 9450
    },
    {
      "MSE": 607.8594933064783,
      "MSE/layer0": 607.8594933064783,
      "dead_code_fraction": 0.18835,
      "dead_code_fraction/layer0": 0.18835,
      "epoch": 1.47,
      "input_norm": 31.998687744140625,
      "input_norm/layer0": 31.998687744140625,
      "learning_rate": 0.0005,
      "loss": 2.1067,
      "max_norm": 75.15766143798828,
      "max_norm/layer0": 75.15766143798828,
      "mean_norm": 45.32560920715332,
      "mean_norm/layer0": 45.32560920715332,
      "multicode_k": 1,
      "output_norm": 19.27704188664754,
      "output_norm/layer0": 19.27704188664754,
      "step": 9500
    },
    {
      "epoch": 1.47,
      "eval_MSE/layer0": 608.6866096036146,
      "eval_accuracy": 0.5090880757079915,
      "eval_dead_code_fraction/layer0": 0.18755,
      "eval_input_norm/layer0": 31.998685899710146,
      "eval_loss": 2.1350600719451904,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 19.283631281241068,
      "eval_runtime": 158.1797,
      "eval_samples_per_second": 29.226,
      "eval_steps_per_second": 1.827,
      "step": 9500
    },
    {
      "MSE": 607.5302533983886,
      "MSE/layer0": 607.5302533983886,
      "dead_code_fraction": 0.1872,
      "dead_code_fraction/layer0": 0.1872,
      "epoch": 1.48,
      "input_norm": 31.99869025141972,
      "input_norm/layer0": 31.99869025141972,
      "learning_rate": 0.0005,
      "loss": 2.1075,
      "max_norm": 75.2263412475586,
      "max_norm/layer0": 75.2263412475586,
      "mean_norm": 45.363752365112305,
      "mean_norm/layer0": 45.363752365112305,
      "multicode_k": 1,
      "output_norm": 19.2927733112995,
      "output_norm/layer0": 19.2927733112995,
      "step": 9550
    },
    {
      "MSE": 608.902215973978,
      "MSE/layer0": 608.902215973978,
      "dead_code_fraction": 0.187,
      "dead_code_fraction/layer0": 0.187,
      "epoch": 2.0,
      "input_norm": 31.998686492629858,
      "input_norm/layer0": 31.998686492629858,
      "learning_rate": 0.0005,
      "loss": 2.1013,
      "max_norm": 75.294677734375,
      "max_norm/layer0": 75.294677734375,
      "mean_norm": 45.40024948120117,
      "mean_norm/layer0": 45.40024948120117,
      "multicode_k": 1,
      "output_norm": 19.268582361188244,
      "output_norm/layer0": 19.268582361188244,
      "step": 9600
    },
    {
      "MSE": 606.3796120198567,
      "MSE/layer0": 606.3796120198567,
      "dead_code_fraction": 0.18715,
      "dead_code_fraction/layer0": 0.18715,
      "epoch": 2.01,
      "input_norm": 31.998710851669312,
      "input_norm/layer0": 31.998710851669312,
      "learning_rate": 0.0005,
      "loss": 2.17,
      "max_norm": 75.35186004638672,
      "max_norm/layer0": 75.35186004638672,
      "mean_norm": 45.4382266998291,
      "mean_norm/layer0": 45.4382266998291,
      "multicode_k": 1,
      "output_norm": 19.314183537165327,
      "output_norm/layer0": 19.314183537165327,
      "step": 9650
    },
    {
      "MSE": 606.9239878336591,
      "MSE/layer0": 606.9239878336591,
      "dead_code_fraction": 0.1877,
      "dead_code_fraction/layer0": 0.1877,
      "epoch": 2.01,
      "input_norm": 31.99869126637776,
      "input_norm/layer0": 31.99869126637776,
      "learning_rate": 0.0005,
      "loss": 2.0661,
      "max_norm": 75.44601440429688,
      "max_norm/layer0": 75.44601440429688,
      "mean_norm": 45.47653579711914,
      "mean_norm/layer0": 45.47653579711914,
      "multicode_k": 1,
      "output_norm": 19.313949975967407,
      "output_norm/layer0": 19.313949975967407,
      "step": 9700
    },
    {
      "MSE": 606.1468785603844,
      "MSE/layer0": 606.1468785603844,
      "dead_code_fraction": 0.18755,
      "dead_code_fraction/layer0": 0.18755,
      "epoch": 2.02,
      "input_norm": 31.998706903457652,
      "input_norm/layer0": 31.998706903457652,
      "learning_rate": 0.0005,
      "loss": 2.1325,
      "max_norm": 75.6237564086914,
      "max_norm/layer0": 75.6237564086914,
      "mean_norm": 45.51473808288574,
      "mean_norm/layer0": 45.51473808288574,
      "multicode_k": 1,
      "output_norm": 19.331538470586143,
      "output_norm/layer0": 19.331538470586143,
      "step": 9750
    },
    {
      "MSE": 606.2908910115561,
      "MSE/layer0": 606.2908910115561,
      "dead_code_fraction": 0.18715,
      "dead_code_fraction/layer0": 0.18715,
      "epoch": 2.02,
      "input_norm": 31.998702777226768,
      "input_norm/layer0": 31.998702777226768,
      "learning_rate": 0.0005,
      "loss": 2.0999,
      "max_norm": 75.77623748779297,
      "max_norm/layer0": 75.77623748779297,
      "mean_norm": 45.55307388305664,
      "mean_norm/layer0": 45.55307388305664,
      "multicode_k": 1,
      "output_norm": 19.340178826649982,
      "output_norm/layer0": 19.340178826649982,
      "step": 9800
    },
    {
      "MSE": 605.7215723673501,
      "MSE/layer0": 605.7215723673501,
      "dead_code_fraction": 0.18635,
      "dead_code_fraction/layer0": 0.18635,
      "epoch": 2.03,
      "input_norm": 31.998708073298122,
      "input_norm/layer0": 31.998708073298122,
      "learning_rate": 0.0005,
      "loss": 2.1015,
      "max_norm": 75.92095184326172,
      "max_norm/layer0": 75.92095184326172,
      "mean_norm": 45.591548919677734,
      "mean_norm/layer0": 45.591548919677734,
      "multicode_k": 1,
      "output_norm": 19.351260058085124,
      "output_norm/layer0": 19.351260058085124,
      "step": 9850
    },
    {
      "MSE": 605.7307819620769,
      "MSE/layer0": 605.7307819620769,
      "dead_code_fraction": 0.1879,
      "dead_code_fraction/layer0": 0.1879,
      "epoch": 2.03,
      "input_norm": 31.99871432304383,
      "input_norm/layer0": 31.99871432304383,
      "learning_rate": 0.0005,
      "loss": 2.1079,
      "max_norm": 76.06104278564453,
      "max_norm/layer0": 76.06104278564453,
      "mean_norm": 45.62945747375488,
      "mean_norm/layer0": 45.62945747375488,
      "multicode_k": 1,
      "output_norm": 19.36078415234882,
      "output_norm/layer0": 19.36078415234882,
      "step": 9900
    },
    {
      "MSE": 605.7736006673174,
      "MSE/layer0": 605.7736006673174,
      "dead_code_fraction": 0.1873,
      "dead_code_fraction/layer0": 0.1873,
      "epoch": 2.04,
      "input_norm": 31.99871180534363,
      "input_norm/layer0": 31.99871180534363,
      "learning_rate": 0.0005,
      "loss": 2.102,
      "max_norm": 76.22486877441406,
      "max_norm/layer0": 76.22486877441406,
      "mean_norm": 45.66733360290527,
      "mean_norm/layer0": 45.66733360290527,
      "multicode_k": 1,
      "output_norm": 19.36815209388733,
      "output_norm/layer0": 19.36815209388733,
      "step": 9950
    },
    {
      "MSE": 604.9809751383466,
      "MSE/layer0": 604.9809751383466,
      "dead_code_fraction": 0.1872,
      "dead_code_fraction/layer0": 0.1872,
      "epoch": 2.04,
      "input_norm": 31.998728539148978,
      "input_norm/layer0": 31.998728539148978,
      "learning_rate": 0.0005,
      "loss": 2.1536,
      "max_norm": 76.40007019042969,
      "max_norm/layer0": 76.40007019042969,
      "mean_norm": 45.70543670654297,
      "mean_norm/layer0": 45.70543670654297,
      "multicode_k": 1,
      "output_norm": 19.38911464373271,
      "output_norm/layer0": 19.38911464373271,
      "step": 10000
    },
    {
      "epoch": 2.04,
      "eval_MSE/layer0": 604.5096733395267,
      "eval_accuracy": 0.5091345939349958,
      "eval_dead_code_fraction/layer0": 0.18795,
      "eval_input_norm/layer0": 31.99872850438308,
      "eval_loss": 2.132894992828369,
      "eval_multicode_k": 1,
      "eval_output_norm/layer0": 19.389702240368152,
      "eval_runtime": 158.9177,
      "eval_samples_per_second": 29.091,
      "eval_steps_per_second": 1.819,
      "step": 10000
    },
    {
      "MSE": 0.0,
      "MSE/layer0": 0.0,
      "dead_code_fraction": 1.0,
      "dead_code_fraction/layer0": 1.0,
      "epoch": 2.04,
      "input_norm": 0.0,
      "input_norm/layer0": 0.0,
      "max_norm": 76.40007019042969,
      "max_norm/layer0": 76.40007019042969,
      "mean_norm": 45.70543670654297,
      "mean_norm/layer0": 45.70543670654297,
      "multicode_k": 1,
      "output_norm": 0.0,
      "output_norm/layer0": 0.0,
      "step": 10000,
      "total_flos": 7.43098011353088e+16,
      "train_loss": 2.325971780395508,
      "train_runtime": 15639.0026,
      "train_samples_per_second": 61.385,
      "train_steps_per_second": 0.639
    }
  ],
  "logging_steps": 50,
  "max_steps": 10000,
  "num_train_epochs": 9223372036854775807,
  "save_steps": 500,
  "total_flos": 7.43098011353088e+16,
  "trial_name": null,
  "trial_params": null
}